diff --git "a/wandb/run-20220228_122826-3vepvy3m/files/wandb-summary.json" "b/wandb/run-20220228_122826-3vepvy3m/files/wandb-summary.json" --- "a/wandb/run-20220228_122826-3vepvy3m/files/wandb-summary.json" +++ "b/wandb/run-20220228_122826-3vepvy3m/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.3305, "train/learning_rate": 9.940000000000001e-06, "train/epoch": 0.56, "train/global_step": 500, "_runtime": 3904, "_timestamp": 1646055210, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 246.0, 762.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-66.11236572265625, -45.430301666259766, -24.74823760986328, -4.066173553466797, 16.615890502929688, 37.29795837402344, 57.980018615722656, 78.66207885742188, 99.34414672851562, 120.02621459960938, 140.70828247070312, 161.3903350830078, 182.07240295410156, 202.7544708251953, 223.4365234375, 244.11859130859375, 264.8006591796875, 285.48272705078125, 306.164794921875, 326.84686279296875, 347.5289306640625, 368.21099853515625, 388.8930358886719, 409.5751037597656, 430.2571716308594, 450.9392395019531, 471.6213073730469, 492.3033752441406, 512.9854125976562, 533.66748046875, 554.3495483398438, 575.0316162109375, 595.713623046875, 616.3956909179688, 637.0777587890625, 657.7598266601562, 678.44189453125, 699.1239624023438, 719.8060302734375, 740.488037109375, 761.170166015625, 781.8522338867188, 802.5343017578125, 823.2163696289062, 843.8984375, 864.5805053710938, 885.2625732421875, 905.944580078125, 926.6266479492188, 947.3087158203125, 967.9907836914062, 988.6728515625, 1009.3549194335938, 1030.0369873046875, 1050.718994140625, 1071.401123046875, 1092.0831298828125, 1112.76513671875, 1133.447265625, 1154.1292724609375, 1174.8114013671875, 1195.493408203125, 1216.175537109375, 1236.8575439453125, 1257.5396728515625]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 10.0, 3.0, 14.0, 13.0, 11.0, 24.0, 27.0, 32.0, 35.0, 50.0, 38.0, 43.0, 46.0, 68.0, 65.0, 54.0, 53.0, 45.0, 57.0, 51.0, 44.0, 45.0, 29.0, 32.0, 24.0, 28.0, 8.0, 14.0, 10.0, 8.0, 9.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.97714233398438, -89.7153091430664, -86.4534683227539, -83.19163513183594, -79.92979431152344, -76.66796112060547, -73.4061279296875, -70.144287109375, -66.88245391845703, -63.6206169128418, -60.35877990722656, -57.096946716308594, -53.83510971069336, -50.573272705078125, -47.311439514160156, -44.04960250854492, -40.78776550292969, -37.52592849731445, -34.26409149169922, -31.00225830078125, -27.740421295166016, -24.47858428955078, -21.21674919128418, -17.954914093017578, -14.693077087402344, -11.431241035461426, -8.169404983520508, -4.90756893157959, -1.6457328796386719, 1.6161041259765625, 4.877939224243164, 8.139774322509766, 11.401611328125, 14.663447380065918, 17.925283432006836, 21.187118530273438, 24.448955535888672, 27.710792541503906, 30.972627639770508, 34.23446273803711, 37.496299743652344, 40.75813674926758, 44.01997375488281, 47.28180694580078, 50.543643951416016, 53.80548095703125, 57.06731414794922, 60.32915115356445, 63.59098815917969, 66.85282135009766, 70.11466217041016, 73.37649536132812, 76.63833618164062, 79.9001693725586, 83.16200256347656, 86.42384338378906, 89.68567657470703, 92.947509765625, 96.2093505859375, 99.47118377685547, 102.73301696777344, 105.99485778808594, 109.2566909790039, 112.51852416992188, 115.78036499023438]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 0.0, 6.0, 13.0, 11.0, 20.0, 16.0, 30.0, 38.0, 27.0, 48.0, 51.0, 52.0, 53.0, 69.0, 74.0, 85.0, 58.0, 66.0, 58.0, 37.0, 34.0, 35.0, 36.0, 24.0, 20.0, 14.0, 12.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -4.8896484375, -4.615234375, -4.3408203125, -4.06640625, -3.7919921875, -3.517578125, -3.2431640625, -2.96875, -2.6943359375, -2.419921875, -2.1455078125, -1.87109375, -1.5966796875, -1.322265625, -1.0478515625, -0.7734375, -0.4990234375, -0.224609375, 0.0498046875, 0.32421875, 0.5986328125, 0.873046875, 1.1474609375, 1.421875, 1.6962890625, 1.970703125, 2.2451171875, 2.51953125, 2.7939453125, 3.068359375, 3.3427734375, 3.6171875, 3.8916015625, 4.166015625, 4.4404296875, 4.71484375, 4.9892578125, 5.263671875, 5.5380859375, 5.8125, 6.0869140625, 6.361328125, 6.6357421875, 6.91015625, 7.1845703125, 7.458984375, 7.7333984375, 8.0078125, 8.2822265625, 8.556640625, 8.8310546875, 9.10546875, 9.3798828125, 9.654296875, 9.9287109375, 10.203125, 10.4775390625, 10.751953125, 11.0263671875, 11.30078125, 11.5751953125, 11.849609375, 12.1240234375, 12.3984375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 5.0, 7.0, 16.0, 22.0, 29.0, 52.0, 54.0, 77.0, 133.0, 198.0, 321.0, 456.0, 717.0, 1150.0, 2223.0, 4863.0, 13667.0, 59172.0, 793809.0, 2888724.0, 374422.0, 35956.0, 9698.0, 3803.0, 1866.0, 1009.0, 649.0, 376.0, 280.0, 132.0, 117.0, 70.0, 54.0, 46.0, 29.0, 28.0, 16.0, 15.0, 11.0, 2.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.671875, -12.078857421875, -11.48583984375, -10.892822265625, -10.2998046875, -9.706787109375, -9.11376953125, -8.520751953125, -7.927734375, -7.334716796875, -6.74169921875, -6.148681640625, -5.5556640625, -4.962646484375, -4.36962890625, -3.776611328125, -3.18359375, -2.590576171875, -1.99755859375, -1.404541015625, -0.8115234375, -0.218505859375, 0.37451171875, 0.967529296875, 1.560546875, 2.153564453125, 2.74658203125, 3.339599609375, 3.9326171875, 4.525634765625, 5.11865234375, 5.711669921875, 6.3046875, 6.897705078125, 7.49072265625, 8.083740234375, 8.6767578125, 9.269775390625, 9.86279296875, 10.455810546875, 11.048828125, 11.641845703125, 12.23486328125, 12.827880859375, 13.4208984375, 14.013916015625, 14.60693359375, 15.199951171875, 15.79296875, 16.385986328125, 16.97900390625, 17.572021484375, 18.1650390625, 18.758056640625, 19.35107421875, 19.944091796875, 20.537109375, 21.130126953125, 21.72314453125, 22.316162109375, 22.9091796875, 23.502197265625, 24.09521484375, 24.688232421875, 25.28125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 1.0, 10.0, 13.0, 14.0, 18.0, 26.0, 45.0, 68.0, 72.0, 90.0, 155.0, 235.0, 329.0, 499.0, 536.0, 546.0, 387.0, 282.0, 211.0, 133.0, 116.0, 77.0, 50.0, 38.0, 29.0, 19.0, 15.0, 14.0, 13.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.296875, -19.6357421875, -18.974609375, -18.3134765625, -17.65234375, -16.9912109375, -16.330078125, -15.6689453125, -15.0078125, -14.3466796875, -13.685546875, -13.0244140625, -12.36328125, -11.7021484375, -11.041015625, -10.3798828125, -9.71875, -9.0576171875, -8.396484375, -7.7353515625, -7.07421875, -6.4130859375, -5.751953125, -5.0908203125, -4.4296875, -3.7685546875, -3.107421875, -2.4462890625, -1.78515625, -1.1240234375, -0.462890625, 0.1982421875, 0.859375, 1.5205078125, 2.181640625, 2.8427734375, 3.50390625, 4.1650390625, 4.826171875, 5.4873046875, 6.1484375, 6.8095703125, 7.470703125, 8.1318359375, 8.79296875, 9.4541015625, 10.115234375, 10.7763671875, 11.4375, 12.0986328125, 12.759765625, 13.4208984375, 14.08203125, 14.7431640625, 15.404296875, 16.0654296875, 16.7265625, 17.3876953125, 18.048828125, 18.7099609375, 19.37109375, 20.0322265625, 20.693359375, 21.3544921875, 22.015625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 6.0, 7.0, 12.0, 18.0, 13.0, 22.0, 20.0, 44.0, 54.0, 78.0, 95.0, 156.0, 239.0, 364.0, 620.0, 1211.0, 3232.0, 39383.0, 3811315.0, 326321.0, 6984.0, 1725.0, 842.0, 474.0, 310.0, 207.0, 136.0, 115.0, 85.0, 54.0, 42.0, 16.0, 17.0, 15.0, 10.0, 4.0, 4.0, 4.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-66.8125, -64.7060546875, -62.599609375, -60.4931640625, -58.38671875, -56.2802734375, -54.173828125, -52.0673828125, -49.9609375, -47.8544921875, -45.748046875, -43.6416015625, -41.53515625, -39.4287109375, -37.322265625, -35.2158203125, -33.109375, -31.0029296875, -28.896484375, -26.7900390625, -24.68359375, -22.5771484375, -20.470703125, -18.3642578125, -16.2578125, -14.1513671875, -12.044921875, -9.9384765625, -7.83203125, -5.7255859375, -3.619140625, -1.5126953125, 0.59375, 2.7001953125, 4.806640625, 6.9130859375, 9.01953125, 11.1259765625, 13.232421875, 15.3388671875, 17.4453125, 19.5517578125, 21.658203125, 23.7646484375, 25.87109375, 27.9775390625, 30.083984375, 32.1904296875, 34.296875, 36.4033203125, 38.509765625, 40.6162109375, 42.72265625, 44.8291015625, 46.935546875, 49.0419921875, 51.1484375, 53.2548828125, 55.361328125, 57.4677734375, 59.57421875, 61.6806640625, 63.787109375, 65.8935546875, 68.0]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 190.0, 730.0, 85.0, 4.0, 0.0, 0.0, 1.0], "bins": [-675.4635009765625, -663.8788452148438, -652.294189453125, -640.7095336914062, -629.1248779296875, -617.540283203125, -605.9556274414062, -594.3709716796875, -582.7863159179688, -571.20166015625, -559.6170043945312, -548.0323486328125, -536.4476928710938, -524.8630981445312, -513.2784423828125, -501.69378662109375, -490.109130859375, -478.52447509765625, -466.9398193359375, -455.3551940917969, -443.7705383300781, -432.1858825683594, -420.6012268066406, -409.0166015625, -397.4319152832031, -385.8472595214844, -374.2626037597656, -362.677978515625, -351.09332275390625, -339.5086669921875, -327.92401123046875, -316.33935546875, -304.75469970703125, -293.1700439453125, -281.58538818359375, -270.0007629394531, -258.4161071777344, -246.83145141601562, -235.24679565429688, -223.6621551513672, -212.0775146484375, -200.49285888671875, -188.90821838378906, -177.3235626220703, -165.73892211914062, -154.15426635742188, -142.56961059570312, -130.98497009277344, -119.40032196044922, -107.815673828125, -96.23102569580078, -84.64637756347656, -73.06172180175781, -61.47707748413086, -49.892425537109375, -38.307777404785156, -26.723129272460938, -15.138480186462402, -3.553831100463867, 8.030818939208984, 19.615467071533203, 31.200115203857422, 42.784767150878906, 54.369415283203125, 65.95406341552734]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 10.0, 5.0, 14.0, 19.0, 8.0, 19.0, 23.0, 26.0, 40.0, 46.0, 59.0, 43.0, 53.0, 58.0, 61.0, 58.0, 69.0, 53.0, 49.0, 50.0, 52.0, 38.0, 28.0, 33.0, 22.0, 26.0, 8.0, 11.0, 10.0, 2.0, 11.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.02938842773438, -121.90411376953125, -118.77884674072266, -115.65357208251953, -112.52830505371094, -109.40303039550781, -106.27775573730469, -103.1524887084961, -100.02721405029297, -96.90193939208984, -93.77667236328125, -90.65139770507812, -87.52613067626953, -84.4008560180664, -81.27558898925781, -78.15031433105469, -75.02503967285156, -71.89976501464844, -68.77449798583984, -65.64922332763672, -62.52395248413086, -59.398681640625, -56.27341079711914, -53.14813995361328, -50.02287292480469, -46.89760208129883, -43.77233123779297, -40.647056579589844, -37.521785736083984, -34.396514892578125, -31.271244049072266, -28.145971298217773, -25.02069854736328, -21.895427703857422, -18.77015495300293, -15.64488410949707, -12.519612312316895, -9.394340515136719, -6.269069671630859, -3.143796920776367, -0.018526077270507812, 3.106745481491089, 6.2320170402526855, 9.357288360595703, 12.482560157775879, 15.607831954956055, 18.733102798461914, 21.858375549316406, 24.983646392822266, 28.108917236328125, 31.234189987182617, 34.359458923339844, 37.48473358154297, 40.61000442504883, 43.73527526855469, 46.86054992675781, 49.985816955566406, 53.111087799072266, 56.236358642578125, 59.36163330078125, 62.48690414428711, 65.61217498779297, 68.73744201660156, 71.86271667480469, 74.98799133300781]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 10.0, 7.0, 9.0, 13.0, 16.0, 23.0, 13.0, 17.0, 27.0, 29.0, 27.0, 34.0, 35.0, 28.0, 46.0, 43.0, 47.0, 44.0, 51.0, 51.0, 47.0, 30.0, 37.0, 35.0, 43.0, 39.0, 27.0, 31.0, 20.0, 18.0, 21.0, 11.0, 14.0, 14.0, 6.0, 6.0, 13.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.16015625, -5.9569091796875, -5.753662109375, -5.5504150390625, -5.34716796875, -5.1439208984375, -4.940673828125, -4.7374267578125, -4.5341796875, -4.3309326171875, -4.127685546875, -3.9244384765625, -3.72119140625, -3.5179443359375, -3.314697265625, -3.1114501953125, -2.908203125, -2.7049560546875, -2.501708984375, -2.2984619140625, -2.09521484375, -1.8919677734375, -1.688720703125, -1.4854736328125, -1.2822265625, -1.0789794921875, -0.875732421875, -0.6724853515625, -0.46923828125, -0.2659912109375, -0.062744140625, 0.1405029296875, 0.34375, 0.5469970703125, 0.750244140625, 0.9534912109375, 1.15673828125, 1.3599853515625, 1.563232421875, 1.7664794921875, 1.9697265625, 2.1729736328125, 2.376220703125, 2.5794677734375, 2.78271484375, 2.9859619140625, 3.189208984375, 3.3924560546875, 3.595703125, 3.7989501953125, 4.002197265625, 4.2054443359375, 4.40869140625, 4.6119384765625, 4.815185546875, 5.0184326171875, 5.2216796875, 5.4249267578125, 5.628173828125, 5.8314208984375, 6.03466796875, 6.2379150390625, 6.441162109375, 6.6444091796875, 6.84765625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 1.0, 6.0, 16.0, 23.0, 18.0, 29.0, 47.0, 77.0, 90.0, 146.0, 252.0, 323.0, 565.0, 794.0, 1292.0, 1972.0, 3106.0, 5027.0, 7968.0, 13174.0, 21636.0, 37156.0, 65955.0, 128050.0, 357656.0, 195691.0, 87918.0, 48153.0, 27742.0, 16579.0, 10082.0, 6189.0, 3905.0, 2428.0, 1564.0, 971.0, 713.0, 401.0, 278.0, 190.0, 109.0, 81.0, 80.0, 28.0, 30.0, 20.0, 7.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.38671875, -1.343017578125, -1.29931640625, -1.255615234375, -1.2119140625, -1.168212890625, -1.12451171875, -1.080810546875, -1.037109375, -0.993408203125, -0.94970703125, -0.906005859375, -0.8623046875, -0.818603515625, -0.77490234375, -0.731201171875, -0.6875, -0.643798828125, -0.60009765625, -0.556396484375, -0.5126953125, -0.468994140625, -0.42529296875, -0.381591796875, -0.337890625, -0.294189453125, -0.25048828125, -0.206787109375, -0.1630859375, -0.119384765625, -0.07568359375, -0.031982421875, 0.01171875, 0.055419921875, 0.09912109375, 0.142822265625, 0.1865234375, 0.230224609375, 0.27392578125, 0.317626953125, 0.361328125, 0.405029296875, 0.44873046875, 0.492431640625, 0.5361328125, 0.579833984375, 0.62353515625, 0.667236328125, 0.7109375, 0.754638671875, 0.79833984375, 0.842041015625, 0.8857421875, 0.929443359375, 0.97314453125, 1.016845703125, 1.060546875, 1.104248046875, 1.14794921875, 1.191650390625, 1.2353515625, 1.279052734375, 1.32275390625, 1.366455078125, 1.41015625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 10.0, 4.0, 14.0, 7.0, 14.0, 11.0, 22.0, 16.0, 29.0, 28.0, 28.0, 35.0, 27.0, 25.0, 29.0, 41.0, 48.0, 44.0, 44.0, 1056.0, 33.0, 40.0, 39.0, 45.0, 32.0, 29.0, 38.0, 27.0, 25.0, 27.0, 21.0, 22.0, 14.0, 10.0, 9.0, 16.0, 14.0, 10.0, 11.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.927734375, -3.804046630859375, -3.68035888671875, -3.556671142578125, -3.4329833984375, -3.309295654296875, -3.18560791015625, -3.061920166015625, -2.938232421875, -2.814544677734375, -2.69085693359375, -2.567169189453125, -2.4434814453125, -2.319793701171875, -2.19610595703125, -2.072418212890625, -1.94873046875, -1.825042724609375, -1.70135498046875, -1.577667236328125, -1.4539794921875, -1.330291748046875, -1.20660400390625, -1.082916259765625, -0.959228515625, -0.835540771484375, -0.71185302734375, -0.588165283203125, -0.4644775390625, -0.340789794921875, -0.21710205078125, -0.093414306640625, 0.0302734375, 0.153961181640625, 0.27764892578125, 0.401336669921875, 0.5250244140625, 0.648712158203125, 0.77239990234375, 0.896087646484375, 1.019775390625, 1.143463134765625, 1.26715087890625, 1.390838623046875, 1.5145263671875, 1.638214111328125, 1.76190185546875, 1.885589599609375, 2.00927734375, 2.132965087890625, 2.25665283203125, 2.380340576171875, 2.5040283203125, 2.627716064453125, 2.75140380859375, 2.875091552734375, 2.998779296875, 3.122467041015625, 3.24615478515625, 3.369842529296875, 3.4935302734375, 3.617218017578125, 3.74090576171875, 3.864593505859375, 3.98828125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 9.0, 9.0, 10.0, 14.0, 15.0, 20.0, 25.0, 46.0, 57.0, 89.0, 127.0, 184.0, 288.0, 398.0, 589.0, 809.0, 1213.0, 1808.0, 2660.0, 4056.0, 5924.0, 9019.0, 13924.0, 21269.0, 33193.0, 52823.0, 93054.0, 208115.0, 1351021.0, 120413.0, 63897.0, 38826.0, 25131.0, 16407.0, 10751.0, 7031.0, 4706.0, 3069.0, 2059.0, 1317.0, 897.0, 612.0, 400.0, 256.0, 205.0, 137.0, 85.0, 45.0, 47.0, 26.0, 17.0, 14.0, 10.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.2001953125, -1.16290283203125, -1.1256103515625, -1.08831787109375, -1.051025390625, -1.01373291015625, -0.9764404296875, -0.93914794921875, -0.90185546875, -0.86456298828125, -0.8272705078125, -0.78997802734375, -0.752685546875, -0.71539306640625, -0.6781005859375, -0.64080810546875, -0.603515625, -0.56622314453125, -0.5289306640625, -0.49163818359375, -0.454345703125, -0.41705322265625, -0.3797607421875, -0.34246826171875, -0.30517578125, -0.26788330078125, -0.2305908203125, -0.19329833984375, -0.156005859375, -0.11871337890625, -0.0814208984375, -0.04412841796875, -0.0068359375, 0.03045654296875, 0.0677490234375, 0.10504150390625, 0.142333984375, 0.17962646484375, 0.2169189453125, 0.25421142578125, 0.29150390625, 0.32879638671875, 0.3660888671875, 0.40338134765625, 0.440673828125, 0.47796630859375, 0.5152587890625, 0.55255126953125, 0.58984375, 0.62713623046875, 0.6644287109375, 0.70172119140625, 0.739013671875, 0.77630615234375, 0.8135986328125, 0.85089111328125, 0.88818359375, 0.92547607421875, 0.9627685546875, 1.00006103515625, 1.037353515625, 1.07464599609375, 1.1119384765625, 1.14923095703125, 1.1865234375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 6.0, 9.0, 3.0, 8.0, 7.0, 15.0, 15.0, 20.0, 30.0, 29.0, 44.0, 59.0, 60.0, 62.0, 82.0, 96.0, 76.0, 68.0, 49.0, 52.0, 47.0, 36.0, 25.0, 19.0, 18.0, 11.0, 6.0, 7.0, 3.0, 9.0, 6.0, 4.0, 2.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0009889602661132812, -0.0009608566761016846, -0.0009327530860900879, -0.0009046494960784912, -0.0008765459060668945, -0.0008484423160552979, -0.0008203387260437012, -0.0007922351360321045, -0.0007641315460205078, -0.0007360279560089111, -0.0007079243659973145, -0.0006798207759857178, -0.0006517171859741211, -0.0006236135959625244, -0.0005955100059509277, -0.0005674064159393311, -0.0005393028259277344, -0.0005111992359161377, -0.000483095645904541, -0.00045499205589294434, -0.00042688846588134766, -0.000398784875869751, -0.0003706812858581543, -0.0003425776958465576, -0.00031447410583496094, -0.00028637051582336426, -0.0002582669258117676, -0.0002301633358001709, -0.00020205974578857422, -0.00017395615577697754, -0.00014585256576538086, -0.00011774897575378418, -8.96453857421875e-05, -6.154179573059082e-05, -3.343820571899414e-05, -5.334615707397461e-06, 2.276897430419922e-05, 5.08725643157959e-05, 7.897615432739258e-05, 0.00010707974433898926, 0.00013518333435058594, 0.00016328692436218262, 0.0001913905143737793, 0.00021949410438537598, 0.00024759769439697266, 0.00027570128440856934, 0.000303804874420166, 0.0003319084644317627, 0.0003600120544433594, 0.00038811564445495605, 0.00041621923446655273, 0.0004443228244781494, 0.0004724264144897461, 0.0005005300045013428, 0.0005286335945129395, 0.0005567371845245361, 0.0005848407745361328, 0.0006129443645477295, 0.0006410479545593262, 0.0006691515445709229, 0.0006972551345825195, 0.0007253587245941162, 0.0007534623146057129, 0.0007815659046173096, 0.0008096694946289062]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 5.0, 7.0, 11.0, 17.0, 12.0, 26.0, 19.0, 25.0, 30.0, 50.0, 76.0, 119.0, 172.0, 197.0, 297.0, 476.0, 835.0, 70687.0, 972687.0, 1090.0, 514.0, 339.0, 220.0, 175.0, 104.0, 78.0, 66.0, 49.0, 23.0, 19.0, 28.0, 17.0, 19.0, 11.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0152435302734375, -0.014737367630004883, -0.014231204986572266, -0.013725042343139648, -0.013218879699707031, -0.012712717056274414, -0.012206554412841797, -0.01170039176940918, -0.011194229125976562, -0.010688066482543945, -0.010181903839111328, -0.009675741195678711, -0.009169578552246094, -0.008663415908813477, -0.00815725326538086, -0.007651090621948242, -0.007144927978515625, -0.006638765335083008, -0.006132602691650391, -0.0056264400482177734, -0.005120277404785156, -0.004614114761352539, -0.004107952117919922, -0.0036017894744873047, -0.0030956268310546875, -0.0025894641876220703, -0.002083301544189453, -0.001577138900756836, -0.0010709762573242188, -0.0005648136138916016, -5.8650970458984375e-05, 0.0004475116729736328, 0.00095367431640625, 0.0014598369598388672, 0.0019659996032714844, 0.0024721622467041016, 0.0029783248901367188, 0.003484487533569336, 0.003990650177001953, 0.00449681282043457, 0.0050029754638671875, 0.005509138107299805, 0.006015300750732422, 0.006521463394165039, 0.007027626037597656, 0.0075337886810302734, 0.00803995132446289, 0.008546113967895508, 0.009052276611328125, 0.009558439254760742, 0.01006460189819336, 0.010570764541625977, 0.011076927185058594, 0.011583089828491211, 0.012089252471923828, 0.012595415115356445, 0.013101577758789062, 0.01360774040222168, 0.014113903045654297, 0.014620065689086914, 0.015126228332519531, 0.01563239097595215, 0.016138553619384766, 0.016644716262817383, 0.01715087890625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 17.0, 68.0, 307.0, 456.0, 135.0, 21.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0017846140544861555, -0.001752868527546525, -0.0017211231170222163, -0.0016893777064979076, -0.0016576321795582771, -0.0016258866526186466, -0.001594141242094338, -0.0015623958315700293, -0.0015306503046303988, -0.0014989047776907682, -0.0014671593671664596, -0.0014354139566421509, -0.0014036684297025204, -0.0013719229027628899, -0.0013401774922385812, -0.0013084320817142725, -0.001276686554774642, -0.0012449410278350115, -0.0012131956173107028, -0.0011814502067863941, -0.0011497046798467636, -0.001117959152907133, -0.0010862137423828244, -0.0010544683318585157, -0.0010227228049188852, -0.0009909772779792547, -0.000959231867454946, -0.0009274863987229764, -0.0008957409299910069, -0.0008639954612590373, -0.0008322499925270677, -0.0008005045237950981, -0.0007687590550631285, -0.0007370135863311589, -0.0007052681175991893, -0.0006735226488672197, -0.0006417771801352501, -0.0006100317114032805, -0.0005782862426713109, -0.0005465407739393413, -0.0005147953052073717, -0.0004830498364754021, -0.0004513043677434325, -0.0004195588990114629, -0.00038781343027949333, -0.00035606796154752374, -0.00032432249281555414, -0.00029257702408358455, -0.0002608315844554454, -0.00022908611572347581, -0.00019734064699150622, -0.00016559517825953662, -0.00013384970952756703, -0.00010210424079559743, -7.035877206362784e-05, -3.8613303331658244e-05, -6.867834599688649e-06, 2.4877634132280946e-05, 5.662310286425054e-05, 8.836857159622014e-05, 0.00012011404032818973, 0.00015185950906015933, 0.00018360497779212892, 0.00021535044652409852, 0.0002470959152560681]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 9.0, 8.0, 7.0, 16.0, 19.0, 11.0, 17.0, 22.0, 16.0, 21.0, 30.0, 36.0, 39.0, 29.0, 41.0, 35.0, 29.0, 47.0, 33.0, 53.0, 36.0, 42.0, 42.0, 46.0, 30.0, 32.0, 25.0, 37.0, 26.0, 22.0, 19.0, 17.0, 19.0, 13.0, 18.0, 7.0, 12.0, 8.0, 8.0, 6.0, 8.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038999319076538086, -0.00037722568958997726, -0.00036445818841457367, -0.0003516906872391701, -0.0003389231860637665, -0.0003261556848883629, -0.0003133881837129593, -0.0003006206825375557, -0.0002878531813621521, -0.0002750856801867485, -0.0002623181790113449, -0.0002495506778359413, -0.00023678317666053772, -0.00022401567548513412, -0.00021124817430973053, -0.00019848067313432693, -0.00018571317195892334, -0.00017294567078351974, -0.00016017816960811615, -0.00014741066843271255, -0.00013464316725730896, -0.00012187566608190536, -0.00010910816490650177, -9.634066373109818e-05, -8.357316255569458e-05, -7.080566138029099e-05, -5.803816020488739e-05, -4.5270659029483795e-05, -3.25031578540802e-05, -1.9735656678676605e-05, -6.96815550327301e-06, 5.799345672130585e-06, 1.856684684753418e-05, 3.1334348022937775e-05, 4.410184919834137e-05, 5.6869350373744965e-05, 6.963685154914856e-05, 8.240435272455215e-05, 9.517185389995575e-05, 0.00010793935507535934, 0.00012070685625076294, 0.00013347435742616653, 0.00014624185860157013, 0.00015900935977697372, 0.00017177686095237732, 0.00018454436212778091, 0.0001973118633031845, 0.0002100793644785881, 0.0002228468656539917, 0.0002356143668293953, 0.0002483818680047989, 0.0002611493691802025, 0.0002739168703556061, 0.0002866843715310097, 0.00029945187270641327, 0.00031221937388181686, 0.00032498687505722046, 0.00033775437623262405, 0.00035052187740802765, 0.00036328937858343124, 0.00037605687975883484, 0.00038882438093423843, 0.00040159188210964203, 0.0004143593832850456, 0.0004271268844604492]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 10.0, 7.0, 9.0, 13.0, 16.0, 23.0, 13.0, 17.0, 27.0, 29.0, 27.0, 34.0, 35.0, 28.0, 46.0, 43.0, 47.0, 44.0, 51.0, 51.0, 47.0, 30.0, 37.0, 35.0, 43.0, 39.0, 27.0, 31.0, 20.0, 18.0, 21.0, 11.0, 14.0, 14.0, 6.0, 6.0, 13.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.16015625, -5.9569091796875, -5.753662109375, -5.5504150390625, -5.34716796875, -5.1439208984375, -4.940673828125, -4.7374267578125, -4.5341796875, -4.3309326171875, -4.127685546875, -3.9244384765625, -3.72119140625, -3.5179443359375, -3.314697265625, -3.1114501953125, -2.908203125, -2.7049560546875, -2.501708984375, -2.2984619140625, -2.09521484375, -1.8919677734375, -1.688720703125, -1.4854736328125, -1.2822265625, -1.0789794921875, -0.875732421875, -0.6724853515625, -0.46923828125, -0.2659912109375, -0.062744140625, 0.1405029296875, 0.34375, 0.5469970703125, 0.750244140625, 0.9534912109375, 1.15673828125, 1.3599853515625, 1.563232421875, 1.7664794921875, 1.9697265625, 2.1729736328125, 2.376220703125, 2.5794677734375, 2.78271484375, 2.9859619140625, 3.189208984375, 3.3924560546875, 3.595703125, 3.7989501953125, 4.002197265625, 4.2054443359375, 4.40869140625, 4.6119384765625, 4.815185546875, 5.0184326171875, 5.2216796875, 5.4249267578125, 5.628173828125, 5.8314208984375, 6.03466796875, 6.2379150390625, 6.441162109375, 6.6444091796875, 6.84765625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 8.0, 15.0, 19.0, 35.0, 39.0, 41.0, 64.0, 72.0, 129.0, 151.0, 234.0, 307.0, 386.0, 582.0, 805.0, 1146.0, 1612.0, 2428.0, 3727.0, 6515.0, 13822.0, 48454.0, 844162.0, 86182.0, 16960.0, 7630.0, 4256.0, 2645.0, 1712.0, 1235.0, 920.0, 611.0, 427.0, 342.0, 232.0, 151.0, 159.0, 92.0, 60.0, 47.0, 36.0, 36.0, 17.0, 17.0, 8.0, 12.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-41.28125, -40.05322265625, -38.8251953125, -37.59716796875, -36.369140625, -35.14111328125, -33.9130859375, -32.68505859375, -31.45703125, -30.22900390625, -29.0009765625, -27.77294921875, -26.544921875, -25.31689453125, -24.0888671875, -22.86083984375, -21.6328125, -20.40478515625, -19.1767578125, -17.94873046875, -16.720703125, -15.49267578125, -14.2646484375, -13.03662109375, -11.80859375, -10.58056640625, -9.3525390625, -8.12451171875, -6.896484375, -5.66845703125, -4.4404296875, -3.21240234375, -1.984375, -0.75634765625, 0.4716796875, 1.69970703125, 2.927734375, 4.15576171875, 5.3837890625, 6.61181640625, 7.83984375, 9.06787109375, 10.2958984375, 11.52392578125, 12.751953125, 13.97998046875, 15.2080078125, 16.43603515625, 17.6640625, 18.89208984375, 20.1201171875, 21.34814453125, 22.576171875, 23.80419921875, 25.0322265625, 26.26025390625, 27.48828125, 28.71630859375, 29.9443359375, 31.17236328125, 32.400390625, 33.62841796875, 34.8564453125, 36.08447265625, 37.3125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 3.0, 6.0, 5.0, 11.0, 8.0, 14.0, 18.0, 5.0, 18.0, 17.0, 35.0, 27.0, 28.0, 30.0, 56.0, 51.0, 61.0, 59.0, 181.0, 1723.0, 189.0, 68.0, 49.0, 51.0, 43.0, 38.0, 28.0, 31.0, 34.0, 36.0, 20.0, 11.0, 20.0, 17.0, 15.0, 9.0, 9.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.71875, -20.11865234375, -19.5185546875, -18.91845703125, -18.318359375, -17.71826171875, -17.1181640625, -16.51806640625, -15.91796875, -15.31787109375, -14.7177734375, -14.11767578125, -13.517578125, -12.91748046875, -12.3173828125, -11.71728515625, -11.1171875, -10.51708984375, -9.9169921875, -9.31689453125, -8.716796875, -8.11669921875, -7.5166015625, -6.91650390625, -6.31640625, -5.71630859375, -5.1162109375, -4.51611328125, -3.916015625, -3.31591796875, -2.7158203125, -2.11572265625, -1.515625, -0.91552734375, -0.3154296875, 0.28466796875, 0.884765625, 1.48486328125, 2.0849609375, 2.68505859375, 3.28515625, 3.88525390625, 4.4853515625, 5.08544921875, 5.685546875, 6.28564453125, 6.8857421875, 7.48583984375, 8.0859375, 8.68603515625, 9.2861328125, 9.88623046875, 10.486328125, 11.08642578125, 11.6865234375, 12.28662109375, 12.88671875, 13.48681640625, 14.0869140625, 14.68701171875, 15.287109375, 15.88720703125, 16.4873046875, 17.08740234375, 17.6875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 2.0, 8.0, 6.0, 6.0, 6.0, 12.0, 15.0, 17.0, 14.0, 15.0, 29.0, 30.0, 27.0, 33.0, 46.0, 51.0, 100.0, 156.0, 429.0, 2227.0, 3050671.0, 90119.0, 991.0, 242.0, 118.0, 82.0, 55.0, 31.0, 34.0, 22.0, 17.0, 15.0, 17.0, 10.0, 19.0, 4.0, 10.0, 6.0, 3.0, 5.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.3125, -78.5849609375, -75.857421875, -73.1298828125, -70.40234375, -67.6748046875, -64.947265625, -62.2197265625, -59.4921875, -56.7646484375, -54.037109375, -51.3095703125, -48.58203125, -45.8544921875, -43.126953125, -40.3994140625, -37.671875, -34.9443359375, -32.216796875, -29.4892578125, -26.76171875, -24.0341796875, -21.306640625, -18.5791015625, -15.8515625, -13.1240234375, -10.396484375, -7.6689453125, -4.94140625, -2.2138671875, 0.513671875, 3.2412109375, 5.96875, 8.6962890625, 11.423828125, 14.1513671875, 16.87890625, 19.6064453125, 22.333984375, 25.0615234375, 27.7890625, 30.5166015625, 33.244140625, 35.9716796875, 38.69921875, 41.4267578125, 44.154296875, 46.8818359375, 49.609375, 52.3369140625, 55.064453125, 57.7919921875, 60.51953125, 63.2470703125, 65.974609375, 68.7021484375, 71.4296875, 74.1572265625, 76.884765625, 79.6123046875, 82.33984375, 85.0673828125, 87.794921875, 90.5224609375, 93.25]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 84.0, 756.0, 163.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-235.33775329589844, -231.24969482421875, -227.16163635253906, -223.07359313964844, -218.98553466796875, -214.89747619628906, -210.80941772460938, -206.7213592529297, -202.63330078125, -198.5452423095703, -194.45718383789062, -190.369140625, -186.2810821533203, -182.19302368164062, -178.10496520996094, -174.01690673828125, -169.92886352539062, -165.84080505371094, -161.75274658203125, -157.66470336914062, -153.57664489746094, -149.48858642578125, -145.40052795410156, -141.31246948242188, -137.22442626953125, -133.13636779785156, -129.04830932617188, -124.96025848388672, -120.87220764160156, -116.78414916992188, -112.69609069824219, -108.6080322265625, -104.51998901367188, -100.43193054199219, -96.34387969970703, -92.25582122802734, -88.16777038574219, -84.0797119140625, -79.99165344238281, -75.90359497070312, -71.81554412841797, -67.72748565673828, -63.639434814453125, -59.55137634277344, -55.463321685791016, -51.375267028808594, -47.287208557128906, -43.199153900146484, -39.11109924316406, -35.02304458618164, -30.934988021850586, -26.84693145751953, -22.75887680053711, -18.670822143554688, -14.582765579223633, -10.494709014892578, -6.406652450561523, -2.318596839904785, 1.7694587707519531, 5.857514381408691, 9.94556999206543, 14.033624649047852, 18.121681213378906, 22.20973777770996, 26.297792434692383]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 4.0, 9.0, 10.0, 8.0, 10.0, 13.0, 13.0, 13.0, 16.0, 26.0, 20.0, 25.0, 25.0, 20.0, 28.0, 42.0, 33.0, 41.0, 37.0, 37.0, 41.0, 46.0, 46.0, 47.0, 39.0, 35.0, 34.0, 33.0, 35.0, 29.0, 30.0, 13.0, 23.0, 18.0, 15.0, 18.0, 11.0, 7.0, 14.0, 7.0, 8.0, 7.0, 8.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-62.762062072753906, -61.041603088378906, -59.321144104003906, -57.60068893432617, -55.88022994995117, -54.15977096557617, -52.43931198120117, -50.71885681152344, -48.99839782714844, -47.27793884277344, -45.55747985839844, -43.8370246887207, -42.1165657043457, -40.3961067199707, -38.6756477355957, -36.95519256591797, -35.23473358154297, -33.51427459716797, -31.7938175201416, -30.0733585357666, -28.352901458740234, -26.632442474365234, -24.911983489990234, -23.191526412963867, -21.471065521240234, -19.750606536865234, -18.030149459838867, -16.309690475463867, -14.5892333984375, -12.8687744140625, -11.148316383361816, -9.427858352661133, -7.707401275634766, -5.986943244934082, -4.266485214233398, -2.5460267066955566, -0.825568675994873, 0.8948898315429688, 2.6153478622436523, 4.335805892944336, 6.0562639236450195, 7.776721954345703, 9.497179985046387, 11.21763801574707, 12.93809700012207, 14.658555030822754, 16.379013061523438, 18.099472045898438, 19.819929122924805, 21.540388107299805, 23.260845184326172, 24.981304168701172, 26.70176124572754, 28.42222023010254, 30.142677307128906, 31.863136291503906, 33.583595275878906, 35.304054260253906, 37.024513244628906, 38.74496841430664, 40.46542739868164, 42.18588638305664, 43.90634536743164, 45.626800537109375, 47.347259521484375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 4.0, 4.0, 6.0, 4.0, 7.0, 9.0, 9.0, 22.0, 16.0, 18.0, 17.0, 18.0, 35.0, 27.0, 28.0, 30.0, 37.0, 40.0, 45.0, 38.0, 55.0, 44.0, 49.0, 44.0, 37.0, 33.0, 40.0, 35.0, 37.0, 40.0, 22.0, 27.0, 22.0, 17.0, 14.0, 12.0, 8.0, 17.0, 8.0, 8.0, 1.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.3671875, -6.1588134765625, -5.950439453125, -5.7420654296875, -5.53369140625, -5.3253173828125, -5.116943359375, -4.9085693359375, -4.7001953125, -4.4918212890625, -4.283447265625, -4.0750732421875, -3.86669921875, -3.6583251953125, -3.449951171875, -3.2415771484375, -3.033203125, -2.8248291015625, -2.616455078125, -2.4080810546875, -2.19970703125, -1.9913330078125, -1.782958984375, -1.5745849609375, -1.3662109375, -1.1578369140625, -0.949462890625, -0.7410888671875, -0.53271484375, -0.3243408203125, -0.115966796875, 0.0924072265625, 0.30078125, 0.5091552734375, 0.717529296875, 0.9259033203125, 1.13427734375, 1.3426513671875, 1.551025390625, 1.7593994140625, 1.9677734375, 2.1761474609375, 2.384521484375, 2.5928955078125, 2.80126953125, 3.0096435546875, 3.218017578125, 3.4263916015625, 3.634765625, 3.8431396484375, 4.051513671875, 4.2598876953125, 4.46826171875, 4.6766357421875, 4.885009765625, 5.0933837890625, 5.3017578125, 5.5101318359375, 5.718505859375, 5.9268798828125, 6.13525390625, 6.3436279296875, 6.552001953125, 6.7603759765625, 6.96875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 6.0, 7.0, 10.0, 9.0, 11.0, 13.0, 20.0, 43.0, 45.0, 84.0, 86.0, 134.0, 217.0, 366.0, 612.0, 1151.0, 2111.0, 4404.0, 9380.0, 24076.0, 104128.0, 2981329.0, 982368.0, 54196.0, 16045.0, 6636.0, 3063.0, 1542.0, 857.0, 460.0, 289.0, 184.0, 115.0, 72.0, 52.0, 39.0, 35.0, 22.0, 11.0, 14.0, 6.0, 10.0, 8.0, 2.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-35.84375, -34.6806640625, -33.517578125, -32.3544921875, -31.19140625, -30.0283203125, -28.865234375, -27.7021484375, -26.5390625, -25.3759765625, -24.212890625, -23.0498046875, -21.88671875, -20.7236328125, -19.560546875, -18.3974609375, -17.234375, -16.0712890625, -14.908203125, -13.7451171875, -12.58203125, -11.4189453125, -10.255859375, -9.0927734375, -7.9296875, -6.7666015625, -5.603515625, -4.4404296875, -3.27734375, -2.1142578125, -0.951171875, 0.2119140625, 1.375, 2.5380859375, 3.701171875, 4.8642578125, 6.02734375, 7.1904296875, 8.353515625, 9.5166015625, 10.6796875, 11.8427734375, 13.005859375, 14.1689453125, 15.33203125, 16.4951171875, 17.658203125, 18.8212890625, 19.984375, 21.1474609375, 22.310546875, 23.4736328125, 24.63671875, 25.7998046875, 26.962890625, 28.1259765625, 29.2890625, 30.4521484375, 31.615234375, 32.7783203125, 33.94140625, 35.1044921875, 36.267578125, 37.4306640625, 38.59375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 6.0, 6.0, 3.0, 12.0, 14.0, 20.0, 20.0, 30.0, 42.0, 54.0, 82.0, 87.0, 123.0, 169.0, 260.0, 371.0, 498.0, 587.0, 491.0, 361.0, 231.0, 144.0, 119.0, 82.0, 62.0, 54.0, 34.0, 24.0, 15.0, 24.0, 14.0, 5.0, 7.0, 5.0, 2.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.6875, -25.80908203125, -24.9306640625, -24.05224609375, -23.173828125, -22.29541015625, -21.4169921875, -20.53857421875, -19.66015625, -18.78173828125, -17.9033203125, -17.02490234375, -16.146484375, -15.26806640625, -14.3896484375, -13.51123046875, -12.6328125, -11.75439453125, -10.8759765625, -9.99755859375, -9.119140625, -8.24072265625, -7.3623046875, -6.48388671875, -5.60546875, -4.72705078125, -3.8486328125, -2.97021484375, -2.091796875, -1.21337890625, -0.3349609375, 0.54345703125, 1.421875, 2.30029296875, 3.1787109375, 4.05712890625, 4.935546875, 5.81396484375, 6.6923828125, 7.57080078125, 8.44921875, 9.32763671875, 10.2060546875, 11.08447265625, 11.962890625, 12.84130859375, 13.7197265625, 14.59814453125, 15.4765625, 16.35498046875, 17.2333984375, 18.11181640625, 18.990234375, 19.86865234375, 20.7470703125, 21.62548828125, 22.50390625, 23.38232421875, 24.2607421875, 25.13916015625, 26.017578125, 26.89599609375, 27.7744140625, 28.65283203125, 29.53125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 7.0, 7.0, 9.0, 22.0, 27.0, 16.0, 26.0, 52.0, 73.0, 84.0, 117.0, 195.0, 331.0, 729.0, 4906.0, 4082478.0, 102502.0, 1419.0, 442.0, 244.0, 156.0, 108.0, 77.0, 64.0, 43.0, 31.0, 24.0, 20.0, 15.0, 7.0, 6.0, 7.0, 4.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.875, -124.681640625, -120.48828125, -116.294921875, -112.1015625, -107.908203125, -103.71484375, -99.521484375, -95.328125, -91.134765625, -86.94140625, -82.748046875, -78.5546875, -74.361328125, -70.16796875, -65.974609375, -61.78125, -57.587890625, -53.39453125, -49.201171875, -45.0078125, -40.814453125, -36.62109375, -32.427734375, -28.234375, -24.041015625, -19.84765625, -15.654296875, -11.4609375, -7.267578125, -3.07421875, 1.119140625, 5.3125, 9.505859375, 13.69921875, 17.892578125, 22.0859375, 26.279296875, 30.47265625, 34.666015625, 38.859375, 43.052734375, 47.24609375, 51.439453125, 55.6328125, 59.826171875, 64.01953125, 68.212890625, 72.40625, 76.599609375, 80.79296875, 84.986328125, 89.1796875, 93.373046875, 97.56640625, 101.759765625, 105.953125, 110.146484375, 114.33984375, 118.533203125, 122.7265625, 126.919921875, 131.11328125, 135.306640625, 139.5]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 30.0, 106.0, 265.0, 347.0, 182.0, 61.0, 16.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.61618041992188, -123.90042877197266, -119.18467712402344, -114.46892547607422, -109.753173828125, -105.03741455078125, -100.32166290283203, -95.60591125488281, -90.8901596069336, -86.17440795898438, -81.45865631103516, -76.74290466308594, -72.02714538574219, -67.3114013671875, -62.59564208984375, -57.87989044189453, -53.16413879394531, -48.448387145996094, -43.732635498046875, -39.01688003540039, -34.30112838745117, -29.585376739501953, -24.8696231842041, -20.15386962890625, -15.438117980957031, -10.722365379333496, -6.006612777709961, -1.2908601760864258, 3.4248924255371094, 8.140644073486328, 12.85639762878418, 17.57215118408203, 22.28790283203125, 27.00365447998047, 31.71940803527832, 36.43516159057617, 41.15091323852539, 45.86666488647461, 50.582420349121094, 55.29817199707031, 60.01392364501953, 64.72967529296875, 69.44542694091797, 74.16117858886719, 78.87693786621094, 83.59268188476562, 88.30844116210938, 93.0241928100586, 97.73994445800781, 102.45569610595703, 107.17144775390625, 111.88719940185547, 116.60295104980469, 121.31871032714844, 126.03446197509766, 130.75021362304688, 135.46597290039062, 140.18173217773438, 144.89747619628906, 149.6132354736328, 154.3289794921875, 159.04473876953125, 163.76048278808594, 168.4762420654297, 173.19198608398438]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 5.0, 7.0, 10.0, 18.0, 12.0, 14.0, 18.0, 20.0, 24.0, 30.0, 21.0, 44.0, 24.0, 32.0, 32.0, 36.0, 46.0, 42.0, 51.0, 42.0, 29.0, 52.0, 34.0, 38.0, 36.0, 33.0, 24.0, 38.0, 26.0, 23.0, 20.0, 17.0, 23.0, 15.0, 10.0, 6.0, 10.0, 7.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.61894226074219, -78.90320587158203, -76.18746948242188, -73.47174072265625, -70.7560043334961, -68.04026794433594, -65.32453918457031, -62.608802795410156, -59.89306640625, -57.177330017089844, -54.46159744262695, -51.74586486816406, -49.030128479003906, -46.31439208984375, -43.59865951538086, -40.88292694091797, -38.16719055175781, -35.451454162597656, -32.735721588134766, -30.019987106323242, -27.30425262451172, -24.588518142700195, -21.872783660888672, -19.15704917907715, -16.441314697265625, -13.725580215454102, -11.009845733642578, -8.294111251831055, -5.578376770019531, -2.862642288208008, -0.14690780639648438, 2.568826675415039, 5.284568786621094, 8.000303268432617, 10.71603775024414, 13.431772232055664, 16.147506713867188, 18.86324119567871, 21.578975677490234, 24.294710159301758, 27.01044464111328, 29.726179122924805, 32.44191360473633, 35.15764617919922, 37.873382568359375, 40.58911895751953, 43.30485153198242, 46.02058410644531, 48.73632049560547, 51.452056884765625, 54.167789459228516, 56.883522033691406, 59.59925842285156, 62.31499481201172, 65.03073120117188, 67.7464599609375, 70.46219635009766, 73.17793273925781, 75.89366149902344, 78.6093978881836, 81.32513427734375, 84.0408706665039, 86.75660705566406, 89.47233581542969, 92.18807220458984]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 1.0, 6.0, 1.0, 9.0, 9.0, 12.0, 13.0, 12.0, 13.0, 15.0, 24.0, 29.0, 37.0, 29.0, 34.0, 30.0, 30.0, 53.0, 48.0, 40.0, 44.0, 40.0, 44.0, 42.0, 47.0, 43.0, 37.0, 43.0, 34.0, 30.0, 24.0, 23.0, 15.0, 15.0, 16.0, 7.0, 12.0, 10.0, 6.0, 11.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.76953125, -6.5518798828125, -6.334228515625, -6.1165771484375, -5.89892578125, -5.6812744140625, -5.463623046875, -5.2459716796875, -5.0283203125, -4.8106689453125, -4.593017578125, -4.3753662109375, -4.15771484375, -3.9400634765625, -3.722412109375, -3.5047607421875, -3.287109375, -3.0694580078125, -2.851806640625, -2.6341552734375, -2.41650390625, -2.1988525390625, -1.981201171875, -1.7635498046875, -1.5458984375, -1.3282470703125, -1.110595703125, -0.8929443359375, -0.67529296875, -0.4576416015625, -0.239990234375, -0.0223388671875, 0.1953125, 0.4129638671875, 0.630615234375, 0.8482666015625, 1.06591796875, 1.2835693359375, 1.501220703125, 1.7188720703125, 1.9365234375, 2.1541748046875, 2.371826171875, 2.5894775390625, 2.80712890625, 3.0247802734375, 3.242431640625, 3.4600830078125, 3.677734375, 3.8953857421875, 4.113037109375, 4.3306884765625, 4.54833984375, 4.7659912109375, 4.983642578125, 5.2012939453125, 5.4189453125, 5.6365966796875, 5.854248046875, 6.0718994140625, 6.28955078125, 6.5072021484375, 6.724853515625, 6.9425048828125, 7.16015625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 8.0, 8.0, 7.0, 11.0, 22.0, 39.0, 62.0, 77.0, 99.0, 146.0, 208.0, 279.0, 414.0, 691.0, 1009.0, 1538.0, 2212.0, 3356.0, 5346.0, 8660.0, 13717.0, 22735.0, 38801.0, 68925.0, 130752.0, 322381.0, 202716.0, 94353.0, 51949.0, 29695.0, 17849.0, 11066.0, 6694.0, 4271.0, 2807.0, 1857.0, 1225.0, 808.0, 570.0, 392.0, 260.0, 159.0, 118.0, 91.0, 47.0, 38.0, 23.0, 19.0, 22.0, 14.0, 5.0, 3.0, 5.0, 2.0, 0.0, 4.0, 2.0], "bins": [-1.4755859375, -1.4305419921875, -1.385498046875, -1.3404541015625, -1.29541015625, -1.2503662109375, -1.205322265625, -1.1602783203125, -1.115234375, -1.0701904296875, -1.025146484375, -0.9801025390625, -0.93505859375, -0.8900146484375, -0.844970703125, -0.7999267578125, -0.7548828125, -0.7098388671875, -0.664794921875, -0.6197509765625, -0.57470703125, -0.5296630859375, -0.484619140625, -0.4395751953125, -0.39453125, -0.3494873046875, -0.304443359375, -0.2593994140625, -0.21435546875, -0.1693115234375, -0.124267578125, -0.0792236328125, -0.0341796875, 0.0108642578125, 0.055908203125, 0.1009521484375, 0.14599609375, 0.1910400390625, 0.236083984375, 0.2811279296875, 0.326171875, 0.3712158203125, 0.416259765625, 0.4613037109375, 0.50634765625, 0.5513916015625, 0.596435546875, 0.6414794921875, 0.6865234375, 0.7315673828125, 0.776611328125, 0.8216552734375, 0.86669921875, 0.9117431640625, 0.956787109375, 1.0018310546875, 1.046875, 1.0919189453125, 1.136962890625, 1.1820068359375, 1.22705078125, 1.2720947265625, 1.317138671875, 1.3621826171875, 1.4072265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 9.0, 8.0, 13.0, 12.0, 17.0, 20.0, 18.0, 19.0, 20.0, 26.0, 23.0, 25.0, 33.0, 31.0, 42.0, 25.0, 36.0, 35.0, 25.0, 36.0, 1060.0, 47.0, 31.0, 43.0, 27.0, 32.0, 39.0, 24.0, 27.0, 26.0, 29.0, 31.0, 22.0, 15.0, 14.0, 15.0, 21.0, 10.0, 9.0, 7.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.9921875, -3.867767333984375, -3.74334716796875, -3.618927001953125, -3.4945068359375, -3.370086669921875, -3.24566650390625, -3.121246337890625, -2.996826171875, -2.872406005859375, -2.74798583984375, -2.623565673828125, -2.4991455078125, -2.374725341796875, -2.25030517578125, -2.125885009765625, -2.00146484375, -1.877044677734375, -1.75262451171875, -1.628204345703125, -1.5037841796875, -1.379364013671875, -1.25494384765625, -1.130523681640625, -1.006103515625, -0.881683349609375, -0.75726318359375, -0.632843017578125, -0.5084228515625, -0.384002685546875, -0.25958251953125, -0.135162353515625, -0.0107421875, 0.113677978515625, 0.23809814453125, 0.362518310546875, 0.4869384765625, 0.611358642578125, 0.73577880859375, 0.860198974609375, 0.984619140625, 1.109039306640625, 1.23345947265625, 1.357879638671875, 1.4822998046875, 1.606719970703125, 1.73114013671875, 1.855560302734375, 1.97998046875, 2.104400634765625, 2.22882080078125, 2.353240966796875, 2.4776611328125, 2.602081298828125, 2.72650146484375, 2.850921630859375, 2.975341796875, 3.099761962890625, 3.22418212890625, 3.348602294921875, 3.4730224609375, 3.597442626953125, 3.72186279296875, 3.846282958984375, 3.970703125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 11.0, 11.0, 14.0, 19.0, 28.0, 50.0, 59.0, 78.0, 126.0, 192.0, 303.0, 446.0, 627.0, 866.0, 1471.0, 2188.0, 3235.0, 4971.0, 7513.0, 11425.0, 17514.0, 26028.0, 40200.0, 63404.0, 111609.0, 1313707.0, 221852.0, 100957.0, 58973.0, 37436.0, 24451.0, 16099.0, 10780.0, 7109.0, 4608.0, 3057.0, 1966.0, 1232.0, 857.0, 534.0, 379.0, 236.0, 178.0, 127.0, 54.0, 44.0, 38.0, 20.0, 19.0, 12.0, 10.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.1904296875, -1.15313720703125, -1.1158447265625, -1.07855224609375, -1.041259765625, -1.00396728515625, -0.9666748046875, -0.92938232421875, -0.89208984375, -0.85479736328125, -0.8175048828125, -0.78021240234375, -0.742919921875, -0.70562744140625, -0.6683349609375, -0.63104248046875, -0.59375, -0.55645751953125, -0.5191650390625, -0.48187255859375, -0.444580078125, -0.40728759765625, -0.3699951171875, -0.33270263671875, -0.29541015625, -0.25811767578125, -0.2208251953125, -0.18353271484375, -0.146240234375, -0.10894775390625, -0.0716552734375, -0.03436279296875, 0.0029296875, 0.04022216796875, 0.0775146484375, 0.11480712890625, 0.152099609375, 0.18939208984375, 0.2266845703125, 0.26397705078125, 0.30126953125, 0.33856201171875, 0.3758544921875, 0.41314697265625, 0.450439453125, 0.48773193359375, 0.5250244140625, 0.56231689453125, 0.599609375, 0.63690185546875, 0.6741943359375, 0.71148681640625, 0.748779296875, 0.78607177734375, 0.8233642578125, 0.86065673828125, 0.89794921875, 0.93524169921875, 0.9725341796875, 1.00982666015625, 1.047119140625, 1.08441162109375, 1.1217041015625, 1.15899658203125, 1.1962890625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 9.0, 7.0, 9.0, 21.0, 14.0, 29.0, 43.0, 57.0, 64.0, 92.0, 110.0, 117.0, 118.0, 57.0, 59.0, 48.0, 47.0, 19.0, 18.0, 12.0, 8.0, 10.0, 7.0, 4.0, 5.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010967254638671875, -0.0010605454444885254, -0.0010243654251098633, -0.0009881854057312012, -0.0009520053863525391, -0.000915825366973877, -0.0008796453475952148, -0.0008434653282165527, -0.0008072853088378906, -0.0007711052894592285, -0.0007349252700805664, -0.0006987452507019043, -0.0006625652313232422, -0.0006263852119445801, -0.000590205192565918, -0.0005540251731872559, -0.0005178451538085938, -0.00048166513442993164, -0.00044548511505126953, -0.0004093050956726074, -0.0003731250762939453, -0.0003369450569152832, -0.0003007650375366211, -0.000264585018157959, -0.00022840499877929688, -0.00019222497940063477, -0.00015604496002197266, -0.00011986494064331055, -8.368492126464844e-05, -4.750490188598633e-05, -1.1324882507324219e-05, 2.485513687133789e-05, 6.103515625e-05, 9.721517562866211e-05, 0.00013339519500732422, 0.00016957521438598633, 0.00020575523376464844, 0.00024193525314331055, 0.00027811527252197266, 0.00031429529190063477, 0.0003504753112792969, 0.000386655330657959, 0.0004228353500366211, 0.0004590153694152832, 0.0004951953887939453, 0.0005313754081726074, 0.0005675554275512695, 0.0006037354469299316, 0.0006399154663085938, 0.0006760954856872559, 0.000712275505065918, 0.0007484555244445801, 0.0007846355438232422, 0.0008208155632019043, 0.0008569955825805664, 0.0008931756019592285, 0.0009293556213378906, 0.0009655356407165527, 0.0010017156600952148, 0.001037895679473877, 0.001074075698852539, 0.0011102557182312012, 0.0011464357376098633, 0.0011826157569885254, 0.0012187957763671875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 4.0, 8.0, 10.0, 15.0, 22.0, 41.0, 81.0, 134.0, 265.0, 583.0, 827419.0, 218846.0, 547.0, 260.0, 128.0, 67.0, 38.0, 22.0, 16.0, 10.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03204345703125, -0.03107142448425293, -0.03009939193725586, -0.02912735939025879, -0.02815532684326172, -0.02718329429626465, -0.026211261749267578, -0.025239229202270508, -0.024267196655273438, -0.023295164108276367, -0.022323131561279297, -0.021351099014282227, -0.020379066467285156, -0.019407033920288086, -0.018435001373291016, -0.017462968826293945, -0.016490936279296875, -0.015518903732299805, -0.014546871185302734, -0.013574838638305664, -0.012602806091308594, -0.011630773544311523, -0.010658740997314453, -0.009686708450317383, -0.008714675903320312, -0.007742643356323242, -0.006770610809326172, -0.0057985782623291016, -0.004826545715332031, -0.003854513168334961, -0.0028824806213378906, -0.0019104480743408203, -0.00093841552734375, 3.361701965332031e-05, 0.0010056495666503906, 0.001977682113647461, 0.0029497146606445312, 0.0039217472076416016, 0.004893779754638672, 0.005865812301635742, 0.0068378448486328125, 0.007809877395629883, 0.008781909942626953, 0.009753942489624023, 0.010725975036621094, 0.011698007583618164, 0.012670040130615234, 0.013642072677612305, 0.014614105224609375, 0.015586137771606445, 0.016558170318603516, 0.017530202865600586, 0.018502235412597656, 0.019474267959594727, 0.020446300506591797, 0.021418333053588867, 0.022390365600585938, 0.023362398147583008, 0.024334430694580078, 0.02530646324157715, 0.02627849578857422, 0.02725052833557129, 0.02822256088256836, 0.02919459342956543, 0.0301666259765625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 951.0, 63.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.008962997235357761, -0.008796058595180511, -0.008629119955003262, -0.008462180383503437, -0.008295241743326187, -0.008128303103148937, -0.007961364462971687, -0.00779442535713315, -0.007627486251294613, -0.007460547611117363, -0.007293608505278826, -0.007126669865101576, -0.006959730759263039, -0.006792792119085789, -0.0066258530132472515, -0.006458914373070002, -0.006291975267231464, -0.0061250366270542145, -0.005958097521215677, -0.005791158881038427, -0.00562421977519989, -0.00545728113502264, -0.005290342029184103, -0.005123403389006853, -0.004956464748829603, -0.004789526108652353, -0.004622587002813816, -0.004455648362636566, -0.004288709256798029, -0.004121770616620779, -0.003954831510782242, -0.003787892870604992, -0.0036209532991051674, -0.003454014426097274, -0.0032870755530893803, -0.0031201366800814867, -0.002953197807073593, -0.0027862589340656996, -0.002619320061057806, -0.002452381420880556, -0.0022854425478726625, -0.002118503674864769, -0.0019515648018568754, -0.0017846259288489819, -0.0016176870558410883, -0.0014507481828331947, -0.001283809426240623, -0.0011168705532327294, -0.0009499316802248359, -0.0007829928072169423, -0.0006160539342090487, -0.0004491151194088161, -0.00028217624640092254, -0.00011523737339302897, 5.1701441407203674e-05, 0.00021864031441509724, 0.0003855791874229908, 0.0005525180604308844, 0.0007194569334387779, 0.0008863957482390106, 0.001053334679454565, 0.0012202735524624586, 0.0013872123090550303, 0.001554151182062924, 0.0017210900550708175]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 9.0, 2.0, 1.0, 5.0, 8.0, 10.0, 7.0, 8.0, 15.0, 8.0, 11.0, 16.0, 18.0, 7.0, 20.0, 20.0, 23.0, 31.0, 32.0, 36.0, 39.0, 36.0, 34.0, 39.0, 42.0, 40.0, 44.0, 38.0, 38.0, 41.0, 39.0, 29.0, 35.0, 39.0, 25.0, 17.0, 14.0, 21.0, 21.0, 14.0, 21.0, 16.0, 7.0, 9.0, 3.0, 8.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0004317760467529297, -0.00041939225047826767, -0.00040700845420360565, -0.00039462465792894363, -0.0003822408616542816, -0.0003698570653796196, -0.0003574732691049576, -0.00034508947283029556, -0.00033270567655563354, -0.0003203218802809715, -0.0003079380840063095, -0.0002955542877316475, -0.0002831704914569855, -0.00027078669518232346, -0.00025840289890766144, -0.0002460191026329994, -0.0002336353063583374, -0.00022125151008367538, -0.00020886771380901337, -0.00019648391753435135, -0.00018410012125968933, -0.0001717163249850273, -0.0001593325287103653, -0.00014694873243570328, -0.00013456493616104126, -0.00012218113988637924, -0.00010979734361171722, -9.74135473370552e-05, -8.502975106239319e-05, -7.264595478773117e-05, -6.026215851306915e-05, -4.7878362238407135e-05, -3.549456596374512e-05, -2.31107696890831e-05, -1.0726973414421082e-05, 1.6568228602409363e-06, 1.4040619134902954e-05, 2.6424415409564972e-05, 3.880821168422699e-05, 5.119200795888901e-05, 6.357580423355103e-05, 7.595960050821304e-05, 8.834339678287506e-05, 0.00010072719305753708, 0.0001131109893321991, 0.00012549478560686111, 0.00013787858188152313, 0.00015026237815618515, 0.00016264617443084717, 0.00017502997070550919, 0.0001874137669801712, 0.00019979756325483322, 0.00021218135952949524, 0.00022456515580415726, 0.00023694895207881927, 0.0002493327483534813, 0.0002617165446281433, 0.00027410034090280533, 0.00028648413717746735, 0.00029886793345212936, 0.0003112517297267914, 0.0003236355260014534, 0.0003360193222761154, 0.00034840311855077744, 0.00036078691482543945]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 1.0, 6.0, 1.0, 9.0, 9.0, 12.0, 13.0, 12.0, 13.0, 15.0, 24.0, 29.0, 37.0, 29.0, 34.0, 30.0, 30.0, 53.0, 48.0, 40.0, 44.0, 40.0, 44.0, 42.0, 47.0, 43.0, 37.0, 43.0, 34.0, 30.0, 24.0, 23.0, 15.0, 15.0, 16.0, 7.0, 12.0, 10.0, 6.0, 11.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.76953125, -6.5518798828125, -6.334228515625, -6.1165771484375, -5.89892578125, -5.6812744140625, -5.463623046875, -5.2459716796875, -5.0283203125, -4.8106689453125, -4.593017578125, -4.3753662109375, -4.15771484375, -3.9400634765625, -3.722412109375, -3.5047607421875, -3.287109375, -3.0694580078125, -2.851806640625, -2.6341552734375, -2.41650390625, -2.1988525390625, -1.981201171875, -1.7635498046875, -1.5458984375, -1.3282470703125, -1.110595703125, -0.8929443359375, -0.67529296875, -0.4576416015625, -0.239990234375, -0.0223388671875, 0.1953125, 0.4129638671875, 0.630615234375, 0.8482666015625, 1.06591796875, 1.2835693359375, 1.501220703125, 1.7188720703125, 1.9365234375, 2.1541748046875, 2.371826171875, 2.5894775390625, 2.80712890625, 3.0247802734375, 3.242431640625, 3.4600830078125, 3.677734375, 3.8953857421875, 4.113037109375, 4.3306884765625, 4.54833984375, 4.7659912109375, 4.983642578125, 5.2012939453125, 5.4189453125, 5.6365966796875, 5.854248046875, 6.0718994140625, 6.28955078125, 6.5072021484375, 6.724853515625, 6.9425048828125, 7.16015625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 7.0, 4.0, 8.0, 13.0, 17.0, 27.0, 37.0, 39.0, 53.0, 78.0, 123.0, 147.0, 185.0, 286.0, 467.0, 741.0, 1199.0, 2281.0, 4784.0, 11037.0, 28636.0, 89084.0, 381128.0, 387001.0, 90260.0, 28911.0, 11328.0, 4849.0, 2386.0, 1282.0, 678.0, 413.0, 283.0, 250.0, 126.0, 94.0, 77.0, 71.0, 47.0, 34.0, 18.0, 26.0, 15.0, 4.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.2734375, -6.07110595703125, -5.8687744140625, -5.66644287109375, -5.464111328125, -5.26177978515625, -5.0594482421875, -4.85711669921875, -4.65478515625, -4.45245361328125, -4.2501220703125, -4.04779052734375, -3.845458984375, -3.64312744140625, -3.4407958984375, -3.23846435546875, -3.0361328125, -2.83380126953125, -2.6314697265625, -2.42913818359375, -2.226806640625, -2.02447509765625, -1.8221435546875, -1.61981201171875, -1.41748046875, -1.21514892578125, -1.0128173828125, -0.81048583984375, -0.608154296875, -0.40582275390625, -0.2034912109375, -0.00115966796875, 0.201171875, 0.40350341796875, 0.6058349609375, 0.80816650390625, 1.010498046875, 1.21282958984375, 1.4151611328125, 1.61749267578125, 1.81982421875, 2.02215576171875, 2.2244873046875, 2.42681884765625, 2.629150390625, 2.83148193359375, 3.0338134765625, 3.23614501953125, 3.4384765625, 3.64080810546875, 3.8431396484375, 4.04547119140625, 4.247802734375, 4.45013427734375, 4.6524658203125, 4.85479736328125, 5.05712890625, 5.25946044921875, 5.4617919921875, 5.66412353515625, 5.866455078125, 6.06878662109375, 6.2711181640625, 6.47344970703125, 6.67578125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 5.0, 3.0, 8.0, 12.0, 14.0, 14.0, 11.0, 13.0, 24.0, 35.0, 39.0, 36.0, 45.0, 53.0, 48.0, 67.0, 73.0, 148.0, 1841.0, 119.0, 51.0, 55.0, 51.0, 45.0, 42.0, 19.0, 35.0, 36.0, 11.0, 21.0, 15.0, 12.0, 13.0, 8.0, 7.0, 6.0, 4.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.171875, -26.3828125, -25.59375, -24.8046875, -24.015625, -23.2265625, -22.4375, -21.6484375, -20.859375, -20.0703125, -19.28125, -18.4921875, -17.703125, -16.9140625, -16.125, -15.3359375, -14.546875, -13.7578125, -12.96875, -12.1796875, -11.390625, -10.6015625, -9.8125, -9.0234375, -8.234375, -7.4453125, -6.65625, -5.8671875, -5.078125, -4.2890625, -3.5, -2.7109375, -1.921875, -1.1328125, -0.34375, 0.4453125, 1.234375, 2.0234375, 2.8125, 3.6015625, 4.390625, 5.1796875, 5.96875, 6.7578125, 7.546875, 8.3359375, 9.125, 9.9140625, 10.703125, 11.4921875, 12.28125, 13.0703125, 13.859375, 14.6484375, 15.4375, 16.2265625, 17.015625, 17.8046875, 18.59375, 19.3828125, 20.171875, 20.9609375, 21.75, 22.5390625, 23.328125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 8.0, 7.0, 5.0, 18.0, 14.0, 14.0, 19.0, 15.0, 36.0, 38.0, 44.0, 64.0, 97.0, 160.0, 337.0, 1057.0, 15048.0, 3114014.0, 12839.0, 965.0, 325.0, 159.0, 96.0, 83.0, 43.0, 52.0, 38.0, 19.0, 18.0, 13.0, 14.0, 13.0, 9.0, 11.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.71875, -52.86279296875, -51.0068359375, -49.15087890625, -47.294921875, -45.43896484375, -43.5830078125, -41.72705078125, -39.87109375, -38.01513671875, -36.1591796875, -34.30322265625, -32.447265625, -30.59130859375, -28.7353515625, -26.87939453125, -25.0234375, -23.16748046875, -21.3115234375, -19.45556640625, -17.599609375, -15.74365234375, -13.8876953125, -12.03173828125, -10.17578125, -8.31982421875, -6.4638671875, -4.60791015625, -2.751953125, -0.89599609375, 0.9599609375, 2.81591796875, 4.671875, 6.52783203125, 8.3837890625, 10.23974609375, 12.095703125, 13.95166015625, 15.8076171875, 17.66357421875, 19.51953125, 21.37548828125, 23.2314453125, 25.08740234375, 26.943359375, 28.79931640625, 30.6552734375, 32.51123046875, 34.3671875, 36.22314453125, 38.0791015625, 39.93505859375, 41.791015625, 43.64697265625, 45.5029296875, 47.35888671875, 49.21484375, 51.07080078125, 52.9267578125, 54.78271484375, 56.638671875, 58.49462890625, 60.3505859375, 62.20654296875, 64.0625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 285.0, 731.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.956825256347656, -12.510163307189941, -1.0635013580322266, 10.383159637451172, 21.829822540283203, 33.276485443115234, 44.72314453125, 56.16980743408203, 67.61647033691406, 79.0631332397461, 90.50979614257812, 101.95645141601562, 113.40312194824219, 124.84977722167969, 136.29644775390625, 147.74310302734375, 159.18975830078125, 170.63641357421875, 182.0830841064453, 193.5297393798828, 204.97640991210938, 216.42306518554688, 227.86972045898438, 239.31639099121094, 250.7630615234375, 262.209716796875, 273.6563720703125, 285.1030578613281, 296.5497131347656, 307.9963684082031, 319.4430236816406, 330.88970947265625, 342.3363342285156, 353.7829895019531, 365.2296447753906, 376.67633056640625, 388.12298583984375, 399.56964111328125, 411.01629638671875, 422.46295166015625, 433.9096374511719, 445.3562927246094, 456.8029479980469, 468.2496337890625, 479.6962890625, 491.1429443359375, 502.589599609375, 514.0362548828125, 525.48291015625, 536.9295654296875, 548.376220703125, 559.8228759765625, 571.26953125, 582.7162475585938, 594.1629028320312, 605.6095581054688, 617.0562133789062, 628.5028686523438, 639.9495239257812, 651.3961791992188, 662.8428344726562, 674.28955078125, 685.7362060546875, 697.182861328125, 708.6295166015625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 7.0, 11.0, 8.0, 10.0, 11.0, 17.0, 17.0, 27.0, 22.0, 22.0, 13.0, 33.0, 37.0, 30.0, 34.0, 37.0, 33.0, 32.0, 39.0, 50.0, 43.0, 28.0, 33.0, 27.0, 34.0, 39.0, 42.0, 29.0, 36.0, 23.0, 24.0, 22.0, 28.0, 19.0, 18.0, 14.0, 11.0, 10.0, 9.0, 4.0, 6.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-70.2687759399414, -68.1363525390625, -66.0039291381836, -63.87150192260742, -61.739078521728516, -59.606651306152344, -57.47422790527344, -55.34180450439453, -53.209381103515625, -51.07695770263672, -48.94453048706055, -46.81210708618164, -44.679683685302734, -42.54725646972656, -40.414833068847656, -38.28240966796875, -36.14998245239258, -34.01755905151367, -31.885133743286133, -29.752708435058594, -27.620285034179688, -25.48785972595215, -23.35543441772461, -21.223011016845703, -19.090585708618164, -16.958160400390625, -14.825736999511719, -12.69331169128418, -10.560887336730957, -8.428462982177734, -6.296037673950195, -4.163613319396973, -2.03118896484375, 0.10123562812805176, 2.2336602210998535, 4.366085052490234, 6.498509407043457, 8.63093376159668, 10.763359069824219, 12.895783424377441, 15.028207778930664, 17.160633087158203, 19.29305648803711, 21.42548179626465, 23.557907104492188, 25.690330505371094, 27.822755813598633, 29.955181121826172, 32.08760452270508, 34.220027923583984, 36.352455139160156, 38.48487854003906, 40.61730194091797, 42.749725341796875, 44.88215255737305, 47.01457595825195, 49.147003173828125, 51.27942657470703, 53.4118537902832, 55.54427719116211, 57.676700592041016, 59.80912780761719, 61.941551208496094, 64.073974609375, 66.2063980102539]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 0.0, 2.0, 4.0, 10.0, 14.0, 9.0, 18.0, 8.0, 15.0, 23.0, 19.0, 35.0, 40.0, 35.0, 26.0, 33.0, 43.0, 47.0, 46.0, 47.0, 39.0, 49.0, 52.0, 37.0, 43.0, 40.0, 31.0, 42.0, 30.0, 27.0, 24.0, 19.0, 23.0, 7.0, 8.0, 14.0, 10.0, 1.0, 10.0, 12.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.046875, -6.82208251953125, -6.5972900390625, -6.37249755859375, -6.147705078125, -5.92291259765625, -5.6981201171875, -5.47332763671875, -5.24853515625, -5.02374267578125, -4.7989501953125, -4.57415771484375, -4.349365234375, -4.12457275390625, -3.8997802734375, -3.67498779296875, -3.4501953125, -3.22540283203125, -3.0006103515625, -2.77581787109375, -2.551025390625, -2.32623291015625, -2.1014404296875, -1.87664794921875, -1.65185546875, -1.42706298828125, -1.2022705078125, -0.97747802734375, -0.752685546875, -0.52789306640625, -0.3031005859375, -0.07830810546875, 0.146484375, 0.37127685546875, 0.5960693359375, 0.82086181640625, 1.045654296875, 1.27044677734375, 1.4952392578125, 1.72003173828125, 1.94482421875, 2.16961669921875, 2.3944091796875, 2.61920166015625, 2.843994140625, 3.06878662109375, 3.2935791015625, 3.51837158203125, 3.7431640625, 3.96795654296875, 4.1927490234375, 4.41754150390625, 4.642333984375, 4.86712646484375, 5.0919189453125, 5.31671142578125, 5.54150390625, 5.76629638671875, 5.9910888671875, 6.21588134765625, 6.440673828125, 6.66546630859375, 6.8902587890625, 7.11505126953125, 7.33984375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 3.0, 7.0, 10.0, 12.0, 9.0, 17.0, 22.0, 24.0, 34.0, 37.0, 58.0, 88.0, 126.0, 259.0, 567.0, 2302.0, 27078.0, 1343189.0, 2744764.0, 69807.0, 4206.0, 791.0, 347.0, 153.0, 91.0, 66.0, 48.0, 37.0, 27.0, 21.0, 21.0, 7.0, 10.0, 13.0, 7.0, 4.0, 2.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.171875, -26.270263671875, -25.36865234375, -24.467041015625, -23.5654296875, -22.663818359375, -21.76220703125, -20.860595703125, -19.958984375, -19.057373046875, -18.15576171875, -17.254150390625, -16.3525390625, -15.450927734375, -14.54931640625, -13.647705078125, -12.74609375, -11.844482421875, -10.94287109375, -10.041259765625, -9.1396484375, -8.238037109375, -7.33642578125, -6.434814453125, -5.533203125, -4.631591796875, -3.72998046875, -2.828369140625, -1.9267578125, -1.025146484375, -0.12353515625, 0.778076171875, 1.6796875, 2.581298828125, 3.48291015625, 4.384521484375, 5.2861328125, 6.187744140625, 7.08935546875, 7.990966796875, 8.892578125, 9.794189453125, 10.69580078125, 11.597412109375, 12.4990234375, 13.400634765625, 14.30224609375, 15.203857421875, 16.10546875, 17.007080078125, 17.90869140625, 18.810302734375, 19.7119140625, 20.613525390625, 21.51513671875, 22.416748046875, 23.318359375, 24.219970703125, 25.12158203125, 26.023193359375, 26.9248046875, 27.826416015625, 28.72802734375, 29.629638671875, 30.53125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 13.0, 8.0, 16.0, 24.0, 44.0, 65.0, 107.0, 123.0, 224.0, 407.0, 578.0, 662.0, 624.0, 420.0, 262.0, 159.0, 118.0, 66.0, 46.0, 40.0, 19.0, 12.0, 9.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.03125, -33.987548828125, -32.94384765625, -31.900146484375, -30.8564453125, -29.812744140625, -28.76904296875, -27.725341796875, -26.681640625, -25.637939453125, -24.59423828125, -23.550537109375, -22.5068359375, -21.463134765625, -20.41943359375, -19.375732421875, -18.33203125, -17.288330078125, -16.24462890625, -15.200927734375, -14.1572265625, -13.113525390625, -12.06982421875, -11.026123046875, -9.982421875, -8.938720703125, -7.89501953125, -6.851318359375, -5.8076171875, -4.763916015625, -3.72021484375, -2.676513671875, -1.6328125, -0.589111328125, 0.45458984375, 1.498291015625, 2.5419921875, 3.585693359375, 4.62939453125, 5.673095703125, 6.716796875, 7.760498046875, 8.80419921875, 9.847900390625, 10.8916015625, 11.935302734375, 12.97900390625, 14.022705078125, 15.06640625, 16.110107421875, 17.15380859375, 18.197509765625, 19.2412109375, 20.284912109375, 21.32861328125, 22.372314453125, 23.416015625, 24.459716796875, 25.50341796875, 26.547119140625, 27.5908203125, 28.634521484375, 29.67822265625, 30.721923828125, 31.765625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 4.0, 8.0, 3.0, 12.0, 20.0, 46.0, 50.0, 98.0, 183.0, 346.0, 815.0, 9718.0, 4157125.0, 24060.0, 964.0, 379.0, 179.0, 106.0, 59.0, 35.0, 21.0, 19.0, 10.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-133.625, -129.392578125, -125.16015625, -120.927734375, -116.6953125, -112.462890625, -108.23046875, -103.998046875, -99.765625, -95.533203125, -91.30078125, -87.068359375, -82.8359375, -78.603515625, -74.37109375, -70.138671875, -65.90625, -61.673828125, -57.44140625, -53.208984375, -48.9765625, -44.744140625, -40.51171875, -36.279296875, -32.046875, -27.814453125, -23.58203125, -19.349609375, -15.1171875, -10.884765625, -6.65234375, -2.419921875, 1.8125, 6.044921875, 10.27734375, 14.509765625, 18.7421875, 22.974609375, 27.20703125, 31.439453125, 35.671875, 39.904296875, 44.13671875, 48.369140625, 52.6015625, 56.833984375, 61.06640625, 65.298828125, 69.53125, 73.763671875, 77.99609375, 82.228515625, 86.4609375, 90.693359375, 94.92578125, 99.158203125, 103.390625, 107.623046875, 111.85546875, 116.087890625, 120.3203125, 124.552734375, 128.78515625, 133.017578125, 137.25]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 93.0, 489.0, 388.0, 39.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-427.95977783203125, -417.21441650390625, -406.46905517578125, -395.72369384765625, -384.9783020019531, -374.2329406738281, -363.4875793457031, -352.7422180175781, -341.9968566894531, -331.2514953613281, -320.5061340332031, -309.7607421875, -299.015380859375, -288.27001953125, -277.524658203125, -266.779296875, -256.033935546875, -245.28857421875, -234.54319763183594, -223.79783630371094, -213.05247497558594, -202.30709838867188, -191.56173706054688, -180.81637573242188, -170.07098388671875, -159.32562255859375, -148.5802459716797, -137.8348846435547, -127.08952331542969, -116.34415435791016, -105.59878540039062, -94.85342407226562, -84.10806274414062, -73.3626937866211, -62.617332458496094, -51.87196350097656, -41.1265983581543, -30.38123321533203, -19.6358642578125, -8.8905029296875, 1.8548660278320312, 12.600232124328613, 23.345598220825195, 34.090965270996094, 44.83633041381836, 55.581695556640625, 66.32706451416016, 77.07242584228516, 87.81779479980469, 98.56316375732422, 109.30852508544922, 120.05389404296875, 130.79925537109375, 141.54461669921875, 152.2899932861328, 163.0353546142578, 173.78073120117188, 184.52609252929688, 195.27146911621094, 206.01683044433594, 216.76219177246094, 227.507568359375, 238.2529296875, 248.998291015625, 259.74365234375]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 2.0, 2.0, 10.0, 12.0, 4.0, 9.0, 12.0, 17.0, 11.0, 18.0, 24.0, 22.0, 19.0, 30.0, 33.0, 27.0, 43.0, 41.0, 40.0, 34.0, 40.0, 37.0, 39.0, 45.0, 38.0, 38.0, 34.0, 43.0, 20.0, 36.0, 23.0, 28.0, 20.0, 27.0, 17.0, 15.0, 22.0, 13.0, 8.0, 8.0, 6.0, 9.0, 8.0, 4.0, 4.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-83.39867401123047, -80.9155044555664, -78.43234252929688, -75.94917297363281, -73.46601104736328, -70.98284149169922, -68.49967956542969, -66.01651000976562, -63.53334426879883, -61.05017852783203, -58.567012786865234, -56.08384704589844, -53.600677490234375, -51.117515563964844, -48.63434600830078, -46.151180267333984, -43.66801452636719, -41.18484878540039, -38.701683044433594, -36.2185173034668, -33.7353515625, -31.25218391418457, -28.76901626586914, -26.285850524902344, -23.802684783935547, -21.31951904296875, -18.836353302001953, -16.353185653686523, -13.870019912719727, -11.38685417175293, -8.903687477111816, -6.420520782470703, -3.9373550415039062, -1.4541888236999512, 1.028977394104004, 3.512143611907959, 5.995309829711914, 8.478475570678711, 10.961642265319824, 13.444808959960938, 15.927974700927734, 18.41114044189453, 20.894306182861328, 23.377473831176758, 25.860639572143555, 28.34380531311035, 30.82697296142578, 33.31013870239258, 35.793304443359375, 38.27647018432617, 40.75963592529297, 43.242801666259766, 45.72596740722656, 48.209136962890625, 50.69230270385742, 53.17546844482422, 55.658634185791016, 58.14179992675781, 60.62496566772461, 63.108131408691406, 65.59130096435547, 68.074462890625, 70.55763244628906, 73.04080200195312, 75.52396392822266]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 9.0, 5.0, 8.0, 11.0, 12.0, 13.0, 27.0, 25.0, 32.0, 25.0, 28.0, 29.0, 31.0, 35.0, 43.0, 43.0, 59.0, 46.0, 50.0, 40.0, 45.0, 41.0, 40.0, 45.0, 36.0, 29.0, 33.0, 32.0, 21.0, 20.0, 14.0, 12.0, 11.0, 7.0, 7.0, 5.0, 12.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.63671875, -6.40802001953125, -6.1793212890625, -5.95062255859375, -5.721923828125, -5.49322509765625, -5.2645263671875, -5.03582763671875, -4.80712890625, -4.57843017578125, -4.3497314453125, -4.12103271484375, -3.892333984375, -3.66363525390625, -3.4349365234375, -3.20623779296875, -2.9775390625, -2.74884033203125, -2.5201416015625, -2.29144287109375, -2.062744140625, -1.83404541015625, -1.6053466796875, -1.37664794921875, -1.14794921875, -0.91925048828125, -0.6905517578125, -0.46185302734375, -0.233154296875, -0.00445556640625, 0.2242431640625, 0.45294189453125, 0.681640625, 0.91033935546875, 1.1390380859375, 1.36773681640625, 1.596435546875, 1.82513427734375, 2.0538330078125, 2.28253173828125, 2.51123046875, 2.73992919921875, 2.9686279296875, 3.19732666015625, 3.426025390625, 3.65472412109375, 3.8834228515625, 4.11212158203125, 4.3408203125, 4.56951904296875, 4.7982177734375, 5.02691650390625, 5.255615234375, 5.48431396484375, 5.7130126953125, 5.94171142578125, 6.17041015625, 6.39910888671875, 6.6278076171875, 6.85650634765625, 7.085205078125, 7.31390380859375, 7.5426025390625, 7.77130126953125, 8.0]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 8.0, 24.0, 21.0, 27.0, 57.0, 83.0, 130.0, 200.0, 299.0, 505.0, 870.0, 1522.0, 2466.0, 4316.0, 7781.0, 14582.0, 28074.0, 55665.0, 121605.0, 387125.0, 239193.0, 91332.0, 43710.0, 22129.0, 11602.0, 6533.0, 3565.0, 1981.0, 1152.0, 732.0, 471.0, 282.0, 180.0, 103.0, 67.0, 43.0, 41.0, 19.0, 19.0, 13.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.111328125, -2.0507049560546875, -1.990081787109375, -1.9294586181640625, -1.86883544921875, -1.8082122802734375, -1.747589111328125, -1.6869659423828125, -1.6263427734375, -1.5657196044921875, -1.505096435546875, -1.4444732666015625, -1.38385009765625, -1.3232269287109375, -1.262603759765625, -1.2019805908203125, -1.141357421875, -1.0807342529296875, -1.020111083984375, -0.9594879150390625, -0.89886474609375, -0.8382415771484375, -0.777618408203125, -0.7169952392578125, -0.6563720703125, -0.5957489013671875, -0.535125732421875, -0.4745025634765625, -0.41387939453125, -0.3532562255859375, -0.292633056640625, -0.2320098876953125, -0.17138671875, -0.1107635498046875, -0.050140380859375, 0.0104827880859375, 0.07110595703125, 0.1317291259765625, 0.192352294921875, 0.2529754638671875, 0.3135986328125, 0.3742218017578125, 0.434844970703125, 0.4954681396484375, 0.55609130859375, 0.6167144775390625, 0.677337646484375, 0.7379608154296875, 0.798583984375, 0.8592071533203125, 0.919830322265625, 0.9804534912109375, 1.04107666015625, 1.1016998291015625, 1.162322998046875, 1.2229461669921875, 1.2835693359375, 1.3441925048828125, 1.404815673828125, 1.4654388427734375, 1.52606201171875, 1.5866851806640625, 1.647308349609375, 1.7079315185546875, 1.7685546875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 6.0, 17.0, 9.0, 10.0, 15.0, 21.0, 25.0, 15.0, 26.0, 33.0, 18.0, 26.0, 30.0, 34.0, 25.0, 27.0, 44.0, 39.0, 38.0, 1065.0, 42.0, 40.0, 38.0, 30.0, 28.0, 43.0, 41.0, 33.0, 29.0, 16.0, 21.0, 16.0, 18.0, 21.0, 16.0, 13.0, 10.0, 7.0, 6.0, 9.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.75390625, -3.6300048828125, -3.506103515625, -3.3822021484375, -3.25830078125, -3.1343994140625, -3.010498046875, -2.8865966796875, -2.7626953125, -2.6387939453125, -2.514892578125, -2.3909912109375, -2.26708984375, -2.1431884765625, -2.019287109375, -1.8953857421875, -1.771484375, -1.6475830078125, -1.523681640625, -1.3997802734375, -1.27587890625, -1.1519775390625, -1.028076171875, -0.9041748046875, -0.7802734375, -0.6563720703125, -0.532470703125, -0.4085693359375, -0.28466796875, -0.1607666015625, -0.036865234375, 0.0870361328125, 0.2109375, 0.3348388671875, 0.458740234375, 0.5826416015625, 0.70654296875, 0.8304443359375, 0.954345703125, 1.0782470703125, 1.2021484375, 1.3260498046875, 1.449951171875, 1.5738525390625, 1.69775390625, 1.8216552734375, 1.945556640625, 2.0694580078125, 2.193359375, 2.3172607421875, 2.441162109375, 2.5650634765625, 2.68896484375, 2.8128662109375, 2.936767578125, 3.0606689453125, 3.1845703125, 3.3084716796875, 3.432373046875, 3.5562744140625, 3.68017578125, 3.8040771484375, 3.927978515625, 4.0518798828125, 4.17578125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 6.0, 14.0, 12.0, 19.0, 28.0, 32.0, 55.0, 72.0, 107.0, 160.0, 229.0, 321.0, 472.0, 687.0, 1032.0, 1436.0, 2217.0, 3348.0, 5038.0, 7602.0, 11536.0, 17220.0, 26723.0, 41439.0, 65789.0, 119141.0, 1351990.0, 196766.0, 90732.0, 53601.0, 33867.0, 22095.0, 14564.0, 9845.0, 6282.0, 4288.0, 2810.0, 1754.0, 1232.0, 847.0, 520.0, 372.0, 286.0, 170.0, 115.0, 92.0, 43.0, 37.0, 27.0, 18.0, 13.0, 8.0, 6.0, 9.0, 4.0, 2.0, 3.0], "bins": [-1.2529296875, -1.215850830078125, -1.17877197265625, -1.141693115234375, -1.1046142578125, -1.067535400390625, -1.03045654296875, -0.993377685546875, -0.956298828125, -0.919219970703125, -0.88214111328125, -0.845062255859375, -0.8079833984375, -0.770904541015625, -0.73382568359375, -0.696746826171875, -0.65966796875, -0.622589111328125, -0.58551025390625, -0.548431396484375, -0.5113525390625, -0.474273681640625, -0.43719482421875, -0.400115966796875, -0.363037109375, -0.325958251953125, -0.28887939453125, -0.251800537109375, -0.2147216796875, -0.177642822265625, -0.14056396484375, -0.103485107421875, -0.06640625, -0.029327392578125, 0.00775146484375, 0.044830322265625, 0.0819091796875, 0.118988037109375, 0.15606689453125, 0.193145751953125, 0.230224609375, 0.267303466796875, 0.30438232421875, 0.341461181640625, 0.3785400390625, 0.415618896484375, 0.45269775390625, 0.489776611328125, 0.52685546875, 0.563934326171875, 0.60101318359375, 0.638092041015625, 0.6751708984375, 0.712249755859375, 0.74932861328125, 0.786407470703125, 0.823486328125, 0.860565185546875, 0.89764404296875, 0.934722900390625, 0.9718017578125, 1.008880615234375, 1.04595947265625, 1.083038330078125, 1.1201171875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 7.0, 5.0, 5.0, 2.0, 9.0, 11.0, 14.0, 25.0, 20.0, 22.0, 35.0, 68.0, 60.0, 59.0, 58.0, 86.0, 92.0, 80.0, 67.0, 56.0, 43.0, 36.0, 44.0, 24.0, 26.0, 12.0, 4.0, 8.0, 10.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007781982421875, -0.0007513165473937988, -0.0007244348526000977, -0.0006975531578063965, -0.0006706714630126953, -0.0006437897682189941, -0.000616908073425293, -0.0005900263786315918, -0.0005631446838378906, -0.0005362629890441895, -0.0005093812942504883, -0.0004824995994567871, -0.00045561790466308594, -0.00042873620986938477, -0.0004018545150756836, -0.0003749728202819824, -0.00034809112548828125, -0.0003212094306945801, -0.0002943277359008789, -0.00026744604110717773, -0.00024056434631347656, -0.0002136826515197754, -0.00018680095672607422, -0.00015991926193237305, -0.00013303756713867188, -0.0001061558723449707, -7.927417755126953e-05, -5.239248275756836e-05, -2.5510787963867188e-05, 1.3709068298339844e-06, 2.8252601623535156e-05, 5.513429641723633e-05, 8.20159912109375e-05, 0.00010889768600463867, 0.00013577938079833984, 0.00016266107559204102, 0.0001895427703857422, 0.00021642446517944336, 0.00024330615997314453, 0.0002701878547668457, 0.0002970695495605469, 0.00032395124435424805, 0.0003508329391479492, 0.0003777146339416504, 0.00040459632873535156, 0.00043147802352905273, 0.0004583597183227539, 0.0004852414131164551, 0.0005121231079101562, 0.0005390048027038574, 0.0005658864974975586, 0.0005927681922912598, 0.0006196498870849609, 0.0006465315818786621, 0.0006734132766723633, 0.0007002949714660645, 0.0007271766662597656, 0.0007540583610534668, 0.000780940055847168, 0.0008078217506408691, 0.0008347034454345703, 0.0008615851402282715, 0.0008884668350219727, 0.0009153485298156738, 0.000942230224609375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 5.0, 6.0, 8.0, 17.0, 22.0, 26.0, 41.0, 52.0, 95.0, 134.0, 240.0, 522.0, 13457.0, 1032175.0, 903.0, 347.0, 200.0, 99.0, 51.0, 35.0, 27.0, 20.0, 18.0, 16.0, 4.0, 6.0, 4.0, 4.0, 1.0, 8.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0267791748046875, -0.02604055404663086, -0.02530193328857422, -0.024563312530517578, -0.023824691772460938, -0.023086071014404297, -0.022347450256347656, -0.021608829498291016, -0.020870208740234375, -0.020131587982177734, -0.019392967224121094, -0.018654346466064453, -0.017915725708007812, -0.017177104949951172, -0.01643848419189453, -0.01569986343383789, -0.01496124267578125, -0.01422262191772461, -0.013484001159667969, -0.012745380401611328, -0.012006759643554688, -0.011268138885498047, -0.010529518127441406, -0.009790897369384766, -0.009052276611328125, -0.008313655853271484, -0.007575035095214844, -0.006836414337158203, -0.0060977935791015625, -0.005359172821044922, -0.004620552062988281, -0.0038819313049316406, -0.003143310546875, -0.0024046897888183594, -0.0016660690307617188, -0.0009274482727050781, -0.0001888275146484375, 0.0005497932434082031, 0.0012884140014648438, 0.0020270347595214844, 0.002765655517578125, 0.0035042762756347656, 0.004242897033691406, 0.004981517791748047, 0.0057201385498046875, 0.006458759307861328, 0.007197380065917969, 0.00793600082397461, 0.00867462158203125, 0.00941324234008789, 0.010151863098144531, 0.010890483856201172, 0.011629104614257812, 0.012367725372314453, 0.013106346130371094, 0.013844966888427734, 0.014583587646484375, 0.015322208404541016, 0.016060829162597656, 0.016799449920654297, 0.017538070678710938, 0.018276691436767578, 0.01901531219482422, 0.01975393295288086, 0.0204925537109375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 11.0, 141.0, 542.0, 293.0, 29.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044134899508208036, -0.0003753548371605575, -0.00030936067923903465, -0.00024336649221368134, -0.00017737233429215848, -0.00011137817637063563, -4.5383989345282316e-05, 2.061016857624054e-05, 8.66043264977634e-05, 0.00015259848441928625, 0.00021859265689272434, 0.0002845868293661624, 0.0003505809872876853, 0.00041657514520920813, 0.00048256933223456144, 0.0005485634901560843, 0.0006145576480776072, 0.00068055180599913, 0.0007465459639206529, 0.0008125401800498366, 0.0008785342797636986, 0.0009445284958928823, 0.0010105227120220661, 0.001076516811735928, 0.00114251091144979, 0.0012085051275789738, 0.0012744992272928357, 0.0013404934434220195, 0.0014064875431358814, 0.0014724817592650652, 0.001538475975394249, 0.001604470075108111, 0.0016704641748219728, 0.0017364583909511566, 0.0018024524906650186, 0.0018684467067942023, 0.0019344408065080643, 0.002000435022637248, 0.002066429238766432, 0.002132423222064972, 0.0021984174381941557, 0.0022644116543233395, 0.0023304058704525232, 0.0023963998537510633, 0.002462394069880247, 0.002528388286009431, 0.0025943825021386147, 0.0026603764854371548, 0.002726370934396982, 0.002792365150526166, 0.0028583593666553497, 0.00292435334995389, 0.0029903475660830736, 0.0030563417822122574, 0.003122335998341441, 0.003188330214470625, 0.003254324197769165, 0.003320318413898349, 0.0033863126300275326, 0.0034523066133260727, 0.0035183008294552565, 0.0035842950455844402, 0.003650289261713624, 0.0037162834778428078, 0.003782277461141348]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 8.0, 7.0, 15.0, 13.0, 15.0, 19.0, 17.0, 23.0, 20.0, 24.0, 21.0, 27.0, 42.0, 40.0, 36.0, 51.0, 34.0, 38.0, 39.0, 50.0, 50.0, 46.0, 40.0, 27.0, 32.0, 30.0, 35.0, 40.0, 19.0, 22.0, 21.0, 11.0, 20.0, 9.0, 9.0, 5.0, 9.0, 5.0, 6.0, 1.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003440380096435547, -0.00033304188400506973, -0.0003220457583665848, -0.0003110496327280998, -0.00030005350708961487, -0.0002890573814511299, -0.00027806125581264496, -0.00026706513017416, -0.00025606900453567505, -0.0002450728788971901, -0.00023407675325870514, -0.00022308062762022018, -0.00021208450198173523, -0.00020108837634325027, -0.00019009225070476532, -0.00017909612506628036, -0.0001680999994277954, -0.00015710387378931046, -0.0001461077481508255, -0.00013511162251234055, -0.0001241154968738556, -0.00011311937123537064, -0.00010212324559688568, -9.112711995840073e-05, -8.013099431991577e-05, -6.913486868143082e-05, -5.813874304294586e-05, -4.714261740446091e-05, -3.614649176597595e-05, -2.5150366127490997e-05, -1.4154240489006042e-05, -3.1581148505210876e-06, 7.838010787963867e-06, 1.8834136426448822e-05, 2.9830262064933777e-05, 4.082638770341873e-05, 5.1822513341903687e-05, 6.281863898038864e-05, 7.38147646188736e-05, 8.481089025735855e-05, 9.58070158958435e-05, 0.00010680314153432846, 0.00011779926717281342, 0.00012879539281129837, 0.00013979151844978333, 0.00015078764408826828, 0.00016178376972675323, 0.0001727798953652382, 0.00018377602100372314, 0.0001947721466422081, 0.00020576827228069305, 0.000216764397919178, 0.00022776052355766296, 0.00023875664919614792, 0.0002497527748346329, 0.00026074890047311783, 0.0002717450261116028, 0.00028274115175008774, 0.0002937372773885727, 0.00030473340302705765, 0.0003157295286655426, 0.00032672565430402756, 0.0003377217799425125, 0.00034871790558099747, 0.0003597140312194824]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 9.0, 5.0, 8.0, 11.0, 12.0, 13.0, 27.0, 25.0, 32.0, 25.0, 28.0, 29.0, 31.0, 35.0, 43.0, 43.0, 59.0, 46.0, 50.0, 40.0, 46.0, 40.0, 40.0, 45.0, 36.0, 29.0, 33.0, 32.0, 21.0, 20.0, 14.0, 12.0, 11.0, 7.0, 7.0, 5.0, 12.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.63671875, -6.40802001953125, -6.1793212890625, -5.95062255859375, -5.721923828125, -5.49322509765625, -5.2645263671875, -5.03582763671875, -4.80712890625, -4.57843017578125, -4.3497314453125, -4.12103271484375, -3.892333984375, -3.66363525390625, -3.4349365234375, -3.20623779296875, -2.9775390625, -2.74884033203125, -2.5201416015625, -2.29144287109375, -2.062744140625, -1.83404541015625, -1.6053466796875, -1.37664794921875, -1.14794921875, -0.91925048828125, -0.6905517578125, -0.46185302734375, -0.233154296875, -0.00445556640625, 0.2242431640625, 0.45294189453125, 0.681640625, 0.91033935546875, 1.1390380859375, 1.36773681640625, 1.596435546875, 1.82513427734375, 2.0538330078125, 2.28253173828125, 2.51123046875, 2.73992919921875, 2.9686279296875, 3.19732666015625, 3.426025390625, 3.65472412109375, 3.8834228515625, 4.11212158203125, 4.3408203125, 4.56951904296875, 4.7982177734375, 5.02691650390625, 5.255615234375, 5.48431396484375, 5.7130126953125, 5.94171142578125, 6.17041015625, 6.39910888671875, 6.6278076171875, 6.85650634765625, 7.085205078125, 7.31390380859375, 7.5426025390625, 7.77130126953125, 8.0]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 6.0, 22.0, 16.0, 31.0, 27.0, 45.0, 62.0, 90.0, 128.0, 204.0, 297.0, 457.0, 689.0, 1226.0, 1940.0, 3679.0, 7024.0, 15121.0, 36158.0, 97834.0, 329411.0, 373157.0, 107849.0, 39597.0, 16362.0, 7709.0, 3851.0, 2201.0, 1165.0, 720.0, 484.0, 315.0, 206.0, 149.0, 89.0, 72.0, 52.0, 27.0, 19.0, 20.0, 12.0, 11.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41796875, -4.265869140625, -4.11376953125, -3.961669921875, -3.8095703125, -3.657470703125, -3.50537109375, -3.353271484375, -3.201171875, -3.049072265625, -2.89697265625, -2.744873046875, -2.5927734375, -2.440673828125, -2.28857421875, -2.136474609375, -1.984375, -1.832275390625, -1.68017578125, -1.528076171875, -1.3759765625, -1.223876953125, -1.07177734375, -0.919677734375, -0.767578125, -0.615478515625, -0.46337890625, -0.311279296875, -0.1591796875, -0.007080078125, 0.14501953125, 0.297119140625, 0.44921875, 0.601318359375, 0.75341796875, 0.905517578125, 1.0576171875, 1.209716796875, 1.36181640625, 1.513916015625, 1.666015625, 1.818115234375, 1.97021484375, 2.122314453125, 2.2744140625, 2.426513671875, 2.57861328125, 2.730712890625, 2.8828125, 3.034912109375, 3.18701171875, 3.339111328125, 3.4912109375, 3.643310546875, 3.79541015625, 3.947509765625, 4.099609375, 4.251708984375, 4.40380859375, 4.555908203125, 4.7080078125, 4.860107421875, 5.01220703125, 5.164306640625, 5.31640625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 7.0, 7.0, 8.0, 12.0, 17.0, 15.0, 23.0, 23.0, 26.0, 27.0, 34.0, 36.0, 39.0, 45.0, 52.0, 66.0, 176.0, 1851.0, 133.0, 62.0, 52.0, 49.0, 44.0, 37.0, 37.0, 30.0, 25.0, 24.0, 19.0, 15.0, 8.0, 13.0, 14.0, 6.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.390625, -27.5146484375, -26.638671875, -25.7626953125, -24.88671875, -24.0107421875, -23.134765625, -22.2587890625, -21.3828125, -20.5068359375, -19.630859375, -18.7548828125, -17.87890625, -17.0029296875, -16.126953125, -15.2509765625, -14.375, -13.4990234375, -12.623046875, -11.7470703125, -10.87109375, -9.9951171875, -9.119140625, -8.2431640625, -7.3671875, -6.4912109375, -5.615234375, -4.7392578125, -3.86328125, -2.9873046875, -2.111328125, -1.2353515625, -0.359375, 0.5166015625, 1.392578125, 2.2685546875, 3.14453125, 4.0205078125, 4.896484375, 5.7724609375, 6.6484375, 7.5244140625, 8.400390625, 9.2763671875, 10.15234375, 11.0283203125, 11.904296875, 12.7802734375, 13.65625, 14.5322265625, 15.408203125, 16.2841796875, 17.16015625, 18.0361328125, 18.912109375, 19.7880859375, 20.6640625, 21.5400390625, 22.416015625, 23.2919921875, 24.16796875, 25.0439453125, 25.919921875, 26.7958984375, 27.671875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 12.0, 14.0, 9.0, 9.0, 16.0, 21.0, 22.0, 22.0, 38.0, 55.0, 55.0, 104.0, 174.0, 295.0, 822.0, 6493.0, 2874184.0, 259279.0, 2786.0, 548.0, 254.0, 141.0, 90.0, 40.0, 45.0, 36.0, 23.0, 24.0, 21.0, 16.0, 12.0, 10.0, 8.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.3125, -44.8583984375, -43.404296875, -41.9501953125, -40.49609375, -39.0419921875, -37.587890625, -36.1337890625, -34.6796875, -33.2255859375, -31.771484375, -30.3173828125, -28.86328125, -27.4091796875, -25.955078125, -24.5009765625, -23.046875, -21.5927734375, -20.138671875, -18.6845703125, -17.23046875, -15.7763671875, -14.322265625, -12.8681640625, -11.4140625, -9.9599609375, -8.505859375, -7.0517578125, -5.59765625, -4.1435546875, -2.689453125, -1.2353515625, 0.21875, 1.6728515625, 3.126953125, 4.5810546875, 6.03515625, 7.4892578125, 8.943359375, 10.3974609375, 11.8515625, 13.3056640625, 14.759765625, 16.2138671875, 17.66796875, 19.1220703125, 20.576171875, 22.0302734375, 23.484375, 24.9384765625, 26.392578125, 27.8466796875, 29.30078125, 30.7548828125, 32.208984375, 33.6630859375, 35.1171875, 36.5712890625, 38.025390625, 39.4794921875, 40.93359375, 42.3876953125, 43.841796875, 45.2958984375, 46.75]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [25.0, 677.0, 315.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.908289909362793, -5.010406017303467, 0.8874778747558594, 6.785361289978027, 12.683245658874512, 18.581130981445312, 24.47901153564453, 30.376895904541016, 36.2747802734375, 42.172664642333984, 48.07054901123047, 53.96842956542969, 59.86631774902344, 65.76419830322266, 71.66207885742188, 77.55996704101562, 83.45785522460938, 89.3557357788086, 95.25362396240234, 101.15150451660156, 107.04939270019531, 112.94727325439453, 118.84515380859375, 124.7430419921875, 130.64093017578125, 136.538818359375, 142.4366912841797, 148.33457946777344, 154.2324676513672, 160.13035583496094, 166.02822875976562, 171.92611694335938, 177.82398986816406, 183.7218780517578, 189.6197509765625, 195.51763916015625, 201.41552734375, 207.31341552734375, 213.21128845214844, 219.1091766357422, 225.00706481933594, 230.9049530029297, 236.80282592773438, 242.70071411132812, 248.59860229492188, 254.49649047851562, 260.3943786621094, 266.292236328125, 272.19012451171875, 278.0880126953125, 283.98590087890625, 289.8837890625, 295.7816467285156, 301.6795349121094, 307.5774230957031, 313.4753112792969, 319.3731994628906, 325.2710876464844, 331.1689758300781, 337.0668640136719, 342.9647216796875, 348.86260986328125, 354.760498046875, 360.65838623046875, 366.5562744140625]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 7.0, 15.0, 8.0, 13.0, 16.0, 13.0, 32.0, 17.0, 33.0, 24.0, 25.0, 28.0, 32.0, 31.0, 31.0, 36.0, 39.0, 56.0, 38.0, 39.0, 43.0, 36.0, 49.0, 32.0, 29.0, 32.0, 34.0, 25.0, 27.0, 21.0, 19.0, 21.0, 16.0, 14.0, 12.0, 7.0, 8.0, 3.0, 2.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-71.33573150634766, -68.8845443725586, -66.433349609375, -63.98215866088867, -61.530967712402344, -59.079776763916016, -56.62858581542969, -54.177398681640625, -51.72620391845703, -49.2750129699707, -46.823822021484375, -44.37263107299805, -41.92144012451172, -39.47024917602539, -37.01905822753906, -34.56787109375, -32.11668014526367, -29.665489196777344, -27.214298248291016, -24.763107299804688, -22.31191635131836, -19.86072540283203, -17.409536361694336, -14.958345413208008, -12.50715446472168, -10.055963516235352, -7.604773044586182, -5.153582572937012, -2.7023916244506836, -0.25120067596435547, 2.1999893188476562, 4.651180267333984, 7.1023712158203125, 9.55356216430664, 12.004753112792969, 14.45594310760498, 16.907135009765625, 19.358325958251953, 21.80951499938965, 24.260705947875977, 26.711896896362305, 29.163087844848633, 31.61427879333496, 34.065467834472656, 36.516658782958984, 38.96784973144531, 41.41904067993164, 43.87023162841797, 46.3214225769043, 48.772613525390625, 51.22380447387695, 53.67499542236328, 56.12618637084961, 58.57737731933594, 61.028564453125, 63.479759216308594, 65.93094635009766, 68.38213348388672, 70.83332824707031, 73.28451538085938, 75.73571014404297, 78.18689727783203, 80.63809204101562, 83.08927917480469, 85.54047393798828]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 5.0, 7.0, 9.0, 14.0, 10.0, 28.0, 22.0, 26.0, 25.0, 24.0, 31.0, 35.0, 29.0, 45.0, 47.0, 46.0, 49.0, 45.0, 46.0, 39.0, 51.0, 39.0, 47.0, 42.0, 26.0, 39.0, 26.0, 28.0, 22.0, 18.0, 9.0, 13.0, 7.0, 7.0, 7.0, 13.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.79296875, -6.55511474609375, -6.3172607421875, -6.07940673828125, -5.841552734375, -5.60369873046875, -5.3658447265625, -5.12799072265625, -4.89013671875, -4.65228271484375, -4.4144287109375, -4.17657470703125, -3.938720703125, -3.70086669921875, -3.4630126953125, -3.22515869140625, -2.9873046875, -2.74945068359375, -2.5115966796875, -2.27374267578125, -2.035888671875, -1.79803466796875, -1.5601806640625, -1.32232666015625, -1.08447265625, -0.84661865234375, -0.6087646484375, -0.37091064453125, -0.133056640625, 0.10479736328125, 0.3426513671875, 0.58050537109375, 0.818359375, 1.05621337890625, 1.2940673828125, 1.53192138671875, 1.769775390625, 2.00762939453125, 2.2454833984375, 2.48333740234375, 2.72119140625, 2.95904541015625, 3.1968994140625, 3.43475341796875, 3.672607421875, 3.91046142578125, 4.1483154296875, 4.38616943359375, 4.6240234375, 4.86187744140625, 5.0997314453125, 5.33758544921875, 5.575439453125, 5.81329345703125, 6.0511474609375, 6.28900146484375, 6.52685546875, 6.76470947265625, 7.0025634765625, 7.24041748046875, 7.478271484375, 7.71612548828125, 7.9539794921875, 8.19183349609375, 8.4296875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 4.0, 5.0, 7.0, 14.0, 10.0, 12.0, 20.0, 28.0, 17.0, 30.0, 34.0, 24.0, 33.0, 50.0, 77.0, 209.0, 1232.0, 105644.0, 4037595.0, 47708.0, 961.0, 174.0, 84.0, 42.0, 40.0, 40.0, 36.0, 27.0, 21.0, 16.0, 12.0, 16.0, 11.0, 11.0, 8.0, 10.0, 7.0, 7.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.78125, -43.20654296875, -41.6318359375, -40.05712890625, -38.482421875, -36.90771484375, -35.3330078125, -33.75830078125, -32.18359375, -30.60888671875, -29.0341796875, -27.45947265625, -25.884765625, -24.31005859375, -22.7353515625, -21.16064453125, -19.5859375, -18.01123046875, -16.4365234375, -14.86181640625, -13.287109375, -11.71240234375, -10.1376953125, -8.56298828125, -6.98828125, -5.41357421875, -3.8388671875, -2.26416015625, -0.689453125, 0.88525390625, 2.4599609375, 4.03466796875, 5.609375, 7.18408203125, 8.7587890625, 10.33349609375, 11.908203125, 13.48291015625, 15.0576171875, 16.63232421875, 18.20703125, 19.78173828125, 21.3564453125, 22.93115234375, 24.505859375, 26.08056640625, 27.6552734375, 29.22998046875, 30.8046875, 32.37939453125, 33.9541015625, 35.52880859375, 37.103515625, 38.67822265625, 40.2529296875, 41.82763671875, 43.40234375, 44.97705078125, 46.5517578125, 48.12646484375, 49.701171875, 51.27587890625, 52.8505859375, 54.42529296875, 56.0]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 5.0, 4.0, 9.0, 14.0, 19.0, 33.0, 37.0, 65.0, 88.0, 124.0, 162.0, 209.0, 369.0, 481.0, 610.0, 539.0, 429.0, 279.0, 194.0, 125.0, 90.0, 60.0, 41.0, 37.0, 23.0, 10.0, 7.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.359375, -24.55908203125, -23.7587890625, -22.95849609375, -22.158203125, -21.35791015625, -20.5576171875, -19.75732421875, -18.95703125, -18.15673828125, -17.3564453125, -16.55615234375, -15.755859375, -14.95556640625, -14.1552734375, -13.35498046875, -12.5546875, -11.75439453125, -10.9541015625, -10.15380859375, -9.353515625, -8.55322265625, -7.7529296875, -6.95263671875, -6.15234375, -5.35205078125, -4.5517578125, -3.75146484375, -2.951171875, -2.15087890625, -1.3505859375, -0.55029296875, 0.25, 1.05029296875, 1.8505859375, 2.65087890625, 3.451171875, 4.25146484375, 5.0517578125, 5.85205078125, 6.65234375, 7.45263671875, 8.2529296875, 9.05322265625, 9.853515625, 10.65380859375, 11.4541015625, 12.25439453125, 13.0546875, 13.85498046875, 14.6552734375, 15.45556640625, 16.255859375, 17.05615234375, 17.8564453125, 18.65673828125, 19.45703125, 20.25732421875, 21.0576171875, 21.85791015625, 22.658203125, 23.45849609375, 24.2587890625, 25.05908203125, 25.859375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 8.0, 13.0, 12.0, 25.0, 40.0, 64.0, 98.0, 125.0, 153.0, 296.0, 673.0, 7922.0, 4113725.0, 68962.0, 1061.0, 423.0, 215.0, 149.0, 107.0, 69.0, 57.0, 31.0, 15.0, 15.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.6875, -114.939453125, -111.19140625, -107.443359375, -103.6953125, -99.947265625, -96.19921875, -92.451171875, -88.703125, -84.955078125, -81.20703125, -77.458984375, -73.7109375, -69.962890625, -66.21484375, -62.466796875, -58.71875, -54.970703125, -51.22265625, -47.474609375, -43.7265625, -39.978515625, -36.23046875, -32.482421875, -28.734375, -24.986328125, -21.23828125, -17.490234375, -13.7421875, -9.994140625, -6.24609375, -2.498046875, 1.25, 4.998046875, 8.74609375, 12.494140625, 16.2421875, 19.990234375, 23.73828125, 27.486328125, 31.234375, 34.982421875, 38.73046875, 42.478515625, 46.2265625, 49.974609375, 53.72265625, 57.470703125, 61.21875, 64.966796875, 68.71484375, 72.462890625, 76.2109375, 79.958984375, 83.70703125, 87.455078125, 91.203125, 94.951171875, 98.69921875, 102.447265625, 106.1953125, 109.943359375, 113.69140625, 117.439453125, 121.1875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 7.0, 50.0, 243.0, 398.0, 239.0, 76.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.334232330322266, -26.81269645690918, -19.291160583496094, -11.769622802734375, -4.248086929321289, 3.273448944091797, 10.794986724853516, 18.31652069091797, 25.838058471679688, 33.359596252441406, 40.88113021850586, 48.40266799926758, 55.92420196533203, 63.44573974609375, 70.96727752685547, 78.48881530761719, 86.01034545898438, 93.5318832397461, 101.05342102050781, 108.574951171875, 116.09648895263672, 123.61802673339844, 131.13955688476562, 138.66110229492188, 146.18264770507812, 153.7041778564453, 161.22572326660156, 168.74725341796875, 176.268798828125, 183.7903289794922, 191.31185913085938, 198.83340454101562, 206.3549346923828, 213.87646484375, 221.39801025390625, 228.91954040527344, 236.4410858154297, 243.96261596679688, 251.48416137695312, 259.00567626953125, 266.5272216796875, 274.04876708984375, 281.5702819824219, 289.0918273925781, 296.6133728027344, 304.1348876953125, 311.65643310546875, 319.177978515625, 326.69952392578125, 334.2210693359375, 341.7425842285156, 349.2641296386719, 356.7856750488281, 364.30718994140625, 371.8287353515625, 379.35028076171875, 386.8717956542969, 394.3933410644531, 401.91485595703125, 409.4364013671875, 416.95794677734375, 424.4794921875, 432.0010070800781, 439.5225524902344, 447.0440979003906]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 9.0, 8.0, 10.0, 13.0, 23.0, 16.0, 21.0, 25.0, 33.0, 36.0, 42.0, 32.0, 34.0, 48.0, 55.0, 43.0, 47.0, 43.0, 59.0, 45.0, 32.0, 52.0, 38.0, 33.0, 24.0, 30.0, 29.0, 18.0, 21.0, 17.0, 11.0, 12.0, 8.0, 8.0, 4.0, 7.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.67984008789062, -78.16622924804688, -75.6526107788086, -73.13899993896484, -70.62538146972656, -68.11177062988281, -65.59815979003906, -63.08454513549805, -60.57093048095703, -58.057315826416016, -55.543701171875, -53.03009033203125, -50.516475677490234, -48.00286102294922, -45.48925018310547, -42.97563552856445, -40.46202087402344, -37.94840621948242, -35.434791564941406, -32.921180725097656, -30.40756607055664, -27.893951416015625, -25.380338668823242, -22.86672592163086, -20.353111267089844, -17.839496612548828, -15.325883865356445, -12.812270164489746, -10.298656463623047, -7.785042762756348, -5.271429061889648, -2.7578163146972656, -0.24420166015625, 2.269412040710449, 4.783025741577148, 7.296639442443848, 9.810253143310547, 12.323866844177246, 14.837480545043945, 17.351093292236328, 19.864707946777344, 22.37832260131836, 24.891935348510742, 27.405548095703125, 29.91916275024414, 32.432777404785156, 34.946388244628906, 37.46000289916992, 39.97361755371094, 42.48723220825195, 45.00084686279297, 47.51445770263672, 50.028072357177734, 52.54168701171875, 55.0552978515625, 57.568912506103516, 60.08252716064453, 62.59614181518555, 65.10975646972656, 67.62336730957031, 70.13697814941406, 72.65059661865234, 75.1642074584961, 77.67782592773438, 80.19143676757812]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 5.0, 6.0, 8.0, 16.0, 25.0, 17.0, 18.0, 26.0, 24.0, 25.0, 31.0, 34.0, 39.0, 36.0, 38.0, 32.0, 53.0, 56.0, 51.0, 45.0, 53.0, 37.0, 42.0, 40.0, 31.0, 24.0, 26.0, 38.0, 20.0, 18.0, 13.0, 17.0, 11.0, 12.0, 8.0, 4.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.51171875, -7.26715087890625, -7.0225830078125, -6.77801513671875, -6.533447265625, -6.28887939453125, -6.0443115234375, -5.79974365234375, -5.55517578125, -5.31060791015625, -5.0660400390625, -4.82147216796875, -4.576904296875, -4.33233642578125, -4.0877685546875, -3.84320068359375, -3.5986328125, -3.35406494140625, -3.1094970703125, -2.86492919921875, -2.620361328125, -2.37579345703125, -2.1312255859375, -1.88665771484375, -1.64208984375, -1.39752197265625, -1.1529541015625, -0.90838623046875, -0.663818359375, -0.41925048828125, -0.1746826171875, 0.06988525390625, 0.314453125, 0.55902099609375, 0.8035888671875, 1.04815673828125, 1.292724609375, 1.53729248046875, 1.7818603515625, 2.02642822265625, 2.27099609375, 2.51556396484375, 2.7601318359375, 3.00469970703125, 3.249267578125, 3.49383544921875, 3.7384033203125, 3.98297119140625, 4.2275390625, 4.47210693359375, 4.7166748046875, 4.96124267578125, 5.205810546875, 5.45037841796875, 5.6949462890625, 5.93951416015625, 6.18408203125, 6.42864990234375, 6.6732177734375, 6.91778564453125, 7.162353515625, 7.40692138671875, 7.6514892578125, 7.89605712890625, 8.140625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 9.0, 7.0, 22.0, 26.0, 29.0, 53.0, 104.0, 133.0, 193.0, 267.0, 432.0, 706.0, 1060.0, 1687.0, 2667.0, 4313.0, 7242.0, 11720.0, 19212.0, 32732.0, 55794.0, 101187.0, 241158.0, 302030.0, 113499.0, 61926.0, 35551.0, 21373.0, 12805.0, 7790.0, 4815.0, 2894.0, 1874.0, 1142.0, 757.0, 471.0, 313.0, 190.0, 132.0, 86.0, 49.0, 42.0, 19.0, 14.0, 13.0, 8.0, 4.0, 3.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6923828125, -1.6412353515625, -1.590087890625, -1.5389404296875, -1.48779296875, -1.4366455078125, -1.385498046875, -1.3343505859375, -1.283203125, -1.2320556640625, -1.180908203125, -1.1297607421875, -1.07861328125, -1.0274658203125, -0.976318359375, -0.9251708984375, -0.8740234375, -0.8228759765625, -0.771728515625, -0.7205810546875, -0.66943359375, -0.6182861328125, -0.567138671875, -0.5159912109375, -0.46484375, -0.4136962890625, -0.362548828125, -0.3114013671875, -0.26025390625, -0.2091064453125, -0.157958984375, -0.1068115234375, -0.0556640625, -0.0045166015625, 0.046630859375, 0.0977783203125, 0.14892578125, 0.2000732421875, 0.251220703125, 0.3023681640625, 0.353515625, 0.4046630859375, 0.455810546875, 0.5069580078125, 0.55810546875, 0.6092529296875, 0.660400390625, 0.7115478515625, 0.7626953125, 0.8138427734375, 0.864990234375, 0.9161376953125, 0.96728515625, 1.0184326171875, 1.069580078125, 1.1207275390625, 1.171875, 1.2230224609375, 1.274169921875, 1.3253173828125, 1.37646484375, 1.4276123046875, 1.478759765625, 1.5299072265625, 1.5810546875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 4.0, 6.0, 3.0, 16.0, 14.0, 16.0, 14.0, 15.0, 19.0, 17.0, 23.0, 31.0, 33.0, 24.0, 47.0, 39.0, 48.0, 50.0, 41.0, 30.0, 1059.0, 46.0, 45.0, 42.0, 48.0, 35.0, 43.0, 31.0, 18.0, 22.0, 19.0, 26.0, 26.0, 14.0, 15.0, 11.0, 8.0, 7.0, 5.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.5523681640625, -4.401611328125, -4.2508544921875, -4.10009765625, -3.9493408203125, -3.798583984375, -3.6478271484375, -3.4970703125, -3.3463134765625, -3.195556640625, -3.0447998046875, -2.89404296875, -2.7432861328125, -2.592529296875, -2.4417724609375, -2.291015625, -2.1402587890625, -1.989501953125, -1.8387451171875, -1.68798828125, -1.5372314453125, -1.386474609375, -1.2357177734375, -1.0849609375, -0.9342041015625, -0.783447265625, -0.6326904296875, -0.48193359375, -0.3311767578125, -0.180419921875, -0.0296630859375, 0.12109375, 0.2718505859375, 0.422607421875, 0.5733642578125, 0.72412109375, 0.8748779296875, 1.025634765625, 1.1763916015625, 1.3271484375, 1.4779052734375, 1.628662109375, 1.7794189453125, 1.93017578125, 2.0809326171875, 2.231689453125, 2.3824462890625, 2.533203125, 2.6839599609375, 2.834716796875, 2.9854736328125, 3.13623046875, 3.2869873046875, 3.437744140625, 3.5885009765625, 3.7392578125, 3.8900146484375, 4.040771484375, 4.1915283203125, 4.34228515625, 4.4930419921875, 4.643798828125, 4.7945556640625, 4.9453125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 5.0, 10.0, 21.0, 20.0, 32.0, 63.0, 70.0, 102.0, 166.0, 256.0, 381.0, 556.0, 856.0, 1356.0, 2098.0, 3220.0, 5162.0, 8163.0, 12801.0, 19909.0, 32079.0, 54170.0, 101795.0, 243446.0, 1340452.0, 115369.0, 59608.0, 35108.0, 21575.0, 13675.0, 8746.0, 5634.0, 3654.0, 2258.0, 1481.0, 973.0, 604.0, 409.0, 298.0, 179.0, 108.0, 78.0, 60.0, 43.0, 25.0, 18.0, 14.0, 5.0, 8.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-1.5048828125, -1.4593963623046875, -1.413909912109375, -1.3684234619140625, -1.32293701171875, -1.2774505615234375, -1.231964111328125, -1.1864776611328125, -1.1409912109375, -1.0955047607421875, -1.050018310546875, -1.0045318603515625, -0.95904541015625, -0.9135589599609375, -0.868072509765625, -0.8225860595703125, -0.777099609375, -0.7316131591796875, -0.686126708984375, -0.6406402587890625, -0.59515380859375, -0.5496673583984375, -0.504180908203125, -0.4586944580078125, -0.4132080078125, -0.3677215576171875, -0.322235107421875, -0.2767486572265625, -0.23126220703125, -0.1857757568359375, -0.140289306640625, -0.0948028564453125, -0.04931640625, -0.0038299560546875, 0.041656494140625, 0.0871429443359375, 0.13262939453125, 0.1781158447265625, 0.223602294921875, 0.2690887451171875, 0.3145751953125, 0.3600616455078125, 0.405548095703125, 0.4510345458984375, 0.49652099609375, 0.5420074462890625, 0.587493896484375, 0.6329803466796875, 0.678466796875, 0.7239532470703125, 0.769439697265625, 0.8149261474609375, 0.86041259765625, 0.9058990478515625, 0.951385498046875, 0.9968719482421875, 1.0423583984375, 1.0878448486328125, 1.133331298828125, 1.1788177490234375, 1.22430419921875, 1.2697906494140625, 1.315277099609375, 1.3607635498046875, 1.40625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 6.0, 5.0, 8.0, 11.0, 9.0, 6.0, 7.0, 11.0, 20.0, 20.0, 22.0, 28.0, 32.0, 37.0, 54.0, 54.0, 63.0, 58.0, 78.0, 68.0, 74.0, 61.0, 44.0, 42.0, 31.0, 28.0, 17.0, 19.0, 12.0, 10.0, 5.0, 9.0, 10.0, 7.0, 8.0, 9.0, 3.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007925033569335938, -0.0007638037204742432, -0.0007351040840148926, -0.000706404447555542, -0.0006777048110961914, -0.0006490051746368408, -0.0006203055381774902, -0.0005916059017181396, -0.0005629062652587891, -0.0005342066287994385, -0.0005055069923400879, -0.0004768073558807373, -0.0004481077194213867, -0.00041940808296203613, -0.00039070844650268555, -0.00036200881004333496, -0.0003333091735839844, -0.0003046095371246338, -0.0002759099006652832, -0.0002472102642059326, -0.00021851062774658203, -0.00018981099128723145, -0.00016111135482788086, -0.00013241171836853027, -0.00010371208190917969, -7.50124454498291e-05, -4.6312808990478516e-05, -1.761317253112793e-05, 1.1086463928222656e-05, 3.978610038757324e-05, 6.848573684692383e-05, 9.718537330627441e-05, 0.000125885009765625, 0.00015458464622497559, 0.00018328428268432617, 0.00021198391914367676, 0.00024068355560302734, 0.00026938319206237793, 0.0002980828285217285, 0.0003267824649810791, 0.0003554821014404297, 0.0003841817378997803, 0.00041288137435913086, 0.00044158101081848145, 0.00047028064727783203, 0.0004989802837371826, 0.0005276799201965332, 0.0005563795566558838, 0.0005850791931152344, 0.000613778829574585, 0.0006424784660339355, 0.0006711781024932861, 0.0006998777389526367, 0.0007285773754119873, 0.0007572770118713379, 0.0007859766483306885, 0.0008146762847900391, 0.0008433759212493896, 0.0008720755577087402, 0.0009007751941680908, 0.0009294748306274414, 0.000958174467086792, 0.0009868741035461426, 0.0010155737400054932, 0.0010442733764648438]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 6.0, 1.0, 3.0, 3.0, 3.0, 8.0, 8.0, 13.0, 11.0, 15.0, 15.0, 25.0, 31.0, 60.0, 90.0, 153.0, 206.0, 398.0, 1301.0, 1034390.0, 10475.0, 563.0, 299.0, 156.0, 84.0, 49.0, 40.0, 34.0, 28.0, 12.0, 11.0, 13.0, 12.0, 8.0, 7.0, 7.0, 9.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.02764892578125, -0.026874303817749023, -0.026099681854248047, -0.02532505989074707, -0.024550437927246094, -0.023775815963745117, -0.02300119400024414, -0.022226572036743164, -0.021451950073242188, -0.02067732810974121, -0.019902706146240234, -0.019128084182739258, -0.01835346221923828, -0.017578840255737305, -0.016804218292236328, -0.01602959632873535, -0.015254974365234375, -0.014480352401733398, -0.013705730438232422, -0.012931108474731445, -0.012156486511230469, -0.011381864547729492, -0.010607242584228516, -0.009832620620727539, -0.009057998657226562, -0.008283376693725586, -0.007508754730224609, -0.006734132766723633, -0.005959510803222656, -0.00518488883972168, -0.004410266876220703, -0.0036356449127197266, -0.00286102294921875, -0.0020864009857177734, -0.0013117790222167969, -0.0005371570587158203, 0.00023746490478515625, 0.0010120868682861328, 0.0017867088317871094, 0.002561330795288086, 0.0033359527587890625, 0.004110574722290039, 0.004885196685791016, 0.005659818649291992, 0.006434440612792969, 0.007209062576293945, 0.007983684539794922, 0.008758306503295898, 0.009532928466796875, 0.010307550430297852, 0.011082172393798828, 0.011856794357299805, 0.012631416320800781, 0.013406038284301758, 0.014180660247802734, 0.014955282211303711, 0.015729904174804688, 0.016504526138305664, 0.01727914810180664, 0.018053770065307617, 0.018828392028808594, 0.01960301399230957, 0.020377635955810547, 0.021152257919311523, 0.0219268798828125]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 25.0, 126.0, 361.0, 370.0, 102.0, 22.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010926652466878295, -0.0010429599788039923, -0.0009932545945048332, -0.000943549326620996, -0.0008938440587371588, -0.0008441387326456606, -0.0007944334065541625, -0.0007447281386703253, -0.0006950228125788271, -0.000645317486487329, -0.0005956122186034918, -0.0005459068925119936, -0.0004962015664204955, -0.0004464962985366583, -0.00039679097244516015, -0.00034708567545749247, -0.0002973803784698248, -0.0002476750814821571, -0.0001979697699425742, -0.0001482644584029913, -9.855916141532362e-05, -4.8853864427655935e-05, 8.514616638422012e-07, 5.055675865150988e-05, 0.00010026205563917756, 0.00014996735262684524, 0.00019967266416642815, 0.00024937797570601106, 0.00029908327269367874, 0.0003487885696813464, 0.00039849389577284455, 0.00044819919276051223, 0.0004979046061635017, 0.0005476099322549999, 0.0005973152001388371, 0.0006470205262303352, 0.0006967257941141725, 0.0007464311202056706, 0.0007961364462971687, 0.000845841714181006, 0.0008955470402725041, 0.0009452523663640022, 0.0009949576342478395, 0.0010446629021316767, 0.0010943682864308357, 0.001144073554314673, 0.0011937788221985102, 0.0012434842064976692, 0.0012931894743815064, 0.0013428947422653437, 0.0013926001265645027, 0.00144230539444834, 0.0014920106623321772, 0.0015417160466313362, 0.0015914213145151734, 0.0016411265823990107, 0.0016908319666981697, 0.001740537234582007, 0.001790242618881166, 0.0018399478867650032, 0.0018896531546488404, 0.0019393584225326777, 0.0019890638068318367, 0.0020387691911309958, 0.002088474342599511]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 6.0, 8.0, 6.0, 7.0, 10.0, 16.0, 14.0, 18.0, 23.0, 29.0, 28.0, 23.0, 38.0, 34.0, 38.0, 30.0, 37.0, 41.0, 35.0, 49.0, 29.0, 42.0, 45.0, 37.0, 32.0, 35.0, 44.0, 30.0, 20.0, 28.0, 25.0, 14.0, 23.0, 12.0, 15.0, 9.0, 10.0, 9.0, 8.0, 2.0, 9.0, 7.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00045108795166015625, -0.0004370715469121933, -0.00042305514216423035, -0.0004090387374162674, -0.00039502233266830444, -0.0003810059279203415, -0.00036698952317237854, -0.0003529731184244156, -0.00033895671367645264, -0.0003249403089284897, -0.00031092390418052673, -0.0002969074994325638, -0.00028289109468460083, -0.0002688746899366379, -0.0002548582851886749, -0.00024084188044071198, -0.00022682547569274902, -0.00021280907094478607, -0.00019879266619682312, -0.00018477626144886017, -0.00017075985670089722, -0.00015674345195293427, -0.0001427270472049713, -0.00012871064245700836, -0.00011469423770904541, -0.00010067783296108246, -8.666142821311951e-05, -7.264502346515656e-05, -5.8628618717193604e-05, -4.461221396923065e-05, -3.05958092212677e-05, -1.657940447330475e-05, -2.562999725341797e-06, 1.1453405022621155e-05, 2.5469809770584106e-05, 3.948621451854706e-05, 5.350261926651001e-05, 6.751902401447296e-05, 8.153542876243591e-05, 9.555183351039886e-05, 0.00010956823825836182, 0.00012358464300632477, 0.00013760104775428772, 0.00015161745250225067, 0.00016563385725021362, 0.00017965026199817657, 0.00019366666674613953, 0.00020768307149410248, 0.00022169947624206543, 0.00023571588099002838, 0.00024973228573799133, 0.0002637486904859543, 0.00027776509523391724, 0.0002917814999818802, 0.00030579790472984314, 0.0003198143094778061, 0.00033383071422576904, 0.000347847118973732, 0.00036186352372169495, 0.0003758799284696579, 0.00038989633321762085, 0.0004039127379655838, 0.00041792914271354675, 0.0004319455474615097, 0.00044596195220947266]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 5.0, 6.0, 8.0, 16.0, 25.0, 17.0, 18.0, 26.0, 24.0, 25.0, 31.0, 34.0, 39.0, 36.0, 38.0, 32.0, 53.0, 56.0, 51.0, 46.0, 52.0, 37.0, 42.0, 40.0, 31.0, 24.0, 26.0, 38.0, 20.0, 18.0, 13.0, 17.0, 11.0, 12.0, 8.0, 4.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.51171875, -7.26715087890625, -7.0225830078125, -6.77801513671875, -6.533447265625, -6.28887939453125, -6.0443115234375, -5.79974365234375, -5.55517578125, -5.31060791015625, -5.0660400390625, -4.82147216796875, -4.576904296875, -4.33233642578125, -4.0877685546875, -3.84320068359375, -3.5986328125, -3.35406494140625, -3.1094970703125, -2.86492919921875, -2.620361328125, -2.37579345703125, -2.1312255859375, -1.88665771484375, -1.64208984375, -1.39752197265625, -1.1529541015625, -0.90838623046875, -0.663818359375, -0.41925048828125, -0.1746826171875, 0.06988525390625, 0.314453125, 0.55902099609375, 0.8035888671875, 1.04815673828125, 1.292724609375, 1.53729248046875, 1.7818603515625, 2.02642822265625, 2.27099609375, 2.51556396484375, 2.7601318359375, 3.00469970703125, 3.249267578125, 3.49383544921875, 3.7384033203125, 3.98297119140625, 4.2275390625, 4.47210693359375, 4.7166748046875, 4.96124267578125, 5.205810546875, 5.45037841796875, 5.6949462890625, 5.93951416015625, 6.18408203125, 6.42864990234375, 6.6732177734375, 6.91778564453125, 7.162353515625, 7.40692138671875, 7.6514892578125, 7.89605712890625, 8.140625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 14.0, 8.0, 11.0, 19.0, 33.0, 32.0, 48.0, 57.0, 90.0, 134.0, 195.0, 336.0, 504.0, 752.0, 1282.0, 2255.0, 4323.0, 9113.0, 22236.0, 74943.0, 407461.0, 408919.0, 74233.0, 22378.0, 9089.0, 4228.0, 2302.0, 1276.0, 761.0, 512.0, 306.0, 213.0, 138.0, 103.0, 66.0, 55.0, 44.0, 23.0, 23.0, 8.0, 6.0, 9.0, 3.0, 3.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.08984375, -5.8995361328125, -5.709228515625, -5.5189208984375, -5.32861328125, -5.1383056640625, -4.947998046875, -4.7576904296875, -4.5673828125, -4.3770751953125, -4.186767578125, -3.9964599609375, -3.80615234375, -3.6158447265625, -3.425537109375, -3.2352294921875, -3.044921875, -2.8546142578125, -2.664306640625, -2.4739990234375, -2.28369140625, -2.0933837890625, -1.903076171875, -1.7127685546875, -1.5224609375, -1.3321533203125, -1.141845703125, -0.9515380859375, -0.76123046875, -0.5709228515625, -0.380615234375, -0.1903076171875, 0.0, 0.1903076171875, 0.380615234375, 0.5709228515625, 0.76123046875, 0.9515380859375, 1.141845703125, 1.3321533203125, 1.5224609375, 1.7127685546875, 1.903076171875, 2.0933837890625, 2.28369140625, 2.4739990234375, 2.664306640625, 2.8546142578125, 3.044921875, 3.2352294921875, 3.425537109375, 3.6158447265625, 3.80615234375, 3.9964599609375, 4.186767578125, 4.3770751953125, 4.5673828125, 4.7576904296875, 4.947998046875, 5.1383056640625, 5.32861328125, 5.5189208984375, 5.709228515625, 5.8995361328125, 6.08984375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 6.0, 10.0, 14.0, 11.0, 9.0, 12.0, 22.0, 29.0, 23.0, 25.0, 31.0, 34.0, 38.0, 29.0, 52.0, 47.0, 98.0, 1726.0, 308.0, 73.0, 62.0, 49.0, 53.0, 40.0, 35.0, 27.0, 33.0, 23.0, 20.0, 17.0, 17.0, 11.0, 5.0, 13.0, 9.0, 7.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-27.0625, -26.262451171875, -25.46240234375, -24.662353515625, -23.8623046875, -23.062255859375, -22.26220703125, -21.462158203125, -20.662109375, -19.862060546875, -19.06201171875, -18.261962890625, -17.4619140625, -16.661865234375, -15.86181640625, -15.061767578125, -14.26171875, -13.461669921875, -12.66162109375, -11.861572265625, -11.0615234375, -10.261474609375, -9.46142578125, -8.661376953125, -7.861328125, -7.061279296875, -6.26123046875, -5.461181640625, -4.6611328125, -3.861083984375, -3.06103515625, -2.260986328125, -1.4609375, -0.660888671875, 0.13916015625, 0.939208984375, 1.7392578125, 2.539306640625, 3.33935546875, 4.139404296875, 4.939453125, 5.739501953125, 6.53955078125, 7.339599609375, 8.1396484375, 8.939697265625, 9.73974609375, 10.539794921875, 11.33984375, 12.139892578125, 12.93994140625, 13.739990234375, 14.5400390625, 15.340087890625, 16.14013671875, 16.940185546875, 17.740234375, 18.540283203125, 19.34033203125, 20.140380859375, 20.9404296875, 21.740478515625, 22.54052734375, 23.340576171875, 24.140625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 5.0, 5.0, 5.0, 13.0, 13.0, 5.0, 13.0, 14.0, 19.0, 24.0, 30.0, 46.0, 52.0, 73.0, 109.0, 166.0, 240.0, 605.0, 3074.0, 225950.0, 2907865.0, 5649.0, 784.0, 335.0, 159.0, 118.0, 76.0, 49.0, 37.0, 30.0, 30.0, 26.0, 16.0, 13.0, 10.0, 13.0, 9.0, 5.0, 7.0, 6.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.1875, -38.853515625, -37.51953125, -36.185546875, -34.8515625, -33.517578125, -32.18359375, -30.849609375, -29.515625, -28.181640625, -26.84765625, -25.513671875, -24.1796875, -22.845703125, -21.51171875, -20.177734375, -18.84375, -17.509765625, -16.17578125, -14.841796875, -13.5078125, -12.173828125, -10.83984375, -9.505859375, -8.171875, -6.837890625, -5.50390625, -4.169921875, -2.8359375, -1.501953125, -0.16796875, 1.166015625, 2.5, 3.833984375, 5.16796875, 6.501953125, 7.8359375, 9.169921875, 10.50390625, 11.837890625, 13.171875, 14.505859375, 15.83984375, 17.173828125, 18.5078125, 19.841796875, 21.17578125, 22.509765625, 23.84375, 25.177734375, 26.51171875, 27.845703125, 29.1796875, 30.513671875, 31.84765625, 33.181640625, 34.515625, 35.849609375, 37.18359375, 38.517578125, 39.8515625, 41.185546875, 42.51953125, 43.853515625, 45.1875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 10.0, 20.0, 33.0, 63.0, 92.0, 173.0, 220.0, 165.0, 119.0, 58.0, 33.0, 15.0, 5.0, 2.0, 0.0, 0.0, 3.0], "bins": [-42.61725997924805, -41.82050323486328, -41.023746490478516, -40.22698974609375, -39.430233001708984, -38.63347625732422, -37.83671951293945, -37.03996276855469, -36.24320602416992, -35.446449279785156, -34.64969253540039, -33.852935791015625, -33.05617904663086, -32.259422302246094, -31.462665557861328, -30.665908813476562, -29.86915397644043, -29.072397232055664, -28.2756404876709, -27.478883743286133, -26.682126998901367, -25.8853702545166, -25.08861541748047, -24.291858673095703, -23.495101928710938, -22.698345184326172, -21.901588439941406, -21.10483169555664, -20.308074951171875, -19.51131820678711, -18.714561462402344, -17.917804718017578, -17.121047973632812, -16.324291229248047, -15.527534484863281, -14.730777740478516, -13.93402099609375, -13.137264251708984, -12.340508460998535, -11.54375171661377, -10.74699592590332, -9.950239181518555, -9.153482437133789, -8.356725692749023, -7.559969425201416, -6.76321268081665, -5.966456413269043, -5.169699668884277, -4.372942924499512, -3.576186180114746, -2.7794296741485596, -1.982673168182373, -1.1859164237976074, -0.3891596794128418, 0.4075965881347656, 1.2043533325195312, 2.001110076904297, 2.7978668212890625, 3.594623327255249, 4.3913798332214355, 5.188136577606201, 5.984893321990967, 6.781649589538574, 7.57840633392334, 8.375163078308105]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 5.0, 5.0, 11.0, 11.0, 12.0, 15.0, 15.0, 18.0, 21.0, 15.0, 26.0, 23.0, 32.0, 30.0, 28.0, 27.0, 42.0, 38.0, 42.0, 26.0, 33.0, 36.0, 44.0, 43.0, 42.0, 38.0, 30.0, 36.0, 31.0, 20.0, 21.0, 23.0, 28.0, 18.0, 22.0, 13.0, 15.0, 13.0, 13.0, 7.0, 7.0, 6.0, 1.0, 3.0, 3.0, 7.0, 3.0, 3.0, 0.0, 1.0], "bins": [-80.3304443359375, -78.02043151855469, -75.7104263305664, -73.4004135131836, -71.09040069580078, -68.7803955078125, -66.47038269042969, -64.16036987304688, -61.85036087036133, -59.54035186767578, -57.23033905029297, -54.92033004760742, -52.610321044921875, -50.30030822753906, -47.990299224853516, -45.68029022216797, -43.370277404785156, -41.06026840209961, -38.7502555847168, -36.44024658203125, -34.13023376464844, -31.82022476196289, -29.510215759277344, -27.200204849243164, -24.890193939208984, -22.580183029174805, -20.270172119140625, -17.960163116455078, -15.650152206420898, -13.340141296386719, -11.030131340026855, -8.720121383666992, -6.410118103027344, -4.100107669830322, -1.7900972366333008, 0.5199131965637207, 2.829923629760742, 5.139934539794922, 7.449944496154785, 9.759954452514648, 12.069965362548828, 14.379976272583008, 16.689987182617188, 18.999996185302734, 21.310007095336914, 23.620018005371094, 25.93002700805664, 28.24003791809082, 30.550048828125, 32.86005783081055, 35.17007064819336, 37.480079650878906, 39.79009246826172, 42.100101470947266, 44.41011047363281, 46.720123291015625, 49.03013229370117, 51.34014129638672, 53.65015411376953, 55.96016311645508, 58.270172119140625, 60.58018493652344, 62.890193939208984, 65.20020294189453, 67.51021575927734]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 7.0, 7.0, 12.0, 16.0, 19.0, 25.0, 27.0, 25.0, 14.0, 34.0, 35.0, 32.0, 33.0, 40.0, 39.0, 41.0, 49.0, 59.0, 50.0, 46.0, 51.0, 36.0, 43.0, 40.0, 29.0, 21.0, 32.0, 25.0, 23.0, 10.0, 19.0, 12.0, 15.0, 10.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.60546875, -7.35418701171875, -7.1029052734375, -6.85162353515625, -6.600341796875, -6.34906005859375, -6.0977783203125, -5.84649658203125, -5.59521484375, -5.34393310546875, -5.0926513671875, -4.84136962890625, -4.590087890625, -4.33880615234375, -4.0875244140625, -3.83624267578125, -3.5849609375, -3.33367919921875, -3.0823974609375, -2.83111572265625, -2.579833984375, -2.32855224609375, -2.0772705078125, -1.82598876953125, -1.57470703125, -1.32342529296875, -1.0721435546875, -0.82086181640625, -0.569580078125, -0.31829833984375, -0.0670166015625, 0.18426513671875, 0.435546875, 0.68682861328125, 0.9381103515625, 1.18939208984375, 1.440673828125, 1.69195556640625, 1.9432373046875, 2.19451904296875, 2.44580078125, 2.69708251953125, 2.9483642578125, 3.19964599609375, 3.450927734375, 3.70220947265625, 3.9534912109375, 4.20477294921875, 4.4560546875, 4.70733642578125, 4.9586181640625, 5.20989990234375, 5.461181640625, 5.71246337890625, 5.9637451171875, 6.21502685546875, 6.46630859375, 6.71759033203125, 6.9688720703125, 7.22015380859375, 7.471435546875, 7.72271728515625, 7.9739990234375, 8.22528076171875, 8.4765625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 2.0, 1.0, 8.0, 7.0, 9.0, 13.0, 22.0, 27.0, 32.0, 33.0, 65.0, 105.0, 192.0, 312.0, 772.0, 2565.0, 13217.0, 108481.0, 1381685.0, 2365755.0, 288430.0, 25970.0, 4423.0, 1090.0, 463.0, 209.0, 127.0, 75.0, 48.0, 37.0, 29.0, 25.0, 18.0, 10.0, 10.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.859375, -16.30078125, -15.7421875, -15.18359375, -14.625, -14.06640625, -13.5078125, -12.94921875, -12.390625, -11.83203125, -11.2734375, -10.71484375, -10.15625, -9.59765625, -9.0390625, -8.48046875, -7.921875, -7.36328125, -6.8046875, -6.24609375, -5.6875, -5.12890625, -4.5703125, -4.01171875, -3.453125, -2.89453125, -2.3359375, -1.77734375, -1.21875, -0.66015625, -0.1015625, 0.45703125, 1.015625, 1.57421875, 2.1328125, 2.69140625, 3.25, 3.80859375, 4.3671875, 4.92578125, 5.484375, 6.04296875, 6.6015625, 7.16015625, 7.71875, 8.27734375, 8.8359375, 9.39453125, 9.953125, 10.51171875, 11.0703125, 11.62890625, 12.1875, 12.74609375, 13.3046875, 13.86328125, 14.421875, 14.98046875, 15.5390625, 16.09765625, 16.65625, 17.21484375, 17.7734375, 18.33203125, 18.890625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 14.0, 21.0, 41.0, 58.0, 66.0, 84.0, 154.0, 245.0, 406.0, 590.0, 690.0, 559.0, 412.0, 275.0, 156.0, 110.0, 64.0, 46.0, 19.0, 14.0, 13.0, 12.0, 7.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.59375, -27.654296875, -26.71484375, -25.775390625, -24.8359375, -23.896484375, -22.95703125, -22.017578125, -21.078125, -20.138671875, -19.19921875, -18.259765625, -17.3203125, -16.380859375, -15.44140625, -14.501953125, -13.5625, -12.623046875, -11.68359375, -10.744140625, -9.8046875, -8.865234375, -7.92578125, -6.986328125, -6.046875, -5.107421875, -4.16796875, -3.228515625, -2.2890625, -1.349609375, -0.41015625, 0.529296875, 1.46875, 2.408203125, 3.34765625, 4.287109375, 5.2265625, 6.166015625, 7.10546875, 8.044921875, 8.984375, 9.923828125, 10.86328125, 11.802734375, 12.7421875, 13.681640625, 14.62109375, 15.560546875, 16.5, 17.439453125, 18.37890625, 19.318359375, 20.2578125, 21.197265625, 22.13671875, 23.076171875, 24.015625, 24.955078125, 25.89453125, 26.833984375, 27.7734375, 28.712890625, 29.65234375, 30.591796875, 31.53125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 3.0, 5.0, 8.0, 11.0, 12.0, 29.0, 42.0, 54.0, 97.0, 114.0, 216.0, 373.0, 1573.0, 93694.0, 4085363.0, 11001.0, 843.0, 298.0, 171.0, 128.0, 69.0, 55.0, 30.0, 26.0, 16.0, 19.0, 10.0, 7.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.0625, -78.5439453125, -75.025390625, -71.5068359375, -67.98828125, -64.4697265625, -60.951171875, -57.4326171875, -53.9140625, -50.3955078125, -46.876953125, -43.3583984375, -39.83984375, -36.3212890625, -32.802734375, -29.2841796875, -25.765625, -22.2470703125, -18.728515625, -15.2099609375, -11.69140625, -8.1728515625, -4.654296875, -1.1357421875, 2.3828125, 5.9013671875, 9.419921875, 12.9384765625, 16.45703125, 19.9755859375, 23.494140625, 27.0126953125, 30.53125, 34.0498046875, 37.568359375, 41.0869140625, 44.60546875, 48.1240234375, 51.642578125, 55.1611328125, 58.6796875, 62.1982421875, 65.716796875, 69.2353515625, 72.75390625, 76.2724609375, 79.791015625, 83.3095703125, 86.828125, 90.3466796875, 93.865234375, 97.3837890625, 100.90234375, 104.4208984375, 107.939453125, 111.4580078125, 114.9765625, 118.4951171875, 122.013671875, 125.5322265625, 129.05078125, 132.5693359375, 136.087890625, 139.6064453125, 143.125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 36.0, 166.0, 303.0, 299.0, 157.0, 34.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-284.6612854003906, -277.87799072265625, -271.0946960449219, -264.3114013671875, -257.5281066894531, -250.74481201171875, -243.96151733398438, -237.17823791503906, -230.3949432373047, -223.6116485595703, -216.82835388183594, -210.04505920410156, -203.2617645263672, -196.47848510742188, -189.6951904296875, -182.91189575195312, -176.12860107421875, -169.34530639648438, -162.56201171875, -155.77871704101562, -148.99542236328125, -142.21212768554688, -135.4288330078125, -128.6455535888672, -121.86224365234375, -115.07894897460938, -108.295654296875, -101.51235961914062, -94.72907257080078, -87.9457778930664, -81.16248321533203, -74.37919616699219, -67.59590148925781, -60.81260681152344, -54.02931594848633, -47.24602127075195, -40.462730407714844, -33.67943572998047, -26.896141052246094, -20.112850189208984, -13.32955551147461, -6.546262264251709, 0.2370309829711914, 7.02032470703125, 13.803617477416992, 20.586910247802734, 27.37020492553711, 34.15349578857422, 40.936790466308594, 47.72008514404297, 54.50337600708008, 61.28667068481445, 68.06996154785156, 74.85325622558594, 81.63655090332031, 88.41984558105469, 95.20314025878906, 101.98643493652344, 108.76972961425781, 115.55302429199219, 122.33631134033203, 129.11959838867188, 135.90289306640625, 142.68618774414062, 149.469482421875]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 10.0, 13.0, 17.0, 15.0, 17.0, 17.0, 24.0, 24.0, 37.0, 29.0, 31.0, 48.0, 38.0, 49.0, 51.0, 47.0, 44.0, 38.0, 35.0, 46.0, 39.0, 34.0, 47.0, 33.0, 40.0, 27.0, 32.0, 29.0, 14.0, 21.0, 9.0, 5.0, 10.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-91.22701263427734, -88.80516815185547, -86.3833236694336, -83.96147155761719, -81.53962707519531, -79.11778259277344, -76.69593811035156, -74.27409362792969, -71.85224914550781, -69.43040466308594, -67.00856018066406, -64.58671569824219, -62.16486740112305, -59.743019104003906, -57.32117462158203, -54.899330139160156, -52.477481842041016, -50.05563735961914, -47.6337890625, -45.211944580078125, -42.79010009765625, -40.368255615234375, -37.946407318115234, -35.52456283569336, -33.10271453857422, -30.68086814880371, -28.259023666381836, -25.837177276611328, -23.415332794189453, -20.993486404418945, -18.571640014648438, -16.149795532226562, -13.727951049804688, -11.306105613708496, -8.884260177612305, -6.462413787841797, -4.0405683517456055, -1.618722915649414, 0.8031234741210938, 3.2249679565429688, 5.646814346313477, 8.068659782409668, 10.49050521850586, 12.912351608276367, 15.334197044372559, 17.75604248046875, 20.177888870239258, 22.599733352661133, 25.02157974243164, 27.44342613220215, 29.865270614624023, 32.28711700439453, 34.708961486816406, 37.13080596923828, 39.55265426635742, 41.9744987487793, 44.39634704589844, 46.81819152832031, 49.24003982543945, 51.66188430786133, 54.0837287902832, 56.505577087402344, 58.92742156982422, 61.349266052246094, 63.77111053466797]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 5.0, 7.0, 3.0, 2.0, 6.0, 9.0, 11.0, 16.0, 27.0, 26.0, 14.0, 33.0, 25.0, 35.0, 31.0, 40.0, 52.0, 47.0, 55.0, 45.0, 45.0, 62.0, 37.0, 43.0, 46.0, 47.0, 46.0, 30.0, 33.0, 28.0, 13.0, 15.0, 17.0, 16.0, 10.0, 6.0, 8.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.703125, -7.42919921875, -7.1552734375, -6.88134765625, -6.607421875, -6.33349609375, -6.0595703125, -5.78564453125, -5.51171875, -5.23779296875, -4.9638671875, -4.68994140625, -4.416015625, -4.14208984375, -3.8681640625, -3.59423828125, -3.3203125, -3.04638671875, -2.7724609375, -2.49853515625, -2.224609375, -1.95068359375, -1.6767578125, -1.40283203125, -1.12890625, -0.85498046875, -0.5810546875, -0.30712890625, -0.033203125, 0.24072265625, 0.5146484375, 0.78857421875, 1.0625, 1.33642578125, 1.6103515625, 1.88427734375, 2.158203125, 2.43212890625, 2.7060546875, 2.97998046875, 3.25390625, 3.52783203125, 3.8017578125, 4.07568359375, 4.349609375, 4.62353515625, 4.8974609375, 5.17138671875, 5.4453125, 5.71923828125, 5.9931640625, 6.26708984375, 6.541015625, 6.81494140625, 7.0888671875, 7.36279296875, 7.63671875, 7.91064453125, 8.1845703125, 8.45849609375, 8.732421875, 9.00634765625, 9.2802734375, 9.55419921875, 9.828125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 12.0, 16.0, 27.0, 37.0, 46.0, 84.0, 133.0, 159.0, 270.0, 447.0, 650.0, 988.0, 1656.0, 2750.0, 4489.0, 7191.0, 12203.0, 20791.0, 35994.0, 65373.0, 132256.0, 368613.0, 197883.0, 85469.0, 45865.0, 26001.0, 15525.0, 9176.0, 5330.0, 3413.0, 2061.0, 1249.0, 852.0, 521.0, 370.0, 219.0, 149.0, 87.0, 64.0, 41.0, 29.0, 18.0, 14.0, 6.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.8837890625, -1.827911376953125, -1.77203369140625, -1.716156005859375, -1.6602783203125, -1.604400634765625, -1.54852294921875, -1.492645263671875, -1.436767578125, -1.380889892578125, -1.32501220703125, -1.269134521484375, -1.2132568359375, -1.157379150390625, -1.10150146484375, -1.045623779296875, -0.98974609375, -0.933868408203125, -0.87799072265625, -0.822113037109375, -0.7662353515625, -0.710357666015625, -0.65447998046875, -0.598602294921875, -0.542724609375, -0.486846923828125, -0.43096923828125, -0.375091552734375, -0.3192138671875, -0.263336181640625, -0.20745849609375, -0.151580810546875, -0.095703125, -0.039825439453125, 0.01605224609375, 0.071929931640625, 0.1278076171875, 0.183685302734375, 0.23956298828125, 0.295440673828125, 0.351318359375, 0.407196044921875, 0.46307373046875, 0.518951416015625, 0.5748291015625, 0.630706787109375, 0.68658447265625, 0.742462158203125, 0.79833984375, 0.854217529296875, 0.91009521484375, 0.965972900390625, 1.0218505859375, 1.077728271484375, 1.13360595703125, 1.189483642578125, 1.245361328125, 1.301239013671875, 1.35711669921875, 1.412994384765625, 1.4688720703125, 1.524749755859375, 1.58062744140625, 1.636505126953125, 1.6923828125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 8.0, 6.0, 6.0, 10.0, 17.0, 11.0, 15.0, 19.0, 23.0, 21.0, 26.0, 23.0, 23.0, 25.0, 38.0, 38.0, 43.0, 40.0, 29.0, 37.0, 1055.0, 38.0, 42.0, 43.0, 43.0, 30.0, 35.0, 24.0, 40.0, 29.0, 16.0, 30.0, 27.0, 13.0, 22.0, 14.0, 12.0, 10.0, 7.0, 8.0, 2.0, 5.0, 1.0, 3.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.359375, -4.2208251953125, -4.082275390625, -3.9437255859375, -3.80517578125, -3.6666259765625, -3.528076171875, -3.3895263671875, -3.2509765625, -3.1124267578125, -2.973876953125, -2.8353271484375, -2.69677734375, -2.5582275390625, -2.419677734375, -2.2811279296875, -2.142578125, -2.0040283203125, -1.865478515625, -1.7269287109375, -1.58837890625, -1.4498291015625, -1.311279296875, -1.1727294921875, -1.0341796875, -0.8956298828125, -0.757080078125, -0.6185302734375, -0.47998046875, -0.3414306640625, -0.202880859375, -0.0643310546875, 0.07421875, 0.2127685546875, 0.351318359375, 0.4898681640625, 0.62841796875, 0.7669677734375, 0.905517578125, 1.0440673828125, 1.1826171875, 1.3211669921875, 1.459716796875, 1.5982666015625, 1.73681640625, 1.8753662109375, 2.013916015625, 2.1524658203125, 2.291015625, 2.4295654296875, 2.568115234375, 2.7066650390625, 2.84521484375, 2.9837646484375, 3.122314453125, 3.2608642578125, 3.3994140625, 3.5379638671875, 3.676513671875, 3.8150634765625, 3.95361328125, 4.0921630859375, 4.230712890625, 4.3692626953125, 4.5078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 10.0, 14.0, 11.0, 25.0, 28.0, 44.0, 37.0, 60.0, 114.0, 157.0, 223.0, 320.0, 478.0, 719.0, 1032.0, 1408.0, 2129.0, 3213.0, 4718.0, 7243.0, 10911.0, 16769.0, 25382.0, 39024.0, 64038.0, 117750.0, 1333149.0, 214576.0, 97440.0, 55618.0, 34478.0, 22270.0, 14597.0, 9714.0, 6374.0, 4329.0, 2717.0, 1946.0, 1300.0, 862.0, 590.0, 426.0, 279.0, 191.0, 135.0, 81.0, 57.0, 45.0, 30.0, 26.0, 13.0, 12.0, 8.0, 4.0, 6.0, 4.0, 1.0, 1.0], "bins": [-1.3623046875, -1.3208465576171875, -1.279388427734375, -1.2379302978515625, -1.19647216796875, -1.1550140380859375, -1.113555908203125, -1.0720977783203125, -1.0306396484375, -0.9891815185546875, -0.947723388671875, -0.9062652587890625, -0.86480712890625, -0.8233489990234375, -0.781890869140625, -0.7404327392578125, -0.698974609375, -0.6575164794921875, -0.616058349609375, -0.5746002197265625, -0.53314208984375, -0.4916839599609375, -0.450225830078125, -0.4087677001953125, -0.3673095703125, -0.3258514404296875, -0.284393310546875, -0.2429351806640625, -0.20147705078125, -0.1600189208984375, -0.118560791015625, -0.0771026611328125, -0.03564453125, 0.0058135986328125, 0.047271728515625, 0.0887298583984375, 0.13018798828125, 0.1716461181640625, 0.213104248046875, 0.2545623779296875, 0.2960205078125, 0.3374786376953125, 0.378936767578125, 0.4203948974609375, 0.46185302734375, 0.5033111572265625, 0.544769287109375, 0.5862274169921875, 0.627685546875, 0.6691436767578125, 0.710601806640625, 0.7520599365234375, 0.79351806640625, 0.8349761962890625, 0.876434326171875, 0.9178924560546875, 0.9593505859375, 1.0008087158203125, 1.042266845703125, 1.0837249755859375, 1.12518310546875, 1.1666412353515625, 1.208099365234375, 1.2495574951171875, 1.291015625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 13.0, 20.0, 20.0, 34.0, 48.0, 53.0, 77.0, 114.0, 110.0, 135.0, 112.0, 65.0, 43.0, 45.0, 21.0, 19.0, 18.0, 11.0, 7.0, 7.0, 3.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00148773193359375, -0.0014438778162002563, -0.0014000236988067627, -0.001356169581413269, -0.0013123154640197754, -0.0012684613466262817, -0.001224607229232788, -0.0011807531118392944, -0.0011368989944458008, -0.0010930448770523071, -0.0010491907596588135, -0.0010053366422653198, -0.0009614825248718262, -0.0009176284074783325, -0.0008737742900848389, -0.0008299201726913452, -0.0007860660552978516, -0.0007422119379043579, -0.0006983578205108643, -0.0006545037031173706, -0.000610649585723877, -0.0005667954683303833, -0.0005229413509368896, -0.000479087233543396, -0.00043523311614990234, -0.0003913789987564087, -0.00034752488136291504, -0.0003036707639694214, -0.00025981664657592773, -0.00021596252918243408, -0.00017210841178894043, -0.00012825429439544678, -8.440017700195312e-05, -4.054605960845947e-05, 3.3080577850341797e-06, 4.716217517852783e-05, 9.101629257202148e-05, 0.00013487040996551514, 0.0001787245273590088, 0.00022257864475250244, 0.0002664327621459961, 0.00031028687953948975, 0.0003541409969329834, 0.00039799511432647705, 0.0004418492317199707, 0.00048570334911346436, 0.000529557466506958, 0.0005734115839004517, 0.0006172657012939453, 0.000661119818687439, 0.0007049739360809326, 0.0007488280534744263, 0.0007926821708679199, 0.0008365362882614136, 0.0008803904056549072, 0.0009242445230484009, 0.0009680986404418945, 0.0010119527578353882, 0.0010558068752288818, 0.0010996609926223755, 0.0011435151100158691, 0.0011873692274093628, 0.0012312233448028564, 0.00127507746219635, 0.0013189315795898438]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 3.0, 11.0, 8.0, 14.0, 17.0, 20.0, 30.0, 54.0, 76.0, 166.0, 307.0, 777.0, 628817.0, 416846.0, 689.0, 278.0, 161.0, 85.0, 58.0, 41.0, 19.0, 13.0, 18.0, 10.0, 14.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026947021484375, -0.0260772705078125, -0.02520751953125, -0.0243377685546875, -0.023468017578125, -0.0225982666015625, -0.021728515625, -0.0208587646484375, -0.019989013671875, -0.0191192626953125, -0.01824951171875, -0.0173797607421875, -0.016510009765625, -0.0156402587890625, -0.0147705078125, -0.0139007568359375, -0.013031005859375, -0.0121612548828125, -0.01129150390625, -0.0104217529296875, -0.009552001953125, -0.0086822509765625, -0.0078125, -0.0069427490234375, -0.006072998046875, -0.0052032470703125, -0.00433349609375, -0.0034637451171875, -0.002593994140625, -0.0017242431640625, -0.0008544921875, 1.52587890625e-05, 0.000885009765625, 0.0017547607421875, 0.00262451171875, 0.0034942626953125, 0.004364013671875, 0.0052337646484375, 0.006103515625, 0.0069732666015625, 0.007843017578125, 0.0087127685546875, 0.00958251953125, 0.0104522705078125, 0.011322021484375, 0.0121917724609375, 0.0130615234375, 0.0139312744140625, 0.014801025390625, 0.0156707763671875, 0.01654052734375, 0.0174102783203125, 0.018280029296875, 0.0191497802734375, 0.02001953125, 0.0208892822265625, 0.021759033203125, 0.0226287841796875, 0.02349853515625, 0.0243682861328125, 0.025238037109375, 0.0261077880859375, 0.0269775390625, 0.0278472900390625, 0.028717041015625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 112.0, 829.0, 75.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006324330344796181, -0.00618203729391098, -0.006039744708687067, -0.0058974516578018665, -0.005755158606916666, -0.005612866021692753, -0.005470572970807552, -0.005328279919922352, -0.005185986869037151, -0.005043693818151951, -0.004901401232928038, -0.004759108182042837, -0.004616815131157637, -0.0044745225459337234, -0.004332229495048523, -0.0041899364441633224, -0.004047643858939409, -0.0039053510408848524, -0.003763057989999652, -0.003620765171945095, -0.0034784721210598946, -0.0033361793030053377, -0.003193886484950781, -0.0030515934340655804, -0.0029093006160110235, -0.0027670077979564667, -0.002624714747071266, -0.0024824219290167093, -0.0023401291109621525, -0.002197836060076952, -0.002055543242022395, -0.0019132503075525165, -0.0017709576059132814, -0.0016286646714434028, -0.001486371736973524, -0.0013440789189189672, -0.0012017859844490886, -0.00105949304997921, -0.0009172001737169921, -0.0007749072974547744, -0.0006326143629848957, -0.000490321428515017, -0.00034802855225279927, -0.00020573564688675106, -6.344274152070284e-05, 7.885019294917583e-05, 0.0002211430692113936, 0.00036343594547361135, 0.00050572887994349, 0.0006480218144133687, 0.0007903146906755865, 0.0009326075669378042, 0.001074900501407683, 0.0012171934358775616, 0.0013594862539321184, 0.001501779188401997, 0.0016440721228718758, 0.0017863650573417544, 0.0019286579918116331, 0.00207095080986619, 0.0022132438607513905, 0.0023555366788059473, 0.002497829496860504, 0.0026401225477457047, 0.0027824153658002615]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 10.0, 9.0, 9.0, 8.0, 15.0, 19.0, 18.0, 27.0, 17.0, 35.0, 32.0, 42.0, 26.0, 36.0, 40.0, 47.0, 48.0, 54.0, 38.0, 37.0, 44.0, 48.0, 31.0, 20.0, 30.0, 50.0, 29.0, 26.0, 28.0, 21.0, 15.0, 15.0, 15.0, 18.0, 8.0, 8.0, 12.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004774928092956543, -0.0004622172564268112, -0.00044694170355796814, -0.00043166615068912506, -0.000416390597820282, -0.0004011150449514389, -0.0003858394920825958, -0.00037056393921375275, -0.00035528838634490967, -0.0003400128334760666, -0.0003247372806072235, -0.00030946172773838043, -0.00029418617486953735, -0.0002789106220006943, -0.0002636350691318512, -0.0002483595162630081, -0.00023308396339416504, -0.00021780841052532196, -0.00020253285765647888, -0.0001872573047876358, -0.00017198175191879272, -0.00015670619904994965, -0.00014143064618110657, -0.0001261550933122635, -0.00011087954044342041, -9.560398757457733e-05, -8.032843470573425e-05, -6.505288183689117e-05, -4.9777328968048096e-05, -3.450177609920502e-05, -1.922622323036194e-05, -3.95067036151886e-06, 1.1324882507324219e-05, 2.6600435376167297e-05, 4.1875988245010376e-05, 5.7151541113853455e-05, 7.242709398269653e-05, 8.770264685153961e-05, 0.00010297819972038269, 0.00011825375258922577, 0.00013352930545806885, 0.00014880485832691193, 0.000164080411195755, 0.00017935596406459808, 0.00019463151693344116, 0.00020990706980228424, 0.00022518262267112732, 0.0002404581755399704, 0.0002557337284088135, 0.00027100928127765656, 0.00028628483414649963, 0.0003015603870153427, 0.0003168359398841858, 0.00033211149275302887, 0.00034738704562187195, 0.000362662598490715, 0.0003779381513595581, 0.0003932137042284012, 0.00040848925709724426, 0.00042376480996608734, 0.0004390403628349304, 0.0004543159157037735, 0.0004695914685726166, 0.00048486702144145966, 0.0005001425743103027]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 5.0, 7.0, 3.0, 2.0, 6.0, 9.0, 11.0, 16.0, 27.0, 26.0, 14.0, 33.0, 25.0, 35.0, 31.0, 40.0, 52.0, 47.0, 55.0, 45.0, 45.0, 62.0, 37.0, 43.0, 46.0, 47.0, 46.0, 30.0, 33.0, 28.0, 13.0, 15.0, 17.0, 16.0, 10.0, 6.0, 8.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.703125, -7.42919921875, -7.1552734375, -6.88134765625, -6.607421875, -6.33349609375, -6.0595703125, -5.78564453125, -5.51171875, -5.23779296875, -4.9638671875, -4.68994140625, -4.416015625, -4.14208984375, -3.8681640625, -3.59423828125, -3.3203125, -3.04638671875, -2.7724609375, -2.49853515625, -2.224609375, -1.95068359375, -1.6767578125, -1.40283203125, -1.12890625, -0.85498046875, -0.5810546875, -0.30712890625, -0.033203125, 0.24072265625, 0.5146484375, 0.78857421875, 1.0625, 1.33642578125, 1.6103515625, 1.88427734375, 2.158203125, 2.43212890625, 2.7060546875, 2.97998046875, 3.25390625, 3.52783203125, 3.8017578125, 4.07568359375, 4.349609375, 4.62353515625, 4.8974609375, 5.17138671875, 5.4453125, 5.71923828125, 5.9931640625, 6.26708984375, 6.541015625, 6.81494140625, 7.0888671875, 7.36279296875, 7.63671875, 7.91064453125, 8.1845703125, 8.45849609375, 8.732421875, 9.00634765625, 9.2802734375, 9.55419921875, 9.828125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 7.0, 4.0, 3.0, 6.0, 10.0, 18.0, 31.0, 40.0, 62.0, 83.0, 168.0, 290.0, 571.0, 1206.0, 2522.0, 6231.0, 17154.0, 58874.0, 263566.0, 523713.0, 123974.0, 32001.0, 10401.0, 4003.0, 1722.0, 882.0, 424.0, 241.0, 141.0, 56.0, 40.0, 36.0, 22.0, 17.0, 9.0, 9.0, 9.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80078125, -4.63092041015625, -4.4610595703125, -4.29119873046875, -4.121337890625, -3.95147705078125, -3.7816162109375, -3.61175537109375, -3.44189453125, -3.27203369140625, -3.1021728515625, -2.93231201171875, -2.762451171875, -2.59259033203125, -2.4227294921875, -2.25286865234375, -2.0830078125, -1.91314697265625, -1.7432861328125, -1.57342529296875, -1.403564453125, -1.23370361328125, -1.0638427734375, -0.89398193359375, -0.72412109375, -0.55426025390625, -0.3843994140625, -0.21453857421875, -0.044677734375, 0.12518310546875, 0.2950439453125, 0.46490478515625, 0.634765625, 0.80462646484375, 0.9744873046875, 1.14434814453125, 1.314208984375, 1.48406982421875, 1.6539306640625, 1.82379150390625, 1.99365234375, 2.16351318359375, 2.3333740234375, 2.50323486328125, 2.673095703125, 2.84295654296875, 3.0128173828125, 3.18267822265625, 3.3525390625, 3.52239990234375, 3.6922607421875, 3.86212158203125, 4.031982421875, 4.20184326171875, 4.3717041015625, 4.54156494140625, 4.71142578125, 4.88128662109375, 5.0511474609375, 5.22100830078125, 5.390869140625, 5.56072998046875, 5.7305908203125, 5.90045166015625, 6.0703125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 2.0, 9.0, 10.0, 13.0, 15.0, 23.0, 17.0, 23.0, 27.0, 29.0, 30.0, 32.0, 34.0, 42.0, 43.0, 52.0, 94.0, 1561.0, 469.0, 90.0, 51.0, 50.0, 45.0, 27.0, 34.0, 30.0, 21.0, 25.0, 26.0, 19.0, 13.0, 11.0, 15.0, 14.0, 9.0, 5.0, 4.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-24.1875, -23.32275390625, -22.4580078125, -21.59326171875, -20.728515625, -19.86376953125, -18.9990234375, -18.13427734375, -17.26953125, -16.40478515625, -15.5400390625, -14.67529296875, -13.810546875, -12.94580078125, -12.0810546875, -11.21630859375, -10.3515625, -9.48681640625, -8.6220703125, -7.75732421875, -6.892578125, -6.02783203125, -5.1630859375, -4.29833984375, -3.43359375, -2.56884765625, -1.7041015625, -0.83935546875, 0.025390625, 0.89013671875, 1.7548828125, 2.61962890625, 3.484375, 4.34912109375, 5.2138671875, 6.07861328125, 6.943359375, 7.80810546875, 8.6728515625, 9.53759765625, 10.40234375, 11.26708984375, 12.1318359375, 12.99658203125, 13.861328125, 14.72607421875, 15.5908203125, 16.45556640625, 17.3203125, 18.18505859375, 19.0498046875, 19.91455078125, 20.779296875, 21.64404296875, 22.5087890625, 23.37353515625, 24.23828125, 25.10302734375, 25.9677734375, 26.83251953125, 27.697265625, 28.56201171875, 29.4267578125, 30.29150390625, 31.15625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 8.0, 8.0, 11.0, 18.0, 18.0, 16.0, 24.0, 34.0, 32.0, 34.0, 62.0, 59.0, 109.0, 180.0, 342.0, 709.0, 4385.0, 2581564.0, 553358.0, 3175.0, 620.0, 293.0, 179.0, 118.0, 74.0, 49.0, 44.0, 37.0, 26.0, 18.0, 16.0, 21.0, 11.0, 11.0, 7.0, 2.0, 6.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-52.71875, -51.251953125, -49.78515625, -48.318359375, -46.8515625, -45.384765625, -43.91796875, -42.451171875, -40.984375, -39.517578125, -38.05078125, -36.583984375, -35.1171875, -33.650390625, -32.18359375, -30.716796875, -29.25, -27.783203125, -26.31640625, -24.849609375, -23.3828125, -21.916015625, -20.44921875, -18.982421875, -17.515625, -16.048828125, -14.58203125, -13.115234375, -11.6484375, -10.181640625, -8.71484375, -7.248046875, -5.78125, -4.314453125, -2.84765625, -1.380859375, 0.0859375, 1.552734375, 3.01953125, 4.486328125, 5.953125, 7.419921875, 8.88671875, 10.353515625, 11.8203125, 13.287109375, 14.75390625, 16.220703125, 17.6875, 19.154296875, 20.62109375, 22.087890625, 23.5546875, 25.021484375, 26.48828125, 27.955078125, 29.421875, 30.888671875, 32.35546875, 33.822265625, 35.2890625, 36.755859375, 38.22265625, 39.689453125, 41.15625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 30.0, 432.0, 509.0, 43.0, 2.0, 0.0, 1.0], "bins": [-249.012939453125, -244.79678344726562, -240.5806121826172, -236.3644561767578, -232.14828491210938, -227.93212890625, -223.71597290039062, -219.4998016357422, -215.2836456298828, -211.06748962402344, -206.851318359375, -202.63516235351562, -198.4189910888672, -194.2028350830078, -189.98666381835938, -185.7705078125, -181.55435180664062, -177.33819580078125, -173.1220245361328, -168.90586853027344, -164.689697265625, -160.47354125976562, -156.25738525390625, -152.0412139892578, -147.82504272460938, -143.60888671875, -139.39271545410156, -135.1765594482422, -130.96038818359375, -126.74423217773438, -122.52806854248047, -118.31190490722656, -114.09574890136719, -109.87958526611328, -105.66342163085938, -101.447265625, -97.2311019897461, -93.01493835449219, -88.79877471923828, -84.58261108398438, -80.36644744873047, -76.15028381347656, -71.93412017822266, -67.71795654296875, -63.501800537109375, -59.28563690185547, -55.06947326660156, -50.853309631347656, -46.63715362548828, -42.420989990234375, -38.204830169677734, -33.98866653442383, -29.772504806518555, -25.55634307861328, -21.340179443359375, -17.1240177154541, -12.907854080200195, -8.691692352294922, -4.475529670715332, -0.2593669891357422, 3.9567947387695312, 8.172956466674805, 12.389120101928711, 16.605281829833984, 20.821443557739258]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 11.0, 9.0, 8.0, 12.0, 9.0, 6.0, 15.0, 21.0, 23.0, 23.0, 24.0, 24.0, 36.0, 37.0, 37.0, 39.0, 41.0, 37.0, 43.0, 29.0, 38.0, 31.0, 41.0, 40.0, 34.0, 31.0, 31.0, 36.0, 40.0, 32.0, 17.0, 19.0, 18.0, 19.0, 19.0, 14.0, 22.0, 8.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-80.9436264038086, -78.33077239990234, -75.71792602539062, -73.10507202148438, -70.49221801757812, -67.87936401367188, -65.26651763916016, -62.653663635253906, -60.04081344604492, -57.42796325683594, -54.81510925292969, -52.2022590637207, -49.58940887451172, -46.97655487060547, -44.363704681396484, -41.7508544921875, -39.13800048828125, -36.525150299072266, -33.912296295166016, -31.29944610595703, -28.686594009399414, -26.073741912841797, -23.460891723632812, -20.848039627075195, -18.235187530517578, -15.622335433959961, -13.00948429107666, -10.39663314819336, -7.783781051635742, -5.170928955078125, -2.558077812194824, 0.05477333068847656, 2.6676254272460938, 5.280477046966553, 7.893328666687012, 10.506179809570312, 13.11903190612793, 15.731884002685547, 18.34473419189453, 20.95758628845215, 23.570438385009766, 26.183290481567383, 28.796142578125, 31.408992767333984, 34.02184295654297, 36.63469696044922, 39.2475471496582, 41.86039733886719, 44.47325134277344, 47.08610153198242, 49.69895553588867, 52.311805725097656, 54.924659729003906, 57.53750991821289, 60.150360107421875, 62.763214111328125, 65.37606811523438, 67.98892211914062, 70.60176849365234, 73.2146224975586, 75.82747650146484, 78.44032287597656, 81.05317687988281, 83.66603088378906, 86.27887725830078]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 5.0, 2.0, 5.0, 4.0, 5.0, 2.0, 10.0, 14.0, 19.0, 15.0, 27.0, 25.0, 24.0, 36.0, 29.0, 32.0, 35.0, 51.0, 62.0, 41.0, 58.0, 41.0, 62.0, 31.0, 43.0, 54.0, 47.0, 41.0, 31.0, 28.0, 31.0, 14.0, 14.0, 21.0, 14.0, 8.0, 7.0, 8.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.90234375, -7.62066650390625, -7.3389892578125, -7.05731201171875, -6.775634765625, -6.49395751953125, -6.2122802734375, -5.93060302734375, -5.64892578125, -5.36724853515625, -5.0855712890625, -4.80389404296875, -4.522216796875, -4.24053955078125, -3.9588623046875, -3.67718505859375, -3.3955078125, -3.11383056640625, -2.8321533203125, -2.55047607421875, -2.268798828125, -1.98712158203125, -1.7054443359375, -1.42376708984375, -1.14208984375, -0.86041259765625, -0.5787353515625, -0.29705810546875, -0.015380859375, 0.26629638671875, 0.5479736328125, 0.82965087890625, 1.111328125, 1.39300537109375, 1.6746826171875, 1.95635986328125, 2.238037109375, 2.51971435546875, 2.8013916015625, 3.08306884765625, 3.36474609375, 3.64642333984375, 3.9281005859375, 4.20977783203125, 4.491455078125, 4.77313232421875, 5.0548095703125, 5.33648681640625, 5.6181640625, 5.89984130859375, 6.1815185546875, 6.46319580078125, 6.744873046875, 7.02655029296875, 7.3082275390625, 7.58990478515625, 7.87158203125, 8.15325927734375, 8.4349365234375, 8.71661376953125, 8.998291015625, 9.27996826171875, 9.5616455078125, 9.84332275390625, 10.125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 6.0, 10.0, 19.0, 11.0, 18.0, 25.0, 23.0, 24.0, 48.0, 76.0, 73.0, 148.0, 414.0, 1548.0, 15832.0, 523551.0, 3454944.0, 188055.0, 7724.0, 952.0, 296.0, 158.0, 77.0, 46.0, 47.0, 23.0, 26.0, 21.0, 12.0, 16.0, 14.0, 10.0, 9.0, 6.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.015625, -27.09326171875, -26.1708984375, -25.24853515625, -24.326171875, -23.40380859375, -22.4814453125, -21.55908203125, -20.63671875, -19.71435546875, -18.7919921875, -17.86962890625, -16.947265625, -16.02490234375, -15.1025390625, -14.18017578125, -13.2578125, -12.33544921875, -11.4130859375, -10.49072265625, -9.568359375, -8.64599609375, -7.7236328125, -6.80126953125, -5.87890625, -4.95654296875, -4.0341796875, -3.11181640625, -2.189453125, -1.26708984375, -0.3447265625, 0.57763671875, 1.5, 2.42236328125, 3.3447265625, 4.26708984375, 5.189453125, 6.11181640625, 7.0341796875, 7.95654296875, 8.87890625, 9.80126953125, 10.7236328125, 11.64599609375, 12.568359375, 13.49072265625, 14.4130859375, 15.33544921875, 16.2578125, 17.18017578125, 18.1025390625, 19.02490234375, 19.947265625, 20.86962890625, 21.7919921875, 22.71435546875, 23.63671875, 24.55908203125, 25.4814453125, 26.40380859375, 27.326171875, 28.24853515625, 29.1708984375, 30.09326171875, 31.015625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 5.0, 13.0, 6.0, 7.0, 9.0, 20.0, 23.0, 47.0, 46.0, 72.0, 74.0, 145.0, 175.0, 266.0, 357.0, 493.0, 598.0, 486.0, 367.0, 243.0, 183.0, 136.0, 77.0, 70.0, 45.0, 40.0, 25.0, 22.0, 7.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-31.140625, -30.3896484375, -29.638671875, -28.8876953125, -28.13671875, -27.3857421875, -26.634765625, -25.8837890625, -25.1328125, -24.3818359375, -23.630859375, -22.8798828125, -22.12890625, -21.3779296875, -20.626953125, -19.8759765625, -19.125, -18.3740234375, -17.623046875, -16.8720703125, -16.12109375, -15.3701171875, -14.619140625, -13.8681640625, -13.1171875, -12.3662109375, -11.615234375, -10.8642578125, -10.11328125, -9.3623046875, -8.611328125, -7.8603515625, -7.109375, -6.3583984375, -5.607421875, -4.8564453125, -4.10546875, -3.3544921875, -2.603515625, -1.8525390625, -1.1015625, -0.3505859375, 0.400390625, 1.1513671875, 1.90234375, 2.6533203125, 3.404296875, 4.1552734375, 4.90625, 5.6572265625, 6.408203125, 7.1591796875, 7.91015625, 8.6611328125, 9.412109375, 10.1630859375, 10.9140625, 11.6650390625, 12.416015625, 13.1669921875, 13.91796875, 14.6689453125, 15.419921875, 16.1708984375, 16.921875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 6.0, 5.0, 14.0, 16.0, 22.0, 29.0, 48.0, 59.0, 132.0, 183.0, 311.0, 582.0, 3509.0, 3543556.0, 642581.0, 2003.0, 482.0, 240.0, 161.0, 113.0, 66.0, 45.0, 39.0, 27.0, 18.0, 13.0, 8.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.6875, -96.1142578125, -92.541015625, -88.9677734375, -85.39453125, -81.8212890625, -78.248046875, -74.6748046875, -71.1015625, -67.5283203125, -63.955078125, -60.3818359375, -56.80859375, -53.2353515625, -49.662109375, -46.0888671875, -42.515625, -38.9423828125, -35.369140625, -31.7958984375, -28.22265625, -24.6494140625, -21.076171875, -17.5029296875, -13.9296875, -10.3564453125, -6.783203125, -3.2099609375, 0.36328125, 3.9365234375, 7.509765625, 11.0830078125, 14.65625, 18.2294921875, 21.802734375, 25.3759765625, 28.94921875, 32.5224609375, 36.095703125, 39.6689453125, 43.2421875, 46.8154296875, 50.388671875, 53.9619140625, 57.53515625, 61.1083984375, 64.681640625, 68.2548828125, 71.828125, 75.4013671875, 78.974609375, 82.5478515625, 86.12109375, 89.6943359375, 93.267578125, 96.8408203125, 100.4140625, 103.9873046875, 107.560546875, 111.1337890625, 114.70703125, 118.2802734375, 121.853515625, 125.4267578125, 129.0]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 17.0, 110.0, 313.0, 376.0, 156.0, 36.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-252.63304138183594, -244.53671264648438, -236.4403839111328, -228.34405517578125, -220.24771118164062, -212.15139770507812, -204.0550537109375, -195.95872497558594, -187.86239624023438, -179.7660675048828, -171.66973876953125, -163.5734100341797, -155.47708129882812, -147.3807373046875, -139.28440856933594, -131.18807983398438, -123.09175109863281, -114.99542236328125, -106.89909362792969, -98.8027572631836, -90.70642852783203, -82.61009979248047, -74.51376342773438, -66.41743469238281, -58.32110595703125, -50.22477722167969, -42.12844467163086, -34.03211212158203, -25.93578338623047, -17.839454650878906, -9.743122100830078, -1.64678955078125, 6.449554443359375, 14.54588508605957, 22.642215728759766, 30.73854637145996, 38.834877014160156, 46.93120574951172, 55.02753829956055, 63.123870849609375, 71.22019958496094, 79.3165283203125, 87.41285705566406, 95.50919342041016, 103.60552215576172, 111.70185089111328, 119.79818725585938, 127.89451599121094, 135.9908447265625, 144.08717346191406, 152.18350219726562, 160.2798309326172, 168.37615966796875, 176.47250366210938, 184.56883239746094, 192.6651611328125, 200.76148986816406, 208.85781860351562, 216.9541473388672, 225.05047607421875, 233.14682006835938, 241.24313354492188, 249.3394775390625, 257.435791015625, 265.5321350097656]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 7.0, 13.0, 12.0, 18.0, 21.0, 11.0, 22.0, 17.0, 31.0, 36.0, 32.0, 39.0, 36.0, 29.0, 48.0, 38.0, 35.0, 45.0, 34.0, 49.0, 40.0, 32.0, 40.0, 32.0, 25.0, 30.0, 37.0, 28.0, 28.0, 19.0, 20.0, 12.0, 13.0, 7.0, 12.0, 7.0, 8.0, 2.0, 6.0, 4.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-80.74872589111328, -78.43477630615234, -76.12081909179688, -73.80686950683594, -71.492919921875, -69.17897033691406, -66.8650131225586, -64.55106353759766, -62.23711013793945, -59.92315673828125, -57.60920715332031, -55.29525375366211, -52.981300354003906, -50.66735076904297, -48.353397369384766, -46.03944396972656, -43.725494384765625, -41.41154098510742, -39.097591400146484, -36.78363800048828, -34.469688415527344, -32.15573501586914, -29.841781616210938, -27.527830123901367, -25.213878631591797, -22.899927139282227, -20.585975646972656, -18.272022247314453, -15.958070755004883, -13.644119262695312, -11.330166816711426, -9.016214370727539, -6.7022552490234375, -4.388303279876709, -2.0743513107299805, 0.23960065841674805, 2.5535526275634766, 4.867504119873047, 7.181456565856934, 9.49540901184082, 11.80936050415039, 14.123311996459961, 16.43726348876953, 18.751216888427734, 21.065168380737305, 23.379119873046875, 25.693073272705078, 28.00702476501465, 30.32097625732422, 32.63492965698242, 34.94887924194336, 37.26283264160156, 39.5767822265625, 41.8907356262207, 44.204689025878906, 46.518638610839844, 48.83259201049805, 51.14654541015625, 53.46049499511719, 55.77444839477539, 58.088401794433594, 60.40235137939453, 62.716304779052734, 65.03025817871094, 67.34420776367188]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 3.0, 9.0, 12.0, 12.0, 16.0, 19.0, 27.0, 23.0, 33.0, 43.0, 35.0, 32.0, 45.0, 45.0, 53.0, 46.0, 52.0, 55.0, 54.0, 46.0, 44.0, 36.0, 34.0, 42.0, 38.0, 26.0, 24.0, 15.0, 12.0, 15.0, 11.0, 12.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.8782958984375, -7.592529296875, -7.3067626953125, -7.02099609375, -6.7352294921875, -6.449462890625, -6.1636962890625, -5.8779296875, -5.5921630859375, -5.306396484375, -5.0206298828125, -4.73486328125, -4.4490966796875, -4.163330078125, -3.8775634765625, -3.591796875, -3.3060302734375, -3.020263671875, -2.7344970703125, -2.44873046875, -2.1629638671875, -1.877197265625, -1.5914306640625, -1.3056640625, -1.0198974609375, -0.734130859375, -0.4483642578125, -0.16259765625, 0.1231689453125, 0.408935546875, 0.6947021484375, 0.98046875, 1.2662353515625, 1.552001953125, 1.8377685546875, 2.12353515625, 2.4093017578125, 2.695068359375, 2.9808349609375, 3.2666015625, 3.5523681640625, 3.838134765625, 4.1239013671875, 4.40966796875, 4.6954345703125, 4.981201171875, 5.2669677734375, 5.552734375, 5.8385009765625, 6.124267578125, 6.4100341796875, 6.69580078125, 6.9815673828125, 7.267333984375, 7.5531005859375, 7.8388671875, 8.1246337890625, 8.410400390625, 8.6961669921875, 8.98193359375, 9.2677001953125, 9.553466796875, 9.8392333984375, 10.125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 0.0, 8.0, 7.0, 11.0, 20.0, 25.0, 26.0, 42.0, 68.0, 87.0, 109.0, 182.0, 227.0, 327.0, 476.0, 733.0, 1097.0, 1608.0, 2330.0, 3581.0, 5507.0, 8824.0, 14379.0, 23695.0, 40481.0, 71717.0, 138492.0, 344952.0, 181402.0, 86274.0, 48311.0, 27891.0, 16367.0, 10510.0, 6391.0, 4123.0, 2607.0, 1756.0, 1243.0, 815.0, 580.0, 387.0, 278.0, 187.0, 124.0, 106.0, 51.0, 49.0, 24.0, 21.0, 19.0, 11.0, 9.0, 7.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0], "bins": [-1.748046875, -1.6928253173828125, -1.637603759765625, -1.5823822021484375, -1.52716064453125, -1.4719390869140625, -1.416717529296875, -1.3614959716796875, -1.3062744140625, -1.2510528564453125, -1.195831298828125, -1.1406097412109375, -1.08538818359375, -1.0301666259765625, -0.974945068359375, -0.9197235107421875, -0.864501953125, -0.8092803955078125, -0.754058837890625, -0.6988372802734375, -0.64361572265625, -0.5883941650390625, -0.533172607421875, -0.4779510498046875, -0.4227294921875, -0.3675079345703125, -0.312286376953125, -0.2570648193359375, -0.20184326171875, -0.1466217041015625, -0.091400146484375, -0.0361785888671875, 0.01904296875, 0.0742645263671875, 0.129486083984375, 0.1847076416015625, 0.23992919921875, 0.2951507568359375, 0.350372314453125, 0.4055938720703125, 0.4608154296875, 0.5160369873046875, 0.571258544921875, 0.6264801025390625, 0.68170166015625, 0.7369232177734375, 0.792144775390625, 0.8473663330078125, 0.902587890625, 0.9578094482421875, 1.013031005859375, 1.0682525634765625, 1.12347412109375, 1.1786956787109375, 1.233917236328125, 1.2891387939453125, 1.3443603515625, 1.3995819091796875, 1.454803466796875, 1.5100250244140625, 1.56524658203125, 1.6204681396484375, 1.675689697265625, 1.7309112548828125, 1.7861328125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 4.0, 7.0, 7.0, 7.0, 14.0, 16.0, 16.0, 13.0, 25.0, 18.0, 26.0, 30.0, 40.0, 35.0, 28.0, 50.0, 31.0, 48.0, 29.0, 33.0, 1067.0, 32.0, 43.0, 30.0, 38.0, 38.0, 38.0, 39.0, 30.0, 27.0, 21.0, 25.0, 23.0, 22.0, 15.0, 11.0, 6.0, 8.0, 6.0, 5.0, 4.0, 9.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-5.30078125, -5.14373779296875, -4.9866943359375, -4.82965087890625, -4.672607421875, -4.51556396484375, -4.3585205078125, -4.20147705078125, -4.04443359375, -3.88739013671875, -3.7303466796875, -3.57330322265625, -3.416259765625, -3.25921630859375, -3.1021728515625, -2.94512939453125, -2.7880859375, -2.63104248046875, -2.4739990234375, -2.31695556640625, -2.159912109375, -2.00286865234375, -1.8458251953125, -1.68878173828125, -1.53173828125, -1.37469482421875, -1.2176513671875, -1.06060791015625, -0.903564453125, -0.74652099609375, -0.5894775390625, -0.43243408203125, -0.275390625, -0.11834716796875, 0.0386962890625, 0.19573974609375, 0.352783203125, 0.50982666015625, 0.6668701171875, 0.82391357421875, 0.98095703125, 1.13800048828125, 1.2950439453125, 1.45208740234375, 1.609130859375, 1.76617431640625, 1.9232177734375, 2.08026123046875, 2.2373046875, 2.39434814453125, 2.5513916015625, 2.70843505859375, 2.865478515625, 3.02252197265625, 3.1795654296875, 3.33660888671875, 3.49365234375, 3.65069580078125, 3.8077392578125, 3.96478271484375, 4.121826171875, 4.27886962890625, 4.4359130859375, 4.59295654296875, 4.75]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 6.0, 6.0, 6.0, 8.0, 14.0, 15.0, 43.0, 51.0, 68.0, 90.0, 129.0, 214.0, 300.0, 473.0, 651.0, 1034.0, 1575.0, 2375.0, 3502.0, 5463.0, 8500.0, 13369.0, 21011.0, 33592.0, 55175.0, 95893.0, 201875.0, 1349092.0, 122989.0, 67952.0, 40652.0, 25376.0, 15901.0, 10227.0, 6663.0, 4400.0, 2779.0, 1915.0, 1219.0, 862.0, 528.0, 361.0, 251.0, 154.0, 111.0, 100.0, 52.0, 39.0, 24.0, 15.0, 15.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4208984375, -1.37384033203125, -1.3267822265625, -1.27972412109375, -1.232666015625, -1.18560791015625, -1.1385498046875, -1.09149169921875, -1.04443359375, -0.99737548828125, -0.9503173828125, -0.90325927734375, -0.856201171875, -0.80914306640625, -0.7620849609375, -0.71502685546875, -0.66796875, -0.62091064453125, -0.5738525390625, -0.52679443359375, -0.479736328125, -0.43267822265625, -0.3856201171875, -0.33856201171875, -0.29150390625, -0.24444580078125, -0.1973876953125, -0.15032958984375, -0.103271484375, -0.05621337890625, -0.0091552734375, 0.03790283203125, 0.0849609375, 0.13201904296875, 0.1790771484375, 0.22613525390625, 0.273193359375, 0.32025146484375, 0.3673095703125, 0.41436767578125, 0.46142578125, 0.50848388671875, 0.5555419921875, 0.60260009765625, 0.649658203125, 0.69671630859375, 0.7437744140625, 0.79083251953125, 0.837890625, 0.88494873046875, 0.9320068359375, 0.97906494140625, 1.026123046875, 1.07318115234375, 1.1202392578125, 1.16729736328125, 1.21435546875, 1.26141357421875, 1.3084716796875, 1.35552978515625, 1.402587890625, 1.44964599609375, 1.4967041015625, 1.54376220703125, 1.5908203125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 5.0, 3.0, 5.0, 4.0, 8.0, 7.0, 8.0, 4.0, 15.0, 11.0, 14.0, 21.0, 23.0, 27.0, 30.0, 41.0, 37.0, 51.0, 57.0, 61.0, 68.0, 50.0, 72.0, 56.0, 43.0, 39.0, 32.0, 26.0, 21.0, 29.0, 30.0, 13.0, 20.0, 13.0, 10.0, 13.0, 6.0, 6.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0008687973022460938, -0.0008419007062911987, -0.0008150041103363037, -0.0007881075143814087, -0.0007612109184265137, -0.0007343143224716187, -0.0007074177265167236, -0.0006805211305618286, -0.0006536245346069336, -0.0006267279386520386, -0.0005998313426971436, -0.0005729347467422485, -0.0005460381507873535, -0.0005191415548324585, -0.0004922449588775635, -0.00046534836292266846, -0.00043845176696777344, -0.0004115551710128784, -0.0003846585750579834, -0.0003577619791030884, -0.00033086538314819336, -0.00030396878719329834, -0.0002770721912384033, -0.0002501755952835083, -0.00022327899932861328, -0.00019638240337371826, -0.00016948580741882324, -0.00014258921146392822, -0.0001156926155090332, -8.879601955413818e-05, -6.189942359924316e-05, -3.5002827644348145e-05, -8.106231689453125e-06, 1.8790364265441895e-05, 4.5686960220336914e-05, 7.258355617523193e-05, 9.948015213012695e-05, 0.00012637674808502197, 0.000153273344039917, 0.000180169939994812, 0.00020706653594970703, 0.00023396313190460205, 0.00026085972785949707, 0.0002877563238143921, 0.0003146529197692871, 0.00034154951572418213, 0.00036844611167907715, 0.00039534270763397217, 0.0004222393035888672, 0.0004491358995437622, 0.0004760324954986572, 0.0005029290914535522, 0.0005298256874084473, 0.0005567222833633423, 0.0005836188793182373, 0.0006105154752731323, 0.0006374120712280273, 0.0006643086671829224, 0.0006912052631378174, 0.0007181018590927124, 0.0007449984550476074, 0.0007718950510025024, 0.0007987916469573975, 0.0008256882429122925, 0.0008525848388671875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 2.0, 5.0, 15.0, 9.0, 14.0, 8.0, 21.0, 18.0, 25.0, 31.0, 44.0, 50.0, 63.0, 119.0, 182.0, 371.0, 1163.0, 866085.0, 178564.0, 804.0, 342.0, 170.0, 110.0, 70.0, 61.0, 28.0, 30.0, 23.0, 18.0, 14.0, 20.0, 5.0, 12.0, 8.0, 10.0, 9.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0208587646484375, -0.020204782485961914, -0.019550800323486328, -0.018896818161010742, -0.018242835998535156, -0.01758885383605957, -0.016934871673583984, -0.0162808895111084, -0.015626907348632812, -0.014972925186157227, -0.01431894302368164, -0.013664960861206055, -0.013010978698730469, -0.012356996536254883, -0.011703014373779297, -0.011049032211303711, -0.010395050048828125, -0.009741067886352539, -0.009087085723876953, -0.008433103561401367, -0.007779121398925781, -0.007125139236450195, -0.006471157073974609, -0.0058171749114990234, -0.0051631927490234375, -0.0045092105865478516, -0.0038552284240722656, -0.0032012462615966797, -0.0025472640991210938, -0.0018932819366455078, -0.0012392997741699219, -0.0005853176116943359, 6.866455078125e-05, 0.0007226467132568359, 0.0013766288757324219, 0.002030611038208008, 0.0026845932006835938, 0.0033385753631591797, 0.003992557525634766, 0.0046465396881103516, 0.0053005218505859375, 0.0059545040130615234, 0.006608486175537109, 0.007262468338012695, 0.007916450500488281, 0.008570432662963867, 0.009224414825439453, 0.009878396987915039, 0.010532379150390625, 0.011186361312866211, 0.011840343475341797, 0.012494325637817383, 0.013148307800292969, 0.013802289962768555, 0.01445627212524414, 0.015110254287719727, 0.015764236450195312, 0.0164182186126709, 0.017072200775146484, 0.01772618293762207, 0.018380165100097656, 0.019034147262573242, 0.019688129425048828, 0.020342111587524414, 0.02099609375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 19.0, 249.0, 555.0, 169.0, 22.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016488254768773913, -0.0015681134536862373, -0.0014874013140797615, -0.0014066892908886075, -0.0013259772676974535, -0.0012452651280909777, -0.0011645531048998237, -0.0010838410817086697, -0.0010031289421021938, -0.0009224168607033789, -0.0008417048375122249, -0.00076099275611341, -0.000680280732922256, -0.0005995686515234411, -0.0005188565701246262, -0.00043814454693347216, -0.00035743252374231815, -0.0002767204714473337, -0.000196008404600434, -0.00011529633775353432, -3.458428545854986e-05, 4.61277668364346e-05, 0.00012683984823524952, 0.00020755187142640352, 0.00028826395282521844, 0.0003689760051202029, 0.00044968805741518736, 0.0005304001388140023, 0.0006111122202128172, 0.0006918242434039712, 0.0007725363248027861, 0.0008532483479939401, 0.0009339605458080769, 0.0010146725689992309, 0.0010953847086057067, 0.0011760967317968607, 0.0012568087549880147, 0.0013375207781791687, 0.0014182329177856445, 0.0014989449409767985, 0.0015796569641679525, 0.0016603689873591065, 0.0017410811269655824, 0.0018217931501567364, 0.0019025051733478904, 0.0019832171965390444, 0.00206392933614552, 0.0021446412429213524, 0.002225353382527828, 0.002306065522134304, 0.0023867774289101362, 0.002467489568516612, 0.002548201708123088, 0.00262891361489892, 0.002709625754505396, 0.0027903378941118717, 0.0028710500337183475, 0.0029517621733248234, 0.0030324740801006556, 0.0031131862197071314, 0.003193898359313607, 0.0032746102660894394, 0.0033553224056959152, 0.003436034545302391, 0.0035167464520782232]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 9.0, 9.0, 15.0, 13.0, 22.0, 16.0, 25.0, 27.0, 23.0, 32.0, 33.0, 36.0, 35.0, 45.0, 39.0, 45.0, 40.0, 32.0, 36.0, 45.0, 45.0, 43.0, 37.0, 34.0, 38.0, 24.0, 31.0, 23.0, 19.0, 24.0, 28.0, 12.0, 11.0, 11.0, 11.0, 6.0, 4.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004642605781555176, -0.00044866278767585754, -0.0004330649971961975, -0.0004174672067165375, -0.00040186941623687744, -0.0003862716257572174, -0.0003706738352775574, -0.00035507604479789734, -0.0003394782543182373, -0.00032388046383857727, -0.00030828267335891724, -0.0002926848828792572, -0.00027708709239959717, -0.00026148930191993713, -0.0002458915114402771, -0.00023029372096061707, -0.00021469593048095703, -0.000199098140001297, -0.00018350034952163696, -0.00016790255904197693, -0.0001523047685623169, -0.00013670697808265686, -0.00012110918760299683, -0.00010551139712333679, -8.991360664367676e-05, -7.431581616401672e-05, -5.871802568435669e-05, -4.3120235204696655e-05, -2.752244472503662e-05, -1.1924654245376587e-05, 3.6731362342834473e-06, 1.927092671394348e-05, 3.4868717193603516e-05, 5.046650767326355e-05, 6.606429815292358e-05, 8.166208863258362e-05, 9.725987911224365e-05, 0.00011285766959190369, 0.00012845546007156372, 0.00014405325055122375, 0.0001596510410308838, 0.00017524883151054382, 0.00019084662199020386, 0.0002064444124698639, 0.00022204220294952393, 0.00023763999342918396, 0.000253237783908844, 0.00026883557438850403, 0.00028443336486816406, 0.0003000311553478241, 0.00031562894582748413, 0.00033122673630714417, 0.0003468245267868042, 0.00036242231726646423, 0.00037802010774612427, 0.0003936178982257843, 0.00040921568870544434, 0.00042481347918510437, 0.0004404112696647644, 0.00045600906014442444, 0.00047160685062408447, 0.0004872046411037445, 0.0005028024315834045, 0.0005184002220630646, 0.0005339980125427246]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 3.0, 9.0, 12.0, 12.0, 16.0, 19.0, 27.0, 23.0, 33.0, 43.0, 35.0, 32.0, 45.0, 45.0, 53.0, 46.0, 52.0, 55.0, 54.0, 46.0, 44.0, 36.0, 34.0, 42.0, 38.0, 26.0, 24.0, 15.0, 12.0, 15.0, 11.0, 12.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.8782958984375, -7.592529296875, -7.3067626953125, -7.02099609375, -6.7352294921875, -6.449462890625, -6.1636962890625, -5.8779296875, -5.5921630859375, -5.306396484375, -5.0206298828125, -4.73486328125, -4.4490966796875, -4.163330078125, -3.8775634765625, -3.591796875, -3.3060302734375, -3.020263671875, -2.7344970703125, -2.44873046875, -2.1629638671875, -1.877197265625, -1.5914306640625, -1.3056640625, -1.0198974609375, -0.734130859375, -0.4483642578125, -0.16259765625, 0.1231689453125, 0.408935546875, 0.6947021484375, 0.98046875, 1.2662353515625, 1.552001953125, 1.8377685546875, 2.12353515625, 2.4093017578125, 2.695068359375, 2.9808349609375, 3.2666015625, 3.5523681640625, 3.838134765625, 4.1239013671875, 4.40966796875, 4.6954345703125, 4.981201171875, 5.2669677734375, 5.552734375, 5.8385009765625, 6.124267578125, 6.4100341796875, 6.69580078125, 6.9815673828125, 7.267333984375, 7.5531005859375, 7.8388671875, 8.1246337890625, 8.410400390625, 8.6961669921875, 8.98193359375, 9.2677001953125, 9.553466796875, 9.8392333984375, 10.125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 6.0, 3.0, 7.0, 8.0, 18.0, 21.0, 26.0, 37.0, 46.0, 72.0, 95.0, 135.0, 211.0, 272.0, 386.0, 622.0, 848.0, 1189.0, 1856.0, 2774.0, 4187.0, 6789.0, 11578.0, 21715.0, 49457.0, 159915.0, 498707.0, 178773.0, 53400.0, 23070.0, 12025.0, 6897.0, 4459.0, 2912.0, 1951.0, 1248.0, 868.0, 604.0, 421.0, 304.0, 211.0, 127.0, 94.0, 67.0, 40.0, 29.0, 26.0, 18.0, 12.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.4609375, -4.30462646484375, -4.1483154296875, -3.99200439453125, -3.835693359375, -3.67938232421875, -3.5230712890625, -3.36676025390625, -3.21044921875, -3.05413818359375, -2.8978271484375, -2.74151611328125, -2.585205078125, -2.42889404296875, -2.2725830078125, -2.11627197265625, -1.9599609375, -1.80364990234375, -1.6473388671875, -1.49102783203125, -1.334716796875, -1.17840576171875, -1.0220947265625, -0.86578369140625, -0.70947265625, -0.55316162109375, -0.3968505859375, -0.24053955078125, -0.084228515625, 0.07208251953125, 0.2283935546875, 0.38470458984375, 0.541015625, 0.69732666015625, 0.8536376953125, 1.00994873046875, 1.166259765625, 1.32257080078125, 1.4788818359375, 1.63519287109375, 1.79150390625, 1.94781494140625, 2.1041259765625, 2.26043701171875, 2.416748046875, 2.57305908203125, 2.7293701171875, 2.88568115234375, 3.0419921875, 3.19830322265625, 3.3546142578125, 3.51092529296875, 3.667236328125, 3.82354736328125, 3.9798583984375, 4.13616943359375, 4.29248046875, 4.44879150390625, 4.6051025390625, 4.76141357421875, 4.917724609375, 5.07403564453125, 5.2303466796875, 5.38665771484375, 5.54296875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 6.0, 11.0, 6.0, 6.0, 18.0, 16.0, 29.0, 19.0, 23.0, 38.0, 40.0, 26.0, 46.0, 46.0, 55.0, 84.0, 243.0, 1742.0, 119.0, 54.0, 65.0, 57.0, 48.0, 31.0, 40.0, 31.0, 20.0, 28.0, 21.0, 16.0, 11.0, 14.0, 7.0, 11.0, 4.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.171875, -30.175537109375, -29.17919921875, -28.182861328125, -27.1865234375, -26.190185546875, -25.19384765625, -24.197509765625, -23.201171875, -22.204833984375, -21.20849609375, -20.212158203125, -19.2158203125, -18.219482421875, -17.22314453125, -16.226806640625, -15.23046875, -14.234130859375, -13.23779296875, -12.241455078125, -11.2451171875, -10.248779296875, -9.25244140625, -8.256103515625, -7.259765625, -6.263427734375, -5.26708984375, -4.270751953125, -3.2744140625, -2.278076171875, -1.28173828125, -0.285400390625, 0.7109375, 1.707275390625, 2.70361328125, 3.699951171875, 4.6962890625, 5.692626953125, 6.68896484375, 7.685302734375, 8.681640625, 9.677978515625, 10.67431640625, 11.670654296875, 12.6669921875, 13.663330078125, 14.65966796875, 15.656005859375, 16.65234375, 17.648681640625, 18.64501953125, 19.641357421875, 20.6376953125, 21.634033203125, 22.63037109375, 23.626708984375, 24.623046875, 25.619384765625, 26.61572265625, 27.612060546875, 28.6083984375, 29.604736328125, 30.60107421875, 31.597412109375, 32.59375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 1.0, 7.0, 6.0, 12.0, 11.0, 19.0, 15.0, 24.0, 20.0, 31.0, 38.0, 68.0, 76.0, 95.0, 177.0, 240.0, 504.0, 1419.0, 17883.0, 3076164.0, 45421.0, 2008.0, 571.0, 273.0, 160.0, 100.0, 90.0, 72.0, 40.0, 35.0, 29.0, 26.0, 14.0, 8.0, 12.0, 10.0, 9.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.78125, -56.978515625, -55.17578125, -53.373046875, -51.5703125, -49.767578125, -47.96484375, -46.162109375, -44.359375, -42.556640625, -40.75390625, -38.951171875, -37.1484375, -35.345703125, -33.54296875, -31.740234375, -29.9375, -28.134765625, -26.33203125, -24.529296875, -22.7265625, -20.923828125, -19.12109375, -17.318359375, -15.515625, -13.712890625, -11.91015625, -10.107421875, -8.3046875, -6.501953125, -4.69921875, -2.896484375, -1.09375, 0.708984375, 2.51171875, 4.314453125, 6.1171875, 7.919921875, 9.72265625, 11.525390625, 13.328125, 15.130859375, 16.93359375, 18.736328125, 20.5390625, 22.341796875, 24.14453125, 25.947265625, 27.75, 29.552734375, 31.35546875, 33.158203125, 34.9609375, 36.763671875, 38.56640625, 40.369140625, 42.171875, 43.974609375, 45.77734375, 47.580078125, 49.3828125, 51.185546875, 52.98828125, 54.791015625, 56.59375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 11.0, 22.0, 53.0, 122.0, 208.0, 199.0, 173.0, 109.0, 59.0, 21.0, 20.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.68754959106445, -34.22761917114258, -32.7676887512207, -31.307756423950195, -29.84782600402832, -28.387895584106445, -26.927963256835938, -25.468032836914062, -24.008102416992188, -22.548171997070312, -21.088241577148438, -19.62830924987793, -18.168378829956055, -16.70844841003418, -15.248517036437988, -13.788585662841797, -12.328655242919922, -10.868724822998047, -9.408793449401855, -7.948862552642822, -6.488931655883789, -5.029000759124756, -3.5690698623657227, -2.1091384887695312, -0.6492080688476562, 0.810722827911377, 2.27065372467041, 3.7305846214294434, 5.190515518188477, 6.65044641494751, 8.110377311706543, 9.570308685302734, 11.030242919921875, 12.49017333984375, 13.950104713439941, 15.410036087036133, 16.869966506958008, 18.329896926879883, 19.78982925415039, 21.249759674072266, 22.70969009399414, 24.169620513916016, 25.62955093383789, 27.0894832611084, 28.549413681030273, 30.00934410095215, 31.469276428222656, 32.92920684814453, 34.389137268066406, 35.84906768798828, 37.308998107910156, 38.76892852783203, 40.228858947753906, 41.68879318237305, 43.14872360229492, 44.6086540222168, 46.06858444213867, 47.52851486206055, 48.98844528198242, 50.4483757019043, 51.90830993652344, 53.36824035644531, 54.82817077636719, 56.28810119628906, 57.74803161621094]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 9.0, 4.0, 5.0, 5.0, 12.0, 6.0, 17.0, 18.0, 9.0, 11.0, 22.0, 19.0, 26.0, 20.0, 44.0, 47.0, 44.0, 39.0, 40.0, 26.0, 38.0, 47.0, 40.0, 40.0, 37.0, 39.0, 31.0, 33.0, 33.0, 43.0, 31.0, 26.0, 17.0, 20.0, 22.0, 23.0, 12.0, 9.0, 14.0, 4.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.5935287475586, -85.85505676269531, -83.11659240722656, -80.37812042236328, -77.6396484375, -74.90118408203125, -72.16271209716797, -69.42424011230469, -66.68577575683594, -63.94730758666992, -61.20883560180664, -58.470367431640625, -55.731895446777344, -52.99342727661133, -50.25495910644531, -47.51648712158203, -44.77801513671875, -42.039546966552734, -39.30107498168945, -36.56260681152344, -33.824134826660156, -31.08566665649414, -28.347198486328125, -25.608728408813477, -22.870258331298828, -20.13178825378418, -17.39331817626953, -14.654850006103516, -11.916379928588867, -9.177909851074219, -6.439441680908203, -3.7009716033935547, -0.9625091552734375, 1.7759604454040527, 4.514430046081543, 7.252899169921875, 9.991369247436523, 12.729839324951172, 15.468307495117188, 18.206777572631836, 20.945247650146484, 23.683717727661133, 26.42218780517578, 29.160655975341797, 31.899126052856445, 34.637596130371094, 37.37606430053711, 40.114532470703125, 42.853004455566406, 45.59147262573242, 48.3299446105957, 51.06841278076172, 53.806884765625, 56.545352935791016, 59.28382110595703, 62.02229309082031, 64.76075744628906, 67.49922943115234, 70.2376937866211, 72.97616577148438, 75.71463775634766, 78.45310974121094, 81.19157409667969, 83.93004608154297, 86.66851806640625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 0.0, 6.0, 10.0, 10.0, 17.0, 21.0, 16.0, 27.0, 37.0, 28.0, 43.0, 32.0, 43.0, 40.0, 48.0, 45.0, 54.0, 59.0, 53.0, 51.0, 44.0, 43.0, 32.0, 40.0, 33.0, 38.0, 27.0, 18.0, 10.0, 17.0, 10.0, 15.0, 9.0, 4.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4921875, -8.2005615234375, -7.908935546875, -7.6173095703125, -7.32568359375, -7.0340576171875, -6.742431640625, -6.4508056640625, -6.1591796875, -5.8675537109375, -5.575927734375, -5.2843017578125, -4.99267578125, -4.7010498046875, -4.409423828125, -4.1177978515625, -3.826171875, -3.5345458984375, -3.242919921875, -2.9512939453125, -2.65966796875, -2.3680419921875, -2.076416015625, -1.7847900390625, -1.4931640625, -1.2015380859375, -0.909912109375, -0.6182861328125, -0.32666015625, -0.0350341796875, 0.256591796875, 0.5482177734375, 0.83984375, 1.1314697265625, 1.423095703125, 1.7147216796875, 2.00634765625, 2.2979736328125, 2.589599609375, 2.8812255859375, 3.1728515625, 3.4644775390625, 3.756103515625, 4.0477294921875, 4.33935546875, 4.6309814453125, 4.922607421875, 5.2142333984375, 5.505859375, 5.7974853515625, 6.089111328125, 6.3807373046875, 6.67236328125, 6.9639892578125, 7.255615234375, 7.5472412109375, 7.8388671875, 8.1304931640625, 8.422119140625, 8.7137451171875, 9.00537109375, 9.2969970703125, 9.588623046875, 9.8802490234375, 10.171875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 10.0, 15.0, 19.0, 30.0, 44.0, 55.0, 100.0, 144.0, 327.0, 522.0, 1000.0, 2058.0, 4838.0, 11836.0, 33825.0, 125036.0, 558639.0, 1600166.0, 1343766.0, 379135.0, 90931.0, 25894.0, 8774.0, 3621.0, 1610.0, 829.0, 428.0, 216.0, 131.0, 92.0, 66.0, 37.0, 23.0, 23.0, 11.0, 10.0, 5.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.953125, -10.6297607421875, -10.306396484375, -9.9830322265625, -9.65966796875, -9.3363037109375, -9.012939453125, -8.6895751953125, -8.3662109375, -8.0428466796875, -7.719482421875, -7.3961181640625, -7.07275390625, -6.7493896484375, -6.426025390625, -6.1026611328125, -5.779296875, -5.4559326171875, -5.132568359375, -4.8092041015625, -4.48583984375, -4.1624755859375, -3.839111328125, -3.5157470703125, -3.1923828125, -2.8690185546875, -2.545654296875, -2.2222900390625, -1.89892578125, -1.5755615234375, -1.252197265625, -0.9288330078125, -0.60546875, -0.2821044921875, 0.041259765625, 0.3646240234375, 0.68798828125, 1.0113525390625, 1.334716796875, 1.6580810546875, 1.9814453125, 2.3048095703125, 2.628173828125, 2.9515380859375, 3.27490234375, 3.5982666015625, 3.921630859375, 4.2449951171875, 4.568359375, 4.8917236328125, 5.215087890625, 5.5384521484375, 5.86181640625, 6.1851806640625, 6.508544921875, 6.8319091796875, 7.1552734375, 7.4786376953125, 7.802001953125, 8.1253662109375, 8.44873046875, 8.7720947265625, 9.095458984375, 9.4188232421875, 9.7421875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 7.0, 14.0, 16.0, 38.0, 35.0, 60.0, 78.0, 100.0, 162.0, 243.0, 287.0, 391.0, 520.0, 487.0, 411.0, 340.0, 250.0, 179.0, 132.0, 102.0, 64.0, 48.0, 30.0, 27.0, 20.0, 3.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.59375, -20.900146484375, -20.20654296875, -19.512939453125, -18.8193359375, -18.125732421875, -17.43212890625, -16.738525390625, -16.044921875, -15.351318359375, -14.65771484375, -13.964111328125, -13.2705078125, -12.576904296875, -11.88330078125, -11.189697265625, -10.49609375, -9.802490234375, -9.10888671875, -8.415283203125, -7.7216796875, -7.028076171875, -6.33447265625, -5.640869140625, -4.947265625, -4.253662109375, -3.56005859375, -2.866455078125, -2.1728515625, -1.479248046875, -0.78564453125, -0.092041015625, 0.6015625, 1.295166015625, 1.98876953125, 2.682373046875, 3.3759765625, 4.069580078125, 4.76318359375, 5.456787109375, 6.150390625, 6.843994140625, 7.53759765625, 8.231201171875, 8.9248046875, 9.618408203125, 10.31201171875, 11.005615234375, 11.69921875, 12.392822265625, 13.08642578125, 13.780029296875, 14.4736328125, 15.167236328125, 15.86083984375, 16.554443359375, 17.248046875, 17.941650390625, 18.63525390625, 19.328857421875, 20.0224609375, 20.716064453125, 21.40966796875, 22.103271484375, 22.796875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 13.0, 18.0, 30.0, 44.0, 71.0, 93.0, 140.0, 258.0, 599.0, 4449.0, 3961132.0, 225208.0, 1300.0, 380.0, 192.0, 104.0, 77.0, 52.0, 30.0, 32.0, 14.0, 10.0, 7.0, 8.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.75, -103.04296875, -99.3359375, -95.62890625, -91.921875, -88.21484375, -84.5078125, -80.80078125, -77.09375, -73.38671875, -69.6796875, -65.97265625, -62.265625, -58.55859375, -54.8515625, -51.14453125, -47.4375, -43.73046875, -40.0234375, -36.31640625, -32.609375, -28.90234375, -25.1953125, -21.48828125, -17.78125, -14.07421875, -10.3671875, -6.66015625, -2.953125, 0.75390625, 4.4609375, 8.16796875, 11.875, 15.58203125, 19.2890625, 22.99609375, 26.703125, 30.41015625, 34.1171875, 37.82421875, 41.53125, 45.23828125, 48.9453125, 52.65234375, 56.359375, 60.06640625, 63.7734375, 67.48046875, 71.1875, 74.89453125, 78.6015625, 82.30859375, 86.015625, 89.72265625, 93.4296875, 97.13671875, 100.84375, 104.55078125, 108.2578125, 111.96484375, 115.671875, 119.37890625, 123.0859375, 126.79296875, 130.5]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 32.0, 125.0, 382.0, 339.0, 101.0, 27.0, 4.0, 0.0, 2.0], "bins": [-505.6151428222656, -496.8895263671875, -488.16387939453125, -479.4382629394531, -470.712646484375, -461.98699951171875, -453.2613830566406, -444.5357666015625, -435.81011962890625, -427.0845031738281, -418.3588562011719, -409.63323974609375, -400.9076232910156, -392.1820068359375, -383.45635986328125, -374.7307434082031, -366.005126953125, -357.2795104980469, -348.5538635253906, -339.8282470703125, -331.1026306152344, -322.37701416015625, -313.6513671875, -304.9257507324219, -296.20013427734375, -287.4745178222656, -278.7488708496094, -270.02325439453125, -261.2976379394531, -252.57200622558594, -243.84637451171875, -235.12075805664062, -226.3950958251953, -217.66946411132812, -208.94384765625, -200.2182159423828, -191.49258422851562, -182.7669677734375, -174.0413360595703, -165.31570434570312, -156.590087890625, -147.8644561767578, -139.1388397216797, -130.4132080078125, -121.68758392333984, -112.96195983886719, -104.236328125, -95.51070404052734, -86.78507995605469, -78.05945587158203, -69.33383178710938, -60.60820007324219, -51.88257598876953, -43.156951904296875, -34.43132400512695, -25.70569610595703, -16.98006820678711, -8.25444221496582, 0.47118377685546875, 9.196809768676758, 17.922435760498047, 26.648059844970703, 35.373687744140625, 44.09931564331055, 52.8249397277832]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 15.0, 12.0, 8.0, 16.0, 19.0, 28.0, 18.0, 25.0, 26.0, 32.0, 33.0, 45.0, 37.0, 48.0, 44.0, 40.0, 47.0, 47.0, 43.0, 49.0, 54.0, 39.0, 36.0, 31.0, 30.0, 26.0, 22.0, 27.0, 21.0, 15.0, 17.0, 15.0, 9.0, 8.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.72566223144531, -74.46015167236328, -72.19464111328125, -69.92913055419922, -67.66361999511719, -65.39810943603516, -63.13259506225586, -60.86708450317383, -58.6015739440918, -56.336063385009766, -54.070552825927734, -51.8050422668457, -49.539527893066406, -47.274017333984375, -45.008506774902344, -42.74299621582031, -40.47748565673828, -38.21197509765625, -35.94646453857422, -33.68095397949219, -31.415441513061523, -29.149930953979492, -26.884418487548828, -24.618907928466797, -22.353397369384766, -20.087886810302734, -17.822376251220703, -15.556863784790039, -13.291353225708008, -11.025842666625977, -8.760331153869629, -6.494819641113281, -4.229301452636719, -1.9637904167175293, 0.30172061920166016, 2.5672316551208496, 4.832742691040039, 7.09825325012207, 9.363764762878418, 11.629276275634766, 13.894786834716797, 16.160297393798828, 18.42580795288086, 20.691320419311523, 22.956830978393555, 25.222341537475586, 27.48785400390625, 29.75336456298828, 32.01887512207031, 34.284385681152344, 36.549896240234375, 38.815406799316406, 41.08091735839844, 43.34642791748047, 45.611942291259766, 47.8774528503418, 50.14296340942383, 52.40847396850586, 54.67398452758789, 56.93949508666992, 59.20500946044922, 61.47052001953125, 63.73603057861328, 66.00154113769531, 68.26705169677734]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 9.0, 8.0, 11.0, 13.0, 19.0, 36.0, 40.0, 32.0, 25.0, 40.0, 31.0, 40.0, 40.0, 52.0, 48.0, 54.0, 39.0, 50.0, 43.0, 52.0, 44.0, 50.0, 35.0, 30.0, 35.0, 17.0, 20.0, 14.0, 17.0, 16.0, 5.0, 5.0, 10.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6640625, -8.372314453125, -8.08056640625, -7.788818359375, -7.4970703125, -7.205322265625, -6.91357421875, -6.621826171875, -6.330078125, -6.038330078125, -5.74658203125, -5.454833984375, -5.1630859375, -4.871337890625, -4.57958984375, -4.287841796875, -3.99609375, -3.704345703125, -3.41259765625, -3.120849609375, -2.8291015625, -2.537353515625, -2.24560546875, -1.953857421875, -1.662109375, -1.370361328125, -1.07861328125, -0.786865234375, -0.4951171875, -0.203369140625, 0.08837890625, 0.380126953125, 0.671875, 0.963623046875, 1.25537109375, 1.547119140625, 1.8388671875, 2.130615234375, 2.42236328125, 2.714111328125, 3.005859375, 3.297607421875, 3.58935546875, 3.881103515625, 4.1728515625, 4.464599609375, 4.75634765625, 5.048095703125, 5.33984375, 5.631591796875, 5.92333984375, 6.215087890625, 6.5068359375, 6.798583984375, 7.09033203125, 7.382080078125, 7.673828125, 7.965576171875, 8.25732421875, 8.549072265625, 8.8408203125, 9.132568359375, 9.42431640625, 9.716064453125, 10.0078125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 9.0, 7.0, 11.0, 18.0, 36.0, 50.0, 65.0, 87.0, 139.0, 226.0, 289.0, 428.0, 636.0, 879.0, 1351.0, 2120.0, 3040.0, 4973.0, 7672.0, 12197.0, 19816.0, 32203.0, 53255.0, 95600.0, 220588.0, 316554.0, 115541.0, 62481.0, 36819.0, 22474.0, 14011.0, 8845.0, 5527.0, 3599.0, 2270.0, 1549.0, 983.0, 683.0, 455.0, 321.0, 233.0, 161.0, 113.0, 67.0, 50.0, 43.0, 27.0, 21.0, 14.0, 6.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0], "bins": [-1.7177734375, -1.6659393310546875, -1.614105224609375, -1.5622711181640625, -1.51043701171875, -1.4586029052734375, -1.406768798828125, -1.3549346923828125, -1.3031005859375, -1.2512664794921875, -1.199432373046875, -1.1475982666015625, -1.09576416015625, -1.0439300537109375, -0.992095947265625, -0.9402618408203125, -0.888427734375, -0.8365936279296875, -0.784759521484375, -0.7329254150390625, -0.68109130859375, -0.6292572021484375, -0.577423095703125, -0.5255889892578125, -0.4737548828125, -0.4219207763671875, -0.370086669921875, -0.3182525634765625, -0.26641845703125, -0.2145843505859375, -0.162750244140625, -0.1109161376953125, -0.05908203125, -0.0072479248046875, 0.044586181640625, 0.0964202880859375, 0.14825439453125, 0.2000885009765625, 0.251922607421875, 0.3037567138671875, 0.3555908203125, 0.4074249267578125, 0.459259033203125, 0.5110931396484375, 0.56292724609375, 0.6147613525390625, 0.666595458984375, 0.7184295654296875, 0.770263671875, 0.8220977783203125, 0.873931884765625, 0.9257659912109375, 0.97760009765625, 1.0294342041015625, 1.081268310546875, 1.1331024169921875, 1.1849365234375, 1.2367706298828125, 1.288604736328125, 1.3404388427734375, 1.39227294921875, 1.4441070556640625, 1.495941162109375, 1.5477752685546875, 1.599609375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 11.0, 12.0, 9.0, 16.0, 13.0, 12.0, 15.0, 33.0, 25.0, 27.0, 31.0, 34.0, 31.0, 35.0, 45.0, 39.0, 33.0, 34.0, 1069.0, 42.0, 44.0, 38.0, 29.0, 36.0, 32.0, 33.0, 23.0, 24.0, 21.0, 18.0, 12.0, 15.0, 22.0, 12.0, 19.0, 10.0, 13.0, 13.0, 9.0, 14.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-4.65234375, -4.506591796875, -4.36083984375, -4.215087890625, -4.0693359375, -3.923583984375, -3.77783203125, -3.632080078125, -3.486328125, -3.340576171875, -3.19482421875, -3.049072265625, -2.9033203125, -2.757568359375, -2.61181640625, -2.466064453125, -2.3203125, -2.174560546875, -2.02880859375, -1.883056640625, -1.7373046875, -1.591552734375, -1.44580078125, -1.300048828125, -1.154296875, -1.008544921875, -0.86279296875, -0.717041015625, -0.5712890625, -0.425537109375, -0.27978515625, -0.134033203125, 0.01171875, 0.157470703125, 0.30322265625, 0.448974609375, 0.5947265625, 0.740478515625, 0.88623046875, 1.031982421875, 1.177734375, 1.323486328125, 1.46923828125, 1.614990234375, 1.7607421875, 1.906494140625, 2.05224609375, 2.197998046875, 2.34375, 2.489501953125, 2.63525390625, 2.781005859375, 2.9267578125, 3.072509765625, 3.21826171875, 3.364013671875, 3.509765625, 3.655517578125, 3.80126953125, 3.947021484375, 4.0927734375, 4.238525390625, 4.38427734375, 4.530029296875, 4.67578125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 11.0, 8.0, 9.0, 29.0, 35.0, 48.0, 66.0, 104.0, 160.0, 208.0, 335.0, 454.0, 679.0, 970.0, 1484.0, 2313.0, 3409.0, 5057.0, 7339.0, 10759.0, 16020.0, 24156.0, 38063.0, 61746.0, 111538.0, 1337385.0, 220575.0, 96741.0, 55013.0, 34500.0, 22721.0, 15085.0, 9954.0, 6691.0, 4460.0, 3049.0, 1894.0, 1332.0, 882.0, 582.0, 399.0, 266.0, 203.0, 132.0, 91.0, 37.0, 40.0, 29.0, 27.0, 11.0, 5.0, 11.0, 8.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-1.4013671875, -1.357421875, -1.3134765625, -1.26953125, -1.2255859375, -1.181640625, -1.1376953125, -1.09375, -1.0498046875, -1.005859375, -0.9619140625, -0.91796875, -0.8740234375, -0.830078125, -0.7861328125, -0.7421875, -0.6982421875, -0.654296875, -0.6103515625, -0.56640625, -0.5224609375, -0.478515625, -0.4345703125, -0.390625, -0.3466796875, -0.302734375, -0.2587890625, -0.21484375, -0.1708984375, -0.126953125, -0.0830078125, -0.0390625, 0.0048828125, 0.048828125, 0.0927734375, 0.13671875, 0.1806640625, 0.224609375, 0.2685546875, 0.3125, 0.3564453125, 0.400390625, 0.4443359375, 0.48828125, 0.5322265625, 0.576171875, 0.6201171875, 0.6640625, 0.7080078125, 0.751953125, 0.7958984375, 0.83984375, 0.8837890625, 0.927734375, 0.9716796875, 1.015625, 1.0595703125, 1.103515625, 1.1474609375, 1.19140625, 1.2353515625, 1.279296875, 1.3232421875, 1.3671875, 1.4111328125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 3.0, 7.0, 6.0, 13.0, 13.0, 14.0, 25.0, 24.0, 32.0, 37.0, 37.0, 52.0, 87.0, 71.0, 91.0, 73.0, 83.0, 64.0, 48.0, 37.0, 38.0, 28.0, 25.0, 18.0, 12.0, 8.0, 15.0, 10.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0009341239929199219, -0.0009048283100128174, -0.0008755326271057129, -0.0008462369441986084, -0.0008169412612915039, -0.0007876455783843994, -0.0007583498954772949, -0.0007290542125701904, -0.0006997585296630859, -0.0006704628467559814, -0.000641167163848877, -0.0006118714809417725, -0.000582575798034668, -0.0005532801151275635, -0.000523984432220459, -0.0004946887493133545, -0.00046539306640625, -0.0004360973834991455, -0.000406801700592041, -0.0003775060176849365, -0.00034821033477783203, -0.00031891465187072754, -0.00028961896896362305, -0.00026032328605651855, -0.00023102760314941406, -0.00020173192024230957, -0.00017243623733520508, -0.00014314055442810059, -0.0001138448715209961, -8.45491886138916e-05, -5.525350570678711e-05, -2.5957822799682617e-05, 3.337860107421875e-06, 3.263354301452637e-05, 6.192922592163086e-05, 9.122490882873535e-05, 0.00012052059173583984, 0.00014981627464294434, 0.00017911195755004883, 0.00020840764045715332, 0.0002377033233642578, 0.0002669990062713623, 0.0002962946891784668, 0.0003255903720855713, 0.0003548860549926758, 0.0003841817378997803, 0.00041347742080688477, 0.00044277310371398926, 0.00047206878662109375, 0.0005013644695281982, 0.0005306601524353027, 0.0005599558353424072, 0.0005892515182495117, 0.0006185472011566162, 0.0006478428840637207, 0.0006771385669708252, 0.0007064342498779297, 0.0007357299327850342, 0.0007650256156921387, 0.0007943212985992432, 0.0008236169815063477, 0.0008529126644134521, 0.0008822083473205566, 0.0009115040302276611, 0.0009407997131347656]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 10.0, 7.0, 12.0, 17.0, 24.0, 38.0, 50.0, 71.0, 120.0, 210.0, 438.0, 1368.0, 938913.0, 105617.0, 838.0, 348.0, 178.0, 96.0, 53.0, 39.0, 23.0, 22.0, 14.0, 15.0, 7.0, 4.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0251312255859375, -0.024366140365600586, -0.023601055145263672, -0.022835969924926758, -0.022070884704589844, -0.02130579948425293, -0.020540714263916016, -0.0197756290435791, -0.019010543823242188, -0.018245458602905273, -0.01748037338256836, -0.016715288162231445, -0.01595020294189453, -0.015185117721557617, -0.014420032501220703, -0.013654947280883789, -0.012889862060546875, -0.012124776840209961, -0.011359691619873047, -0.010594606399536133, -0.009829521179199219, -0.009064435958862305, -0.00829935073852539, -0.0075342655181884766, -0.0067691802978515625, -0.0060040950775146484, -0.005239009857177734, -0.00447392463684082, -0.0037088394165039062, -0.002943754196166992, -0.002178668975830078, -0.001413583755493164, -0.00064849853515625, 0.00011658668518066406, 0.0008816719055175781, 0.0016467571258544922, 0.0024118423461914062, 0.0031769275665283203, 0.003942012786865234, 0.0047070980072021484, 0.0054721832275390625, 0.0062372684478759766, 0.007002353668212891, 0.007767438888549805, 0.008532524108886719, 0.009297609329223633, 0.010062694549560547, 0.010827779769897461, 0.011592864990234375, 0.012357950210571289, 0.013123035430908203, 0.013888120651245117, 0.014653205871582031, 0.015418291091918945, 0.01618337631225586, 0.016948461532592773, 0.017713546752929688, 0.0184786319732666, 0.019243717193603516, 0.02000880241394043, 0.020773887634277344, 0.021538972854614258, 0.022304058074951172, 0.023069143295288086, 0.023834228515625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 8.0, 23.0, 170.0, 421.0, 285.0, 88.0, 19.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00039740331703796983, -0.00032775328145362437, -0.0002581032458692789, -0.00018845321028493345, -0.00011880317470058799, -4.915313911624253e-05, 2.0496896468102932e-05, 9.014693205244839e-05, 0.00015979696763679385, 0.0002294470032211393, 0.00029909703880548477, 0.00036874707438983023, 0.0004383971099741757, 0.0005080471746623516, 0.0005776971811428666, 0.0006473471876233816, 0.0007169972523115575, 0.0007866473169997334, 0.0008562973234802485, 0.0009259473299607635, 0.0009955973364412785, 0.0010652474593371153, 0.0011348974658176303, 0.0012045474722981453, 0.0012741975951939821, 0.0013438476016744971, 0.0014134976081550121, 0.001483147731050849, 0.001552797737531364, 0.001622447744011879, 0.0016920978669077158, 0.0017617478733882308, 0.0018313978798687458, 0.0019010478863492608, 0.001970697892829776, 0.0020403480157256126, 0.002109997905790806, 0.0021796480286866426, 0.0022492981515824795, 0.0023189480416476727, 0.0023885981645435095, 0.0024582482874393463, 0.0025278981775045395, 0.0025975483004003763, 0.002667198423296213, 0.0027368483133614063, 0.002806498436257243, 0.0028761483263224363, 0.002945798449218273, 0.00301544857211411, 0.003085098462179303, 0.00315474858507514, 0.003224398475140333, 0.00329404859803617, 0.003363698720932007, 0.0034333486109972, 0.003502998733893037, 0.0035726488567888737, 0.003642298746854067, 0.0037119488697499037, 0.0037815989926457405, 0.0038512488827109337, 0.003920898772776127, 0.003990549128502607, 0.0040601990185678005]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 12.0, 12.0, 16.0, 14.0, 21.0, 21.0, 30.0, 24.0, 32.0, 28.0, 30.0, 30.0, 41.0, 32.0, 31.0, 37.0, 41.0, 47.0, 29.0, 43.0, 43.0, 37.0, 41.0, 30.0, 32.0, 30.0, 20.0, 31.0, 18.0, 23.0, 17.0, 19.0, 16.0, 15.0, 9.0, 4.0, 4.0, 8.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.00044715404510498047, -0.0004346594214439392, -0.00042216479778289795, -0.0004096701741218567, -0.00039717555046081543, -0.00038468092679977417, -0.0003721863031387329, -0.00035969167947769165, -0.0003471970558166504, -0.00033470243215560913, -0.00032220780849456787, -0.0003097131848335266, -0.00029721856117248535, -0.0002847239375114441, -0.00027222931385040283, -0.00025973469018936157, -0.0002472400665283203, -0.00023474544286727905, -0.0002222508192062378, -0.00020975619554519653, -0.00019726157188415527, -0.00018476694822311401, -0.00017227232456207275, -0.0001597777009010315, -0.00014728307723999023, -0.00013478845357894897, -0.00012229382991790771, -0.00010979920625686646, -9.73045825958252e-05, -8.480995893478394e-05, -7.231533527374268e-05, -5.9820711612701416e-05, -4.7326087951660156e-05, -3.4831464290618896e-05, -2.2336840629577637e-05, -9.842216968536377e-06, 2.652406692504883e-06, 1.5147030353546143e-05, 2.7641654014587402e-05, 4.013627767562866e-05, 5.263090133666992e-05, 6.512552499771118e-05, 7.762014865875244e-05, 9.01147723197937e-05, 0.00010260939598083496, 0.00011510401964187622, 0.00012759864330291748, 0.00014009326696395874, 0.000152587890625, 0.00016508251428604126, 0.00017757713794708252, 0.00019007176160812378, 0.00020256638526916504, 0.0002150610089302063, 0.00022755563259124756, 0.00024005025625228882, 0.0002525448799133301, 0.00026503950357437134, 0.0002775341272354126, 0.00029002875089645386, 0.0003025233745574951, 0.0003150179982185364, 0.00032751262187957764, 0.0003400072455406189, 0.00035250186920166016]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 9.0, 8.0, 11.0, 13.0, 19.0, 36.0, 40.0, 32.0, 25.0, 40.0, 31.0, 40.0, 40.0, 52.0, 48.0, 54.0, 39.0, 50.0, 43.0, 52.0, 44.0, 50.0, 35.0, 30.0, 35.0, 17.0, 20.0, 14.0, 17.0, 16.0, 5.0, 5.0, 10.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6640625, -8.372314453125, -8.08056640625, -7.788818359375, -7.4970703125, -7.205322265625, -6.91357421875, -6.621826171875, -6.330078125, -6.038330078125, -5.74658203125, -5.454833984375, -5.1630859375, -4.871337890625, -4.57958984375, -4.287841796875, -3.99609375, -3.704345703125, -3.41259765625, -3.120849609375, -2.8291015625, -2.537353515625, -2.24560546875, -1.953857421875, -1.662109375, -1.370361328125, -1.07861328125, -0.786865234375, -0.4951171875, -0.203369140625, 0.08837890625, 0.380126953125, 0.671875, 0.963623046875, 1.25537109375, 1.547119140625, 1.8388671875, 2.130615234375, 2.42236328125, 2.714111328125, 3.005859375, 3.297607421875, 3.58935546875, 3.881103515625, 4.1728515625, 4.464599609375, 4.75634765625, 5.048095703125, 5.33984375, 5.631591796875, 5.92333984375, 6.215087890625, 6.5068359375, 6.798583984375, 7.09033203125, 7.382080078125, 7.673828125, 7.965576171875, 8.25732421875, 8.549072265625, 8.8408203125, 9.132568359375, 9.42431640625, 9.716064453125, 10.0078125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 8.0, 12.0, 8.0, 20.0, 29.0, 38.0, 58.0, 106.0, 140.0, 225.0, 446.0, 775.0, 1564.0, 3091.0, 6929.0, 18139.0, 51951.0, 189971.0, 534639.0, 164897.0, 46672.0, 16265.0, 6500.0, 2944.0, 1389.0, 691.0, 369.0, 254.0, 133.0, 88.0, 66.0, 49.0, 28.0, 17.0, 15.0, 4.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.26171875, -6.05609130859375, -5.8504638671875, -5.64483642578125, -5.439208984375, -5.23358154296875, -5.0279541015625, -4.82232666015625, -4.61669921875, -4.41107177734375, -4.2054443359375, -3.99981689453125, -3.794189453125, -3.58856201171875, -3.3829345703125, -3.17730712890625, -2.9716796875, -2.76605224609375, -2.5604248046875, -2.35479736328125, -2.149169921875, -1.94354248046875, -1.7379150390625, -1.53228759765625, -1.32666015625, -1.12103271484375, -0.9154052734375, -0.70977783203125, -0.504150390625, -0.29852294921875, -0.0928955078125, 0.11273193359375, 0.318359375, 0.52398681640625, 0.7296142578125, 0.93524169921875, 1.140869140625, 1.34649658203125, 1.5521240234375, 1.75775146484375, 1.96337890625, 2.16900634765625, 2.3746337890625, 2.58026123046875, 2.785888671875, 2.99151611328125, 3.1971435546875, 3.40277099609375, 3.6083984375, 3.81402587890625, 4.0196533203125, 4.22528076171875, 4.430908203125, 4.63653564453125, 4.8421630859375, 5.04779052734375, 5.25341796875, 5.45904541015625, 5.6646728515625, 5.87030029296875, 6.075927734375, 6.28155517578125, 6.4871826171875, 6.69281005859375, 6.8984375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 10.0, 8.0, 11.0, 9.0, 9.0, 13.0, 16.0, 14.0, 28.0, 18.0, 20.0, 28.0, 42.0, 35.0, 55.0, 45.0, 55.0, 78.0, 174.0, 1669.0, 174.0, 84.0, 70.0, 43.0, 45.0, 41.0, 42.0, 28.0, 28.0, 26.0, 21.0, 22.0, 12.0, 11.0, 15.0, 12.0, 5.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.140625, -24.257568359375, -23.37451171875, -22.491455078125, -21.6083984375, -20.725341796875, -19.84228515625, -18.959228515625, -18.076171875, -17.193115234375, -16.31005859375, -15.427001953125, -14.5439453125, -13.660888671875, -12.77783203125, -11.894775390625, -11.01171875, -10.128662109375, -9.24560546875, -8.362548828125, -7.4794921875, -6.596435546875, -5.71337890625, -4.830322265625, -3.947265625, -3.064208984375, -2.18115234375, -1.298095703125, -0.4150390625, 0.468017578125, 1.35107421875, 2.234130859375, 3.1171875, 4.000244140625, 4.88330078125, 5.766357421875, 6.6494140625, 7.532470703125, 8.41552734375, 9.298583984375, 10.181640625, 11.064697265625, 11.94775390625, 12.830810546875, 13.7138671875, 14.596923828125, 15.47998046875, 16.363037109375, 17.24609375, 18.129150390625, 19.01220703125, 19.895263671875, 20.7783203125, 21.661376953125, 22.54443359375, 23.427490234375, 24.310546875, 25.193603515625, 26.07666015625, 26.959716796875, 27.8427734375, 28.725830078125, 29.60888671875, 30.491943359375, 31.375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 14.0, 26.0, 39.0, 60.0, 104.0, 215.0, 450.0, 1935.0, 3080681.0, 60441.0, 1058.0, 313.0, 150.0, 71.0, 47.0, 36.0, 28.0, 15.0, 13.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-175.375, -171.0810546875, -166.787109375, -162.4931640625, -158.19921875, -153.9052734375, -149.611328125, -145.3173828125, -141.0234375, -136.7294921875, -132.435546875, -128.1416015625, -123.84765625, -119.5537109375, -115.259765625, -110.9658203125, -106.671875, -102.3779296875, -98.083984375, -93.7900390625, -89.49609375, -85.2021484375, -80.908203125, -76.6142578125, -72.3203125, -68.0263671875, -63.732421875, -59.4384765625, -55.14453125, -50.8505859375, -46.556640625, -42.2626953125, -37.96875, -33.6748046875, -29.380859375, -25.0869140625, -20.79296875, -16.4990234375, -12.205078125, -7.9111328125, -3.6171875, 0.6767578125, 4.970703125, 9.2646484375, 13.55859375, 17.8525390625, 22.146484375, 26.4404296875, 30.734375, 35.0283203125, 39.322265625, 43.6162109375, 47.91015625, 52.2041015625, 56.498046875, 60.7919921875, 65.0859375, 69.3798828125, 73.673828125, 77.9677734375, 82.26171875, 86.5556640625, 90.849609375, 95.1435546875, 99.4375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 6.0, 578.0, 431.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.53816223144531, -52.896820068359375, -42.25547790527344, -31.614131927490234, -20.972789764404297, -10.33144760131836, 0.30989837646484375, 10.951240539550781, 21.59258270263672, 32.233924865722656, 42.875267028808594, 53.5166130065918, 64.157958984375, 74.79930114746094, 85.44064331054688, 96.08198547363281, 106.72332763671875, 117.36466979980469, 128.00601196289062, 138.64735412597656, 149.2886962890625, 159.93003845214844, 170.57138061523438, 181.21273803710938, 191.85406494140625, 202.4954071044922, 213.13674926757812, 223.77809143066406, 234.41943359375, 245.06077575683594, 255.70211791992188, 266.3434753417969, 276.9848327636719, 287.6261901855469, 298.26751708984375, 308.90887451171875, 319.5502014160156, 330.1915588378906, 340.8328857421875, 351.4742431640625, 362.1155700683594, 372.7569274902344, 383.39825439453125, 394.03961181640625, 404.6809387207031, 415.3222961425781, 425.963623046875, 436.60498046875, 447.246337890625, 457.8876953125, 468.5290222167969, 479.1703796386719, 489.81170654296875, 500.45306396484375, 511.0943908691406, 521.7357177734375, 532.3770751953125, 543.0184326171875, 553.6597900390625, 564.3010864257812, 574.9424438476562, 585.5838012695312, 596.2251586914062, 606.866455078125, 617.5078125]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 9.0, 9.0, 9.0, 8.0, 8.0, 16.0, 9.0, 14.0, 11.0, 16.0, 23.0, 28.0, 23.0, 20.0, 21.0, 35.0, 29.0, 38.0, 29.0, 45.0, 31.0, 53.0, 34.0, 42.0, 29.0, 38.0, 38.0, 32.0, 30.0, 32.0, 38.0, 19.0, 25.0, 25.0, 19.0, 17.0, 15.0, 17.0, 18.0, 16.0, 6.0, 3.0, 10.0, 3.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-71.00201416015625, -68.90438842773438, -66.8067626953125, -64.70913696289062, -62.61151123046875, -60.513885498046875, -58.416255950927734, -56.31863021850586, -54.221004486083984, -52.12337875366211, -50.025753021240234, -47.92812728881836, -45.83049774169922, -43.732872009277344, -41.63524627685547, -39.537620544433594, -37.43999481201172, -35.342369079589844, -33.24474334716797, -31.14711570739746, -29.049489974975586, -26.95186424255371, -24.854236602783203, -22.756610870361328, -20.658985137939453, -18.561359405517578, -16.463733673095703, -14.366106033325195, -12.26848030090332, -10.170854568481445, -8.073227882385254, -5.9756011962890625, -3.877979278564453, -1.78035306930542, 0.3172731399536133, 2.4148993492126465, 4.51252555847168, 6.610151290893555, 8.707777976989746, 10.805404663085938, 12.903030395507812, 15.000656127929688, 17.098281860351562, 19.19590950012207, 21.293535232543945, 23.39116096496582, 25.488788604736328, 27.586414337158203, 29.684040069580078, 31.781665802001953, 33.87929153442383, 35.9769172668457, 38.074546813964844, 40.17217254638672, 42.269798278808594, 44.36742401123047, 46.465049743652344, 48.56267547607422, 50.660301208496094, 52.75792694091797, 54.855552673339844, 56.95317840576172, 59.05080795288086, 61.148433685302734, 63.24605941772461]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 4.0, 13.0, 14.0, 30.0, 26.0, 29.0, 31.0, 30.0, 25.0, 41.0, 40.0, 36.0, 54.0, 35.0, 46.0, 45.0, 48.0, 46.0, 44.0, 51.0, 44.0, 37.0, 33.0, 35.0, 19.0, 28.0, 22.0, 12.0, 16.0, 7.0, 11.0, 7.0, 8.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.406494140625, -8.11767578125, -7.828857421875, -7.5400390625, -7.251220703125, -6.96240234375, -6.673583984375, -6.384765625, -6.095947265625, -5.80712890625, -5.518310546875, -5.2294921875, -4.940673828125, -4.65185546875, -4.363037109375, -4.07421875, -3.785400390625, -3.49658203125, -3.207763671875, -2.9189453125, -2.630126953125, -2.34130859375, -2.052490234375, -1.763671875, -1.474853515625, -1.18603515625, -0.897216796875, -0.6083984375, -0.319580078125, -0.03076171875, 0.258056640625, 0.546875, 0.835693359375, 1.12451171875, 1.413330078125, 1.7021484375, 1.990966796875, 2.27978515625, 2.568603515625, 2.857421875, 3.146240234375, 3.43505859375, 3.723876953125, 4.0126953125, 4.301513671875, 4.59033203125, 4.879150390625, 5.16796875, 5.456787109375, 5.74560546875, 6.034423828125, 6.3232421875, 6.612060546875, 6.90087890625, 7.189697265625, 7.478515625, 7.767333984375, 8.05615234375, 8.344970703125, 8.6337890625, 8.922607421875, 9.21142578125, 9.500244140625, 9.7890625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 11.0, 11.0, 11.0, 15.0, 28.0, 30.0, 39.0, 27.0, 40.0, 56.0, 102.0, 131.0, 244.0, 926.0, 27546.0, 3866458.0, 295240.0, 2354.0, 339.0, 185.0, 133.0, 83.0, 55.0, 26.0, 31.0, 28.0, 27.0, 15.0, 16.0, 10.0, 9.0, 10.0, 8.0, 4.0, 6.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.0, -45.4169921875, -43.833984375, -42.2509765625, -40.66796875, -39.0849609375, -37.501953125, -35.9189453125, -34.3359375, -32.7529296875, -31.169921875, -29.5869140625, -28.00390625, -26.4208984375, -24.837890625, -23.2548828125, -21.671875, -20.0888671875, -18.505859375, -16.9228515625, -15.33984375, -13.7568359375, -12.173828125, -10.5908203125, -9.0078125, -7.4248046875, -5.841796875, -4.2587890625, -2.67578125, -1.0927734375, 0.490234375, 2.0732421875, 3.65625, 5.2392578125, 6.822265625, 8.4052734375, 9.98828125, 11.5712890625, 13.154296875, 14.7373046875, 16.3203125, 17.9033203125, 19.486328125, 21.0693359375, 22.65234375, 24.2353515625, 25.818359375, 27.4013671875, 28.984375, 30.5673828125, 32.150390625, 33.7333984375, 35.31640625, 36.8994140625, 38.482421875, 40.0654296875, 41.6484375, 43.2314453125, 44.814453125, 46.3974609375, 47.98046875, 49.5634765625, 51.146484375, 52.7294921875, 54.3125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 8.0, 10.0, 10.0, 18.0, 38.0, 51.0, 86.0, 94.0, 172.0, 241.0, 413.0, 532.0, 632.0, 505.0, 431.0, 273.0, 213.0, 120.0, 69.0, 49.0, 39.0, 22.0, 18.0, 12.0, 6.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.796875, -22.026123046875, -21.25537109375, -20.484619140625, -19.7138671875, -18.943115234375, -18.17236328125, -17.401611328125, -16.630859375, -15.860107421875, -15.08935546875, -14.318603515625, -13.5478515625, -12.777099609375, -12.00634765625, -11.235595703125, -10.46484375, -9.694091796875, -8.92333984375, -8.152587890625, -7.3818359375, -6.611083984375, -5.84033203125, -5.069580078125, -4.298828125, -3.528076171875, -2.75732421875, -1.986572265625, -1.2158203125, -0.445068359375, 0.32568359375, 1.096435546875, 1.8671875, 2.637939453125, 3.40869140625, 4.179443359375, 4.9501953125, 5.720947265625, 6.49169921875, 7.262451171875, 8.033203125, 8.803955078125, 9.57470703125, 10.345458984375, 11.1162109375, 11.886962890625, 12.65771484375, 13.428466796875, 14.19921875, 14.969970703125, 15.74072265625, 16.511474609375, 17.2822265625, 18.052978515625, 18.82373046875, 19.594482421875, 20.365234375, 21.135986328125, 21.90673828125, 22.677490234375, 23.4482421875, 24.218994140625, 24.98974609375, 25.760498046875, 26.53125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 10.0, 13.0, 6.0, 3.0, 20.0, 29.0, 28.0, 44.0, 53.0, 57.0, 84.0, 103.0, 162.0, 243.0, 362.0, 683.0, 1838.0, 38526.0, 4005184.0, 141776.0, 2969.0, 772.0, 388.0, 230.0, 161.0, 123.0, 71.0, 70.0, 54.0, 47.0, 43.0, 28.0, 22.0, 18.0, 16.0, 15.0, 7.0, 4.0, 5.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-77.125, -74.8310546875, -72.537109375, -70.2431640625, -67.94921875, -65.6552734375, -63.361328125, -61.0673828125, -58.7734375, -56.4794921875, -54.185546875, -51.8916015625, -49.59765625, -47.3037109375, -45.009765625, -42.7158203125, -40.421875, -38.1279296875, -35.833984375, -33.5400390625, -31.24609375, -28.9521484375, -26.658203125, -24.3642578125, -22.0703125, -19.7763671875, -17.482421875, -15.1884765625, -12.89453125, -10.6005859375, -8.306640625, -6.0126953125, -3.71875, -1.4248046875, 0.869140625, 3.1630859375, 5.45703125, 7.7509765625, 10.044921875, 12.3388671875, 14.6328125, 16.9267578125, 19.220703125, 21.5146484375, 23.80859375, 26.1025390625, 28.396484375, 30.6904296875, 32.984375, 35.2783203125, 37.572265625, 39.8662109375, 42.16015625, 44.4541015625, 46.748046875, 49.0419921875, 51.3359375, 53.6298828125, 55.923828125, 58.2177734375, 60.51171875, 62.8056640625, 65.099609375, 67.3935546875, 69.6875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 16.0, 55.0, 144.0, 208.0, 243.0, 186.0, 106.0, 28.0, 14.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.00889587402344, -197.00038146972656, -191.99188232421875, -186.98336791992188, -181.974853515625, -176.9663543701172, -171.9578399658203, -166.9493408203125, -161.94082641601562, -156.93231201171875, -151.92381286621094, -146.91529846191406, -141.9067840576172, -136.89828491210938, -131.8897705078125, -126.88126373291016, -121.87274932861328, -116.86424255371094, -111.85572814941406, -106.84722137451172, -101.83871459960938, -96.8302001953125, -91.82169342041016, -86.81318664550781, -81.80467224121094, -76.7961654663086, -71.78765106201172, -66.77914428710938, -61.77063751220703, -56.76212692260742, -51.75361633300781, -46.74510955810547, -41.736595153808594, -36.728084564208984, -31.71957778930664, -26.71106719970703, -21.702558517456055, -16.694049835205078, -11.685539245605469, -6.677032470703125, -1.6685218811035156, 3.339987277984619, 8.348496437072754, 13.357006072998047, 18.365514755249023, 23.3740234375, 28.38253402709961, 33.39104080200195, 38.39955139160156, 43.40806198120117, 48.416568756103516, 53.425079345703125, 58.43358612060547, 63.44209671020508, 68.45060729980469, 73.45911407470703, 78.46762084960938, 83.47612762451172, 88.4846420288086, 93.49314880371094, 98.50165557861328, 103.51016235351562, 108.5186767578125, 113.52718353271484, 118.53569793701172]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 3.0, 5.0, 15.0, 9.0, 11.0, 14.0, 13.0, 13.0, 16.0, 19.0, 25.0, 28.0, 32.0, 25.0, 40.0, 29.0, 36.0, 52.0, 34.0, 43.0, 39.0, 40.0, 41.0, 36.0, 44.0, 46.0, 38.0, 29.0, 21.0, 31.0, 21.0, 20.0, 12.0, 16.0, 14.0, 20.0, 7.0, 16.0, 10.0, 12.0, 4.0, 2.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.48942184448242, -53.6074104309082, -51.72539520263672, -49.8433837890625, -47.96137237548828, -46.0793571472168, -44.19734573364258, -42.315330505371094, -40.433319091796875, -38.551307678222656, -36.66929244995117, -34.78728103637695, -32.90526580810547, -31.02325439453125, -29.14124298095703, -27.25922966003418, -25.377216339111328, -23.495203018188477, -21.613189697265625, -19.731178283691406, -17.849164962768555, -15.967151641845703, -14.085139274597168, -12.203126907348633, -10.321113586425781, -8.43910026550293, -6.5570878982543945, -4.675075054168701, -2.793062210083008, -0.9110488891601562, 0.9709634780883789, 2.852975845336914, 4.734992980957031, 6.617005825042725, 8.499018669128418, 10.381031036376953, 12.263044357299805, 14.145057678222656, 16.027069091796875, 17.909082412719727, 19.791095733642578, 21.67310905456543, 23.55512237548828, 25.4371337890625, 27.31914710998535, 29.201160430908203, 31.083171844482422, 32.965187072753906, 34.847198486328125, 36.729209899902344, 38.61122512817383, 40.49323654174805, 42.37525177001953, 44.25726318359375, 46.13927459716797, 48.02128601074219, 49.90330123901367, 51.78531265258789, 53.667327880859375, 55.549339294433594, 57.43135070800781, 59.3133659362793, 61.195377349853516, 63.077392578125, 64.95940399169922]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 5.0, 6.0, 5.0, 2.0, 7.0, 10.0, 9.0, 14.0, 23.0, 24.0, 33.0, 29.0, 31.0, 35.0, 46.0, 29.0, 34.0, 43.0, 44.0, 42.0, 41.0, 55.0, 53.0, 44.0, 45.0, 31.0, 26.0, 40.0, 40.0, 35.0, 19.0, 18.0, 16.0, 15.0, 9.0, 10.0, 11.0, 9.0, 2.0, 6.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.7197265625, -8.431640625, -8.1435546875, -7.85546875, -7.5673828125, -7.279296875, -6.9912109375, -6.703125, -6.4150390625, -6.126953125, -5.8388671875, -5.55078125, -5.2626953125, -4.974609375, -4.6865234375, -4.3984375, -4.1103515625, -3.822265625, -3.5341796875, -3.24609375, -2.9580078125, -2.669921875, -2.3818359375, -2.09375, -1.8056640625, -1.517578125, -1.2294921875, -0.94140625, -0.6533203125, -0.365234375, -0.0771484375, 0.2109375, 0.4990234375, 0.787109375, 1.0751953125, 1.36328125, 1.6513671875, 1.939453125, 2.2275390625, 2.515625, 2.8037109375, 3.091796875, 3.3798828125, 3.66796875, 3.9560546875, 4.244140625, 4.5322265625, 4.8203125, 5.1083984375, 5.396484375, 5.6845703125, 5.97265625, 6.2607421875, 6.548828125, 6.8369140625, 7.125, 7.4130859375, 7.701171875, 7.9892578125, 8.27734375, 8.5654296875, 8.853515625, 9.1416015625, 9.4296875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 10.0, 10.0, 17.0, 26.0, 24.0, 40.0, 73.0, 118.0, 212.0, 292.0, 474.0, 730.0, 1171.0, 1767.0, 2886.0, 4775.0, 8304.0, 14491.0, 25577.0, 46705.0, 87048.0, 195216.0, 369666.0, 135523.0, 67616.0, 36678.0, 20462.0, 11431.0, 6690.0, 4048.0, 2486.0, 1441.0, 920.0, 557.0, 381.0, 238.0, 159.0, 88.0, 59.0, 54.0, 32.0, 29.0, 14.0, 6.0, 4.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9970703125, -1.9332733154296875, -1.869476318359375, -1.8056793212890625, -1.74188232421875, -1.6780853271484375, -1.614288330078125, -1.5504913330078125, -1.4866943359375, -1.4228973388671875, -1.359100341796875, -1.2953033447265625, -1.23150634765625, -1.1677093505859375, -1.103912353515625, -1.0401153564453125, -0.976318359375, -0.9125213623046875, -0.848724365234375, -0.7849273681640625, -0.72113037109375, -0.6573333740234375, -0.593536376953125, -0.5297393798828125, -0.4659423828125, -0.4021453857421875, -0.338348388671875, -0.2745513916015625, -0.21075439453125, -0.1469573974609375, -0.083160400390625, -0.0193634033203125, 0.04443359375, 0.1082305908203125, 0.172027587890625, 0.2358245849609375, 0.29962158203125, 0.3634185791015625, 0.427215576171875, 0.4910125732421875, 0.5548095703125, 0.6186065673828125, 0.682403564453125, 0.7462005615234375, 0.80999755859375, 0.8737945556640625, 0.937591552734375, 1.0013885498046875, 1.065185546875, 1.1289825439453125, 1.192779541015625, 1.2565765380859375, 1.32037353515625, 1.3841705322265625, 1.447967529296875, 1.5117645263671875, 1.5755615234375, 1.6393585205078125, 1.703155517578125, 1.7669525146484375, 1.83074951171875, 1.8945465087890625, 1.958343505859375, 2.0221405029296875, 2.0859375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 2.0, 5.0, 5.0, 3.0, 8.0, 10.0, 12.0, 9.0, 16.0, 8.0, 17.0, 18.0, 19.0, 34.0, 30.0, 19.0, 30.0, 29.0, 35.0, 34.0, 34.0, 35.0, 40.0, 1065.0, 48.0, 41.0, 46.0, 37.0, 34.0, 22.0, 33.0, 32.0, 28.0, 19.0, 21.0, 24.0, 15.0, 15.0, 13.0, 17.0, 10.0, 12.0, 9.0, 7.0, 8.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-5.1875, -5.03265380859375, -4.8778076171875, -4.72296142578125, -4.568115234375, -4.41326904296875, -4.2584228515625, -4.10357666015625, -3.94873046875, -3.79388427734375, -3.6390380859375, -3.48419189453125, -3.329345703125, -3.17449951171875, -3.0196533203125, -2.86480712890625, -2.7099609375, -2.55511474609375, -2.4002685546875, -2.24542236328125, -2.090576171875, -1.93572998046875, -1.7808837890625, -1.62603759765625, -1.47119140625, -1.31634521484375, -1.1614990234375, -1.00665283203125, -0.851806640625, -0.69696044921875, -0.5421142578125, -0.38726806640625, -0.232421875, -0.07757568359375, 0.0772705078125, 0.23211669921875, 0.386962890625, 0.54180908203125, 0.6966552734375, 0.85150146484375, 1.00634765625, 1.16119384765625, 1.3160400390625, 1.47088623046875, 1.625732421875, 1.78057861328125, 1.9354248046875, 2.09027099609375, 2.2451171875, 2.39996337890625, 2.5548095703125, 2.70965576171875, 2.864501953125, 3.01934814453125, 3.1741943359375, 3.32904052734375, 3.48388671875, 3.63873291015625, 3.7935791015625, 3.94842529296875, 4.103271484375, 4.25811767578125, 4.4129638671875, 4.56781005859375, 4.72265625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 1.0, 6.0, 6.0, 9.0, 7.0, 10.0, 15.0, 29.0, 43.0, 70.0, 97.0, 117.0, 165.0, 274.0, 399.0, 570.0, 780.0, 1220.0, 1841.0, 2712.0, 3951.0, 5889.0, 8495.0, 12649.0, 18979.0, 28800.0, 45098.0, 74651.0, 146406.0, 1383790.0, 150377.0, 75895.0, 45578.0, 29302.0, 19488.0, 12859.0, 8347.0, 5823.0, 3953.0, 2661.0, 1787.0, 1275.0, 839.0, 577.0, 396.0, 275.0, 181.0, 141.0, 94.0, 53.0, 44.0, 43.0, 17.0, 19.0, 12.0, 10.0, 8.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0], "bins": [-1.4267578125, -1.3800048828125, -1.333251953125, -1.2864990234375, -1.23974609375, -1.1929931640625, -1.146240234375, -1.0994873046875, -1.052734375, -1.0059814453125, -0.959228515625, -0.9124755859375, -0.86572265625, -0.8189697265625, -0.772216796875, -0.7254638671875, -0.6787109375, -0.6319580078125, -0.585205078125, -0.5384521484375, -0.49169921875, -0.4449462890625, -0.398193359375, -0.3514404296875, -0.3046875, -0.2579345703125, -0.211181640625, -0.1644287109375, -0.11767578125, -0.0709228515625, -0.024169921875, 0.0225830078125, 0.0693359375, 0.1160888671875, 0.162841796875, 0.2095947265625, 0.25634765625, 0.3031005859375, 0.349853515625, 0.3966064453125, 0.443359375, 0.4901123046875, 0.536865234375, 0.5836181640625, 0.63037109375, 0.6771240234375, 0.723876953125, 0.7706298828125, 0.8173828125, 0.8641357421875, 0.910888671875, 0.9576416015625, 1.00439453125, 1.0511474609375, 1.097900390625, 1.1446533203125, 1.19140625, 1.2381591796875, 1.284912109375, 1.3316650390625, 1.37841796875, 1.4251708984375, 1.471923828125, 1.5186767578125, 1.5654296875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 8.0, 6.0, 10.0, 7.0, 20.0, 18.0, 23.0, 50.0, 39.0, 62.0, 65.0, 81.0, 97.0, 79.0, 90.0, 73.0, 63.0, 66.0, 28.0, 28.0, 20.0, 8.0, 10.0, 4.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00136566162109375, -0.0013307034969329834, -0.0012957453727722168, -0.0012607872486114502, -0.0012258291244506836, -0.001190871000289917, -0.0011559128761291504, -0.0011209547519683838, -0.0010859966278076172, -0.0010510385036468506, -0.001016080379486084, -0.0009811222553253174, -0.0009461641311645508, -0.0009112060070037842, -0.0008762478828430176, -0.000841289758682251, -0.0008063316345214844, -0.0007713735103607178, -0.0007364153861999512, -0.0007014572620391846, -0.000666499137878418, -0.0006315410137176514, -0.0005965828895568848, -0.0005616247653961182, -0.0005266666412353516, -0.000491708517074585, -0.00045675039291381836, -0.00042179226875305176, -0.00038683414459228516, -0.00035187602043151855, -0.00031691789627075195, -0.00028195977210998535, -0.00024700164794921875, -0.00021204352378845215, -0.00017708539962768555, -0.00014212727546691895, -0.00010716915130615234, -7.221102714538574e-05, -3.725290298461914e-05, -2.294778823852539e-06, 3.266334533691406e-05, 6.762146949768066e-05, 0.00010257959365844727, 0.00013753771781921387, 0.00017249584197998047, 0.00020745396614074707, 0.00024241209030151367, 0.0002773702144622803, 0.0003123283386230469, 0.0003472864627838135, 0.0003822445869445801, 0.0004172027111053467, 0.0004521608352661133, 0.0004871189594268799, 0.0005220770835876465, 0.0005570352077484131, 0.0005919933319091797, 0.0006269514560699463, 0.0006619095802307129, 0.0006968677043914795, 0.0007318258285522461, 0.0007667839527130127, 0.0008017420768737793, 0.0008367002010345459, 0.0008716583251953125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 6.0, 3.0, 6.0, 4.0, 12.0, 16.0, 22.0, 26.0, 34.0, 49.0, 97.0, 169.0, 354.0, 1432.0, 974412.0, 70495.0, 757.0, 266.0, 120.0, 71.0, 47.0, 39.0, 29.0, 14.0, 10.0, 10.0, 11.0, 4.0, 5.0, 4.0, 7.0, 2.0, 3.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0213623046875, -0.02056574821472168, -0.01976919174194336, -0.01897263526916504, -0.01817607879638672, -0.0173795223236084, -0.016582965850830078, -0.015786409378051758, -0.014989852905273438, -0.014193296432495117, -0.013396739959716797, -0.012600183486938477, -0.011803627014160156, -0.011007070541381836, -0.010210514068603516, -0.009413957595825195, -0.008617401123046875, -0.007820844650268555, -0.007024288177490234, -0.006227731704711914, -0.005431175231933594, -0.0046346187591552734, -0.003838062286376953, -0.003041505813598633, -0.0022449493408203125, -0.0014483928680419922, -0.0006518363952636719, 0.00014472007751464844, 0.0009412765502929688, 0.001737833023071289, 0.0025343894958496094, 0.0033309459686279297, 0.00412750244140625, 0.00492405891418457, 0.005720615386962891, 0.006517171859741211, 0.007313728332519531, 0.008110284805297852, 0.008906841278076172, 0.009703397750854492, 0.010499954223632812, 0.011296510696411133, 0.012093067169189453, 0.012889623641967773, 0.013686180114746094, 0.014482736587524414, 0.015279293060302734, 0.016075849533081055, 0.016872406005859375, 0.017668962478637695, 0.018465518951416016, 0.019262075424194336, 0.020058631896972656, 0.020855188369750977, 0.021651744842529297, 0.022448301315307617, 0.023244857788085938, 0.024041414260864258, 0.024837970733642578, 0.0256345272064209, 0.02643108367919922, 0.02722764015197754, 0.02802419662475586, 0.02882075309753418, 0.0296173095703125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 11.0, 222.0, 615.0, 154.0, 15.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003652448358479887, -0.0002585456822998822, -0.00015184655785560608, -4.514740430749953e-05, 6.155172013677657e-05, 0.00016825084458105266, 0.00027495002723298967, 0.00038164915167726576, 0.0004883483052253723, 0.0005950474296696484, 0.0007017465541139245, 0.0008084457367658615, 0.0009151448612101376, 0.0010218439856544137, 0.0011285431683063507, 0.0012352422345429659, 0.001341941417194903, 0.00144864059984684, 0.001555339666083455, 0.001662038848735392, 0.001768738031387329, 0.0018754370976239443, 0.0019821361638605595, 0.0020888354629278183, 0.0021955345291644335, 0.0023022335954010487, 0.0024089328944683075, 0.0025156319607049227, 0.002622331026941538, 0.0027290303260087967, 0.002835729392245412, 0.002942428458482027, 0.003049127757549286, 0.003155826823785901, 0.00326252612285316, 0.003369225189089775, 0.0034759242553263903, 0.0035826233215630054, 0.0036893226206302643, 0.0037960216868668795, 0.0039027207531034946, 0.0040094200521707535, 0.004116118885576725, 0.004222818184643984, 0.004329517483711243, 0.004436216317117214, 0.004542915616184473, 0.004649614915251732, 0.004756313748657703, 0.004863013047724962, 0.004969711881130934, 0.005076411180198193, 0.005183110479265451, 0.005289809312671423, 0.005396508611738682, 0.005503207910805941, 0.0056099072098731995, 0.005716606508940458, 0.00582330534234643, 0.005930004641413689, 0.0060367039404809475, 0.006143402773886919, 0.006250102072954178, 0.006356801372021437, 0.006463500205427408]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 6.0, 7.0, 15.0, 15.0, 13.0, 14.0, 18.0, 27.0, 25.0, 24.0, 27.0, 26.0, 34.0, 37.0, 40.0, 52.0, 43.0, 42.0, 40.0, 55.0, 42.0, 31.0, 41.0, 41.0, 42.0, 42.0, 25.0, 27.0, 21.0, 20.0, 17.0, 15.0, 12.0, 16.0, 11.0, 4.0, 5.0, 1.0, 6.0, 3.0, 7.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004323720932006836, -0.00041732750833034515, -0.0004022829234600067, -0.0003872383385896683, -0.00037219375371932983, -0.0003571491688489914, -0.00034210458397865295, -0.0003270599991083145, -0.0003120154142379761, -0.00029697082936763763, -0.0002819262444972992, -0.00026688165962696075, -0.0002518370747566223, -0.00023679248988628387, -0.00022174790501594543, -0.000206703320145607, -0.00019165873527526855, -0.00017661415040493011, -0.00016156956553459167, -0.00014652498066425323, -0.0001314803957939148, -0.00011643581092357635, -0.00010139122605323792, -8.634664118289948e-05, -7.130205631256104e-05, -5.6257471442222595e-05, -4.1212886571884155e-05, -2.6168301701545715e-05, -1.1123716831207275e-05, 3.9208680391311646e-06, 1.8965452909469604e-05, 3.4010037779808044e-05, 4.9054622650146484e-05, 6.409920752048492e-05, 7.914379239082336e-05, 9.41883772611618e-05, 0.00010923296213150024, 0.00012427754700183868, 0.00013932213187217712, 0.00015436671674251556, 0.000169411301612854, 0.00018445588648319244, 0.00019950047135353088, 0.00021454505622386932, 0.00022958964109420776, 0.0002446342259645462, 0.00025967881083488464, 0.0002747233957052231, 0.0002897679805755615, 0.00030481256544589996, 0.0003198571503162384, 0.00033490173518657684, 0.0003499463200569153, 0.0003649909049272537, 0.00038003548979759216, 0.0003950800746679306, 0.00041012465953826904, 0.0004251692444086075, 0.0004402138292789459, 0.00045525841414928436, 0.0004703029990196228, 0.00048534758388996124, 0.0005003921687602997, 0.0005154367536306381, 0.0005304813385009766]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 5.0, 6.0, 5.0, 2.0, 7.0, 10.0, 9.0, 14.0, 23.0, 24.0, 33.0, 30.0, 30.0, 35.0, 46.0, 29.0, 34.0, 43.0, 44.0, 42.0, 41.0, 55.0, 53.0, 44.0, 45.0, 31.0, 26.0, 40.0, 40.0, 35.0, 19.0, 18.0, 16.0, 15.0, 9.0, 10.0, 11.0, 9.0, 2.0, 6.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.7197265625, -8.431640625, -8.1435546875, -7.85546875, -7.5673828125, -7.279296875, -6.9912109375, -6.703125, -6.4150390625, -6.126953125, -5.8388671875, -5.55078125, -5.2626953125, -4.974609375, -4.6865234375, -4.3984375, -4.1103515625, -3.822265625, -3.5341796875, -3.24609375, -2.9580078125, -2.669921875, -2.3818359375, -2.09375, -1.8056640625, -1.517578125, -1.2294921875, -0.94140625, -0.6533203125, -0.365234375, -0.0771484375, 0.2109375, 0.4990234375, 0.787109375, 1.0751953125, 1.36328125, 1.6513671875, 1.939453125, 2.2275390625, 2.515625, 2.8037109375, 3.091796875, 3.3798828125, 3.66796875, 3.9560546875, 4.244140625, 4.5322265625, 4.8203125, 5.1083984375, 5.396484375, 5.6845703125, 5.97265625, 6.2607421875, 6.548828125, 6.8369140625, 7.125, 7.4130859375, 7.701171875, 7.9892578125, 8.27734375, 8.5654296875, 8.853515625, 9.1416015625, 9.4296875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 10.0, 14.0, 16.0, 30.0, 51.0, 57.0, 109.0, 178.0, 275.0, 443.0, 715.0, 1280.0, 2338.0, 4209.0, 8152.0, 15846.0, 34129.0, 83173.0, 266996.0, 423070.0, 118751.0, 45743.0, 20684.0, 10177.0, 5258.0, 2937.0, 1653.0, 896.0, 508.0, 293.0, 218.0, 129.0, 70.0, 46.0, 31.0, 21.0, 13.0, 13.0, 10.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -4.987060546875, -4.81005859375, -4.633056640625, -4.4560546875, -4.279052734375, -4.10205078125, -3.925048828125, -3.748046875, -3.571044921875, -3.39404296875, -3.217041015625, -3.0400390625, -2.863037109375, -2.68603515625, -2.509033203125, -2.33203125, -2.155029296875, -1.97802734375, -1.801025390625, -1.6240234375, -1.447021484375, -1.27001953125, -1.093017578125, -0.916015625, -0.739013671875, -0.56201171875, -0.385009765625, -0.2080078125, -0.031005859375, 0.14599609375, 0.322998046875, 0.5, 0.677001953125, 0.85400390625, 1.031005859375, 1.2080078125, 1.385009765625, 1.56201171875, 1.739013671875, 1.916015625, 2.093017578125, 2.27001953125, 2.447021484375, 2.6240234375, 2.801025390625, 2.97802734375, 3.155029296875, 3.33203125, 3.509033203125, 3.68603515625, 3.863037109375, 4.0400390625, 4.217041015625, 4.39404296875, 4.571044921875, 4.748046875, 4.925048828125, 5.10205078125, 5.279052734375, 5.4560546875, 5.633056640625, 5.81005859375, 5.987060546875, 6.1640625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 4.0, 6.0, 9.0, 16.0, 11.0, 6.0, 20.0, 22.0, 29.0, 39.0, 42.0, 37.0, 43.0, 53.0, 68.0, 107.0, 229.0, 1710.0, 148.0, 61.0, 55.0, 51.0, 45.0, 32.0, 40.0, 30.0, 14.0, 29.0, 14.0, 14.0, 12.0, 14.0, 9.0, 8.0, 2.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.0625, -36.8857421875, -35.708984375, -34.5322265625, -33.35546875, -32.1787109375, -31.001953125, -29.8251953125, -28.6484375, -27.4716796875, -26.294921875, -25.1181640625, -23.94140625, -22.7646484375, -21.587890625, -20.4111328125, -19.234375, -18.0576171875, -16.880859375, -15.7041015625, -14.52734375, -13.3505859375, -12.173828125, -10.9970703125, -9.8203125, -8.6435546875, -7.466796875, -6.2900390625, -5.11328125, -3.9365234375, -2.759765625, -1.5830078125, -0.40625, 0.7705078125, 1.947265625, 3.1240234375, 4.30078125, 5.4775390625, 6.654296875, 7.8310546875, 9.0078125, 10.1845703125, 11.361328125, 12.5380859375, 13.71484375, 14.8916015625, 16.068359375, 17.2451171875, 18.421875, 19.5986328125, 20.775390625, 21.9521484375, 23.12890625, 24.3056640625, 25.482421875, 26.6591796875, 27.8359375, 29.0126953125, 30.189453125, 31.3662109375, 32.54296875, 33.7197265625, 34.896484375, 36.0732421875, 37.25]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 10.0, 10.0, 23.0, 41.0, 34.0, 69.0, 79.0, 148.0, 252.0, 506.0, 2306.0, 2981924.0, 157833.0, 1398.0, 446.0, 216.0, 131.0, 88.0, 47.0, 34.0, 34.0, 21.0, 16.0, 9.0, 6.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-126.9375, -123.3994140625, -119.861328125, -116.3232421875, -112.78515625, -109.2470703125, -105.708984375, -102.1708984375, -98.6328125, -95.0947265625, -91.556640625, -88.0185546875, -84.48046875, -80.9423828125, -77.404296875, -73.8662109375, -70.328125, -66.7900390625, -63.251953125, -59.7138671875, -56.17578125, -52.6376953125, -49.099609375, -45.5615234375, -42.0234375, -38.4853515625, -34.947265625, -31.4091796875, -27.87109375, -24.3330078125, -20.794921875, -17.2568359375, -13.71875, -10.1806640625, -6.642578125, -3.1044921875, 0.43359375, 3.9716796875, 7.509765625, 11.0478515625, 14.5859375, 18.1240234375, 21.662109375, 25.2001953125, 28.73828125, 32.2763671875, 35.814453125, 39.3525390625, 42.890625, 46.4287109375, 49.966796875, 53.5048828125, 57.04296875, 60.5810546875, 64.119140625, 67.6572265625, 71.1953125, 74.7333984375, 78.271484375, 81.8095703125, 85.34765625, 88.8857421875, 92.423828125, 95.9619140625, 99.5]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 12.0, 96.0, 408.0, 416.0, 68.0, 10.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-253.13516235351562, -248.52536010742188, -243.91555786132812, -239.30577087402344, -234.6959686279297, -230.08616638183594, -225.4763641357422, -220.86656188964844, -216.25677490234375, -211.64697265625, -207.03717041015625, -202.42738342285156, -197.8175811767578, -193.20777893066406, -188.5979766845703, -183.98817443847656, -179.3783721923828, -174.76856994628906, -170.1587677001953, -165.54898071289062, -160.93917846679688, -156.32937622070312, -151.71957397460938, -147.10977172851562, -142.49996948242188, -137.89016723632812, -133.28036499023438, -128.6705780029297, -124.06077575683594, -119.45097351074219, -114.84117126464844, -110.23136901855469, -105.62156677246094, -101.01176452636719, -96.40196990966797, -91.79216766357422, -87.182373046875, -82.57257080078125, -77.9627685546875, -73.35296630859375, -68.74317169189453, -64.13336944580078, -59.52357482910156, -54.91377258300781, -50.30397415161133, -45.694175720214844, -41.084373474121094, -36.47457504272461, -31.864776611328125, -27.25497817993164, -22.645177841186523, -18.035377502441406, -13.425579071044922, -8.815780639648438, -4.20598030090332, 0.4038200378417969, 5.013618469238281, 9.623417854309082, 14.233217239379883, 18.843017578125, 23.452816009521484, 28.06261444091797, 32.67241668701172, 37.2822151184082, 41.89201354980469]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 0.0, 2.0, 1.0, 10.0, 5.0, 18.0, 13.0, 14.0, 10.0, 14.0, 15.0, 15.0, 22.0, 24.0, 27.0, 40.0, 32.0, 60.0, 31.0, 35.0, 39.0, 53.0, 35.0, 47.0, 53.0, 39.0, 41.0, 43.0, 33.0, 28.0, 29.0, 28.0, 29.0, 14.0, 15.0, 15.0, 13.0, 14.0, 12.0, 10.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.61297607421875, -79.75787353515625, -76.90277099609375, -74.04766082763672, -71.19255828857422, -68.33745574951172, -65.48234558105469, -62.62724304199219, -59.77214050292969, -56.91703796386719, -54.06193161010742, -51.206825256347656, -48.351722717285156, -45.496620178222656, -42.64151382446289, -39.786407470703125, -36.931304931640625, -34.076202392578125, -31.22109603881836, -28.365991592407227, -25.510887145996094, -22.65578269958496, -19.800678253173828, -16.945573806762695, -14.090469360351562, -11.23536491394043, -8.380260467529297, -5.525156021118164, -2.6700515747070312, 0.18505287170410156, 3.0401573181152344, 5.895261764526367, 8.750358581542969, 11.605463027954102, 14.460567474365234, 17.315671920776367, 20.1707763671875, 23.025880813598633, 25.880985260009766, 28.7360897064209, 31.59119415283203, 34.44629669189453, 37.3014030456543, 40.15650939941406, 43.01161193847656, 45.86671447753906, 48.72182083129883, 51.576927185058594, 54.432029724121094, 57.287132263183594, 60.14223861694336, 62.997344970703125, 65.85244750976562, 68.70755004882812, 71.56265258789062, 74.41776275634766, 77.27286529541016, 80.12796783447266, 82.98307800292969, 85.83818054199219, 88.69328308105469, 91.54838562011719, 94.40348815917969, 97.25859832763672, 100.11370086669922]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 6.0, 9.0, 5.0, 6.0, 6.0, 16.0, 16.0, 20.0, 29.0, 19.0, 30.0, 40.0, 46.0, 36.0, 27.0, 38.0, 44.0, 47.0, 33.0, 44.0, 48.0, 49.0, 41.0, 44.0, 32.0, 43.0, 24.0, 30.0, 40.0, 25.0, 13.0, 18.0, 15.0, 16.0, 12.0, 10.0, 2.0, 5.0, 5.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.296875, -8.99853515625, -8.7001953125, -8.40185546875, -8.103515625, -7.80517578125, -7.5068359375, -7.20849609375, -6.91015625, -6.61181640625, -6.3134765625, -6.01513671875, -5.716796875, -5.41845703125, -5.1201171875, -4.82177734375, -4.5234375, -4.22509765625, -3.9267578125, -3.62841796875, -3.330078125, -3.03173828125, -2.7333984375, -2.43505859375, -2.13671875, -1.83837890625, -1.5400390625, -1.24169921875, -0.943359375, -0.64501953125, -0.3466796875, -0.04833984375, 0.25, 0.54833984375, 0.8466796875, 1.14501953125, 1.443359375, 1.74169921875, 2.0400390625, 2.33837890625, 2.63671875, 2.93505859375, 3.2333984375, 3.53173828125, 3.830078125, 4.12841796875, 4.4267578125, 4.72509765625, 5.0234375, 5.32177734375, 5.6201171875, 5.91845703125, 6.216796875, 6.51513671875, 6.8134765625, 7.11181640625, 7.41015625, 7.70849609375, 8.0068359375, 8.30517578125, 8.603515625, 8.90185546875, 9.2001953125, 9.49853515625, 9.796875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 6.0, 8.0, 13.0, 10.0, 16.0, 34.0, 41.0, 44.0, 56.0, 81.0, 123.0, 198.0, 307.0, 544.0, 986.0, 1899.0, 4598.0, 12102.0, 40938.0, 203893.0, 947451.0, 1758420.0, 943003.0, 213865.0, 44962.0, 12064.0, 4393.0, 1911.0, 885.0, 493.0, 293.0, 184.0, 133.0, 96.0, 57.0, 39.0, 39.0, 22.0, 24.0, 12.0, 16.0, 5.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.421875, -12.0618896484375, -11.701904296875, -11.3419189453125, -10.98193359375, -10.6219482421875, -10.261962890625, -9.9019775390625, -9.5419921875, -9.1820068359375, -8.822021484375, -8.4620361328125, -8.10205078125, -7.7420654296875, -7.382080078125, -7.0220947265625, -6.662109375, -6.3021240234375, -5.942138671875, -5.5821533203125, -5.22216796875, -4.8621826171875, -4.502197265625, -4.1422119140625, -3.7822265625, -3.4222412109375, -3.062255859375, -2.7022705078125, -2.34228515625, -1.9822998046875, -1.622314453125, -1.2623291015625, -0.90234375, -0.5423583984375, -0.182373046875, 0.1776123046875, 0.53759765625, 0.8975830078125, 1.257568359375, 1.6175537109375, 1.9775390625, 2.3375244140625, 2.697509765625, 3.0574951171875, 3.41748046875, 3.7774658203125, 4.137451171875, 4.4974365234375, 4.857421875, 5.2174072265625, 5.577392578125, 5.9373779296875, 6.29736328125, 6.6573486328125, 7.017333984375, 7.3773193359375, 7.7373046875, 8.0972900390625, 8.457275390625, 8.8172607421875, 9.17724609375, 9.5372314453125, 9.897216796875, 10.2572021484375, 10.6171875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 11.0, 19.0, 25.0, 47.0, 73.0, 129.0, 210.0, 369.0, 650.0, 912.0, 662.0, 392.0, 266.0, 129.0, 76.0, 45.0, 24.0, 15.0, 10.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.578125, -21.481201171875, -20.38427734375, -19.287353515625, -18.1904296875, -17.093505859375, -15.99658203125, -14.899658203125, -13.802734375, -12.705810546875, -11.60888671875, -10.511962890625, -9.4150390625, -8.318115234375, -7.22119140625, -6.124267578125, -5.02734375, -3.930419921875, -2.83349609375, -1.736572265625, -0.6396484375, 0.457275390625, 1.55419921875, 2.651123046875, 3.748046875, 4.844970703125, 5.94189453125, 7.038818359375, 8.1357421875, 9.232666015625, 10.32958984375, 11.426513671875, 12.5234375, 13.620361328125, 14.71728515625, 15.814208984375, 16.9111328125, 18.008056640625, 19.10498046875, 20.201904296875, 21.298828125, 22.395751953125, 23.49267578125, 24.589599609375, 25.6865234375, 26.783447265625, 27.88037109375, 28.977294921875, 30.07421875, 31.171142578125, 32.26806640625, 33.364990234375, 34.4619140625, 35.558837890625, 36.65576171875, 37.752685546875, 38.849609375, 39.946533203125, 41.04345703125, 42.140380859375, 43.2373046875, 44.334228515625, 45.43115234375, 46.528076171875, 47.625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 4.0, 12.0, 15.0, 22.0, 17.0, 29.0, 41.0, 58.0, 65.0, 89.0, 158.0, 202.0, 395.0, 863.0, 4303.0, 2090806.0, 2090764.0, 4388.0, 858.0, 427.0, 216.0, 152.0, 94.0, 69.0, 52.0, 44.0, 33.0, 20.0, 16.0, 11.0, 12.0, 9.0, 10.0, 8.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-89.75, -86.9453125, -84.140625, -81.3359375, -78.53125, -75.7265625, -72.921875, -70.1171875, -67.3125, -64.5078125, -61.703125, -58.8984375, -56.09375, -53.2890625, -50.484375, -47.6796875, -44.875, -42.0703125, -39.265625, -36.4609375, -33.65625, -30.8515625, -28.046875, -25.2421875, -22.4375, -19.6328125, -16.828125, -14.0234375, -11.21875, -8.4140625, -5.609375, -2.8046875, 0.0, 2.8046875, 5.609375, 8.4140625, 11.21875, 14.0234375, 16.828125, 19.6328125, 22.4375, 25.2421875, 28.046875, 30.8515625, 33.65625, 36.4609375, 39.265625, 42.0703125, 44.875, 47.6796875, 50.484375, 53.2890625, 56.09375, 58.8984375, 61.703125, 64.5078125, 67.3125, 70.1171875, 72.921875, 75.7265625, 78.53125, 81.3359375, 84.140625, 86.9453125, 89.75]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 12.0, 41.0, 112.0, 229.0, 302.0, 190.0, 92.0, 22.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-283.7770080566406, -277.78961181640625, -271.8022155761719, -265.8148193359375, -259.8274230957031, -253.8400421142578, -247.85264587402344, -241.86524963378906, -235.87786865234375, -229.89047241210938, -223.903076171875, -217.91567993164062, -211.9282989501953, -205.94090270996094, -199.95350646972656, -193.9661102294922, -187.9787139892578, -181.99131774902344, -176.00392150878906, -170.01654052734375, -164.02914428710938, -158.041748046875, -152.05435180664062, -146.06695556640625, -140.07955932617188, -134.0921630859375, -128.10476684570312, -122.11737823486328, -116.12998962402344, -110.14259338378906, -104.15519714355469, -98.16780090332031, -92.180419921875, -86.19302368164062, -80.20563507080078, -74.2182388305664, -68.23085021972656, -62.24345397949219, -56.25605773925781, -50.2686653137207, -44.281272888183594, -38.293880462646484, -32.306488037109375, -26.319091796875, -20.33169937133789, -14.344306945800781, -8.356910705566406, -2.369518280029297, 3.6178741455078125, 9.605267524719238, 15.592660903930664, 21.580055236816406, 27.567447662353516, 33.554840087890625, 39.542236328125, 45.52962875366211, 51.51702117919922, 57.50441360473633, 63.49180603027344, 69.47920227050781, 75.46659851074219, 81.45398712158203, 87.4413833618164, 93.42877197265625, 99.41616821289062]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 10.0, 15.0, 8.0, 14.0, 16.0, 13.0, 19.0, 27.0, 32.0, 20.0, 35.0, 22.0, 36.0, 40.0, 45.0, 41.0, 44.0, 46.0, 42.0, 39.0, 45.0, 35.0, 36.0, 33.0, 26.0, 38.0, 30.0, 25.0, 16.0, 22.0, 17.0, 20.0, 18.0, 20.0, 10.0, 6.0, 7.0, 5.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-66.99694061279297, -64.9664535522461, -62.93596267700195, -60.90547180175781, -58.87498474121094, -56.84449768066406, -54.81400680541992, -52.78351593017578, -50.753028869628906, -48.72254180908203, -46.69205093383789, -44.66156005859375, -42.631072998046875, -40.6005859375, -38.57009506225586, -36.53960418701172, -34.509117126464844, -32.47863006591797, -30.448139190673828, -28.41765022277832, -26.387161254882812, -24.356672286987305, -22.326183319091797, -20.29569435119629, -18.26520538330078, -16.234716415405273, -14.204227447509766, -12.173738479614258, -10.14324951171875, -8.112760543823242, -6.082271575927734, -4.051782608032227, -2.02130126953125, 0.009187698364257812, 2.0396766662597656, 4.070165634155273, 6.100654602050781, 8.131143569946289, 10.161632537841797, 12.192121505737305, 14.222610473632812, 16.25309944152832, 18.283588409423828, 20.314077377319336, 22.344566345214844, 24.37505531311035, 26.40554428100586, 28.436033248901367, 30.466522216796875, 32.49700927734375, 34.52750015258789, 36.55799102783203, 38.588478088378906, 40.61896514892578, 42.64945602416992, 44.67994689941406, 46.71043395996094, 48.74092102050781, 50.77141189575195, 52.801902770996094, 54.83238983154297, 56.862876892089844, 58.893367767333984, 60.923858642578125, 62.954345703125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 9.0, 3.0, 7.0, 7.0, 10.0, 12.0, 12.0, 21.0, 22.0, 32.0, 30.0, 32.0, 36.0, 37.0, 41.0, 52.0, 46.0, 41.0, 42.0, 51.0, 38.0, 38.0, 35.0, 42.0, 35.0, 35.0, 35.0, 31.0, 36.0, 28.0, 21.0, 20.0, 9.0, 13.0, 5.0, 9.0, 7.0, 4.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.140625, -9.83349609375, -9.5263671875, -9.21923828125, -8.912109375, -8.60498046875, -8.2978515625, -7.99072265625, -7.68359375, -7.37646484375, -7.0693359375, -6.76220703125, -6.455078125, -6.14794921875, -5.8408203125, -5.53369140625, -5.2265625, -4.91943359375, -4.6123046875, -4.30517578125, -3.998046875, -3.69091796875, -3.3837890625, -3.07666015625, -2.76953125, -2.46240234375, -2.1552734375, -1.84814453125, -1.541015625, -1.23388671875, -0.9267578125, -0.61962890625, -0.3125, -0.00537109375, 0.3017578125, 0.60888671875, 0.916015625, 1.22314453125, 1.5302734375, 1.83740234375, 2.14453125, 2.45166015625, 2.7587890625, 3.06591796875, 3.373046875, 3.68017578125, 3.9873046875, 4.29443359375, 4.6015625, 4.90869140625, 5.2158203125, 5.52294921875, 5.830078125, 6.13720703125, 6.4443359375, 6.75146484375, 7.05859375, 7.36572265625, 7.6728515625, 7.97998046875, 8.287109375, 8.59423828125, 8.9013671875, 9.20849609375, 9.515625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 11.0, 13.0, 7.0, 19.0, 21.0, 34.0, 36.0, 69.0, 81.0, 151.0, 225.0, 276.0, 396.0, 573.0, 770.0, 1154.0, 1659.0, 2542.0, 3754.0, 5651.0, 8781.0, 13451.0, 21377.0, 34288.0, 54795.0, 94117.0, 190947.0, 299592.0, 125666.0, 70376.0, 42477.0, 26684.0, 16631.0, 10762.0, 6933.0, 4597.0, 3097.0, 2065.0, 1356.0, 935.0, 623.0, 469.0, 292.0, 271.0, 164.0, 104.0, 81.0, 51.0, 36.0, 29.0, 21.0, 14.0, 9.0, 5.0, 7.0, 10.0, 2.0, 2.0], "bins": [-1.7734375, -1.7200775146484375, -1.666717529296875, -1.6133575439453125, -1.55999755859375, -1.5066375732421875, -1.453277587890625, -1.3999176025390625, -1.3465576171875, -1.2931976318359375, -1.239837646484375, -1.1864776611328125, -1.13311767578125, -1.0797576904296875, -1.026397705078125, -0.9730377197265625, -0.919677734375, -0.8663177490234375, -0.812957763671875, -0.7595977783203125, -0.70623779296875, -0.6528778076171875, -0.599517822265625, -0.5461578369140625, -0.4927978515625, -0.4394378662109375, -0.386077880859375, -0.3327178955078125, -0.27935791015625, -0.2259979248046875, -0.172637939453125, -0.1192779541015625, -0.06591796875, -0.0125579833984375, 0.040802001953125, 0.0941619873046875, 0.14752197265625, 0.2008819580078125, 0.254241943359375, 0.3076019287109375, 0.3609619140625, 0.4143218994140625, 0.467681884765625, 0.5210418701171875, 0.57440185546875, 0.6277618408203125, 0.681121826171875, 0.7344818115234375, 0.787841796875, 0.8412017822265625, 0.894561767578125, 0.9479217529296875, 1.00128173828125, 1.0546417236328125, 1.108001708984375, 1.1613616943359375, 1.2147216796875, 1.2680816650390625, 1.321441650390625, 1.3748016357421875, 1.42816162109375, 1.4815216064453125, 1.534881591796875, 1.5882415771484375, 1.6416015625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 2.0, 7.0, 10.0, 6.0, 14.0, 5.0, 16.0, 13.0, 17.0, 23.0, 29.0, 39.0, 34.0, 40.0, 32.0, 33.0, 40.0, 42.0, 46.0, 31.0, 36.0, 1056.0, 36.0, 43.0, 35.0, 24.0, 41.0, 30.0, 35.0, 31.0, 21.0, 19.0, 17.0, 19.0, 20.0, 8.0, 15.0, 17.0, 10.0, 10.0, 8.0, 5.0, 3.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.36328125, -6.18707275390625, -6.0108642578125, -5.83465576171875, -5.658447265625, -5.48223876953125, -5.3060302734375, -5.12982177734375, -4.95361328125, -4.77740478515625, -4.6011962890625, -4.42498779296875, -4.248779296875, -4.07257080078125, -3.8963623046875, -3.72015380859375, -3.5439453125, -3.36773681640625, -3.1915283203125, -3.01531982421875, -2.839111328125, -2.66290283203125, -2.4866943359375, -2.31048583984375, -2.13427734375, -1.95806884765625, -1.7818603515625, -1.60565185546875, -1.429443359375, -1.25323486328125, -1.0770263671875, -0.90081787109375, -0.724609375, -0.54840087890625, -0.3721923828125, -0.19598388671875, -0.019775390625, 0.15643310546875, 0.3326416015625, 0.50885009765625, 0.68505859375, 0.86126708984375, 1.0374755859375, 1.21368408203125, 1.389892578125, 1.56610107421875, 1.7423095703125, 1.91851806640625, 2.0947265625, 2.27093505859375, 2.4471435546875, 2.62335205078125, 2.799560546875, 2.97576904296875, 3.1519775390625, 3.32818603515625, 3.50439453125, 3.68060302734375, 3.8568115234375, 4.03302001953125, 4.209228515625, 4.38543701171875, 4.5616455078125, 4.73785400390625, 4.9140625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 10.0, 13.0, 22.0, 33.0, 41.0, 55.0, 79.0, 160.0, 222.0, 316.0, 521.0, 840.0, 1398.0, 2082.0, 3439.0, 5281.0, 8230.0, 12889.0, 20801.0, 33989.0, 57017.0, 101922.0, 235413.0, 1334386.0, 115926.0, 62701.0, 37552.0, 23094.0, 14408.0, 8922.0, 5683.0, 3541.0, 2328.0, 1414.0, 890.0, 528.0, 348.0, 210.0, 156.0, 88.0, 61.0, 49.0, 31.0, 19.0, 13.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.69921875, -1.6427459716796875, -1.586273193359375, -1.5298004150390625, -1.47332763671875, -1.4168548583984375, -1.360382080078125, -1.3039093017578125, -1.2474365234375, -1.1909637451171875, -1.134490966796875, -1.0780181884765625, -1.02154541015625, -0.9650726318359375, -0.908599853515625, -0.8521270751953125, -0.795654296875, -0.7391815185546875, -0.682708740234375, -0.6262359619140625, -0.56976318359375, -0.5132904052734375, -0.456817626953125, -0.4003448486328125, -0.3438720703125, -0.2873992919921875, -0.230926513671875, -0.1744537353515625, -0.11798095703125, -0.0615081787109375, -0.005035400390625, 0.0514373779296875, 0.10791015625, 0.1643829345703125, 0.220855712890625, 0.2773284912109375, 0.33380126953125, 0.3902740478515625, 0.446746826171875, 0.5032196044921875, 0.5596923828125, 0.6161651611328125, 0.672637939453125, 0.7291107177734375, 0.78558349609375, 0.8420562744140625, 0.898529052734375, 0.9550018310546875, 1.011474609375, 1.0679473876953125, 1.124420166015625, 1.1808929443359375, 1.23736572265625, 1.2938385009765625, 1.350311279296875, 1.4067840576171875, 1.4632568359375, 1.5197296142578125, 1.576202392578125, 1.6326751708984375, 1.68914794921875, 1.7456207275390625, 1.802093505859375, 1.8585662841796875, 1.9150390625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 6.0, 9.0, 9.0, 8.0, 11.0, 10.0, 17.0, 31.0, 30.0, 25.0, 40.0, 43.0, 73.0, 53.0, 75.0, 86.0, 78.0, 75.0, 59.0, 57.0, 39.0, 33.0, 24.0, 21.0, 17.0, 13.0, 7.0, 8.0, 9.0, 6.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0011854171752929688, -0.0011502355337142944, -0.0011150538921356201, -0.0010798722505569458, -0.0010446906089782715, -0.0010095089673995972, -0.0009743273258209229, -0.0009391456842422485, -0.0009039640426635742, -0.0008687824010848999, -0.0008336007595062256, -0.0007984191179275513, -0.000763237476348877, -0.0007280558347702026, -0.0006928741931915283, -0.000657692551612854, -0.0006225109100341797, -0.0005873292684555054, -0.0005521476268768311, -0.0005169659852981567, -0.0004817843437194824, -0.0004466027021408081, -0.0004114210605621338, -0.00037623941898345947, -0.00034105777740478516, -0.00030587613582611084, -0.0002706944942474365, -0.0002355128526687622, -0.0002003312110900879, -0.00016514956951141357, -0.00012996792793273926, -9.478628635406494e-05, -5.9604644775390625e-05, -2.442300319671631e-05, 1.0758638381958008e-05, 4.5940279960632324e-05, 8.112192153930664e-05, 0.00011630356311798096, 0.00015148520469665527, 0.0001866668462753296, 0.0002218484878540039, 0.0002570301294326782, 0.00029221177101135254, 0.00032739341259002686, 0.00036257505416870117, 0.0003977566957473755, 0.0004329383373260498, 0.0004681199789047241, 0.0005033016204833984, 0.0005384832620620728, 0.0005736649036407471, 0.0006088465452194214, 0.0006440281867980957, 0.00067920982837677, 0.0007143914699554443, 0.0007495731115341187, 0.000784754753112793, 0.0008199363946914673, 0.0008551180362701416, 0.0008902996778488159, 0.0009254813194274902, 0.0009606629610061646, 0.0009958446025848389, 0.0010310262441635132, 0.0010662078857421875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 3.0, 4.0, 10.0, 7.0, 11.0, 10.0, 14.0, 21.0, 23.0, 39.0, 56.0, 94.0, 139.0, 264.0, 729.0, 16963.0, 1026766.0, 2271.0, 527.0, 202.0, 111.0, 72.0, 47.0, 38.0, 32.0, 25.0, 12.0, 15.0, 11.0, 7.0, 8.0, 5.0, 7.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.027557373046875, -0.026704788208007812, -0.025852203369140625, -0.024999618530273438, -0.02414703369140625, -0.023294448852539062, -0.022441864013671875, -0.021589279174804688, -0.0207366943359375, -0.019884109497070312, -0.019031524658203125, -0.018178939819335938, -0.01732635498046875, -0.016473770141601562, -0.015621185302734375, -0.014768600463867188, -0.013916015625, -0.013063430786132812, -0.012210845947265625, -0.011358261108398438, -0.01050567626953125, -0.009653091430664062, -0.008800506591796875, -0.007947921752929688, -0.0070953369140625, -0.0062427520751953125, -0.005390167236328125, -0.0045375823974609375, -0.00368499755859375, -0.0028324127197265625, -0.001979827880859375, -0.0011272430419921875, -0.000274658203125, 0.0005779266357421875, 0.001430511474609375, 0.0022830963134765625, 0.00313568115234375, 0.0039882659912109375, 0.004840850830078125, 0.0056934356689453125, 0.0065460205078125, 0.0073986053466796875, 0.008251190185546875, 0.009103775024414062, 0.00995635986328125, 0.010808944702148438, 0.011661529541015625, 0.012514114379882812, 0.01336669921875, 0.014219284057617188, 0.015071868896484375, 0.015924453735351562, 0.01677703857421875, 0.017629623413085938, 0.018482208251953125, 0.019334793090820312, 0.0201873779296875, 0.021039962768554688, 0.021892547607421875, 0.022745132446289062, 0.02359771728515625, 0.024450302124023438, 0.025302886962890625, 0.026155471801757812, 0.027008056640625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 17.0, 125.0, 431.0, 340.0, 91.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015701367519795895, -0.0014949573669582605, -0.0014197780983522534, -0.0013445987133309245, -0.0012694194447249174, -0.0011942400597035885, -0.0011190606746822596, -0.0010438812896609306, -0.0009687020210549235, -0.0008935226942412555, -0.0008183433674275875, -0.0007431639824062586, -0.0006679846555925906, -0.0005928053287789226, -0.0005176259437575936, -0.0004424466169439256, -0.0003672672901302576, -0.0002920879633165896, -0.00021690860739909112, -0.00014172926603350788, -6.654992466792464e-05, 8.62940214574337e-06, 8.380875806324184e-05, 0.0001589881139807403, 0.00023416744079440832, 0.00030934676760807633, 0.0003845261235255748, 0.00045970547944307327, 0.0005348848062567413, 0.0006100641330704093, 0.0006852435180917382, 0.0007604228449054062, 0.0008356024045497179, 0.0009107817313633859, 0.000985961058177054, 0.0010611404431983829, 0.00113631971180439, 0.0012114990968257189, 0.0012866784818470478, 0.0013618578668683767, 0.0014370371354743838, 0.0015122165204957128, 0.0015873957891017199, 0.0016625751741230488, 0.0017377545591443777, 0.0018129338277503848, 0.0018881132127717137, 0.001963292481377721, 0.0020384718663990498, 0.0021136512514203787, 0.0021888306364417076, 0.002264009788632393, 0.002339189173653722, 0.0024143685586750507, 0.0024895479436963797, 0.0025647273287177086, 0.002639906480908394, 0.002715085865929723, 0.0027902652509510517, 0.002865444403141737, 0.002940623788163066, 0.003015803173184395, 0.0030909825582057238, 0.0031661619432270527, 0.0032413413282483816]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 9.0, 5.0, 5.0, 8.0, 6.0, 7.0, 8.0, 15.0, 13.0, 13.0, 11.0, 15.0, 18.0, 22.0, 32.0, 37.0, 32.0, 44.0, 37.0, 35.0, 41.0, 32.0, 47.0, 42.0, 36.0, 37.0, 39.0, 27.0, 32.0, 34.0, 31.0, 32.0, 29.0, 27.0, 24.0, 20.0, 12.0, 16.0, 14.0, 10.0, 7.0, 8.0, 9.0, 6.0, 5.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0], "bins": [-0.0005207657814025879, -0.0005055731162428856, -0.0004903804510831833, -0.000475187785923481, -0.0004599951207637787, -0.0004448024556040764, -0.0004296097904443741, -0.0004144171252846718, -0.0003992244601249695, -0.0003840317949652672, -0.0003688391298055649, -0.0003536464646458626, -0.0003384537994861603, -0.000323261134326458, -0.0003080684691667557, -0.0002928758040070534, -0.0002776831388473511, -0.0002624904736876488, -0.00024729780852794647, -0.00023210514336824417, -0.00021691247820854187, -0.00020171981304883957, -0.00018652714788913727, -0.00017133448272943497, -0.00015614181756973267, -0.00014094915241003036, -0.00012575648725032806, -0.00011056382209062576, -9.537115693092346e-05, -8.017849177122116e-05, -6.498582661151886e-05, -4.979316145181656e-05, -3.460049629211426e-05, -1.9407831132411957e-05, -4.215165972709656e-06, 1.0977499186992645e-05, 2.6170164346694946e-05, 4.136282950639725e-05, 5.655549466609955e-05, 7.174815982580185e-05, 8.694082498550415e-05, 0.00010213349014520645, 0.00011732615530490875, 0.00013251882046461105, 0.00014771148562431335, 0.00016290415078401566, 0.00017809681594371796, 0.00019328948110342026, 0.00020848214626312256, 0.00022367481142282486, 0.00023886747658252716, 0.00025406014174222946, 0.00026925280690193176, 0.00028444547206163406, 0.00029963813722133636, 0.00031483080238103867, 0.00033002346754074097, 0.00034521613270044327, 0.00036040879786014557, 0.00037560146301984787, 0.00039079412817955017, 0.00040598679333925247, 0.0004211794584989548, 0.0004363721236586571, 0.0004515647888183594]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 9.0, 3.0, 7.0, 7.0, 10.0, 12.0, 12.0, 21.0, 22.0, 32.0, 30.0, 32.0, 36.0, 37.0, 41.0, 52.0, 46.0, 41.0, 42.0, 51.0, 38.0, 38.0, 35.0, 42.0, 35.0, 35.0, 35.0, 31.0, 36.0, 28.0, 21.0, 20.0, 9.0, 13.0, 5.0, 9.0, 7.0, 4.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.140625, -9.83349609375, -9.5263671875, -9.21923828125, -8.912109375, -8.60498046875, -8.2978515625, -7.99072265625, -7.68359375, -7.37646484375, -7.0693359375, -6.76220703125, -6.455078125, -6.14794921875, -5.8408203125, -5.53369140625, -5.2265625, -4.91943359375, -4.6123046875, -4.30517578125, -3.998046875, -3.69091796875, -3.3837890625, -3.07666015625, -2.76953125, -2.46240234375, -2.1552734375, -1.84814453125, -1.541015625, -1.23388671875, -0.9267578125, -0.61962890625, -0.3125, -0.00537109375, 0.3017578125, 0.60888671875, 0.916015625, 1.22314453125, 1.5302734375, 1.83740234375, 2.14453125, 2.45166015625, 2.7587890625, 3.06591796875, 3.373046875, 3.68017578125, 3.9873046875, 4.29443359375, 4.6015625, 4.90869140625, 5.2158203125, 5.52294921875, 5.830078125, 6.13720703125, 6.4443359375, 6.75146484375, 7.05859375, 7.36572265625, 7.6728515625, 7.97998046875, 8.287109375, 8.59423828125, 8.9013671875, 9.20849609375, 9.515625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 11.0, 18.0, 23.0, 35.0, 33.0, 50.0, 85.0, 120.0, 191.0, 303.0, 459.0, 749.0, 1241.0, 2518.0, 4722.0, 10694.0, 24673.0, 63423.0, 203431.0, 480439.0, 162107.0, 53682.0, 20886.0, 9206.0, 4238.0, 2064.0, 1154.0, 730.0, 442.0, 271.0, 190.0, 127.0, 61.0, 51.0, 31.0, 31.0, 21.0, 20.0, 4.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-7.6015625, -7.38690185546875, -7.1722412109375, -6.95758056640625, -6.742919921875, -6.52825927734375, -6.3135986328125, -6.09893798828125, -5.88427734375, -5.66961669921875, -5.4549560546875, -5.24029541015625, -5.025634765625, -4.81097412109375, -4.5963134765625, -4.38165283203125, -4.1669921875, -3.95233154296875, -3.7376708984375, -3.52301025390625, -3.308349609375, -3.09368896484375, -2.8790283203125, -2.66436767578125, -2.44970703125, -2.23504638671875, -2.0203857421875, -1.80572509765625, -1.591064453125, -1.37640380859375, -1.1617431640625, -0.94708251953125, -0.732421875, -0.51776123046875, -0.3031005859375, -0.08843994140625, 0.126220703125, 0.34088134765625, 0.5555419921875, 0.77020263671875, 0.98486328125, 1.19952392578125, 1.4141845703125, 1.62884521484375, 1.843505859375, 2.05816650390625, 2.2728271484375, 2.48748779296875, 2.7021484375, 2.91680908203125, 3.1314697265625, 3.34613037109375, 3.560791015625, 3.77545166015625, 3.9901123046875, 4.20477294921875, 4.41943359375, 4.63409423828125, 4.8487548828125, 5.06341552734375, 5.278076171875, 5.49273681640625, 5.7073974609375, 5.92205810546875, 6.13671875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 9.0, 7.0, 11.0, 11.0, 11.0, 20.0, 13.0, 12.0, 30.0, 28.0, 32.0, 35.0, 38.0, 64.0, 59.0, 81.0, 188.0, 1685.0, 181.0, 74.0, 67.0, 58.0, 44.0, 33.0, 41.0, 31.0, 21.0, 25.0, 25.0, 18.0, 13.0, 14.0, 7.0, 8.0, 6.0, 12.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-35.84375, -34.77294921875, -33.7021484375, -32.63134765625, -31.560546875, -30.48974609375, -29.4189453125, -28.34814453125, -27.27734375, -26.20654296875, -25.1357421875, -24.06494140625, -22.994140625, -21.92333984375, -20.8525390625, -19.78173828125, -18.7109375, -17.64013671875, -16.5693359375, -15.49853515625, -14.427734375, -13.35693359375, -12.2861328125, -11.21533203125, -10.14453125, -9.07373046875, -8.0029296875, -6.93212890625, -5.861328125, -4.79052734375, -3.7197265625, -2.64892578125, -1.578125, -0.50732421875, 0.5634765625, 1.63427734375, 2.705078125, 3.77587890625, 4.8466796875, 5.91748046875, 6.98828125, 8.05908203125, 9.1298828125, 10.20068359375, 11.271484375, 12.34228515625, 13.4130859375, 14.48388671875, 15.5546875, 16.62548828125, 17.6962890625, 18.76708984375, 19.837890625, 20.90869140625, 21.9794921875, 23.05029296875, 24.12109375, 25.19189453125, 26.2626953125, 27.33349609375, 28.404296875, 29.47509765625, 30.5458984375, 31.61669921875, 32.6875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 12.0, 9.0, 6.0, 14.0, 22.0, 23.0, 28.0, 40.0, 65.0, 63.0, 117.0, 142.0, 162.0, 274.0, 461.0, 1464.0, 65576.0, 3069811.0, 5552.0, 761.0, 304.0, 194.0, 132.0, 99.0, 85.0, 69.0, 39.0, 40.0, 36.0, 13.0, 17.0, 14.0, 14.0, 10.0, 2.0, 11.0, 3.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-87.4375, -84.80859375, -82.1796875, -79.55078125, -76.921875, -74.29296875, -71.6640625, -69.03515625, -66.40625, -63.77734375, -61.1484375, -58.51953125, -55.890625, -53.26171875, -50.6328125, -48.00390625, -45.375, -42.74609375, -40.1171875, -37.48828125, -34.859375, -32.23046875, -29.6015625, -26.97265625, -24.34375, -21.71484375, -19.0859375, -16.45703125, -13.828125, -11.19921875, -8.5703125, -5.94140625, -3.3125, -0.68359375, 1.9453125, 4.57421875, 7.203125, 9.83203125, 12.4609375, 15.08984375, 17.71875, 20.34765625, 22.9765625, 25.60546875, 28.234375, 30.86328125, 33.4921875, 36.12109375, 38.75, 41.37890625, 44.0078125, 46.63671875, 49.265625, 51.89453125, 54.5234375, 57.15234375, 59.78125, 62.41015625, 65.0390625, 67.66796875, 70.296875, 72.92578125, 75.5546875, 78.18359375, 80.8125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [4.0, 747.0, 267.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.430574417114258, -10.227721214294434, 1.9751319885253906, 14.177984237670898, 26.38083839416504, 38.58369445800781, 50.78654479980469, 62.989402770996094, 75.19225311279297, 87.39510345458984, 99.59796142578125, 111.80081176757812, 124.003662109375, 136.20651245117188, 148.40936279296875, 160.6122283935547, 172.81507873535156, 185.01792907714844, 197.2207794189453, 209.42364501953125, 221.62649536132812, 233.829345703125, 246.03219604492188, 258.23504638671875, 270.4378967285156, 282.6407470703125, 294.8435974121094, 307.04644775390625, 319.2492980957031, 331.4521484375, 343.655029296875, 355.8578796386719, 368.0606994628906, 380.2635498046875, 392.4664001464844, 404.66925048828125, 416.8721008300781, 429.074951171875, 441.27783203125, 453.4806823730469, 465.68353271484375, 477.8863830566406, 490.0892333984375, 502.2920837402344, 514.4949340820312, 526.6978149414062, 538.900634765625, 551.103515625, 563.3063354492188, 575.5092163085938, 587.7120361328125, 599.9149169921875, 612.1177368164062, 624.3206176757812, 636.5234375, 648.726318359375, 660.92919921875, 673.132080078125, 685.3348999023438, 697.5377807617188, 709.7406005859375, 721.9434814453125, 734.1463012695312, 746.3491821289062, 758.552001953125]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 8.0, 7.0, 1.0, 7.0, 9.0, 4.0, 13.0, 16.0, 20.0, 22.0, 29.0, 29.0, 39.0, 39.0, 34.0, 38.0, 51.0, 41.0, 46.0, 45.0, 57.0, 52.0, 34.0, 45.0, 45.0, 41.0, 28.0, 34.0, 25.0, 28.0, 19.0, 24.0, 20.0, 9.0, 9.0, 11.0, 6.0, 7.0, 3.0, 5.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.43708038330078, -93.23727416992188, -90.03746032714844, -86.83765411376953, -83.6378402709961, -80.43803405761719, -77.23822021484375, -74.03841400146484, -70.83860778808594, -67.63880157470703, -64.4389877319336, -61.23918151855469, -58.03936767578125, -54.839561462402344, -51.63975143432617, -48.43994140625, -45.24012756347656, -42.04031753540039, -38.84050750732422, -35.64070129394531, -32.440887451171875, -29.241079330444336, -26.041271209716797, -22.841461181640625, -19.641651153564453, -16.44184112548828, -13.242032051086426, -10.04222297668457, -6.842412948608398, -3.6426029205322266, -0.4427947998046875, 2.7570152282714844, 5.9568328857421875, 9.15664291381836, 12.356451988220215, 15.55626106262207, 18.756071090698242, 21.955881118774414, 25.155689239501953, 28.355499267578125, 31.555309295654297, 34.75511932373047, 37.95492935180664, 41.15473937988281, 44.35454559326172, 47.554359436035156, 50.75416564941406, 53.953975677490234, 57.153785705566406, 60.35359573364258, 63.55340576171875, 66.75321197509766, 69.9530258178711, 73.15283203125, 76.35264587402344, 79.55245208740234, 82.75225830078125, 85.95206451416016, 89.1518783569336, 92.3516845703125, 95.55149841308594, 98.75130462646484, 101.95111083984375, 105.15092468261719, 108.35073852539062]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 1.0, 4.0, 6.0, 11.0, 10.0, 9.0, 20.0, 13.0, 20.0, 19.0, 25.0, 30.0, 19.0, 32.0, 47.0, 40.0, 39.0, 44.0, 33.0, 58.0, 35.0, 30.0, 37.0, 43.0, 34.0, 34.0, 38.0, 34.0, 23.0, 33.0, 28.0, 23.0, 22.0, 22.0, 14.0, 15.0, 10.0, 7.0, 5.0, 11.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.1875, -9.8929443359375, -9.598388671875, -9.3038330078125, -9.00927734375, -8.7147216796875, -8.420166015625, -8.1256103515625, -7.8310546875, -7.5364990234375, -7.241943359375, -6.9473876953125, -6.65283203125, -6.3582763671875, -6.063720703125, -5.7691650390625, -5.474609375, -5.1800537109375, -4.885498046875, -4.5909423828125, -4.29638671875, -4.0018310546875, -3.707275390625, -3.4127197265625, -3.1181640625, -2.8236083984375, -2.529052734375, -2.2344970703125, -1.93994140625, -1.6453857421875, -1.350830078125, -1.0562744140625, -0.76171875, -0.4671630859375, -0.172607421875, 0.1219482421875, 0.41650390625, 0.7110595703125, 1.005615234375, 1.3001708984375, 1.5947265625, 1.8892822265625, 2.183837890625, 2.4783935546875, 2.77294921875, 3.0675048828125, 3.362060546875, 3.6566162109375, 3.951171875, 4.2457275390625, 4.540283203125, 4.8348388671875, 5.12939453125, 5.4239501953125, 5.718505859375, 6.0130615234375, 6.3076171875, 6.6021728515625, 6.896728515625, 7.1912841796875, 7.48583984375, 7.7803955078125, 8.074951171875, 8.3695068359375, 8.6640625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 9.0, 8.0, 10.0, 13.0, 13.0, 19.0, 17.0, 15.0, 24.0, 20.0, 46.0, 57.0, 97.0, 110.0, 192.0, 352.0, 1008.0, 5421.0, 133264.0, 3558221.0, 483347.0, 9475.0, 1385.0, 421.0, 191.0, 132.0, 101.0, 59.0, 48.0, 31.0, 21.0, 25.0, 23.0, 22.0, 15.0, 11.0, 7.0, 8.0, 7.0, 6.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-38.71875, -37.6005859375, -36.482421875, -35.3642578125, -34.24609375, -33.1279296875, -32.009765625, -30.8916015625, -29.7734375, -28.6552734375, -27.537109375, -26.4189453125, -25.30078125, -24.1826171875, -23.064453125, -21.9462890625, -20.828125, -19.7099609375, -18.591796875, -17.4736328125, -16.35546875, -15.2373046875, -14.119140625, -13.0009765625, -11.8828125, -10.7646484375, -9.646484375, -8.5283203125, -7.41015625, -6.2919921875, -5.173828125, -4.0556640625, -2.9375, -1.8193359375, -0.701171875, 0.4169921875, 1.53515625, 2.6533203125, 3.771484375, 4.8896484375, 6.0078125, 7.1259765625, 8.244140625, 9.3623046875, 10.48046875, 11.5986328125, 12.716796875, 13.8349609375, 14.953125, 16.0712890625, 17.189453125, 18.3076171875, 19.42578125, 20.5439453125, 21.662109375, 22.7802734375, 23.8984375, 25.0166015625, 26.134765625, 27.2529296875, 28.37109375, 29.4892578125, 30.607421875, 31.7255859375, 32.84375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 5.0, 8.0, 16.0, 24.0, 22.0, 46.0, 67.0, 89.0, 119.0, 195.0, 279.0, 460.0, 604.0, 608.0, 504.0, 345.0, 221.0, 152.0, 93.0, 64.0, 49.0, 31.0, 23.0, 9.0, 7.0, 10.0, 10.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-33.09375, -32.3271484375, -31.560546875, -30.7939453125, -30.02734375, -29.2607421875, -28.494140625, -27.7275390625, -26.9609375, -26.1943359375, -25.427734375, -24.6611328125, -23.89453125, -23.1279296875, -22.361328125, -21.5947265625, -20.828125, -20.0615234375, -19.294921875, -18.5283203125, -17.76171875, -16.9951171875, -16.228515625, -15.4619140625, -14.6953125, -13.9287109375, -13.162109375, -12.3955078125, -11.62890625, -10.8623046875, -10.095703125, -9.3291015625, -8.5625, -7.7958984375, -7.029296875, -6.2626953125, -5.49609375, -4.7294921875, -3.962890625, -3.1962890625, -2.4296875, -1.6630859375, -0.896484375, -0.1298828125, 0.63671875, 1.4033203125, 2.169921875, 2.9365234375, 3.703125, 4.4697265625, 5.236328125, 6.0029296875, 6.76953125, 7.5361328125, 8.302734375, 9.0693359375, 9.8359375, 10.6025390625, 11.369140625, 12.1357421875, 12.90234375, 13.6689453125, 14.435546875, 15.2021484375, 15.96875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 9.0, 7.0, 11.0, 14.0, 16.0, 25.0, 34.0, 68.0, 76.0, 78.0, 124.0, 234.0, 412.0, 1263.0, 43551.0, 4134332.0, 12045.0, 923.0, 385.0, 208.0, 129.0, 97.0, 62.0, 47.0, 39.0, 23.0, 15.0, 12.0, 9.0, 9.0, 7.0, 5.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.625, -93.22265625, -89.8203125, -86.41796875, -83.015625, -79.61328125, -76.2109375, -72.80859375, -69.40625, -66.00390625, -62.6015625, -59.19921875, -55.796875, -52.39453125, -48.9921875, -45.58984375, -42.1875, -38.78515625, -35.3828125, -31.98046875, -28.578125, -25.17578125, -21.7734375, -18.37109375, -14.96875, -11.56640625, -8.1640625, -4.76171875, -1.359375, 2.04296875, 5.4453125, 8.84765625, 12.25, 15.65234375, 19.0546875, 22.45703125, 25.859375, 29.26171875, 32.6640625, 36.06640625, 39.46875, 42.87109375, 46.2734375, 49.67578125, 53.078125, 56.48046875, 59.8828125, 63.28515625, 66.6875, 70.08984375, 73.4921875, 76.89453125, 80.296875, 83.69921875, 87.1015625, 90.50390625, 93.90625, 97.30859375, 100.7109375, 104.11328125, 107.515625, 110.91796875, 114.3203125, 117.72265625, 121.125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 67.0, 159.0, 326.0, 292.0, 110.0, 38.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.42677307128906, -134.02392578125, -127.6210708618164, -121.21821594238281, -114.81536865234375, -108.41252136230469, -102.0096664428711, -95.6068115234375, -89.20396423339844, -82.80111694335938, -76.39826202392578, -69.99540710449219, -63.592559814453125, -57.1897087097168, -50.78685760498047, -44.38400650024414, -37.98115539550781, -31.578304290771484, -25.175453186035156, -18.772602081298828, -12.3697509765625, -5.966899871826172, 0.43595123291015625, 6.838802337646484, 13.241653442382812, 19.64450454711914, 26.04735565185547, 32.4502067565918, 38.853057861328125, 45.25590896606445, 51.65876007080078, 58.06161117553711, 64.46444702148438, 70.86729431152344, 77.27014923095703, 83.67300415039062, 90.07585144042969, 96.47869873046875, 102.88155364990234, 109.28440856933594, 115.687255859375, 122.09010314941406, 128.49295043945312, 134.89581298828125, 141.2986602783203, 147.70150756835938, 154.1043701171875, 160.50721740722656, 166.91006469726562, 173.3129119873047, 179.71575927734375, 186.11862182617188, 192.52146911621094, 198.92431640625, 205.32717895507812, 211.7300262451172, 218.13287353515625, 224.5357208251953, 230.93856811523438, 237.3414306640625, 243.74427795410156, 250.14712524414062, 256.54998779296875, 262.95281982421875, 269.3556823730469]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 6.0, 10.0, 7.0, 12.0, 7.0, 12.0, 11.0, 13.0, 16.0, 19.0, 13.0, 17.0, 26.0, 19.0, 28.0, 30.0, 28.0, 31.0, 25.0, 24.0, 24.0, 34.0, 39.0, 38.0, 24.0, 27.0, 38.0, 35.0, 41.0, 30.0, 35.0, 23.0, 27.0, 25.0, 19.0, 20.0, 24.0, 24.0, 23.0, 16.0, 12.0, 10.0, 14.0, 11.0, 11.0, 8.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-59.25963592529297, -57.50947570800781, -55.759315490722656, -54.0091552734375, -52.25899887084961, -50.50883865356445, -48.7586784362793, -47.00851821899414, -45.25836181640625, -43.508201599121094, -41.75804138183594, -40.00788116455078, -38.25772476196289, -36.507564544677734, -34.75740432739258, -33.00724411010742, -31.257083892822266, -29.50692367553711, -27.756765365600586, -26.00660514831543, -24.256446838378906, -22.50628662109375, -20.756126403808594, -19.005966186523438, -17.255807876586914, -15.505648612976074, -13.755489349365234, -12.005329132080078, -10.255169868469238, -8.505010604858398, -6.754850387573242, -5.004691123962402, -3.254535675048828, -1.5043761730194092, 0.24578332901000977, 1.9959430694580078, 3.7461023330688477, 5.4962615966796875, 7.246421813964844, 8.996581077575684, 10.746740341186523, 12.496899604797363, 14.247058868408203, 15.99721908569336, 17.747379302978516, 19.49753761291504, 21.247697830200195, 22.99785614013672, 24.748016357421875, 26.49817657470703, 28.248334884643555, 29.99849510192871, 31.748653411865234, 33.49881362915039, 35.24897384643555, 36.9991340637207, 38.749290466308594, 40.49945068359375, 42.249610900878906, 43.99977111816406, 45.74992752075195, 47.50008773803711, 49.250247955322266, 51.00040817260742, 52.75056838989258]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 6.0, 8.0, 7.0, 9.0, 14.0, 15.0, 14.0, 23.0, 30.0, 26.0, 29.0, 43.0, 39.0, 49.0, 45.0, 46.0, 44.0, 42.0, 41.0, 47.0, 37.0, 51.0, 34.0, 43.0, 41.0, 41.0, 32.0, 25.0, 30.0, 18.0, 12.0, 10.0, 13.0, 8.0, 13.0, 4.0, 4.0, 0.0, 2.0, 6.0], "bins": [-14.34375, -14.00152587890625, -13.6593017578125, -13.31707763671875, -12.974853515625, -12.63262939453125, -12.2904052734375, -11.94818115234375, -11.60595703125, -11.26373291015625, -10.9215087890625, -10.57928466796875, -10.237060546875, -9.89483642578125, -9.5526123046875, -9.21038818359375, -8.8681640625, -8.52593994140625, -8.1837158203125, -7.84149169921875, -7.499267578125, -7.15704345703125, -6.8148193359375, -6.47259521484375, -6.13037109375, -5.78814697265625, -5.4459228515625, -5.10369873046875, -4.761474609375, -4.41925048828125, -4.0770263671875, -3.73480224609375, -3.392578125, -3.05035400390625, -2.7081298828125, -2.36590576171875, -2.023681640625, -1.68145751953125, -1.3392333984375, -0.99700927734375, -0.65478515625, -0.31256103515625, 0.0296630859375, 0.37188720703125, 0.714111328125, 1.05633544921875, 1.3985595703125, 1.74078369140625, 2.0830078125, 2.42523193359375, 2.7674560546875, 3.10968017578125, 3.451904296875, 3.79412841796875, 4.1363525390625, 4.47857666015625, 4.82080078125, 5.16302490234375, 5.5052490234375, 5.84747314453125, 6.189697265625, 6.53192138671875, 6.8741455078125, 7.21636962890625, 7.55859375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 11.0, 13.0, 14.0, 21.0, 46.0, 79.0, 112.0, 187.0, 306.0, 526.0, 1055.0, 1753.0, 3056.0, 5695.0, 10583.0, 20432.0, 40585.0, 85994.0, 215270.0, 410357.0, 131673.0, 59362.0, 29183.0, 14761.0, 7851.0, 4193.0, 2283.0, 1307.0, 753.0, 448.0, 223.0, 140.0, 101.0, 65.0, 34.0, 28.0, 9.0, 8.0, 10.0, 8.0, 8.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.73046875, -2.640228271484375, -2.54998779296875, -2.459747314453125, -2.3695068359375, -2.279266357421875, -2.18902587890625, -2.098785400390625, -2.008544921875, -1.918304443359375, -1.82806396484375, -1.737823486328125, -1.6475830078125, -1.557342529296875, -1.46710205078125, -1.376861572265625, -1.28662109375, -1.196380615234375, -1.10614013671875, -1.015899658203125, -0.9256591796875, -0.835418701171875, -0.74517822265625, -0.654937744140625, -0.564697265625, -0.474456787109375, -0.38421630859375, -0.293975830078125, -0.2037353515625, -0.113494873046875, -0.02325439453125, 0.066986083984375, 0.1572265625, 0.247467041015625, 0.33770751953125, 0.427947998046875, 0.5181884765625, 0.608428955078125, 0.69866943359375, 0.788909912109375, 0.879150390625, 0.969390869140625, 1.05963134765625, 1.149871826171875, 1.2401123046875, 1.330352783203125, 1.42059326171875, 1.510833740234375, 1.60107421875, 1.691314697265625, 1.78155517578125, 1.871795654296875, 1.9620361328125, 2.052276611328125, 2.14251708984375, 2.232757568359375, 2.322998046875, 2.413238525390625, 2.50347900390625, 2.593719482421875, 2.6839599609375, 2.774200439453125, 2.86444091796875, 2.954681396484375, 3.044921875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 10.0, 6.0, 3.0, 7.0, 12.0, 7.0, 9.0, 22.0, 14.0, 19.0, 17.0, 19.0, 18.0, 30.0, 30.0, 28.0, 32.0, 37.0, 33.0, 44.0, 26.0, 1063.0, 38.0, 43.0, 44.0, 36.0, 29.0, 38.0, 42.0, 48.0, 21.0, 28.0, 26.0, 16.0, 23.0, 15.0, 16.0, 20.0, 9.0, 14.0, 6.0, 8.0, 10.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.67578125, -5.4913330078125, -5.306884765625, -5.1224365234375, -4.93798828125, -4.7535400390625, -4.569091796875, -4.3846435546875, -4.2001953125, -4.0157470703125, -3.831298828125, -3.6468505859375, -3.46240234375, -3.2779541015625, -3.093505859375, -2.9090576171875, -2.724609375, -2.5401611328125, -2.355712890625, -2.1712646484375, -1.98681640625, -1.8023681640625, -1.617919921875, -1.4334716796875, -1.2490234375, -1.0645751953125, -0.880126953125, -0.6956787109375, -0.51123046875, -0.3267822265625, -0.142333984375, 0.0421142578125, 0.2265625, 0.4110107421875, 0.595458984375, 0.7799072265625, 0.96435546875, 1.1488037109375, 1.333251953125, 1.5177001953125, 1.7021484375, 1.8865966796875, 2.071044921875, 2.2554931640625, 2.43994140625, 2.6243896484375, 2.808837890625, 2.9932861328125, 3.177734375, 3.3621826171875, 3.546630859375, 3.7310791015625, 3.91552734375, 4.0999755859375, 4.284423828125, 4.4688720703125, 4.6533203125, 4.8377685546875, 5.022216796875, 5.2066650390625, 5.39111328125, 5.5755615234375, 5.760009765625, 5.9444580078125, 6.12890625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 12.0, 10.0, 19.0, 16.0, 27.0, 44.0, 52.0, 106.0, 135.0, 182.0, 268.0, 419.0, 609.0, 908.0, 1234.0, 1935.0, 2926.0, 4306.0, 6573.0, 9635.0, 14558.0, 22070.0, 34580.0, 55524.0, 96282.0, 211056.0, 1339627.0, 116784.0, 64762.0, 39346.0, 24741.0, 16155.0, 10723.0, 7191.0, 4722.0, 3223.0, 2067.0, 1426.0, 967.0, 575.0, 425.0, 298.0, 178.0, 137.0, 99.0, 63.0, 40.0, 33.0, 19.0, 11.0, 12.0, 4.0, 7.0, 5.0, 3.0, 1.0, 2.0], "bins": [-1.8408203125, -1.7852935791015625, -1.729766845703125, -1.6742401123046875, -1.61871337890625, -1.5631866455078125, -1.507659912109375, -1.4521331787109375, -1.3966064453125, -1.3410797119140625, -1.285552978515625, -1.2300262451171875, -1.17449951171875, -1.1189727783203125, -1.063446044921875, -1.0079193115234375, -0.952392578125, -0.8968658447265625, -0.841339111328125, -0.7858123779296875, -0.73028564453125, -0.6747589111328125, -0.619232177734375, -0.5637054443359375, -0.5081787109375, -0.4526519775390625, -0.397125244140625, -0.3415985107421875, -0.28607177734375, -0.2305450439453125, -0.175018310546875, -0.1194915771484375, -0.06396484375, -0.0084381103515625, 0.047088623046875, 0.1026153564453125, 0.15814208984375, 0.2136688232421875, 0.269195556640625, 0.3247222900390625, 0.3802490234375, 0.4357757568359375, 0.491302490234375, 0.5468292236328125, 0.60235595703125, 0.6578826904296875, 0.713409423828125, 0.7689361572265625, 0.824462890625, 0.8799896240234375, 0.935516357421875, 0.9910430908203125, 1.04656982421875, 1.1020965576171875, 1.157623291015625, 1.2131500244140625, 1.2686767578125, 1.3242034912109375, 1.379730224609375, 1.4352569580078125, 1.49078369140625, 1.5463104248046875, 1.601837158203125, 1.6573638916015625, 1.712890625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 8.0, 14.0, 11.0, 8.0, 7.0, 18.0, 15.0, 26.0, 35.0, 43.0, 47.0, 58.0, 74.0, 84.0, 96.0, 93.0, 73.0, 68.0, 50.0, 42.0, 32.0, 17.0, 16.0, 16.0, 14.0, 11.0, 5.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0014486312866210938, -0.0014041811227798462, -0.0013597309589385986, -0.001315280795097351, -0.0012708306312561035, -0.001226380467414856, -0.0011819303035736084, -0.0011374801397323608, -0.0010930299758911133, -0.0010485798120498657, -0.0010041296482086182, -0.0009596794843673706, -0.000915229320526123, -0.0008707791566848755, -0.0008263289928436279, -0.0007818788290023804, -0.0007374286651611328, -0.0006929785013198853, -0.0006485283374786377, -0.0006040781736373901, -0.0005596280097961426, -0.000515177845954895, -0.00047072768211364746, -0.0004262775182723999, -0.00038182735443115234, -0.0003373771905899048, -0.0002929270267486572, -0.00024847686290740967, -0.0002040266990661621, -0.00015957653522491455, -0.00011512637138366699, -7.067620754241943e-05, -2.6226043701171875e-05, 1.8224120140075684e-05, 6.267428398132324e-05, 0.0001071244478225708, 0.00015157461166381836, 0.00019602477550506592, 0.00024047493934631348, 0.00028492510318756104, 0.0003293752670288086, 0.00037382543087005615, 0.0004182755947113037, 0.00046272575855255127, 0.0005071759223937988, 0.0005516260862350464, 0.0005960762500762939, 0.0006405264139175415, 0.0006849765777587891, 0.0007294267416000366, 0.0007738769054412842, 0.0008183270692825317, 0.0008627772331237793, 0.0009072273969650269, 0.0009516775608062744, 0.000996127724647522, 0.0010405778884887695, 0.001085028052330017, 0.0011294782161712646, 0.0011739283800125122, 0.0012183785438537598, 0.0012628287076950073, 0.0013072788715362549, 0.0013517290353775024, 0.00139617919921875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 11.0, 19.0, 20.0, 13.0, 21.0, 34.0, 64.0, 107.0, 170.0, 528.0, 16779.0, 1028892.0, 1203.0, 282.0, 116.0, 86.0, 44.0, 37.0, 23.0, 18.0, 18.0, 7.0, 8.0, 12.0, 8.0, 9.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0347900390625, -0.0336766242980957, -0.032563209533691406, -0.03144979476928711, -0.030336380004882812, -0.029222965240478516, -0.02810955047607422, -0.026996135711669922, -0.025882720947265625, -0.024769306182861328, -0.02365589141845703, -0.022542476654052734, -0.021429061889648438, -0.02031564712524414, -0.019202232360839844, -0.018088817596435547, -0.01697540283203125, -0.015861988067626953, -0.014748573303222656, -0.01363515853881836, -0.012521743774414062, -0.011408329010009766, -0.010294914245605469, -0.009181499481201172, -0.008068084716796875, -0.006954669952392578, -0.005841255187988281, -0.004727840423583984, -0.0036144256591796875, -0.0025010108947753906, -0.0013875961303710938, -0.0002741813659667969, 0.0008392333984375, 0.0019526481628417969, 0.0030660629272460938, 0.004179477691650391, 0.0052928924560546875, 0.006406307220458984, 0.007519721984863281, 0.008633136749267578, 0.009746551513671875, 0.010859966278076172, 0.011973381042480469, 0.013086795806884766, 0.014200210571289062, 0.01531362533569336, 0.016427040100097656, 0.017540454864501953, 0.01865386962890625, 0.019767284393310547, 0.020880699157714844, 0.02199411392211914, 0.023107528686523438, 0.024220943450927734, 0.02533435821533203, 0.026447772979736328, 0.027561187744140625, 0.028674602508544922, 0.02978801727294922, 0.030901432037353516, 0.03201484680175781, 0.03312826156616211, 0.034241676330566406, 0.0353550910949707, 0.036468505859375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 83.0, 549.0, 349.0, 29.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000771817984059453, -0.0006589174154214561, -0.0005460168467834592, -0.0004331162781454623, -0.00032021570950746536, -0.00020731514086946845, -9.441457223147154e-05, 1.8485996406525373e-05, 0.00013138656504452229, 0.0002442871336825192, 0.0003571877023205161, 0.000470088270958513, 0.0005829888395965099, 0.0006958894082345068, 0.0008087899768725038, 0.0009216905455105007, 0.0010345911141484976, 0.0011474916245788336, 0.0012603922514244914, 0.0013732928782701492, 0.0014861933887004852, 0.0015990938991308212, 0.001711994525976479, 0.0018248951528221369, 0.0019377956632524729, 0.002050696173682809, 0.0021635969169437885, 0.0022764974273741245, 0.0023893979378044605, 0.0025022984482347965, 0.0026151989586651325, 0.002728099701926112, 0.002841000445187092, 0.002953900955617428, 0.003066801466047764, 0.0031797022093087435, 0.0032926027197390795, 0.0034055032301694155, 0.003518403973430395, 0.003631304483860731, 0.003744204994291067, 0.003857105504721403, 0.003970006015151739, 0.004082906525582075, 0.004195807501673698, 0.004308708012104034, 0.00442160852253437, 0.004534509032964706, 0.004647409543395042, 0.004760310053825378, 0.004873210564255714, 0.00498611107468605, 0.005099011585116386, 0.00521191256120801, 0.005324813071638346, 0.005437713582068682, 0.005550614092499018, 0.005663514602929354, 0.00577641511335969, 0.005889315623790026, 0.006002216599881649, 0.006115117110311985, 0.006228017620742321, 0.006340918131172657, 0.006453818641602993]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 10.0, 4.0, 11.0, 7.0, 12.0, 11.0, 15.0, 11.0, 19.0, 27.0, 29.0, 30.0, 31.0, 36.0, 38.0, 35.0, 50.0, 35.0, 54.0, 50.0, 43.0, 41.0, 40.0, 49.0, 34.0, 37.0, 27.0, 26.0, 23.0, 27.0, 29.0, 18.0, 23.0, 13.0, 15.0, 7.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006404519081115723, -0.000621275044977665, -0.0006020981818437576, -0.0005829213187098503, -0.000563744455575943, -0.0005445675924420357, -0.0005253907293081284, -0.000506213866174221, -0.0004870370030403137, -0.0004678601399064064, -0.0004486832767724991, -0.00042950641363859177, -0.00041032955050468445, -0.00039115268737077713, -0.0003719758242368698, -0.0003527989611029625, -0.0003336220979690552, -0.00031444523483514786, -0.00029526837170124054, -0.0002760915085673332, -0.0002569146454334259, -0.00023773778229951859, -0.00021856091916561127, -0.00019938405603170395, -0.00018020719289779663, -0.0001610303297638893, -0.000141853466629982, -0.00012267660349607468, -0.00010349974036216736, -8.432287722826004e-05, -6.514601409435272e-05, -4.5969150960445404e-05, -2.6792287826538086e-05, -7.615424692630768e-06, 1.156143844127655e-05, 3.073830157518387e-05, 4.9915164709091187e-05, 6.90920278429985e-05, 8.826889097690582e-05, 0.00010744575411081314, 0.00012662261724472046, 0.00014579948037862778, 0.0001649763435125351, 0.0001841532066464424, 0.00020333006978034973, 0.00022250693291425705, 0.00024168379604816437, 0.0002608606591820717, 0.000280037522315979, 0.0002992143854498863, 0.00031839124858379364, 0.00033756811171770096, 0.0003567449748516083, 0.0003759218379855156, 0.0003950987011194229, 0.00041427556425333023, 0.00043345242738723755, 0.00045262929052114487, 0.0004718061536550522, 0.0004909830167889595, 0.0005101598799228668, 0.0005293367430567741, 0.0005485136061906815, 0.0005676904693245888, 0.0005868673324584961]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 6.0, 8.0, 7.0, 9.0, 14.0, 15.0, 14.0, 23.0, 30.0, 26.0, 29.0, 43.0, 39.0, 50.0, 44.0, 46.0, 44.0, 42.0, 41.0, 47.0, 37.0, 51.0, 34.0, 43.0, 41.0, 41.0, 32.0, 25.0, 30.0, 18.0, 12.0, 10.0, 13.0, 8.0, 13.0, 4.0, 4.0, 0.0, 2.0, 6.0], "bins": [-14.34375, -14.00152587890625, -13.6593017578125, -13.31707763671875, -12.974853515625, -12.63262939453125, -12.2904052734375, -11.94818115234375, -11.60595703125, -11.26373291015625, -10.9215087890625, -10.57928466796875, -10.237060546875, -9.89483642578125, -9.5526123046875, -9.21038818359375, -8.8681640625, -8.52593994140625, -8.1837158203125, -7.84149169921875, -7.499267578125, -7.15704345703125, -6.8148193359375, -6.47259521484375, -6.13037109375, -5.78814697265625, -5.4459228515625, -5.10369873046875, -4.761474609375, -4.41925048828125, -4.0770263671875, -3.73480224609375, -3.392578125, -3.05035400390625, -2.7081298828125, -2.36590576171875, -2.023681640625, -1.68145751953125, -1.3392333984375, -0.99700927734375, -0.65478515625, -0.31256103515625, 0.0296630859375, 0.37188720703125, 0.714111328125, 1.05633544921875, 1.3985595703125, 1.74078369140625, 2.0830078125, 2.42523193359375, 2.7674560546875, 3.10968017578125, 3.451904296875, 3.79412841796875, 4.1363525390625, 4.47857666015625, 4.82080078125, 5.16302490234375, 5.5052490234375, 5.84747314453125, 6.189697265625, 6.53192138671875, 6.8741455078125, 7.21636962890625, 7.55859375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 10.0, 11.0, 14.0, 32.0, 31.0, 36.0, 59.0, 86.0, 140.0, 202.0, 279.0, 469.0, 730.0, 1339.0, 2492.0, 6501.0, 24827.0, 195278.0, 718116.0, 75456.0, 13488.0, 4175.0, 1963.0, 1014.0, 640.0, 392.0, 251.0, 150.0, 106.0, 78.0, 59.0, 38.0, 31.0, 24.0, 9.0, 15.0, 13.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.859375, -17.3533935546875, -16.847412109375, -16.3414306640625, -15.83544921875, -15.3294677734375, -14.823486328125, -14.3175048828125, -13.8115234375, -13.3055419921875, -12.799560546875, -12.2935791015625, -11.78759765625, -11.2816162109375, -10.775634765625, -10.2696533203125, -9.763671875, -9.2576904296875, -8.751708984375, -8.2457275390625, -7.73974609375, -7.2337646484375, -6.727783203125, -6.2218017578125, -5.7158203125, -5.2098388671875, -4.703857421875, -4.1978759765625, -3.69189453125, -3.1859130859375, -2.679931640625, -2.1739501953125, -1.66796875, -1.1619873046875, -0.656005859375, -0.1500244140625, 0.35595703125, 0.8619384765625, 1.367919921875, 1.8739013671875, 2.3798828125, 2.8858642578125, 3.391845703125, 3.8978271484375, 4.40380859375, 4.9097900390625, 5.415771484375, 5.9217529296875, 6.427734375, 6.9337158203125, 7.439697265625, 7.9456787109375, 8.45166015625, 8.9576416015625, 9.463623046875, 9.9696044921875, 10.4755859375, 10.9815673828125, 11.487548828125, 11.9935302734375, 12.49951171875, 13.0054931640625, 13.511474609375, 14.0174560546875, 14.5234375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 4.0, 2.0, 8.0, 8.0, 12.0, 23.0, 13.0, 21.0, 29.0, 26.0, 34.0, 37.0, 31.0, 43.0, 42.0, 54.0, 65.0, 180.0, 1709.0, 212.0, 82.0, 58.0, 45.0, 45.0, 39.0, 41.0, 28.0, 17.0, 30.0, 20.0, 15.0, 13.0, 8.0, 9.0, 13.0, 8.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.3125, -31.25439453125, -30.1962890625, -29.13818359375, -28.080078125, -27.02197265625, -25.9638671875, -24.90576171875, -23.84765625, -22.78955078125, -21.7314453125, -20.67333984375, -19.615234375, -18.55712890625, -17.4990234375, -16.44091796875, -15.3828125, -14.32470703125, -13.2666015625, -12.20849609375, -11.150390625, -10.09228515625, -9.0341796875, -7.97607421875, -6.91796875, -5.85986328125, -4.8017578125, -3.74365234375, -2.685546875, -1.62744140625, -0.5693359375, 0.48876953125, 1.546875, 2.60498046875, 3.6630859375, 4.72119140625, 5.779296875, 6.83740234375, 7.8955078125, 8.95361328125, 10.01171875, 11.06982421875, 12.1279296875, 13.18603515625, 14.244140625, 15.30224609375, 16.3603515625, 17.41845703125, 18.4765625, 19.53466796875, 20.5927734375, 21.65087890625, 22.708984375, 23.76708984375, 24.8251953125, 25.88330078125, 26.94140625, 27.99951171875, 29.0576171875, 30.11572265625, 31.173828125, 32.23193359375, 33.2900390625, 34.34814453125, 35.40625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 10.0, 10.0, 19.0, 28.0, 23.0, 43.0, 67.0, 93.0, 174.0, 277.0, 548.0, 2565.0, 3038637.0, 100873.0, 1243.0, 439.0, 198.0, 128.0, 95.0, 80.0, 50.0, 33.0, 15.0, 11.0, 11.0, 15.0, 6.0, 10.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-135.875, -132.083984375, -128.29296875, -124.501953125, -120.7109375, -116.919921875, -113.12890625, -109.337890625, -105.546875, -101.755859375, -97.96484375, -94.173828125, -90.3828125, -86.591796875, -82.80078125, -79.009765625, -75.21875, -71.427734375, -67.63671875, -63.845703125, -60.0546875, -56.263671875, -52.47265625, -48.681640625, -44.890625, -41.099609375, -37.30859375, -33.517578125, -29.7265625, -25.935546875, -22.14453125, -18.353515625, -14.5625, -10.771484375, -6.98046875, -3.189453125, 0.6015625, 4.392578125, 8.18359375, 11.974609375, 15.765625, 19.556640625, 23.34765625, 27.138671875, 30.9296875, 34.720703125, 38.51171875, 42.302734375, 46.09375, 49.884765625, 53.67578125, 57.466796875, 61.2578125, 65.048828125, 68.83984375, 72.630859375, 76.421875, 80.212890625, 84.00390625, 87.794921875, 91.5859375, 95.376953125, 99.16796875, 102.958984375, 106.75]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 16.0, 263.0, 658.0, 77.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.21563720703125, -40.60871505737305, -33.001792907714844, -25.394868850708008, -17.787946701049805, -10.181022644042969, -2.5741004943847656, 5.0328216552734375, 12.63974380493164, 20.246665954589844, 27.853588104248047, 35.46051025390625, 43.06743621826172, 50.67435836791992, 58.281280517578125, 65.88819885253906, 73.49512481689453, 81.10205078125, 88.70896911621094, 96.3158950805664, 103.92281341552734, 111.52973937988281, 119.13665771484375, 126.74358367919922, 134.3505096435547, 141.95742797851562, 149.56436157226562, 157.17127990722656, 164.7781982421875, 172.3851318359375, 179.99205017089844, 187.59896850585938, 195.2058868408203, 202.81280517578125, 210.41973876953125, 218.0266571044922, 225.63357543945312, 233.24050903320312, 240.84742736816406, 248.454345703125, 256.061279296875, 263.668212890625, 271.2751159667969, 278.8820495605469, 286.4889831542969, 294.09588623046875, 301.70281982421875, 309.30975341796875, 316.9166564941406, 324.5235900878906, 332.1304931640625, 339.7374267578125, 347.3443603515625, 354.9512634277344, 362.5581970214844, 370.16510009765625, 377.77203369140625, 385.37896728515625, 392.9858703613281, 400.5928039550781, 408.1997375488281, 415.806640625, 423.41357421875, 431.0205078125, 438.6274108886719]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 3.0, 8.0, 8.0, 4.0, 9.0, 8.0, 22.0, 14.0, 15.0, 24.0, 25.0, 20.0, 21.0, 31.0, 39.0, 38.0, 41.0, 42.0, 39.0, 42.0, 49.0, 40.0, 39.0, 39.0, 32.0, 43.0, 51.0, 34.0, 29.0, 36.0, 17.0, 32.0, 18.0, 18.0, 14.0, 13.0, 10.0, 11.0, 2.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-102.98809814453125, -100.13245391845703, -97.27680206298828, -94.42115783691406, -91.56550598144531, -88.7098617553711, -85.85420989990234, -82.99856567382812, -80.14291381835938, -77.28726959228516, -74.4316177368164, -71.57597351074219, -68.72032165527344, -65.86467742919922, -63.00902557373047, -60.15338134765625, -57.297733306884766, -54.44208526611328, -51.5864372253418, -48.73078918457031, -45.87514114379883, -43.019493103027344, -40.163848876953125, -37.308197021484375, -34.452552795410156, -31.596904754638672, -28.741256713867188, -25.885608673095703, -23.02996063232422, -20.174312591552734, -17.318666458129883, -14.463018417358398, -11.607368469238281, -8.751720428466797, -5.896072864532471, -3.0404253005981445, -0.18477725982666016, 2.670870780944824, 5.526517868041992, 8.382165908813477, 11.237813949584961, 14.093461990356445, 16.94911003112793, 19.80475616455078, 22.660404205322266, 25.51605224609375, 28.371700286865234, 31.22734832763672, 34.0829963684082, 36.93864440917969, 39.79429244995117, 42.649940490722656, 45.50558853149414, 48.361236572265625, 51.216880798339844, 54.072532653808594, 56.92817687988281, 59.7838249206543, 62.63947296142578, 65.4951171875, 68.35076904296875, 71.20641326904297, 74.06206512451172, 76.91770935058594, 79.77336120605469]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 9.0, 7.0, 5.0, 6.0, 13.0, 12.0, 14.0, 24.0, 28.0, 17.0, 39.0, 41.0, 35.0, 45.0, 39.0, 43.0, 44.0, 49.0, 36.0, 46.0, 55.0, 41.0, 42.0, 48.0, 30.0, 37.0, 39.0, 32.0, 18.0, 27.0, 15.0, 17.0, 14.0, 6.0, 7.0, 8.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-15.140625, -14.7657470703125, -14.390869140625, -14.0159912109375, -13.64111328125, -13.2662353515625, -12.891357421875, -12.5164794921875, -12.1416015625, -11.7667236328125, -11.391845703125, -11.0169677734375, -10.64208984375, -10.2672119140625, -9.892333984375, -9.5174560546875, -9.142578125, -8.7677001953125, -8.392822265625, -8.0179443359375, -7.64306640625, -7.2681884765625, -6.893310546875, -6.5184326171875, -6.1435546875, -5.7686767578125, -5.393798828125, -5.0189208984375, -4.64404296875, -4.2691650390625, -3.894287109375, -3.5194091796875, -3.14453125, -2.7696533203125, -2.394775390625, -2.0198974609375, -1.64501953125, -1.2701416015625, -0.895263671875, -0.5203857421875, -0.1455078125, 0.2293701171875, 0.604248046875, 0.9791259765625, 1.35400390625, 1.7288818359375, 2.103759765625, 2.4786376953125, 2.853515625, 3.2283935546875, 3.603271484375, 3.9781494140625, 4.35302734375, 4.7279052734375, 5.102783203125, 5.4776611328125, 5.8525390625, 6.2274169921875, 6.602294921875, 6.9771728515625, 7.35205078125, 7.7269287109375, 8.101806640625, 8.4766845703125, 8.8515625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 5.0, 9.0, 4.0, 7.0, 6.0, 10.0, 14.0, 15.0, 20.0, 25.0, 24.0, 41.0, 43.0, 54.0, 67.0, 198.0, 615.0, 3680.0, 131710.0, 3871048.0, 181646.0, 3923.0, 606.0, 175.0, 59.0, 49.0, 31.0, 41.0, 31.0, 25.0, 20.0, 23.0, 20.0, 10.0, 11.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-56.90625, -55.46630859375, -54.0263671875, -52.58642578125, -51.146484375, -49.70654296875, -48.2666015625, -46.82666015625, -45.38671875, -43.94677734375, -42.5068359375, -41.06689453125, -39.626953125, -38.18701171875, -36.7470703125, -35.30712890625, -33.8671875, -32.42724609375, -30.9873046875, -29.54736328125, -28.107421875, -26.66748046875, -25.2275390625, -23.78759765625, -22.34765625, -20.90771484375, -19.4677734375, -18.02783203125, -16.587890625, -15.14794921875, -13.7080078125, -12.26806640625, -10.828125, -9.38818359375, -7.9482421875, -6.50830078125, -5.068359375, -3.62841796875, -2.1884765625, -0.74853515625, 0.69140625, 2.13134765625, 3.5712890625, 5.01123046875, 6.451171875, 7.89111328125, 9.3310546875, 10.77099609375, 12.2109375, 13.65087890625, 15.0908203125, 16.53076171875, 17.970703125, 19.41064453125, 20.8505859375, 22.29052734375, 23.73046875, 25.17041015625, 26.6103515625, 28.05029296875, 29.490234375, 30.93017578125, 32.3701171875, 33.81005859375, 35.25]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 7.0, 8.0, 13.0, 21.0, 16.0, 46.0, 46.0, 79.0, 125.0, 195.0, 277.0, 489.0, 693.0, 618.0, 500.0, 305.0, 240.0, 133.0, 84.0, 54.0, 46.0, 29.0, 18.0, 12.0, 7.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.640625, -29.79052734375, -28.9404296875, -28.09033203125, -27.240234375, -26.39013671875, -25.5400390625, -24.68994140625, -23.83984375, -22.98974609375, -22.1396484375, -21.28955078125, -20.439453125, -19.58935546875, -18.7392578125, -17.88916015625, -17.0390625, -16.18896484375, -15.3388671875, -14.48876953125, -13.638671875, -12.78857421875, -11.9384765625, -11.08837890625, -10.23828125, -9.38818359375, -8.5380859375, -7.68798828125, -6.837890625, -5.98779296875, -5.1376953125, -4.28759765625, -3.4375, -2.58740234375, -1.7373046875, -0.88720703125, -0.037109375, 0.81298828125, 1.6630859375, 2.51318359375, 3.36328125, 4.21337890625, 5.0634765625, 5.91357421875, 6.763671875, 7.61376953125, 8.4638671875, 9.31396484375, 10.1640625, 11.01416015625, 11.8642578125, 12.71435546875, 13.564453125, 14.41455078125, 15.2646484375, 16.11474609375, 16.96484375, 17.81494140625, 18.6650390625, 19.51513671875, 20.365234375, 21.21533203125, 22.0654296875, 22.91552734375, 23.765625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 5.0, 8.0, 6.0, 3.0, 11.0, 12.0, 30.0, 27.0, 40.0, 34.0, 63.0, 83.0, 108.0, 139.0, 183.0, 254.0, 434.0, 924.0, 8472.0, 4005607.0, 174326.0, 1840.0, 534.0, 286.0, 221.0, 149.0, 104.0, 93.0, 68.0, 51.0, 47.0, 28.0, 25.0, 17.0, 15.0, 9.0, 4.0, 3.0, 6.0, 3.0, 4.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.0, -86.0078125, -83.015625, -80.0234375, -77.03125, -74.0390625, -71.046875, -68.0546875, -65.0625, -62.0703125, -59.078125, -56.0859375, -53.09375, -50.1015625, -47.109375, -44.1171875, -41.125, -38.1328125, -35.140625, -32.1484375, -29.15625, -26.1640625, -23.171875, -20.1796875, -17.1875, -14.1953125, -11.203125, -8.2109375, -5.21875, -2.2265625, 0.765625, 3.7578125, 6.75, 9.7421875, 12.734375, 15.7265625, 18.71875, 21.7109375, 24.703125, 27.6953125, 30.6875, 33.6796875, 36.671875, 39.6640625, 42.65625, 45.6484375, 48.640625, 51.6328125, 54.625, 57.6171875, 60.609375, 63.6015625, 66.59375, 69.5859375, 72.578125, 75.5703125, 78.5625, 81.5546875, 84.546875, 87.5390625, 90.53125, 93.5234375, 96.515625, 99.5078125, 102.5]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 50.0, 260.0, 448.0, 207.0, 37.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.01313018798828, -102.00872039794922, -93.00431823730469, -83.99990844726562, -74.99549865722656, -65.9910888671875, -56.9866828918457, -47.982276916503906, -38.977867126464844, -29.973459243774414, -20.969051361083984, -11.964643478393555, -2.960235595703125, 6.0441741943359375, 15.048580169677734, 24.05298614501953, 33.057395935058594, 42.061805725097656, 51.06621170043945, 60.07061767578125, 69.07502746582031, 78.07943725585938, 87.08384704589844, 96.08824920654297, 105.09265899658203, 114.0970687866211, 123.10147094726562, 132.1058807373047, 141.11029052734375, 150.1147003173828, 159.11911010742188, 168.12350463867188, 177.1279296875, 186.13233947753906, 195.13674926757812, 204.1411590576172, 213.14556884765625, 222.14996337890625, 231.1543731689453, 240.15878295898438, 249.16319274902344, 258.1676025390625, 267.1719970703125, 276.1764221191406, 285.1808166503906, 294.18524169921875, 303.18963623046875, 312.19403076171875, 321.1984558105469, 330.2028503417969, 339.207275390625, 348.211669921875, 357.2160949707031, 366.2204895019531, 375.22491455078125, 384.22930908203125, 393.23370361328125, 402.23809814453125, 411.2425231933594, 420.2469177246094, 429.2513427734375, 438.2557373046875, 447.2601623535156, 456.2645568847656, 465.26898193359375]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 5.0, 5.0, 7.0, 3.0, 6.0, 12.0, 17.0, 14.0, 21.0, 20.0, 11.0, 18.0, 21.0, 24.0, 23.0, 33.0, 35.0, 39.0, 36.0, 39.0, 41.0, 46.0, 34.0, 37.0, 49.0, 37.0, 34.0, 28.0, 30.0, 35.0, 24.0, 26.0, 24.0, 29.0, 19.0, 16.0, 20.0, 9.0, 13.0, 10.0, 10.0, 5.0, 8.0, 5.0, 6.0, 5.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.7250862121582, -52.86930847167969, -51.013526916503906, -49.15774917602539, -47.30196762084961, -45.446189880371094, -43.59040832519531, -41.7346305847168, -39.87885284423828, -38.023075103759766, -36.167293548583984, -34.31151580810547, -32.45573425292969, -30.599956512451172, -28.744176864624023, -26.888397216796875, -25.032615661621094, -23.176836013793945, -21.321056365966797, -19.46527862548828, -17.6094970703125, -15.753718376159668, -13.897939682006836, -12.042160034179688, -10.186380386352539, -8.33060073852539, -6.4748215675354, -4.61904239654541, -2.7632627487182617, -0.9074831008911133, 0.9482955932617188, 2.804075241088867, 4.659858703613281, 6.51563835144043, 8.371417999267578, 10.22719669342041, 12.082976341247559, 13.938755989074707, 15.794534683227539, 17.650314331054688, 19.506093978881836, 21.361873626708984, 23.217653274536133, 25.07343292236328, 26.929210662841797, 28.784992218017578, 30.640769958496094, 32.496551513671875, 34.35232925415039, 36.208106994628906, 38.06388854980469, 39.9196662902832, 41.775447845458984, 43.6312255859375, 45.48700714111328, 47.3427848815918, 49.19856262207031, 51.05434036254883, 52.91012191772461, 54.765899658203125, 56.621681213378906, 58.47745895385742, 60.33323669433594, 62.18901824951172, 64.0447998046875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 6.0, 10.0, 4.0, 2.0, 12.0, 13.0, 11.0, 24.0, 19.0, 18.0, 26.0, 31.0, 28.0, 33.0, 37.0, 43.0, 28.0, 40.0, 44.0, 49.0, 53.0, 46.0, 41.0, 36.0, 51.0, 43.0, 50.0, 25.0, 31.0, 29.0, 20.0, 18.0, 11.0, 18.0, 13.0, 22.0, 4.0, 7.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.9609375, -12.6121826171875, -12.263427734375, -11.9146728515625, -11.56591796875, -11.2171630859375, -10.868408203125, -10.5196533203125, -10.1708984375, -9.8221435546875, -9.473388671875, -9.1246337890625, -8.77587890625, -8.4271240234375, -8.078369140625, -7.7296142578125, -7.380859375, -7.0321044921875, -6.683349609375, -6.3345947265625, -5.98583984375, -5.6370849609375, -5.288330078125, -4.9395751953125, -4.5908203125, -4.2420654296875, -3.893310546875, -3.5445556640625, -3.19580078125, -2.8470458984375, -2.498291015625, -2.1495361328125, -1.80078125, -1.4520263671875, -1.103271484375, -0.7545166015625, -0.40576171875, -0.0570068359375, 0.291748046875, 0.6405029296875, 0.9892578125, 1.3380126953125, 1.686767578125, 2.0355224609375, 2.38427734375, 2.7330322265625, 3.081787109375, 3.4305419921875, 3.779296875, 4.1280517578125, 4.476806640625, 4.8255615234375, 5.17431640625, 5.5230712890625, 5.871826171875, 6.2205810546875, 6.5693359375, 6.9180908203125, 7.266845703125, 7.6156005859375, 7.96435546875, 8.3131103515625, 8.661865234375, 9.0106201171875, 9.359375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 10.0, 9.0, 4.0, 7.0, 13.0, 27.0, 31.0, 43.0, 73.0, 107.0, 147.0, 178.0, 345.0, 483.0, 675.0, 1092.0, 1611.0, 2358.0, 3671.0, 5802.0, 8800.0, 13169.0, 21087.0, 33641.0, 56969.0, 103078.0, 252530.0, 279585.0, 107174.0, 59191.0, 34740.0, 21690.0, 13874.0, 9023.0, 6009.0, 3741.0, 2421.0, 1780.0, 1128.0, 735.0, 489.0, 328.0, 212.0, 154.0, 77.0, 75.0, 57.0, 41.0, 19.0, 10.0, 8.0, 7.0, 5.0, 6.0, 2.0, 6.0, 5.0, 2.0], "bins": [-2.119140625, -2.05499267578125, -1.9908447265625, -1.92669677734375, -1.862548828125, -1.79840087890625, -1.7342529296875, -1.67010498046875, -1.60595703125, -1.54180908203125, -1.4776611328125, -1.41351318359375, -1.349365234375, -1.28521728515625, -1.2210693359375, -1.15692138671875, -1.0927734375, -1.02862548828125, -0.9644775390625, -0.90032958984375, -0.836181640625, -0.77203369140625, -0.7078857421875, -0.64373779296875, -0.57958984375, -0.51544189453125, -0.4512939453125, -0.38714599609375, -0.322998046875, -0.25885009765625, -0.1947021484375, -0.13055419921875, -0.06640625, -0.00225830078125, 0.0618896484375, 0.12603759765625, 0.190185546875, 0.25433349609375, 0.3184814453125, 0.38262939453125, 0.44677734375, 0.51092529296875, 0.5750732421875, 0.63922119140625, 0.703369140625, 0.76751708984375, 0.8316650390625, 0.89581298828125, 0.9599609375, 1.02410888671875, 1.0882568359375, 1.15240478515625, 1.216552734375, 1.28070068359375, 1.3448486328125, 1.40899658203125, 1.47314453125, 1.53729248046875, 1.6014404296875, 1.66558837890625, 1.729736328125, 1.79388427734375, 1.8580322265625, 1.92218017578125, 1.986328125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 6.0, 18.0, 11.0, 15.0, 14.0, 11.0, 10.0, 15.0, 11.0, 23.0, 31.0, 28.0, 44.0, 32.0, 34.0, 39.0, 38.0, 50.0, 1057.0, 46.0, 49.0, 41.0, 42.0, 30.0, 37.0, 35.0, 29.0, 33.0, 26.0, 29.0, 12.0, 27.0, 13.0, 13.0, 10.0, 12.0, 13.0, 10.0, 7.0, 3.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-7.05078125, -6.84893798828125, -6.6470947265625, -6.44525146484375, -6.243408203125, -6.04156494140625, -5.8397216796875, -5.63787841796875, -5.43603515625, -5.23419189453125, -5.0323486328125, -4.83050537109375, -4.628662109375, -4.42681884765625, -4.2249755859375, -4.02313232421875, -3.8212890625, -3.61944580078125, -3.4176025390625, -3.21575927734375, -3.013916015625, -2.81207275390625, -2.6102294921875, -2.40838623046875, -2.20654296875, -2.00469970703125, -1.8028564453125, -1.60101318359375, -1.399169921875, -1.19732666015625, -0.9954833984375, -0.79364013671875, -0.591796875, -0.38995361328125, -0.1881103515625, 0.01373291015625, 0.215576171875, 0.41741943359375, 0.6192626953125, 0.82110595703125, 1.02294921875, 1.22479248046875, 1.4266357421875, 1.62847900390625, 1.830322265625, 2.03216552734375, 2.2340087890625, 2.43585205078125, 2.6376953125, 2.83953857421875, 3.0413818359375, 3.24322509765625, 3.445068359375, 3.64691162109375, 3.8487548828125, 4.05059814453125, 4.25244140625, 4.45428466796875, 4.6561279296875, 4.85797119140625, 5.059814453125, 5.26165771484375, 5.4635009765625, 5.66534423828125, 5.8671875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 12.0, 8.0, 20.0, 30.0, 39.0, 54.0, 61.0, 130.0, 190.0, 292.0, 413.0, 644.0, 934.0, 1569.0, 2378.0, 3601.0, 5580.0, 8368.0, 12866.0, 20134.0, 31826.0, 52976.0, 96236.0, 233045.0, 1354923.0, 112793.0, 60211.0, 35709.0, 21939.0, 13833.0, 9075.0, 6115.0, 3962.0, 2491.0, 1635.0, 1030.0, 681.0, 423.0, 315.0, 191.0, 142.0, 83.0, 50.0, 39.0, 31.0, 23.0, 9.0, 11.0, 8.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8974609375, -1.8344573974609375, -1.771453857421875, -1.7084503173828125, -1.64544677734375, -1.5824432373046875, -1.519439697265625, -1.4564361572265625, -1.3934326171875, -1.3304290771484375, -1.267425537109375, -1.2044219970703125, -1.14141845703125, -1.0784149169921875, -1.015411376953125, -0.9524078369140625, -0.889404296875, -0.8264007568359375, -0.763397216796875, -0.7003936767578125, -0.63739013671875, -0.5743865966796875, -0.511383056640625, -0.4483795166015625, -0.3853759765625, -0.3223724365234375, -0.259368896484375, -0.1963653564453125, -0.13336181640625, -0.0703582763671875, -0.007354736328125, 0.0556488037109375, 0.11865234375, 0.1816558837890625, 0.244659423828125, 0.3076629638671875, 0.37066650390625, 0.4336700439453125, 0.496673583984375, 0.5596771240234375, 0.6226806640625, 0.6856842041015625, 0.748687744140625, 0.8116912841796875, 0.87469482421875, 0.9376983642578125, 1.000701904296875, 1.0637054443359375, 1.126708984375, 1.1897125244140625, 1.252716064453125, 1.3157196044921875, 1.37872314453125, 1.4417266845703125, 1.504730224609375, 1.5677337646484375, 1.6307373046875, 1.6937408447265625, 1.756744384765625, 1.8197479248046875, 1.88275146484375, 1.9457550048828125, 2.008758544921875, 2.0717620849609375, 2.134765625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 10.0, 8.0, 13.0, 14.0, 15.0, 24.0, 36.0, 42.0, 45.0, 54.0, 85.0, 92.0, 82.0, 96.0, 82.0, 66.0, 48.0, 43.0, 35.0, 24.0, 18.0, 17.0, 9.0, 2.0, 7.0, 5.0, 5.0, 3.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013246536254882812, -0.0012767314910888672, -0.0012288093566894531, -0.001180887222290039, -0.001132965087890625, -0.001085042953491211, -0.0010371208190917969, -0.0009891986846923828, -0.0009412765502929688, -0.0008933544158935547, -0.0008454322814941406, -0.0007975101470947266, -0.0007495880126953125, -0.0007016658782958984, -0.0006537437438964844, -0.0006058216094970703, -0.0005578994750976562, -0.0005099773406982422, -0.0004620552062988281, -0.00041413307189941406, -0.0003662109375, -0.00031828880310058594, -0.0002703666687011719, -0.0002224445343017578, -0.00017452239990234375, -0.0001266002655029297, -7.867813110351562e-05, -3.075599670410156e-05, 1.71661376953125e-05, 6.508827209472656e-05, 0.00011301040649414062, 0.0001609325408935547, 0.00020885467529296875, 0.0002567768096923828, 0.0003046989440917969, 0.00035262107849121094, 0.000400543212890625, 0.00044846534729003906, 0.0004963874816894531, 0.0005443096160888672, 0.0005922317504882812, 0.0006401538848876953, 0.0006880760192871094, 0.0007359981536865234, 0.0007839202880859375, 0.0008318424224853516, 0.0008797645568847656, 0.0009276866912841797, 0.0009756088256835938, 0.0010235309600830078, 0.0010714530944824219, 0.001119375228881836, 0.00116729736328125, 0.001215219497680664, 0.0012631416320800781, 0.0013110637664794922, 0.0013589859008789062, 0.0014069080352783203, 0.0014548301696777344, 0.0015027523040771484, 0.0015506744384765625, 0.0015985965728759766, 0.0016465187072753906, 0.0016944408416748047, 0.0017423629760742188]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 6.0, 4.0, 3.0, 5.0, 8.0, 8.0, 14.0, 13.0, 16.0, 41.0, 54.0, 66.0, 100.0, 192.0, 483.0, 5972.0, 1038589.0, 2102.0, 389.0, 173.0, 85.0, 53.0, 45.0, 25.0, 26.0, 21.0, 18.0, 12.0, 9.0, 5.0, 7.0, 2.0, 5.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.04296875, -0.04187798500061035, -0.0407872200012207, -0.039696455001831055, -0.038605690002441406, -0.03751492500305176, -0.03642416000366211, -0.03533339500427246, -0.03424263000488281, -0.033151865005493164, -0.032061100006103516, -0.030970335006713867, -0.02987957000732422, -0.02878880500793457, -0.027698040008544922, -0.026607275009155273, -0.025516510009765625, -0.024425745010375977, -0.023334980010986328, -0.02224421501159668, -0.02115345001220703, -0.020062685012817383, -0.018971920013427734, -0.017881155014038086, -0.016790390014648438, -0.01569962501525879, -0.01460886001586914, -0.013518095016479492, -0.012427330017089844, -0.011336565017700195, -0.010245800018310547, -0.009155035018920898, -0.00806427001953125, -0.0069735050201416016, -0.005882740020751953, -0.004791975021362305, -0.0037012100219726562, -0.002610445022583008, -0.0015196800231933594, -0.00042891502380371094, 0.0006618499755859375, 0.001752614974975586, 0.0028433799743652344, 0.003934144973754883, 0.005024909973144531, 0.00611567497253418, 0.007206439971923828, 0.008297204971313477, 0.009387969970703125, 0.010478734970092773, 0.011569499969482422, 0.01266026496887207, 0.013751029968261719, 0.014841794967651367, 0.015932559967041016, 0.017023324966430664, 0.018114089965820312, 0.01920485496520996, 0.02029561996459961, 0.021386384963989258, 0.022477149963378906, 0.023567914962768555, 0.024658679962158203, 0.02574944496154785, 0.0268402099609375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 16.0, 48.0, 99.0, 229.0, 276.0, 196.0, 91.0, 39.0, 10.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002055614721029997, -0.002011307515203953, -0.001967000076547265, -0.001922692870721221, -0.0018783856648951769, -0.001834078342653811, -0.001789771020412445, -0.001745463814586401, -0.001701156608760357, -0.001656849286518991, -0.001612542080692947, -0.001568234758451581, -0.001523927552625537, -0.001479620230384171, -0.001435312908142805, -0.001391005702316761, -0.001346698380075395, -0.0013023910578340292, -0.0012580838520079851, -0.0012137765297666192, -0.0011694693239405751, -0.0011251620016992092, -0.0010808547958731651, -0.0010365474736317992, -0.0009922401513904333, -0.0009479328873567283, -0.0009036256233230233, -0.0008593183010816574, -0.0008150110952556133, -0.0007707037730142474, -0.0007263965089805424, -0.0006820892449468374, -0.0006377821555361152, -0.0005934748915024102, -0.0005491676274687052, -0.0005048603052273393, -0.00046055307029746473, -0.00041624580626375973, -0.0003719385131262243, -0.0003276312490925193, -0.0002833239850588143, -0.0002390167210251093, -0.00019470944243948907, -0.00015040216385386884, -0.00010609489982016385, -6.178763578645885e-05, -1.7480342648923397e-05, 2.68269213847816e-05, 7.11341854184866e-05, 0.0001154414567281492, 0.00015974872803781182, 0.00020405600662343204, 0.00024836327065713704, 0.00029267053469084203, 0.0003369778278283775, 0.0003812850918620825, 0.0004255923558957875, 0.0004698996199294925, 0.0005142068839631975, 0.0005585141479969025, 0.0006028214702382684, 0.0006471286760643125, 0.0006914359983056784, 0.0007357432623393834, 0.0007800505263730884]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 7.0, 8.0, 11.0, 12.0, 16.0, 13.0, 11.0, 17.0, 16.0, 31.0, 20.0, 33.0, 35.0, 27.0, 42.0, 39.0, 48.0, 40.0, 45.0, 44.0, 42.0, 32.0, 40.0, 37.0, 45.0, 36.0, 32.0, 38.0, 20.0, 25.0, 25.0, 17.0, 24.0, 11.0, 5.0, 9.0, 10.0, 8.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0006409883499145508, -0.0006217369809746742, -0.0006024856120347977, -0.0005832342430949211, -0.0005639828741550446, -0.000544731505215168, -0.0005254801362752914, -0.0005062287673354149, -0.00048697739839553833, -0.0004677260294556618, -0.0004484746605157852, -0.00042922329157590866, -0.0004099719226360321, -0.00039072055369615555, -0.000371469184756279, -0.00035221781581640244, -0.0003329664468765259, -0.0003137150779366493, -0.00029446370899677277, -0.0002752123400568962, -0.00025596097111701965, -0.0002367096021771431, -0.00021745823323726654, -0.00019820686429738998, -0.00017895549535751343, -0.00015970412641763687, -0.00014045275747776031, -0.00012120138853788376, -0.0001019500195980072, -8.269865065813065e-05, -6.344728171825409e-05, -4.419591277837753e-05, -2.4944543838500977e-05, -5.69317489862442e-06, 1.3558194041252136e-05, 3.280956298112869e-05, 5.206093192100525e-05, 7.13123008608818e-05, 9.056366980075836e-05, 0.00010981503874063492, 0.00012906640768051147, 0.00014831777662038803, 0.0001675691455602646, 0.00018682051450014114, 0.0002060718834400177, 0.00022532325237989426, 0.0002445746213197708, 0.00026382599025964737, 0.0002830773591995239, 0.0003023287281394005, 0.00032158009707927704, 0.0003408314660191536, 0.00036008283495903015, 0.0003793342038989067, 0.00039858557283878326, 0.0004178369417786598, 0.0004370883107185364, 0.00045633967965841293, 0.0004755910485982895, 0.000494842417538166, 0.0005140937864780426, 0.0005333451554179192, 0.0005525965243577957, 0.0005718478932976723, 0.0005910992622375488]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 6.0, 10.0, 4.0, 2.0, 12.0, 13.0, 11.0, 24.0, 19.0, 18.0, 26.0, 31.0, 28.0, 33.0, 37.0, 43.0, 28.0, 40.0, 44.0, 49.0, 53.0, 46.0, 41.0, 36.0, 51.0, 43.0, 50.0, 25.0, 31.0, 29.0, 20.0, 18.0, 11.0, 18.0, 13.0, 22.0, 4.0, 7.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.9609375, -12.6121826171875, -12.263427734375, -11.9146728515625, -11.56591796875, -11.2171630859375, -10.868408203125, -10.5196533203125, -10.1708984375, -9.8221435546875, -9.473388671875, -9.1246337890625, -8.77587890625, -8.4271240234375, -8.078369140625, -7.7296142578125, -7.380859375, -7.0321044921875, -6.683349609375, -6.3345947265625, -5.98583984375, -5.6370849609375, -5.288330078125, -4.9395751953125, -4.5908203125, -4.2420654296875, -3.893310546875, -3.5445556640625, -3.19580078125, -2.8470458984375, -2.498291015625, -2.1495361328125, -1.80078125, -1.4520263671875, -1.103271484375, -0.7545166015625, -0.40576171875, -0.0570068359375, 0.291748046875, 0.6405029296875, 0.9892578125, 1.3380126953125, 1.686767578125, 2.0355224609375, 2.38427734375, 2.7330322265625, 3.081787109375, 3.4305419921875, 3.779296875, 4.1280517578125, 4.476806640625, 4.8255615234375, 5.17431640625, 5.5230712890625, 5.871826171875, 6.2205810546875, 6.5693359375, 6.9180908203125, 7.266845703125, 7.6156005859375, 7.96435546875, 8.3131103515625, 8.661865234375, 9.0106201171875, 9.359375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 21.0, 25.0, 41.0, 56.0, 100.0, 195.0, 297.0, 601.0, 1154.0, 2883.0, 8099.0, 30254.0, 198516.0, 670824.0, 105949.0, 19531.0, 5838.0, 2079.0, 992.0, 455.0, 243.0, 169.0, 93.0, 53.0, 20.0, 19.0, 13.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.234375, -14.865966796875, -14.49755859375, -14.129150390625, -13.7607421875, -13.392333984375, -13.02392578125, -12.655517578125, -12.287109375, -11.918701171875, -11.55029296875, -11.181884765625, -10.8134765625, -10.445068359375, -10.07666015625, -9.708251953125, -9.33984375, -8.971435546875, -8.60302734375, -8.234619140625, -7.8662109375, -7.497802734375, -7.12939453125, -6.760986328125, -6.392578125, -6.024169921875, -5.65576171875, -5.287353515625, -4.9189453125, -4.550537109375, -4.18212890625, -3.813720703125, -3.4453125, -3.076904296875, -2.70849609375, -2.340087890625, -1.9716796875, -1.603271484375, -1.23486328125, -0.866455078125, -0.498046875, -0.129638671875, 0.23876953125, 0.607177734375, 0.9755859375, 1.343994140625, 1.71240234375, 2.080810546875, 2.44921875, 2.817626953125, 3.18603515625, 3.554443359375, 3.9228515625, 4.291259765625, 4.65966796875, 5.028076171875, 5.396484375, 5.764892578125, 6.13330078125, 6.501708984375, 6.8701171875, 7.238525390625, 7.60693359375, 7.975341796875, 8.34375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 3.0, 8.0, 14.0, 16.0, 24.0, 27.0, 22.0, 25.0, 49.0, 49.0, 59.0, 53.0, 82.0, 166.0, 1850.0, 153.0, 72.0, 72.0, 53.0, 38.0, 43.0, 33.0, 25.0, 26.0, 19.0, 14.0, 10.0, 6.0, 8.0, 4.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.3125, -49.00537109375, -47.6982421875, -46.39111328125, -45.083984375, -43.77685546875, -42.4697265625, -41.16259765625, -39.85546875, -38.54833984375, -37.2412109375, -35.93408203125, -34.626953125, -33.31982421875, -32.0126953125, -30.70556640625, -29.3984375, -28.09130859375, -26.7841796875, -25.47705078125, -24.169921875, -22.86279296875, -21.5556640625, -20.24853515625, -18.94140625, -17.63427734375, -16.3271484375, -15.02001953125, -13.712890625, -12.40576171875, -11.0986328125, -9.79150390625, -8.484375, -7.17724609375, -5.8701171875, -4.56298828125, -3.255859375, -1.94873046875, -0.6416015625, 0.66552734375, 1.97265625, 3.27978515625, 4.5869140625, 5.89404296875, 7.201171875, 8.50830078125, 9.8154296875, 11.12255859375, 12.4296875, 13.73681640625, 15.0439453125, 16.35107421875, 17.658203125, 18.96533203125, 20.2724609375, 21.57958984375, 22.88671875, 24.19384765625, 25.5009765625, 26.80810546875, 28.115234375, 29.42236328125, 30.7294921875, 32.03662109375, 33.34375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 4.0, 9.0, 7.0, 19.0, 19.0, 29.0, 39.0, 51.0, 75.0, 92.0, 127.0, 176.0, 259.0, 425.0, 1247.0, 110387.0, 3028519.0, 2592.0, 533.0, 298.0, 213.0, 156.0, 108.0, 83.0, 58.0, 48.0, 34.0, 30.0, 8.0, 13.0, 12.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-83.0625, -80.2138671875, -77.365234375, -74.5166015625, -71.66796875, -68.8193359375, -65.970703125, -63.1220703125, -60.2734375, -57.4248046875, -54.576171875, -51.7275390625, -48.87890625, -46.0302734375, -43.181640625, -40.3330078125, -37.484375, -34.6357421875, -31.787109375, -28.9384765625, -26.08984375, -23.2412109375, -20.392578125, -17.5439453125, -14.6953125, -11.8466796875, -8.998046875, -6.1494140625, -3.30078125, -0.4521484375, 2.396484375, 5.2451171875, 8.09375, 10.9423828125, 13.791015625, 16.6396484375, 19.48828125, 22.3369140625, 25.185546875, 28.0341796875, 30.8828125, 33.7314453125, 36.580078125, 39.4287109375, 42.27734375, 45.1259765625, 47.974609375, 50.8232421875, 53.671875, 56.5205078125, 59.369140625, 62.2177734375, 65.06640625, 67.9150390625, 70.763671875, 73.6123046875, 76.4609375, 79.3095703125, 82.158203125, 85.0068359375, 87.85546875, 90.7041015625, 93.552734375, 96.4013671875, 99.25]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 26.0, 427.0, 512.0, 46.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-274.1693420410156, -269.0989990234375, -264.0286865234375, -258.9583435058594, -253.88800048828125, -248.8176727294922, -243.74732971191406, -238.677001953125, -233.60665893554688, -228.5363311767578, -223.4659881591797, -218.39566040039062, -213.3253173828125, -208.25498962402344, -203.1846466064453, -198.11431884765625, -193.04397583007812, -187.97364807128906, -182.90330505371094, -177.83297729492188, -172.76263427734375, -167.6923065185547, -162.62196350097656, -157.5516357421875, -152.48130798339844, -147.41098022460938, -142.34063720703125, -137.2703094482422, -132.19996643066406, -127.12963104248047, -122.05929565429688, -116.98896789550781, -111.91860961914062, -106.84827423095703, -101.77793884277344, -96.70760345458984, -91.63726806640625, -86.56693267822266, -81.49659729003906, -76.42626953125, -71.3559341430664, -66.28559875488281, -61.21526336669922, -56.144927978515625, -51.07459259033203, -46.00425720214844, -40.93392562866211, -35.863590240478516, -30.793254852294922, -25.722919464111328, -20.652584075927734, -15.582250595092773, -10.51191520690918, -5.441579818725586, -0.371246337890625, 4.699089050292969, 9.769424438476562, 14.839759826660156, 19.91009521484375, 24.98042869567871, 30.050764083862305, 35.12110137939453, 40.19143295288086, 45.26176834106445, 50.33210372924805]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 6.0, 8.0, 9.0, 12.0, 13.0, 15.0, 18.0, 14.0, 16.0, 23.0, 24.0, 26.0, 27.0, 21.0, 17.0, 36.0, 31.0, 35.0, 35.0, 41.0, 43.0, 40.0, 33.0, 38.0, 36.0, 36.0, 36.0, 27.0, 31.0, 30.0, 29.0, 20.0, 19.0, 19.0, 19.0, 16.0, 8.0, 9.0, 15.0, 6.0, 6.0, 12.0, 7.0, 5.0, 10.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-76.9843521118164, -74.50233459472656, -72.02031707763672, -69.53829956054688, -67.05628204345703, -64.57426452636719, -62.09224319458008, -59.61022186279297, -57.128204345703125, -54.64618682861328, -52.16416931152344, -49.682151794433594, -47.200130462646484, -44.71811294555664, -42.2360954284668, -39.75407409667969, -37.27206039428711, -34.790042877197266, -32.30802536010742, -29.826005935668945, -27.34398651123047, -24.861968994140625, -22.37995147705078, -19.897932052612305, -17.41591453552246, -14.9338960647583, -12.45187759399414, -9.969860076904297, -7.487841606140137, -5.005823135375977, -2.523805618286133, -0.04178619384765625, 2.4402313232421875, 4.922249794006348, 7.40426778793335, 9.886285781860352, 12.368304252624512, 14.850322723388672, 17.332340240478516, 19.814359664916992, 22.296377182006836, 24.77839469909668, 27.260414123535156, 29.742431640625, 32.224449157714844, 34.70646667480469, 37.18848419189453, 39.67050552368164, 42.152523040771484, 44.63454055786133, 47.11655807495117, 49.59857940673828, 52.080596923828125, 54.56261444091797, 57.04463195800781, 59.526649475097656, 62.0086669921875, 64.49068450927734, 66.97270202636719, 69.45471954345703, 71.93673706054688, 74.41876220703125, 76.90077209472656, 79.38279724121094, 81.86481475830078]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 9.0, 3.0, 4.0, 12.0, 12.0, 11.0, 19.0, 22.0, 20.0, 21.0, 25.0, 31.0, 29.0, 40.0, 42.0, 32.0, 28.0, 36.0, 55.0, 45.0, 62.0, 30.0, 43.0, 47.0, 35.0, 43.0, 30.0, 37.0, 31.0, 26.0, 15.0, 22.0, 9.0, 24.0, 14.0, 13.0, 11.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-13.359375, -13.0052490234375, -12.651123046875, -12.2969970703125, -11.94287109375, -11.5887451171875, -11.234619140625, -10.8804931640625, -10.5263671875, -10.1722412109375, -9.818115234375, -9.4639892578125, -9.10986328125, -8.7557373046875, -8.401611328125, -8.0474853515625, -7.693359375, -7.3392333984375, -6.985107421875, -6.6309814453125, -6.27685546875, -5.9227294921875, -5.568603515625, -5.2144775390625, -4.8603515625, -4.5062255859375, -4.152099609375, -3.7979736328125, -3.44384765625, -3.0897216796875, -2.735595703125, -2.3814697265625, -2.02734375, -1.6732177734375, -1.319091796875, -0.9649658203125, -0.61083984375, -0.2567138671875, 0.097412109375, 0.4515380859375, 0.8056640625, 1.1597900390625, 1.513916015625, 1.8680419921875, 2.22216796875, 2.5762939453125, 2.930419921875, 3.2845458984375, 3.638671875, 3.9927978515625, 4.346923828125, 4.7010498046875, 5.05517578125, 5.4093017578125, 5.763427734375, 6.1175537109375, 6.4716796875, 6.8258056640625, 7.179931640625, 7.5340576171875, 7.88818359375, 8.2423095703125, 8.596435546875, 8.9505615234375, 9.3046875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 2.0, 3.0, 6.0, 5.0, 4.0, 15.0, 19.0, 21.0, 14.0, 20.0, 30.0, 42.0, 66.0, 75.0, 108.0, 240.0, 543.0, 1830.0, 9618.0, 219868.0, 3100074.0, 833360.0, 23765.0, 2982.0, 797.0, 271.0, 140.0, 86.0, 56.0, 48.0, 29.0, 24.0, 26.0, 26.0, 13.0, 22.0, 10.0, 10.0, 4.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-33.78125, -32.860107421875, -31.93896484375, -31.017822265625, -30.0966796875, -29.175537109375, -28.25439453125, -27.333251953125, -26.412109375, -25.490966796875, -24.56982421875, -23.648681640625, -22.7275390625, -21.806396484375, -20.88525390625, -19.964111328125, -19.04296875, -18.121826171875, -17.20068359375, -16.279541015625, -15.3583984375, -14.437255859375, -13.51611328125, -12.594970703125, -11.673828125, -10.752685546875, -9.83154296875, -8.910400390625, -7.9892578125, -7.068115234375, -6.14697265625, -5.225830078125, -4.3046875, -3.383544921875, -2.46240234375, -1.541259765625, -0.6201171875, 0.301025390625, 1.22216796875, 2.143310546875, 3.064453125, 3.985595703125, 4.90673828125, 5.827880859375, 6.7490234375, 7.670166015625, 8.59130859375, 9.512451171875, 10.43359375, 11.354736328125, 12.27587890625, 13.197021484375, 14.1181640625, 15.039306640625, 15.96044921875, 16.881591796875, 17.802734375, 18.723876953125, 19.64501953125, 20.566162109375, 21.4873046875, 22.408447265625, 23.32958984375, 24.250732421875, 25.171875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 10.0, 12.0, 12.0, 34.0, 42.0, 55.0, 86.0, 127.0, 202.0, 387.0, 563.0, 781.0, 635.0, 432.0, 260.0, 148.0, 97.0, 81.0, 36.0, 29.0, 22.0, 12.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.921875, -28.035888671875, -27.14990234375, -26.263916015625, -25.3779296875, -24.491943359375, -23.60595703125, -22.719970703125, -21.833984375, -20.947998046875, -20.06201171875, -19.176025390625, -18.2900390625, -17.404052734375, -16.51806640625, -15.632080078125, -14.74609375, -13.860107421875, -12.97412109375, -12.088134765625, -11.2021484375, -10.316162109375, -9.43017578125, -8.544189453125, -7.658203125, -6.772216796875, -5.88623046875, -5.000244140625, -4.1142578125, -3.228271484375, -2.34228515625, -1.456298828125, -0.5703125, 0.315673828125, 1.20166015625, 2.087646484375, 2.9736328125, 3.859619140625, 4.74560546875, 5.631591796875, 6.517578125, 7.403564453125, 8.28955078125, 9.175537109375, 10.0615234375, 10.947509765625, 11.83349609375, 12.719482421875, 13.60546875, 14.491455078125, 15.37744140625, 16.263427734375, 17.1494140625, 18.035400390625, 18.92138671875, 19.807373046875, 20.693359375, 21.579345703125, 22.46533203125, 23.351318359375, 24.2373046875, 25.123291015625, 26.00927734375, 26.895263671875, 27.78125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 22.0, 29.0, 22.0, 42.0, 48.0, 64.0, 86.0, 133.0, 183.0, 227.0, 409.0, 901.0, 24042.0, 4152006.0, 13948.0, 850.0, 374.0, 227.0, 142.0, 136.0, 82.0, 68.0, 47.0, 41.0, 35.0, 26.0, 19.0, 15.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-103.875, -100.46484375, -97.0546875, -93.64453125, -90.234375, -86.82421875, -83.4140625, -80.00390625, -76.59375, -73.18359375, -69.7734375, -66.36328125, -62.953125, -59.54296875, -56.1328125, -52.72265625, -49.3125, -45.90234375, -42.4921875, -39.08203125, -35.671875, -32.26171875, -28.8515625, -25.44140625, -22.03125, -18.62109375, -15.2109375, -11.80078125, -8.390625, -4.98046875, -1.5703125, 1.83984375, 5.25, 8.66015625, 12.0703125, 15.48046875, 18.890625, 22.30078125, 25.7109375, 29.12109375, 32.53125, 35.94140625, 39.3515625, 42.76171875, 46.171875, 49.58203125, 52.9921875, 56.40234375, 59.8125, 63.22265625, 66.6328125, 70.04296875, 73.453125, 76.86328125, 80.2734375, 83.68359375, 87.09375, 90.50390625, 93.9140625, 97.32421875, 100.734375, 104.14453125, 107.5546875, 110.96484375, 114.375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 17.0, 92.0, 297.0, 361.0, 182.0, 50.0, 12.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-264.642578125, -258.2316589355469, -251.8207244873047, -245.40980529785156, -238.99887084960938, -232.58795166015625, -226.17703247070312, -219.76609802246094, -213.35516357421875, -206.94424438476562, -200.53330993652344, -194.1223907470703, -187.71145629882812, -181.300537109375, -174.88961791992188, -168.4786834716797, -162.06776428222656, -155.65684509277344, -149.24591064453125, -142.83499145507812, -136.42405700683594, -130.0131378173828, -123.60221099853516, -117.1912841796875, -110.78035736083984, -104.36943054199219, -97.95850372314453, -91.54757690429688, -85.13665771484375, -78.72572326660156, -72.31480407714844, -65.90387725830078, -59.49293518066406, -53.082008361816406, -46.67108154296875, -40.26015853881836, -33.8492317199707, -27.438304901123047, -21.027381896972656, -14.616455078125, -8.205528259277344, -1.794602394104004, 4.616323471069336, 11.02724838256836, 17.438175201416016, 23.849102020263672, 30.260025024414062, 36.67095184326172, 43.081878662109375, 49.49280548095703, 55.90373229980469, 62.31465530395508, 68.7255859375, 75.13650512695312, 81.54743194580078, 87.95835876464844, 94.3692855834961, 100.78021240234375, 107.1911392211914, 113.60206604003906, 120.01298522949219, 126.42391967773438, 132.8348388671875, 139.24575805664062, 145.6566925048828]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 4.0, 5.0, 5.0, 1.0, 10.0, 12.0, 15.0, 17.0, 13.0, 14.0, 13.0, 16.0, 20.0, 17.0, 27.0, 24.0, 41.0, 39.0, 37.0, 41.0, 47.0, 41.0, 36.0, 38.0, 43.0, 59.0, 40.0, 36.0, 36.0, 24.0, 27.0, 30.0, 23.0, 19.0, 19.0, 20.0, 12.0, 16.0, 11.0, 9.0, 9.0, 11.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-58.656368255615234, -56.8696174621582, -55.08287048339844, -53.296119689941406, -51.509368896484375, -49.722618103027344, -47.93586730957031, -46.14912033081055, -44.362369537353516, -42.575618743896484, -40.78887176513672, -39.00212097167969, -37.215370178222656, -35.428619384765625, -33.641868591308594, -31.855121612548828, -30.068370819091797, -28.281620025634766, -26.494871139526367, -24.70812225341797, -22.921371459960938, -21.134620666503906, -19.347871780395508, -17.56112289428711, -15.774372100830078, -13.987622261047363, -12.200872421264648, -10.414122581481934, -8.627372741699219, -6.840622901916504, -5.053873062133789, -3.267123222351074, -1.4803733825683594, 0.30637645721435547, 2.0931262969970703, 3.879876136779785, 5.6666259765625, 7.453375816345215, 9.24012565612793, 11.026875495910645, 12.81362533569336, 14.600375175476074, 16.38712501525879, 18.173873901367188, 19.96062469482422, 21.74737548828125, 23.53412437438965, 25.320873260498047, 27.107624053955078, 28.89437484741211, 30.681123733520508, 32.467872619628906, 34.25462341308594, 36.04137420654297, 37.828125, 39.614871978759766, 41.4016227722168, 43.18837356567383, 44.975120544433594, 46.761871337890625, 48.548622131347656, 50.33537292480469, 52.12212371826172, 53.908870697021484, 55.695621490478516]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 8.0, 9.0, 15.0, 17.0, 20.0, 27.0, 22.0, 28.0, 32.0, 27.0, 40.0, 42.0, 40.0, 44.0, 36.0, 47.0, 59.0, 53.0, 42.0, 55.0, 44.0, 43.0, 47.0, 33.0, 27.0, 26.0, 19.0, 24.0, 23.0, 15.0, 9.0, 6.0, 8.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.921875, -14.5399169921875, -14.157958984375, -13.7760009765625, -13.39404296875, -13.0120849609375, -12.630126953125, -12.2481689453125, -11.8662109375, -11.4842529296875, -11.102294921875, -10.7203369140625, -10.33837890625, -9.9564208984375, -9.574462890625, -9.1925048828125, -8.810546875, -8.4285888671875, -8.046630859375, -7.6646728515625, -7.28271484375, -6.9007568359375, -6.518798828125, -6.1368408203125, -5.7548828125, -5.3729248046875, -4.990966796875, -4.6090087890625, -4.22705078125, -3.8450927734375, -3.463134765625, -3.0811767578125, -2.69921875, -2.3172607421875, -1.935302734375, -1.5533447265625, -1.17138671875, -0.7894287109375, -0.407470703125, -0.0255126953125, 0.3564453125, 0.7384033203125, 1.120361328125, 1.5023193359375, 1.88427734375, 2.2662353515625, 2.648193359375, 3.0301513671875, 3.412109375, 3.7940673828125, 4.176025390625, 4.5579833984375, 4.93994140625, 5.3218994140625, 5.703857421875, 6.0858154296875, 6.4677734375, 6.8497314453125, 7.231689453125, 7.6136474609375, 7.99560546875, 8.3775634765625, 8.759521484375, 9.1414794921875, 9.5234375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 6.0, 6.0, 11.0, 17.0, 28.0, 37.0, 47.0, 78.0, 152.0, 230.0, 367.0, 626.0, 1075.0, 1800.0, 3080.0, 5224.0, 8829.0, 15067.0, 25947.0, 47996.0, 92659.0, 219345.0, 359419.0, 126062.0, 61546.0, 33188.0, 18750.0, 10889.0, 6497.0, 3865.0, 2344.0, 1295.0, 783.0, 452.0, 299.0, 196.0, 117.0, 74.0, 39.0, 34.0, 22.0, 15.0, 11.0, 6.0, 5.0, 6.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.451171875, -2.37261962890625, -2.2940673828125, -2.21551513671875, -2.136962890625, -2.05841064453125, -1.9798583984375, -1.90130615234375, -1.82275390625, -1.74420166015625, -1.6656494140625, -1.58709716796875, -1.508544921875, -1.42999267578125, -1.3514404296875, -1.27288818359375, -1.1943359375, -1.11578369140625, -1.0372314453125, -0.95867919921875, -0.880126953125, -0.80157470703125, -0.7230224609375, -0.64447021484375, -0.56591796875, -0.48736572265625, -0.4088134765625, -0.33026123046875, -0.251708984375, -0.17315673828125, -0.0946044921875, -0.01605224609375, 0.0625, 0.14105224609375, 0.2196044921875, 0.29815673828125, 0.376708984375, 0.45526123046875, 0.5338134765625, 0.61236572265625, 0.69091796875, 0.76947021484375, 0.8480224609375, 0.92657470703125, 1.005126953125, 1.08367919921875, 1.1622314453125, 1.24078369140625, 1.3193359375, 1.39788818359375, 1.4764404296875, 1.55499267578125, 1.633544921875, 1.71209716796875, 1.7906494140625, 1.86920166015625, 1.94775390625, 2.02630615234375, 2.1048583984375, 2.18341064453125, 2.261962890625, 2.34051513671875, 2.4190673828125, 2.49761962890625, 2.576171875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 8.0, 4.0, 2.0, 8.0, 8.0, 17.0, 12.0, 12.0, 18.0, 21.0, 28.0, 26.0, 35.0, 34.0, 37.0, 36.0, 41.0, 52.0, 43.0, 1070.0, 42.0, 38.0, 43.0, 46.0, 44.0, 29.0, 32.0, 31.0, 37.0, 22.0, 25.0, 23.0, 18.0, 22.0, 13.0, 16.0, 14.0, 5.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.82421875, -7.5992431640625, -7.374267578125, -7.1492919921875, -6.92431640625, -6.6993408203125, -6.474365234375, -6.2493896484375, -6.0244140625, -5.7994384765625, -5.574462890625, -5.3494873046875, -5.12451171875, -4.8995361328125, -4.674560546875, -4.4495849609375, -4.224609375, -3.9996337890625, -3.774658203125, -3.5496826171875, -3.32470703125, -3.0997314453125, -2.874755859375, -2.6497802734375, -2.4248046875, -2.1998291015625, -1.974853515625, -1.7498779296875, -1.52490234375, -1.2999267578125, -1.074951171875, -0.8499755859375, -0.625, -0.4000244140625, -0.175048828125, 0.0499267578125, 0.27490234375, 0.4998779296875, 0.724853515625, 0.9498291015625, 1.1748046875, 1.3997802734375, 1.624755859375, 1.8497314453125, 2.07470703125, 2.2996826171875, 2.524658203125, 2.7496337890625, 2.974609375, 3.1995849609375, 3.424560546875, 3.6495361328125, 3.87451171875, 4.0994873046875, 4.324462890625, 4.5494384765625, 4.7744140625, 4.9993896484375, 5.224365234375, 5.4493408203125, 5.67431640625, 5.8992919921875, 6.124267578125, 6.3492431640625, 6.57421875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 5.0, 5.0, 7.0, 13.0, 24.0, 30.0, 46.0, 85.0, 122.0, 156.0, 277.0, 418.0, 690.0, 1045.0, 1692.0, 2882.0, 4665.0, 7412.0, 11890.0, 19220.0, 31172.0, 52487.0, 96992.0, 232892.0, 1367142.0, 115264.0, 59856.0, 35290.0, 21378.0, 13049.0, 8009.0, 5019.0, 2975.0, 1908.0, 1121.0, 686.0, 399.0, 295.0, 170.0, 90.0, 87.0, 69.0, 37.0, 29.0, 13.0, 6.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.09765625, -2.02801513671875, -1.9583740234375, -1.88873291015625, -1.819091796875, -1.74945068359375, -1.6798095703125, -1.61016845703125, -1.54052734375, -1.47088623046875, -1.4012451171875, -1.33160400390625, -1.261962890625, -1.19232177734375, -1.1226806640625, -1.05303955078125, -0.9833984375, -0.91375732421875, -0.8441162109375, -0.77447509765625, -0.704833984375, -0.63519287109375, -0.5655517578125, -0.49591064453125, -0.42626953125, -0.35662841796875, -0.2869873046875, -0.21734619140625, -0.147705078125, -0.07806396484375, -0.0084228515625, 0.06121826171875, 0.130859375, 0.20050048828125, 0.2701416015625, 0.33978271484375, 0.409423828125, 0.47906494140625, 0.5487060546875, 0.61834716796875, 0.68798828125, 0.75762939453125, 0.8272705078125, 0.89691162109375, 0.966552734375, 1.03619384765625, 1.1058349609375, 1.17547607421875, 1.2451171875, 1.31475830078125, 1.3843994140625, 1.45404052734375, 1.523681640625, 1.59332275390625, 1.6629638671875, 1.73260498046875, 1.80224609375, 1.87188720703125, 1.9415283203125, 2.01116943359375, 2.080810546875, 2.15045166015625, 2.2200927734375, 2.28973388671875, 2.359375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 7.0, 3.0, 3.0, 7.0, 6.0, 13.0, 13.0, 10.0, 13.0, 20.0, 25.0, 31.0, 45.0, 50.0, 68.0, 62.0, 70.0, 63.0, 70.0, 62.0, 42.0, 50.0, 61.0, 38.0, 30.0, 29.0, 23.0, 22.0, 15.0, 9.0, 9.0, 9.0, 8.0, 6.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012540817260742188, -0.0012154430150985718, -0.0011768043041229248, -0.0011381655931472778, -0.0010995268821716309, -0.0010608881711959839, -0.001022249460220337, -0.00098361074924469, -0.000944972038269043, -0.000906333327293396, -0.000867694616317749, -0.000829055905342102, -0.0007904171943664551, -0.0007517784833908081, -0.0007131397724151611, -0.0006745010614395142, -0.0006358623504638672, -0.0005972236394882202, -0.0005585849285125732, -0.0005199462175369263, -0.0004813075065612793, -0.0004426687955856323, -0.00040403008460998535, -0.0003653913736343384, -0.0003267526626586914, -0.00028811395168304443, -0.00024947524070739746, -0.0002108365297317505, -0.00017219781875610352, -0.00013355910778045654, -9.492039680480957e-05, -5.62816858291626e-05, -1.7642974853515625e-05, 2.0995736122131348e-05, 5.963444709777832e-05, 9.827315807342529e-05, 0.00013691186904907227, 0.00017555058002471924, 0.0002141892910003662, 0.0002528280019760132, 0.00029146671295166016, 0.00033010542392730713, 0.0003687441349029541, 0.0004073828458786011, 0.00044602155685424805, 0.000484660267829895, 0.000523298978805542, 0.000561937689781189, 0.0006005764007568359, 0.0006392151117324829, 0.0006778538227081299, 0.0007164925336837769, 0.0007551312446594238, 0.0007937699556350708, 0.0008324086666107178, 0.0008710473775863647, 0.0009096860885620117, 0.0009483247995376587, 0.0009869635105133057, 0.0010256022214889526, 0.0010642409324645996, 0.0011028796434402466, 0.0011415183544158936, 0.0011801570653915405, 0.0012187957763671875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 6.0, 5.0, 4.0, 13.0, 8.0, 12.0, 20.0, 26.0, 22.0, 41.0, 41.0, 47.0, 92.0, 158.0, 308.0, 962.0, 221296.0, 823215.0, 1297.0, 383.0, 177.0, 120.0, 69.0, 55.0, 39.0, 31.0, 32.0, 20.0, 16.0, 5.0, 9.0, 9.0, 6.0, 6.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0270538330078125, -0.0261232852935791, -0.025192737579345703, -0.024262189865112305, -0.023331642150878906, -0.022401094436645508, -0.02147054672241211, -0.02053999900817871, -0.019609451293945312, -0.018678903579711914, -0.017748355865478516, -0.016817808151245117, -0.01588726043701172, -0.01495671272277832, -0.014026165008544922, -0.013095617294311523, -0.012165069580078125, -0.011234521865844727, -0.010303974151611328, -0.00937342643737793, -0.008442878723144531, -0.007512331008911133, -0.006581783294677734, -0.005651235580444336, -0.0047206878662109375, -0.003790140151977539, -0.0028595924377441406, -0.0019290447235107422, -0.0009984970092773438, -6.794929504394531e-05, 0.0008625984191894531, 0.0017931461334228516, 0.00272369384765625, 0.0036542415618896484, 0.004584789276123047, 0.005515336990356445, 0.006445884704589844, 0.007376432418823242, 0.00830698013305664, 0.009237527847290039, 0.010168075561523438, 0.011098623275756836, 0.012029170989990234, 0.012959718704223633, 0.013890266418457031, 0.01482081413269043, 0.015751361846923828, 0.016681909561157227, 0.017612457275390625, 0.018543004989624023, 0.019473552703857422, 0.02040410041809082, 0.02133464813232422, 0.022265195846557617, 0.023195743560791016, 0.024126291275024414, 0.025056838989257812, 0.02598738670349121, 0.02691793441772461, 0.027848482131958008, 0.028779029846191406, 0.029709577560424805, 0.030640125274658203, 0.0315706729888916, 0.032501220703125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 16.0, 26.0, 35.0, 87.0, 132.0, 177.0, 188.0, 146.0, 95.0, 56.0, 22.0, 12.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004642988496925682, -0.0004353416443336755, -0.0004063844389747828, -0.00037742723361589015, -0.00034847002825699747, -0.00031951285200193524, -0.00029055564664304256, -0.0002615984412841499, -0.00023264122137334198, -0.0002036840160144493, -0.00017472681065555662, -0.00014576961984857917, -0.00011681240721372887, -8.785520913079381e-05, -5.889800377190113e-05, -2.994079841300845e-05, -9.835930541157722e-07, 2.7973610485787503e-05, 5.693081402569078e-05, 8.588801574660465e-05, 0.00011484522110549733, 0.0001438024191884324, 0.00017275962454732507, 0.00020171682990621775, 0.00023067403526511043, 0.0002596312260720879, 0.00028858843143098056, 0.00031754563678987324, 0.0003465028421487659, 0.0003754600475076586, 0.0004044172528665513, 0.00043337445822544396, 0.0004623316344805062, 0.0004912888398393989, 0.0005202460451982915, 0.0005492032505571842, 0.0005781604559160769, 0.0006071176612749696, 0.0006360748666338623, 0.0006650320719927549, 0.0006939892773516476, 0.0007229464827105403, 0.000751903688069433, 0.0007808608934283257, 0.0008098180987872183, 0.000838775304146111, 0.0008677325095050037, 0.0008966897148638964, 0.0009256468620151281, 0.0009546040673740208, 0.0009835612727329135, 0.0010125184198841453, 0.0010414756834506989, 0.0010704328306019306, 0.0010993900941684842, 0.001128347241319716, 0.0011573045048862696, 0.0011862616520375013, 0.001215218915604055, 0.0012441760627552867, 0.0012731333263218403, 0.001302090473473072, 0.0013310477370396256, 0.0013600048841908574, 0.001388962147757411]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 3.0, 7.0, 3.0, 12.0, 10.0, 9.0, 12.0, 12.0, 11.0, 19.0, 16.0, 27.0, 20.0, 22.0, 25.0, 27.0, 36.0, 38.0, 30.0, 39.0, 36.0, 34.0, 36.0, 29.0, 46.0, 45.0, 26.0, 42.0, 30.0, 35.0, 32.0, 28.0, 25.0, 30.0, 24.0, 21.0, 11.0, 14.0, 15.0, 14.0, 12.0, 5.0, 9.0, 5.0, 4.0, 3.0, 0.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.000533759593963623, -0.0005171764642000198, -0.0005005933344364166, -0.0004840102046728134, -0.0004674270749092102, -0.000450843945145607, -0.0004342608153820038, -0.0004176776856184006, -0.00040109455585479736, -0.00038451142609119415, -0.00036792829632759094, -0.00035134516656398773, -0.0003347620368003845, -0.0003181789070367813, -0.0003015957772731781, -0.0002850126475095749, -0.0002684295177459717, -0.00025184638798236847, -0.00023526325821876526, -0.00021868012845516205, -0.00020209699869155884, -0.00018551386892795563, -0.00016893073916435242, -0.0001523476094007492, -0.000135764479637146, -0.00011918134987354279, -0.00010259822010993958, -8.601509034633636e-05, -6.943196058273315e-05, -5.2848830819129944e-05, -3.6265701055526733e-05, -1.9682571291923523e-05, -3.0994415283203125e-06, 1.3483688235282898e-05, 3.006681799888611e-05, 4.664994776248932e-05, 6.323307752609253e-05, 7.981620728969574e-05, 9.639933705329895e-05, 0.00011298246681690216, 0.00012956559658050537, 0.00014614872634410858, 0.0001627318561077118, 0.000179314985871315, 0.0001958981156349182, 0.00021248124539852142, 0.00022906437516212463, 0.00024564750492572784, 0.00026223063468933105, 0.00027881376445293427, 0.0002953968942165375, 0.0003119800239801407, 0.0003285631537437439, 0.0003451462835073471, 0.0003617294132709503, 0.00037831254303455353, 0.00039489567279815674, 0.00041147880256175995, 0.00042806193232536316, 0.00044464506208896637, 0.0004612281918525696, 0.0004778113216161728, 0.000494394451379776, 0.0005109775811433792, 0.0005275607109069824]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 8.0, 9.0, 15.0, 17.0, 20.0, 27.0, 22.0, 28.0, 32.0, 27.0, 40.0, 42.0, 40.0, 44.0, 36.0, 47.0, 59.0, 53.0, 42.0, 55.0, 44.0, 43.0, 47.0, 33.0, 27.0, 26.0, 19.0, 24.0, 23.0, 15.0, 9.0, 6.0, 8.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.921875, -14.5399169921875, -14.157958984375, -13.7760009765625, -13.39404296875, -13.0120849609375, -12.630126953125, -12.2481689453125, -11.8662109375, -11.4842529296875, -11.102294921875, -10.7203369140625, -10.33837890625, -9.9564208984375, -9.574462890625, -9.1925048828125, -8.810546875, -8.4285888671875, -8.046630859375, -7.6646728515625, -7.28271484375, -6.9007568359375, -6.518798828125, -6.1368408203125, -5.7548828125, -5.3729248046875, -4.990966796875, -4.6090087890625, -4.22705078125, -3.8450927734375, -3.463134765625, -3.0811767578125, -2.69921875, -2.3172607421875, -1.935302734375, -1.5533447265625, -1.17138671875, -0.7894287109375, -0.407470703125, -0.0255126953125, 0.3564453125, 0.7384033203125, 1.120361328125, 1.5023193359375, 1.88427734375, 2.2662353515625, 2.648193359375, 3.0301513671875, 3.412109375, 3.7940673828125, 4.176025390625, 4.5579833984375, 4.93994140625, 5.3218994140625, 5.703857421875, 6.0858154296875, 6.4677734375, 6.8497314453125, 7.231689453125, 7.6136474609375, 7.99560546875, 8.3775634765625, 8.759521484375, 9.1414794921875, 9.5234375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 6.0, 10.0, 10.0, 26.0, 23.0, 51.0, 55.0, 75.0, 117.0, 222.0, 365.0, 762.0, 1853.0, 6024.0, 25170.0, 178454.0, 720600.0, 91646.0, 16040.0, 4142.0, 1392.0, 605.0, 350.0, 194.0, 111.0, 79.0, 41.0, 47.0, 26.0, 16.0, 15.0, 5.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.5, -14.11181640625, -13.7236328125, -13.33544921875, -12.947265625, -12.55908203125, -12.1708984375, -11.78271484375, -11.39453125, -11.00634765625, -10.6181640625, -10.22998046875, -9.841796875, -9.45361328125, -9.0654296875, -8.67724609375, -8.2890625, -7.90087890625, -7.5126953125, -7.12451171875, -6.736328125, -6.34814453125, -5.9599609375, -5.57177734375, -5.18359375, -4.79541015625, -4.4072265625, -4.01904296875, -3.630859375, -3.24267578125, -2.8544921875, -2.46630859375, -2.078125, -1.68994140625, -1.3017578125, -0.91357421875, -0.525390625, -0.13720703125, 0.2509765625, 0.63916015625, 1.02734375, 1.41552734375, 1.8037109375, 2.19189453125, 2.580078125, 2.96826171875, 3.3564453125, 3.74462890625, 4.1328125, 4.52099609375, 4.9091796875, 5.29736328125, 5.685546875, 6.07373046875, 6.4619140625, 6.85009765625, 7.23828125, 7.62646484375, 8.0146484375, 8.40283203125, 8.791015625, 9.17919921875, 9.5673828125, 9.95556640625, 10.34375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 4.0, 9.0, 7.0, 8.0, 10.0, 12.0, 9.0, 19.0, 17.0, 24.0, 24.0, 20.0, 32.0, 37.0, 34.0, 33.0, 38.0, 49.0, 47.0, 199.0, 1837.0, 106.0, 45.0, 53.0, 39.0, 39.0, 44.0, 26.0, 27.0, 25.0, 24.0, 30.0, 14.0, 15.0, 21.0, 12.0, 8.0, 10.0, 12.0, 7.0, 4.0, 2.0, 6.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.921875, -28.935791015625, -27.94970703125, -26.963623046875, -25.9775390625, -24.991455078125, -24.00537109375, -23.019287109375, -22.033203125, -21.047119140625, -20.06103515625, -19.074951171875, -18.0888671875, -17.102783203125, -16.11669921875, -15.130615234375, -14.14453125, -13.158447265625, -12.17236328125, -11.186279296875, -10.2001953125, -9.214111328125, -8.22802734375, -7.241943359375, -6.255859375, -5.269775390625, -4.28369140625, -3.297607421875, -2.3115234375, -1.325439453125, -0.33935546875, 0.646728515625, 1.6328125, 2.618896484375, 3.60498046875, 4.591064453125, 5.5771484375, 6.563232421875, 7.54931640625, 8.535400390625, 9.521484375, 10.507568359375, 11.49365234375, 12.479736328125, 13.4658203125, 14.451904296875, 15.43798828125, 16.424072265625, 17.41015625, 18.396240234375, 19.38232421875, 20.368408203125, 21.3544921875, 22.340576171875, 23.32666015625, 24.312744140625, 25.298828125, 26.284912109375, 27.27099609375, 28.257080078125, 29.2431640625, 30.229248046875, 31.21533203125, 32.201416015625, 33.1875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 1.0, 4.0, 7.0, 5.0, 7.0, 11.0, 13.0, 8.0, 15.0, 23.0, 22.0, 25.0, 44.0, 42.0, 69.0, 72.0, 114.0, 158.0, 195.0, 317.0, 558.0, 2431.0, 2960596.0, 177900.0, 1632.0, 451.0, 271.0, 172.0, 105.0, 109.0, 71.0, 52.0, 46.0, 41.0, 22.0, 12.0, 21.0, 14.0, 13.0, 9.0, 8.0, 5.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-73.5625, -71.255859375, -68.94921875, -66.642578125, -64.3359375, -62.029296875, -59.72265625, -57.416015625, -55.109375, -52.802734375, -50.49609375, -48.189453125, -45.8828125, -43.576171875, -41.26953125, -38.962890625, -36.65625, -34.349609375, -32.04296875, -29.736328125, -27.4296875, -25.123046875, -22.81640625, -20.509765625, -18.203125, -15.896484375, -13.58984375, -11.283203125, -8.9765625, -6.669921875, -4.36328125, -2.056640625, 0.25, 2.556640625, 4.86328125, 7.169921875, 9.4765625, 11.783203125, 14.08984375, 16.396484375, 18.703125, 21.009765625, 23.31640625, 25.623046875, 27.9296875, 30.236328125, 32.54296875, 34.849609375, 37.15625, 39.462890625, 41.76953125, 44.076171875, 46.3828125, 48.689453125, 50.99609375, 53.302734375, 55.609375, 57.916015625, 60.22265625, 62.529296875, 64.8359375, 67.142578125, 69.44921875, 71.755859375, 74.0625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 577.0, 430.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-312.56585693359375, -306.5470275878906, -300.5282287597656, -294.5093994140625, -288.4906005859375, -282.4717712402344, -276.45294189453125, -270.43414306640625, -264.4153137207031, -258.396484375, -252.377685546875, -246.35885620117188, -240.3400421142578, -234.32122802734375, -228.30239868164062, -222.28358459472656, -216.2647705078125, -210.24595642089844, -204.22714233398438, -198.20831298828125, -192.1894989013672, -186.17068481445312, -180.15185546875, -174.13304138183594, -168.11422729492188, -162.0954132080078, -156.07659912109375, -150.05776977539062, -144.03895568847656, -138.0201416015625, -132.00131225585938, -125.98249816894531, -119.96369171142578, -113.94486999511719, -107.92605590820312, -101.90724182128906, -95.88842010498047, -89.86959838867188, -83.85078430175781, -77.83197021484375, -71.81314849853516, -65.79432678222656, -59.7755126953125, -53.75669479370117, -47.737876892089844, -41.719058990478516, -35.70024108886719, -29.68142318725586, -23.66260528564453, -17.643787384033203, -11.624969482421875, -5.606151580810547, 0.41266632080078125, 6.431484222412109, 12.450302124023438, 18.469120025634766, 24.487937927246094, 30.506755828857422, 36.52557373046875, 42.54439163208008, 48.563209533691406, 54.582027435302734, 60.60084533691406, 66.61965942382812, 72.63848114013672]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 6.0, 11.0, 2.0, 19.0, 15.0, 15.0, 26.0, 24.0, 20.0, 14.0, 24.0, 20.0, 46.0, 37.0, 39.0, 38.0, 45.0, 48.0, 57.0, 35.0, 38.0, 29.0, 43.0, 43.0, 43.0, 32.0, 27.0, 31.0, 22.0, 20.0, 27.0, 16.0, 19.0, 11.0, 10.0, 12.0, 10.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-97.09986114501953, -94.39815521240234, -91.69644927978516, -88.99474334716797, -86.29303741455078, -83.59132385253906, -80.88961791992188, -78.18791198730469, -75.4862060546875, -72.78450012207031, -70.08279418945312, -67.38108825683594, -64.67938232421875, -61.9776725769043, -59.27596664428711, -56.574256896972656, -53.872554779052734, -51.17084884643555, -48.46914291381836, -45.767433166503906, -43.06572723388672, -40.36402130126953, -37.662315368652344, -34.960609436035156, -32.25890350341797, -29.55719757080078, -26.85548973083496, -24.153783798217773, -21.452075958251953, -18.750370025634766, -16.048664093017578, -13.346956253051758, -10.645248413085938, -7.943541526794434, -5.241835117340088, -2.540128707885742, 0.16157817840576172, 2.8632850646972656, 5.564990997314453, 8.266698837280273, 10.968404769897461, 13.670111656188965, 16.37181854248047, 19.073524475097656, 21.775230407714844, 24.476938247680664, 27.17864418029785, 29.880352020263672, 32.58205795288086, 35.28376388549805, 37.985469818115234, 40.68717956542969, 43.388885498046875, 46.09059143066406, 48.79229736328125, 51.49400329589844, 54.195709228515625, 56.89741516113281, 59.59912109375, 62.30082702636719, 65.00253295898438, 67.70423889160156, 70.40594482421875, 73.10765838623047, 75.80936431884766]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 8.0, 11.0, 10.0, 14.0, 12.0, 33.0, 27.0, 25.0, 30.0, 30.0, 33.0, 36.0, 34.0, 48.0, 42.0, 42.0, 55.0, 44.0, 64.0, 40.0, 53.0, 38.0, 40.0, 36.0, 32.0, 29.0, 29.0, 17.0, 24.0, 15.0, 14.0, 8.0, 10.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.2734375, -14.88671875, -14.5, -14.11328125, -13.7265625, -13.33984375, -12.953125, -12.56640625, -12.1796875, -11.79296875, -11.40625, -11.01953125, -10.6328125, -10.24609375, -9.859375, -9.47265625, -9.0859375, -8.69921875, -8.3125, -7.92578125, -7.5390625, -7.15234375, -6.765625, -6.37890625, -5.9921875, -5.60546875, -5.21875, -4.83203125, -4.4453125, -4.05859375, -3.671875, -3.28515625, -2.8984375, -2.51171875, -2.125, -1.73828125, -1.3515625, -0.96484375, -0.578125, -0.19140625, 0.1953125, 0.58203125, 0.96875, 1.35546875, 1.7421875, 2.12890625, 2.515625, 2.90234375, 3.2890625, 3.67578125, 4.0625, 4.44921875, 4.8359375, 5.22265625, 5.609375, 5.99609375, 6.3828125, 6.76953125, 7.15625, 7.54296875, 7.9296875, 8.31640625, 8.703125, 9.08984375, 9.4765625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 4.0, 16.0, 13.0, 15.0, 23.0, 23.0, 21.0, 50.0, 39.0, 68.0, 63.0, 78.0, 139.0, 211.0, 346.0, 654.0, 2029.0, 12411.0, 424626.0, 3289429.0, 445738.0, 14468.0, 2075.0, 642.0, 339.0, 193.0, 106.0, 84.0, 81.0, 73.0, 41.0, 55.0, 31.0, 30.0, 14.0, 14.0, 11.0, 5.0, 4.0, 2.0, 5.0, 2.0, 3.0, 3.0], "bins": [-36.28125, -35.36279296875, -34.4443359375, -33.52587890625, -32.607421875, -31.68896484375, -30.7705078125, -29.85205078125, -28.93359375, -28.01513671875, -27.0966796875, -26.17822265625, -25.259765625, -24.34130859375, -23.4228515625, -22.50439453125, -21.5859375, -20.66748046875, -19.7490234375, -18.83056640625, -17.912109375, -16.99365234375, -16.0751953125, -15.15673828125, -14.23828125, -13.31982421875, -12.4013671875, -11.48291015625, -10.564453125, -9.64599609375, -8.7275390625, -7.80908203125, -6.890625, -5.97216796875, -5.0537109375, -4.13525390625, -3.216796875, -2.29833984375, -1.3798828125, -0.46142578125, 0.45703125, 1.37548828125, 2.2939453125, 3.21240234375, 4.130859375, 5.04931640625, 5.9677734375, 6.88623046875, 7.8046875, 8.72314453125, 9.6416015625, 10.56005859375, 11.478515625, 12.39697265625, 13.3154296875, 14.23388671875, 15.15234375, 16.07080078125, 16.9892578125, 17.90771484375, 18.826171875, 19.74462890625, 20.6630859375, 21.58154296875, 22.5]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 12.0, 17.0, 20.0, 28.0, 36.0, 52.0, 80.0, 106.0, 132.0, 265.0, 373.0, 544.0, 669.0, 582.0, 393.0, 259.0, 173.0, 98.0, 71.0, 47.0, 45.0, 26.0, 10.0, 9.0, 10.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.71875, -15.97607421875, -15.2333984375, -14.49072265625, -13.748046875, -13.00537109375, -12.2626953125, -11.52001953125, -10.77734375, -10.03466796875, -9.2919921875, -8.54931640625, -7.806640625, -7.06396484375, -6.3212890625, -5.57861328125, -4.8359375, -4.09326171875, -3.3505859375, -2.60791015625, -1.865234375, -1.12255859375, -0.3798828125, 0.36279296875, 1.10546875, 1.84814453125, 2.5908203125, 3.33349609375, 4.076171875, 4.81884765625, 5.5615234375, 6.30419921875, 7.046875, 7.78955078125, 8.5322265625, 9.27490234375, 10.017578125, 10.76025390625, 11.5029296875, 12.24560546875, 12.98828125, 13.73095703125, 14.4736328125, 15.21630859375, 15.958984375, 16.70166015625, 17.4443359375, 18.18701171875, 18.9296875, 19.67236328125, 20.4150390625, 21.15771484375, 21.900390625, 22.64306640625, 23.3857421875, 24.12841796875, 24.87109375, 25.61376953125, 26.3564453125, 27.09912109375, 27.841796875, 28.58447265625, 29.3271484375, 30.06982421875, 30.8125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 7.0, 15.0, 15.0, 24.0, 32.0, 42.0, 77.0, 86.0, 112.0, 145.0, 210.0, 313.0, 509.0, 1541.0, 2106731.0, 2081325.0, 1550.0, 461.0, 312.0, 180.0, 133.0, 135.0, 87.0, 75.0, 43.0, 36.0, 30.0, 21.0, 12.0, 11.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-157.375, -153.6279296875, -149.880859375, -146.1337890625, -142.38671875, -138.6396484375, -134.892578125, -131.1455078125, -127.3984375, -123.6513671875, -119.904296875, -116.1572265625, -112.41015625, -108.6630859375, -104.916015625, -101.1689453125, -97.421875, -93.6748046875, -89.927734375, -86.1806640625, -82.43359375, -78.6865234375, -74.939453125, -71.1923828125, -67.4453125, -63.6982421875, -59.951171875, -56.2041015625, -52.45703125, -48.7099609375, -44.962890625, -41.2158203125, -37.46875, -33.7216796875, -29.974609375, -26.2275390625, -22.48046875, -18.7333984375, -14.986328125, -11.2392578125, -7.4921875, -3.7451171875, 0.001953125, 3.7490234375, 7.49609375, 11.2431640625, 14.990234375, 18.7373046875, 22.484375, 26.2314453125, 29.978515625, 33.7255859375, 37.47265625, 41.2197265625, 44.966796875, 48.7138671875, 52.4609375, 56.2080078125, 59.955078125, 63.7021484375, 67.44921875, 71.1962890625, 74.943359375, 78.6904296875, 82.4375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 338.0, 651.0, 26.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-705.5086059570312, -688.3802490234375, -671.2518920898438, -654.12353515625, -636.9951782226562, -619.8668212890625, -602.738525390625, -585.6101684570312, -568.4818115234375, -551.3534545898438, -534.22509765625, -517.0967407226562, -499.9684143066406, -482.8400573730469, -465.7117004394531, -448.5833435058594, -431.4549865722656, -414.3266296386719, -397.1982727050781, -380.0699462890625, -362.94158935546875, -345.813232421875, -328.68487548828125, -311.5565185546875, -294.42816162109375, -277.2998046875, -260.17144775390625, -243.04310607910156, -225.91476440429688, -208.78640747070312, -191.65805053710938, -174.52969360351562, -157.40139770507812, -140.27304077148438, -123.14469909667969, -106.01634216308594, -88.88799285888672, -71.7596435546875, -54.63128662109375, -37.50293731689453, -20.374588012695312, -3.246236801147461, 13.88211441040039, 31.010467529296875, 48.138816833496094, 65.26716613769531, 82.39552307128906, 99.52387237548828, 116.6522216796875, 133.78057861328125, 150.90892028808594, 168.0372772216797, 185.16561889648438, 202.29397583007812, 219.42233276367188, 236.55068969726562, 253.6790313720703, 270.807373046875, 287.93572998046875, 305.0640869140625, 322.19244384765625, 339.32080078125, 356.44915771484375, 373.5774841308594, 390.7058410644531]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 7.0, 5.0, 12.0, 10.0, 17.0, 9.0, 17.0, 25.0, 25.0, 26.0, 24.0, 36.0, 33.0, 37.0, 35.0, 40.0, 39.0, 45.0, 39.0, 49.0, 51.0, 32.0, 43.0, 33.0, 47.0, 28.0, 40.0, 33.0, 22.0, 25.0, 25.0, 16.0, 18.0, 7.0, 3.0, 12.0, 4.0, 3.0, 6.0, 3.0, 6.0, 5.0, 2.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.68462371826172, -53.78672409057617, -51.88882064819336, -49.99092102050781, -48.093021392822266, -46.19512176513672, -44.297218322753906, -42.39931869506836, -40.50141906738281, -38.603519439697266, -36.70561599731445, -34.807716369628906, -32.90981674194336, -31.01191520690918, -29.114013671875, -27.216114044189453, -25.31821060180664, -23.42030906677246, -21.522409439086914, -19.624507904052734, -17.726608276367188, -15.828706741333008, -13.930805206298828, -12.032904624938965, -10.135004043579102, -8.237103462219238, -6.339202404022217, -4.441301345825195, -2.543400764465332, -0.6455001831054688, 1.252401351928711, 3.150301933288574, 5.0482025146484375, 6.946103096008301, 8.844003677368164, 10.741905212402344, 12.639805793762207, 14.53770637512207, 16.43560791015625, 18.333507537841797, 20.231409072875977, 22.129310607910156, 24.027210235595703, 25.925111770629883, 27.823013305664062, 29.72091293334961, 31.61881446838379, 33.51671600341797, 35.414615631103516, 37.31251525878906, 39.210418701171875, 41.10831832885742, 43.00621795654297, 44.90412139892578, 46.80202102661133, 48.699920654296875, 50.59782409667969, 52.495723724365234, 54.39362716674805, 56.291526794433594, 58.18942642211914, 60.08732604980469, 61.9852294921875, 63.88312911987305, 65.7810287475586]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 9.0, 13.0, 13.0, 13.0, 16.0, 16.0, 31.0, 20.0, 23.0, 31.0, 39.0, 41.0, 31.0, 38.0, 42.0, 37.0, 32.0, 45.0, 50.0, 52.0, 39.0, 44.0, 39.0, 45.0, 27.0, 32.0, 27.0, 27.0, 30.0, 10.0, 16.0, 15.0, 10.0, 4.0, 8.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.4921875, -12.146240234375, -11.80029296875, -11.454345703125, -11.1083984375, -10.762451171875, -10.41650390625, -10.070556640625, -9.724609375, -9.378662109375, -9.03271484375, -8.686767578125, -8.3408203125, -7.994873046875, -7.64892578125, -7.302978515625, -6.95703125, -6.611083984375, -6.26513671875, -5.919189453125, -5.5732421875, -5.227294921875, -4.88134765625, -4.535400390625, -4.189453125, -3.843505859375, -3.49755859375, -3.151611328125, -2.8056640625, -2.459716796875, -2.11376953125, -1.767822265625, -1.421875, -1.075927734375, -0.72998046875, -0.384033203125, -0.0380859375, 0.307861328125, 0.65380859375, 0.999755859375, 1.345703125, 1.691650390625, 2.03759765625, 2.383544921875, 2.7294921875, 3.075439453125, 3.42138671875, 3.767333984375, 4.11328125, 4.459228515625, 4.80517578125, 5.151123046875, 5.4970703125, 5.843017578125, 6.18896484375, 6.534912109375, 6.880859375, 7.226806640625, 7.57275390625, 7.918701171875, 8.2646484375, 8.610595703125, 8.95654296875, 9.302490234375, 9.6484375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 10.0, 10.0, 16.0, 20.0, 18.0, 37.0, 87.0, 113.0, 168.0, 246.0, 363.0, 586.0, 919.0, 1582.0, 2383.0, 3963.0, 6476.0, 10569.0, 18068.0, 31209.0, 56384.0, 108146.0, 269431.0, 288666.0, 111974.0, 58285.0, 31926.0, 18613.0, 10968.0, 6584.0, 4088.0, 2444.0, 1552.0, 940.0, 611.0, 443.0, 238.0, 120.0, 99.0, 78.0, 54.0, 28.0, 13.0, 13.0, 9.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.45703125, -2.38262939453125, -2.3082275390625, -2.23382568359375, -2.159423828125, -2.08502197265625, -2.0106201171875, -1.93621826171875, -1.86181640625, -1.78741455078125, -1.7130126953125, -1.63861083984375, -1.564208984375, -1.48980712890625, -1.4154052734375, -1.34100341796875, -1.2666015625, -1.19219970703125, -1.1177978515625, -1.04339599609375, -0.968994140625, -0.89459228515625, -0.8201904296875, -0.74578857421875, -0.67138671875, -0.59698486328125, -0.5225830078125, -0.44818115234375, -0.373779296875, -0.29937744140625, -0.2249755859375, -0.15057373046875, -0.076171875, -0.00177001953125, 0.0726318359375, 0.14703369140625, 0.221435546875, 0.29583740234375, 0.3702392578125, 0.44464111328125, 0.51904296875, 0.59344482421875, 0.6678466796875, 0.74224853515625, 0.816650390625, 0.89105224609375, 0.9654541015625, 1.03985595703125, 1.1142578125, 1.18865966796875, 1.2630615234375, 1.33746337890625, 1.411865234375, 1.48626708984375, 1.5606689453125, 1.63507080078125, 1.70947265625, 1.78387451171875, 1.8582763671875, 1.93267822265625, 2.007080078125, 2.08148193359375, 2.1558837890625, 2.23028564453125, 2.3046875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 5.0, 6.0, 7.0, 7.0, 15.0, 10.0, 21.0, 15.0, 20.0, 27.0, 29.0, 31.0, 31.0, 28.0, 27.0, 36.0, 29.0, 22.0, 26.0, 32.0, 29.0, 1068.0, 29.0, 42.0, 45.0, 38.0, 32.0, 28.0, 27.0, 30.0, 29.0, 33.0, 24.0, 14.0, 20.0, 23.0, 25.0, 9.0, 9.0, 8.0, 7.0, 4.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6875, -5.50244140625, -5.3173828125, -5.13232421875, -4.947265625, -4.76220703125, -4.5771484375, -4.39208984375, -4.20703125, -4.02197265625, -3.8369140625, -3.65185546875, -3.466796875, -3.28173828125, -3.0966796875, -2.91162109375, -2.7265625, -2.54150390625, -2.3564453125, -2.17138671875, -1.986328125, -1.80126953125, -1.6162109375, -1.43115234375, -1.24609375, -1.06103515625, -0.8759765625, -0.69091796875, -0.505859375, -0.32080078125, -0.1357421875, 0.04931640625, 0.234375, 0.41943359375, 0.6044921875, 0.78955078125, 0.974609375, 1.15966796875, 1.3447265625, 1.52978515625, 1.71484375, 1.89990234375, 2.0849609375, 2.27001953125, 2.455078125, 2.64013671875, 2.8251953125, 3.01025390625, 3.1953125, 3.38037109375, 3.5654296875, 3.75048828125, 3.935546875, 4.12060546875, 4.3056640625, 4.49072265625, 4.67578125, 4.86083984375, 5.0458984375, 5.23095703125, 5.416015625, 5.60107421875, 5.7861328125, 5.97119140625, 6.15625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 8.0, 12.0, 26.0, 29.0, 31.0, 55.0, 63.0, 119.0, 169.0, 228.0, 348.0, 516.0, 812.0, 1187.0, 1634.0, 2567.0, 3834.0, 5782.0, 9039.0, 13497.0, 20914.0, 31506.0, 48691.0, 77271.0, 144897.0, 1360276.0, 149579.0, 79068.0, 49606.0, 32399.0, 21341.0, 14107.0, 9112.0, 6103.0, 4000.0, 2684.0, 1781.0, 1221.0, 853.0, 545.0, 398.0, 268.0, 159.0, 104.0, 92.0, 64.0, 36.0, 32.0, 17.0, 17.0, 11.0, 10.0, 4.0, 6.0, 3.0, 2.0], "bins": [-1.87890625, -1.8228607177734375, -1.766815185546875, -1.7107696533203125, -1.65472412109375, -1.5986785888671875, -1.542633056640625, -1.4865875244140625, -1.4305419921875, -1.3744964599609375, -1.318450927734375, -1.2624053955078125, -1.20635986328125, -1.1503143310546875, -1.094268798828125, -1.0382232666015625, -0.982177734375, -0.9261322021484375, -0.870086669921875, -0.8140411376953125, -0.75799560546875, -0.7019500732421875, -0.645904541015625, -0.5898590087890625, -0.5338134765625, -0.4777679443359375, -0.421722412109375, -0.3656768798828125, -0.30963134765625, -0.2535858154296875, -0.197540283203125, -0.1414947509765625, -0.08544921875, -0.0294036865234375, 0.026641845703125, 0.0826873779296875, 0.13873291015625, 0.1947784423828125, 0.250823974609375, 0.3068695068359375, 0.3629150390625, 0.4189605712890625, 0.475006103515625, 0.5310516357421875, 0.58709716796875, 0.6431427001953125, 0.699188232421875, 0.7552337646484375, 0.811279296875, 0.8673248291015625, 0.923370361328125, 0.9794158935546875, 1.03546142578125, 1.0915069580078125, 1.147552490234375, 1.2035980224609375, 1.2596435546875, 1.3156890869140625, 1.371734619140625, 1.4277801513671875, 1.48382568359375, 1.5398712158203125, 1.595916748046875, 1.6519622802734375, 1.7080078125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 8.0, 1.0, 3.0, 7.0, 7.0, 6.0, 5.0, 10.0, 22.0, 24.0, 26.0, 27.0, 23.0, 44.0, 60.0, 84.0, 93.0, 93.0, 91.0, 81.0, 70.0, 40.0, 45.0, 24.0, 19.0, 19.0, 20.0, 8.0, 13.0, 3.0, 8.0, 8.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012559890747070312, -0.001208961009979248, -0.0011619329452514648, -0.0011149048805236816, -0.0010678768157958984, -0.0010208487510681152, -0.000973820686340332, -0.0009267926216125488, -0.0008797645568847656, -0.0008327364921569824, -0.0007857084274291992, -0.000738680362701416, -0.0006916522979736328, -0.0006446242332458496, -0.0005975961685180664, -0.0005505681037902832, -0.0005035400390625, -0.0004565119743347168, -0.0004094839096069336, -0.0003624558448791504, -0.0003154277801513672, -0.000268399715423584, -0.00022137165069580078, -0.00017434358596801758, -0.00012731552124023438, -8.028745651245117e-05, -3.325939178466797e-05, 1.3768672943115234e-05, 6.079673767089844e-05, 0.00010782480239868164, 0.00015485286712646484, 0.00020188093185424805, 0.00024890899658203125, 0.00029593706130981445, 0.00034296512603759766, 0.00038999319076538086, 0.00043702125549316406, 0.00048404932022094727, 0.0005310773849487305, 0.0005781054496765137, 0.0006251335144042969, 0.0006721615791320801, 0.0007191896438598633, 0.0007662177085876465, 0.0008132457733154297, 0.0008602738380432129, 0.0009073019027709961, 0.0009543299674987793, 0.0010013580322265625, 0.0010483860969543457, 0.001095414161682129, 0.0011424422264099121, 0.0011894702911376953, 0.0012364983558654785, 0.0012835264205932617, 0.001330554485321045, 0.0013775825500488281, 0.0014246106147766113, 0.0014716386795043945, 0.0015186667442321777, 0.001565694808959961, 0.0016127228736877441, 0.0016597509384155273, 0.0017067790031433105, 0.0017538070678710938]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 5.0, 7.0, 6.0, 8.0, 13.0, 15.0, 9.0, 21.0, 33.0, 29.0, 42.0, 73.0, 108.0, 226.0, 662.0, 15762.0, 1029120.0, 1533.0, 378.0, 158.0, 88.0, 70.0, 43.0, 35.0, 32.0, 23.0, 10.0, 7.0, 7.0, 5.0, 8.0, 5.0, 5.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040985107421875, -0.03988528251647949, -0.038785457611083984, -0.03768563270568848, -0.03658580780029297, -0.03548598289489746, -0.03438615798950195, -0.033286333084106445, -0.03218650817871094, -0.03108668327331543, -0.029986858367919922, -0.028887033462524414, -0.027787208557128906, -0.0266873836517334, -0.02558755874633789, -0.024487733840942383, -0.023387908935546875, -0.022288084030151367, -0.02118825912475586, -0.02008843421936035, -0.018988609313964844, -0.017888784408569336, -0.016788959503173828, -0.01568913459777832, -0.014589309692382812, -0.013489484786987305, -0.012389659881591797, -0.011289834976196289, -0.010190010070800781, -0.009090185165405273, -0.007990360260009766, -0.006890535354614258, -0.00579071044921875, -0.004690885543823242, -0.0035910606384277344, -0.0024912357330322266, -0.0013914108276367188, -0.00029158592224121094, 0.0008082389831542969, 0.0019080638885498047, 0.0030078887939453125, 0.00410771369934082, 0.005207538604736328, 0.006307363510131836, 0.007407188415527344, 0.008507013320922852, 0.00960683822631836, 0.010706663131713867, 0.011806488037109375, 0.012906312942504883, 0.01400613784790039, 0.015105962753295898, 0.016205787658691406, 0.017305612564086914, 0.018405437469482422, 0.01950526237487793, 0.020605087280273438, 0.021704912185668945, 0.022804737091064453, 0.02390456199645996, 0.02500438690185547, 0.026104211807250977, 0.027204036712646484, 0.028303861618041992, 0.0294036865234375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 9.0, 18.0, 55.0, 110.0, 190.0, 238.0, 213.0, 118.0, 29.0, 18.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001144057372584939, -0.0011051417095586658, -0.0010662261629477143, -0.001027310499921441, -0.0009883948368951678, -0.0009494792320765555, -0.0009105636272579432, -0.0008716479642316699, -0.0008327323594130576, -0.0007938167545944452, -0.000754901091568172, -0.0007159854867495596, -0.0006770698819309473, -0.000638154218904674, -0.0005992386140860617, -0.0005603230092674494, -0.0005214073462411761, -0.00048249171231873333, -0.00044357607839629054, -0.0004046604735776782, -0.0003657448396552354, -0.0003268292057327926, -0.0002879136009141803, -0.0002489979669917375, -0.0002100823330692947, -0.0001711666991468519, -0.00013225107977632433, -9.333545312983915e-05, -5.441982648335397e-05, -1.550419256091118e-05, 2.3411426809616387e-05, 6.232704618014395e-05, 0.00010124279651790857, 0.00014015843044035137, 0.00017907404981087893, 0.0002179896691814065, 0.0002569053031038493, 0.0002958209370262921, 0.0003347365418449044, 0.0003736521757673472, 0.00041256780968979, 0.0004514834436122328, 0.0004903990775346756, 0.0005293146823532879, 0.0005682302871719003, 0.0006071459501981735, 0.0006460615550167859, 0.0006849771598353982, 0.0007238928228616714, 0.0007628084276802838, 0.000801724090706557, 0.0008406396955251694, 0.0008795553585514426, 0.000918470963370055, 0.0009573865681886673, 0.0009963022312149405, 0.0010352178942412138, 0.001074133557267487, 0.0011130491038784385, 0.0011519647669047117, 0.001190880429930985, 0.0012297960929572582, 0.0012687116395682096, 0.001307627302594483, 0.0013465428492054343]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 6.0, 3.0, 7.0, 7.0, 13.0, 13.0, 14.0, 12.0, 13.0, 19.0, 16.0, 11.0, 22.0, 23.0, 33.0, 29.0, 37.0, 40.0, 41.0, 34.0, 39.0, 40.0, 45.0, 41.0, 45.0, 46.0, 49.0, 30.0, 29.0, 28.0, 24.0, 22.0, 28.0, 25.0, 15.0, 16.0, 14.0, 18.0, 11.0, 12.0, 11.0, 6.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005917549133300781, -0.0005721943452954292, -0.0005526337772607803, -0.0005330732092261314, -0.0005135126411914825, -0.0004939520731568336, -0.00047439150512218475, -0.00045483093708753586, -0.00043527036905288696, -0.00041570980101823807, -0.00039614923298358917, -0.0003765886649489403, -0.0003570280969142914, -0.0003374675288796425, -0.0003179069608449936, -0.0002983463928103447, -0.0002787858247756958, -0.0002592252567410469, -0.000239664688706398, -0.00022010412067174911, -0.00020054355263710022, -0.00018098298460245132, -0.00016142241656780243, -0.00014186184853315353, -0.00012230128049850464, -0.00010274071246385574, -8.318014442920685e-05, -6.361957639455795e-05, -4.405900835990906e-05, -2.4498440325260162e-05, -4.937872290611267e-06, 1.4622695744037628e-05, 3.4183263778686523e-05, 5.374383181333542e-05, 7.330439984798431e-05, 9.286496788263321e-05, 0.0001124255359172821, 0.000131986103951931, 0.0001515466719865799, 0.0001711072400212288, 0.00019066780805587769, 0.00021022837609052658, 0.00022978894412517548, 0.00024934951215982437, 0.00026891008019447327, 0.00028847064822912216, 0.00030803121626377106, 0.00032759178429841995, 0.00034715235233306885, 0.00036671292036771774, 0.00038627348840236664, 0.00040583405643701553, 0.00042539462447166443, 0.0004449551925063133, 0.0004645157605409622, 0.0004840763285756111, 0.00050363689661026, 0.0005231974646449089, 0.0005427580326795578, 0.0005623186007142067, 0.0005818791687488556, 0.0006014397367835045, 0.0006210003048181534, 0.0006405608728528023, 0.0006601214408874512]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 9.0, 13.0, 13.0, 13.0, 16.0, 16.0, 31.0, 20.0, 23.0, 31.0, 39.0, 41.0, 31.0, 38.0, 42.0, 37.0, 32.0, 45.0, 50.0, 52.0, 39.0, 44.0, 39.0, 45.0, 27.0, 32.0, 27.0, 27.0, 30.0, 10.0, 16.0, 15.0, 10.0, 4.0, 8.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.4921875, -12.146240234375, -11.80029296875, -11.454345703125, -11.1083984375, -10.762451171875, -10.41650390625, -10.070556640625, -9.724609375, -9.378662109375, -9.03271484375, -8.686767578125, -8.3408203125, -7.994873046875, -7.64892578125, -7.302978515625, -6.95703125, -6.611083984375, -6.26513671875, -5.919189453125, -5.5732421875, -5.227294921875, -4.88134765625, -4.535400390625, -4.189453125, -3.843505859375, -3.49755859375, -3.151611328125, -2.8056640625, -2.459716796875, -2.11376953125, -1.767822265625, -1.421875, -1.075927734375, -0.72998046875, -0.384033203125, -0.0380859375, 0.307861328125, 0.65380859375, 0.999755859375, 1.345703125, 1.691650390625, 2.03759765625, 2.383544921875, 2.7294921875, 3.075439453125, 3.42138671875, 3.767333984375, 4.11328125, 4.459228515625, 4.80517578125, 5.151123046875, 5.4970703125, 5.843017578125, 6.18896484375, 6.534912109375, 6.880859375, 7.226806640625, 7.57275390625, 7.918701171875, 8.2646484375, 8.610595703125, 8.95654296875, 9.302490234375, 9.6484375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 5.0, 10.0, 20.0, 6.0, 18.0, 36.0, 26.0, 63.0, 102.0, 216.0, 490.0, 1481.0, 4413.0, 16351.0, 66053.0, 385260.0, 467912.0, 79090.0, 18962.0, 5324.0, 1584.0, 582.0, 241.0, 105.0, 61.0, 42.0, 31.0, 21.0, 17.0, 11.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-13.7421875, -13.42303466796875, -13.1038818359375, -12.78472900390625, -12.465576171875, -12.14642333984375, -11.8272705078125, -11.50811767578125, -11.18896484375, -10.86981201171875, -10.5506591796875, -10.23150634765625, -9.912353515625, -9.59320068359375, -9.2740478515625, -8.95489501953125, -8.6357421875, -8.31658935546875, -7.9974365234375, -7.67828369140625, -7.359130859375, -7.03997802734375, -6.7208251953125, -6.40167236328125, -6.08251953125, -5.76336669921875, -5.4442138671875, -5.12506103515625, -4.805908203125, -4.48675537109375, -4.1676025390625, -3.84844970703125, -3.529296875, -3.21014404296875, -2.8909912109375, -2.57183837890625, -2.252685546875, -1.93353271484375, -1.6143798828125, -1.29522705078125, -0.97607421875, -0.65692138671875, -0.3377685546875, -0.01861572265625, 0.300537109375, 0.61968994140625, 0.9388427734375, 1.25799560546875, 1.5771484375, 1.89630126953125, 2.2154541015625, 2.53460693359375, 2.853759765625, 3.17291259765625, 3.4920654296875, 3.81121826171875, 4.13037109375, 4.44952392578125, 4.7686767578125, 5.08782958984375, 5.406982421875, 5.72613525390625, 6.0452880859375, 6.36444091796875, 6.68359375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 10.0, 9.0, 9.0, 13.0, 26.0, 23.0, 26.0, 28.0, 38.0, 45.0, 48.0, 67.0, 60.0, 134.0, 1885.0, 137.0, 71.0, 70.0, 48.0, 40.0, 37.0, 40.0, 34.0, 35.0, 24.0, 24.0, 11.0, 20.0, 0.0, 9.0, 3.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.90625, -42.515625, -41.125, -39.734375, -38.34375, -36.953125, -35.5625, -34.171875, -32.78125, -31.390625, -30.0, -28.609375, -27.21875, -25.828125, -24.4375, -23.046875, -21.65625, -20.265625, -18.875, -17.484375, -16.09375, -14.703125, -13.3125, -11.921875, -10.53125, -9.140625, -7.75, -6.359375, -4.96875, -3.578125, -2.1875, -0.796875, 0.59375, 1.984375, 3.375, 4.765625, 6.15625, 7.546875, 8.9375, 10.328125, 11.71875, 13.109375, 14.5, 15.890625, 17.28125, 18.671875, 20.0625, 21.453125, 22.84375, 24.234375, 25.625, 27.015625, 28.40625, 29.796875, 31.1875, 32.578125, 33.96875, 35.359375, 36.75, 38.140625, 39.53125, 40.921875, 42.3125, 43.703125, 45.09375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 7.0, 4.0, 19.0, 15.0, 30.0, 43.0, 53.0, 71.0, 91.0, 119.0, 187.0, 252.0, 405.0, 1277.0, 2772244.0, 368688.0, 1045.0, 350.0, 239.0, 164.0, 96.0, 82.0, 53.0, 36.0, 39.0, 20.0, 17.0, 11.0, 12.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-118.6875, -115.19140625, -111.6953125, -108.19921875, -104.703125, -101.20703125, -97.7109375, -94.21484375, -90.71875, -87.22265625, -83.7265625, -80.23046875, -76.734375, -73.23828125, -69.7421875, -66.24609375, -62.75, -59.25390625, -55.7578125, -52.26171875, -48.765625, -45.26953125, -41.7734375, -38.27734375, -34.78125, -31.28515625, -27.7890625, -24.29296875, -20.796875, -17.30078125, -13.8046875, -10.30859375, -6.8125, -3.31640625, 0.1796875, 3.67578125, 7.171875, 10.66796875, 14.1640625, 17.66015625, 21.15625, 24.65234375, 28.1484375, 31.64453125, 35.140625, 38.63671875, 42.1328125, 45.62890625, 49.125, 52.62109375, 56.1171875, 59.61328125, 63.109375, 66.60546875, 70.1015625, 73.59765625, 77.09375, 80.58984375, 84.0859375, 87.58203125, 91.078125, 94.57421875, 98.0703125, 101.56640625, 105.0625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 940.0, 71.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-582.8887939453125, -572.5997924804688, -562.310791015625, -552.0217895507812, -541.7327880859375, -531.4437866210938, -521.15478515625, -510.8657531738281, -500.5767517089844, -490.2877502441406, -479.9987487792969, -469.7097473144531, -459.4207458496094, -449.1317138671875, -438.84271240234375, -428.5537109375, -418.26470947265625, -407.9757080078125, -397.68670654296875, -387.397705078125, -377.10870361328125, -366.8197021484375, -356.53070068359375, -346.2416687011719, -335.95269775390625, -325.6636962890625, -315.37469482421875, -305.085693359375, -294.79669189453125, -284.5076904296875, -274.21868896484375, -263.9296569824219, -253.64065551757812, -243.35165405273438, -233.06265258789062, -222.77365112304688, -212.48463439941406, -202.1956329345703, -191.90663146972656, -181.61761474609375, -171.32862854003906, -161.0396270751953, -150.75062561035156, -140.46160888671875, -130.172607421875, -119.88360595703125, -109.5946044921875, -99.30559539794922, -89.01659393310547, -78.72759246826172, -68.43858337402344, -58.14958190917969, -47.86057662963867, -37.571571350097656, -27.282569885253906, -16.993560791015625, -6.704559326171875, 3.584444999694824, 13.873449325561523, 24.162452697753906, 34.45145797729492, 44.74046325683594, 55.02946472167969, 65.31847381591797, 75.60747528076172]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 6.0, 6.0, 7.0, 9.0, 10.0, 19.0, 17.0, 13.0, 16.0, 18.0, 22.0, 29.0, 24.0, 30.0, 47.0, 33.0, 38.0, 32.0, 37.0, 36.0, 38.0, 30.0, 48.0, 44.0, 49.0, 32.0, 35.0, 29.0, 29.0, 32.0, 31.0, 15.0, 19.0, 19.0, 22.0, 14.0, 12.0, 10.0, 5.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-96.1603775024414, -93.10614013671875, -90.0519027709961, -86.99766540527344, -83.94342041015625, -80.8891830444336, -77.83494567871094, -74.78070831298828, -71.72647094726562, -68.67223358154297, -65.61799621582031, -62.56375503540039, -59.509517669677734, -56.45527648925781, -53.401039123535156, -50.3468017578125, -47.29256057739258, -44.23832321166992, -41.18408203125, -38.129844665527344, -35.07560729980469, -32.02136993408203, -28.96712875366211, -25.912891387939453, -22.858652114868164, -19.804412841796875, -16.75017547607422, -13.69593620300293, -10.641697883605957, -7.587459564208984, -4.533220291137695, -1.478982925415039, 1.57525634765625, 4.629494667053223, 7.6837334632873535, 10.737972259521484, 13.792210578918457, 16.84644889831543, 19.90068817138672, 22.954925537109375, 26.009164810180664, 29.063404083251953, 32.11764144897461, 35.17188262939453, 38.22611999511719, 41.280357360839844, 44.3345947265625, 47.388832092285156, 50.44307327270508, 53.497310638427734, 56.551551818847656, 59.60578918457031, 62.66002655029297, 65.71426391601562, 68.76850891113281, 71.82273864746094, 74.87698364257812, 77.93122100830078, 80.98545837402344, 84.03970336914062, 87.09394073486328, 90.14817810058594, 93.2024154663086, 96.25665283203125, 99.3108901977539]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 6.0, 2.0, 4.0, 5.0, 3.0, 8.0, 9.0, 10.0, 16.0, 17.0, 9.0, 21.0, 22.0, 31.0, 19.0, 32.0, 32.0, 31.0, 39.0, 33.0, 45.0, 38.0, 33.0, 29.0, 53.0, 54.0, 50.0, 33.0, 38.0, 32.0, 32.0, 34.0, 32.0, 33.0, 20.0, 23.0, 11.0, 9.0, 17.0, 12.0, 9.0, 9.0, 2.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.5703125, -12.2254638671875, -11.880615234375, -11.5357666015625, -11.19091796875, -10.8460693359375, -10.501220703125, -10.1563720703125, -9.8115234375, -9.4666748046875, -9.121826171875, -8.7769775390625, -8.43212890625, -8.0872802734375, -7.742431640625, -7.3975830078125, -7.052734375, -6.7078857421875, -6.363037109375, -6.0181884765625, -5.67333984375, -5.3284912109375, -4.983642578125, -4.6387939453125, -4.2939453125, -3.9490966796875, -3.604248046875, -3.2593994140625, -2.91455078125, -2.5697021484375, -2.224853515625, -1.8800048828125, -1.53515625, -1.1903076171875, -0.845458984375, -0.5006103515625, -0.15576171875, 0.1890869140625, 0.533935546875, 0.8787841796875, 1.2236328125, 1.5684814453125, 1.913330078125, 2.2581787109375, 2.60302734375, 2.9478759765625, 3.292724609375, 3.6375732421875, 3.982421875, 4.3272705078125, 4.672119140625, 5.0169677734375, 5.36181640625, 5.7066650390625, 6.051513671875, 6.3963623046875, 6.7412109375, 7.0860595703125, 7.430908203125, 7.7757568359375, 8.12060546875, 8.4654541015625, 8.810302734375, 9.1551513671875, 9.5]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 7.0, 10.0, 9.0, 7.0, 14.0, 14.0, 17.0, 17.0, 19.0, 25.0, 33.0, 48.0, 44.0, 69.0, 137.0, 257.0, 619.0, 1680.0, 11074.0, 936725.0, 3170821.0, 67487.0, 3311.0, 945.0, 363.0, 151.0, 78.0, 50.0, 44.0, 40.0, 21.0, 28.0, 26.0, 25.0, 12.0, 12.0, 8.0, 5.0, 12.0, 5.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-42.03125, -40.87109375, -39.7109375, -38.55078125, -37.390625, -36.23046875, -35.0703125, -33.91015625, -32.75, -31.58984375, -30.4296875, -29.26953125, -28.109375, -26.94921875, -25.7890625, -24.62890625, -23.46875, -22.30859375, -21.1484375, -19.98828125, -18.828125, -17.66796875, -16.5078125, -15.34765625, -14.1875, -13.02734375, -11.8671875, -10.70703125, -9.546875, -8.38671875, -7.2265625, -6.06640625, -4.90625, -3.74609375, -2.5859375, -1.42578125, -0.265625, 0.89453125, 2.0546875, 3.21484375, 4.375, 5.53515625, 6.6953125, 7.85546875, 9.015625, 10.17578125, 11.3359375, 12.49609375, 13.65625, 14.81640625, 15.9765625, 17.13671875, 18.296875, 19.45703125, 20.6171875, 21.77734375, 22.9375, 24.09765625, 25.2578125, 26.41796875, 27.578125, 28.73828125, 29.8984375, 31.05859375, 32.21875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 1.0, 6.0, 7.0, 8.0, 19.0, 23.0, 47.0, 32.0, 54.0, 60.0, 110.0, 146.0, 193.0, 358.0, 491.0, 599.0, 547.0, 433.0, 267.0, 188.0, 133.0, 89.0, 70.0, 50.0, 42.0, 35.0, 17.0, 14.0, 6.0, 7.0, 3.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.484375, -22.845703125, -22.20703125, -21.568359375, -20.9296875, -20.291015625, -19.65234375, -19.013671875, -18.375, -17.736328125, -17.09765625, -16.458984375, -15.8203125, -15.181640625, -14.54296875, -13.904296875, -13.265625, -12.626953125, -11.98828125, -11.349609375, -10.7109375, -10.072265625, -9.43359375, -8.794921875, -8.15625, -7.517578125, -6.87890625, -6.240234375, -5.6015625, -4.962890625, -4.32421875, -3.685546875, -3.046875, -2.408203125, -1.76953125, -1.130859375, -0.4921875, 0.146484375, 0.78515625, 1.423828125, 2.0625, 2.701171875, 3.33984375, 3.978515625, 4.6171875, 5.255859375, 5.89453125, 6.533203125, 7.171875, 7.810546875, 8.44921875, 9.087890625, 9.7265625, 10.365234375, 11.00390625, 11.642578125, 12.28125, 12.919921875, 13.55859375, 14.197265625, 14.8359375, 15.474609375, 16.11328125, 16.751953125, 17.390625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 7.0, 10.0, 21.0, 36.0, 44.0, 50.0, 66.0, 110.0, 154.0, 184.0, 257.0, 428.0, 937.0, 26502.0, 4158448.0, 5124.0, 683.0, 357.0, 209.0, 167.0, 117.0, 107.0, 70.0, 48.0, 43.0, 28.0, 14.0, 12.0, 11.0, 11.0, 11.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-145.125, -141.2421875, -137.359375, -133.4765625, -129.59375, -125.7109375, -121.828125, -117.9453125, -114.0625, -110.1796875, -106.296875, -102.4140625, -98.53125, -94.6484375, -90.765625, -86.8828125, -83.0, -79.1171875, -75.234375, -71.3515625, -67.46875, -63.5859375, -59.703125, -55.8203125, -51.9375, -48.0546875, -44.171875, -40.2890625, -36.40625, -32.5234375, -28.640625, -24.7578125, -20.875, -16.9921875, -13.109375, -9.2265625, -5.34375, -1.4609375, 2.421875, 6.3046875, 10.1875, 14.0703125, 17.953125, 21.8359375, 25.71875, 29.6015625, 33.484375, 37.3671875, 41.25, 45.1328125, 49.015625, 52.8984375, 56.78125, 60.6640625, 64.546875, 68.4296875, 72.3125, 76.1953125, 80.078125, 83.9609375, 87.84375, 91.7265625, 95.609375, 99.4921875, 103.375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 56.0, 463.0, 450.0, 45.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-488.7304382324219, -478.0940856933594, -467.4577331542969, -456.8213806152344, -446.18505859375, -435.5487060546875, -424.912353515625, -414.2760009765625, -403.6396484375, -393.0032958984375, -382.366943359375, -371.7305908203125, -361.09423828125, -350.4579162597656, -339.8215637207031, -329.1852111816406, -318.5488586425781, -307.9125061035156, -297.2761535644531, -286.6398010253906, -276.00347900390625, -265.36712646484375, -254.73077392578125, -244.09442138671875, -233.45806884765625, -222.82171630859375, -212.18536376953125, -201.5490264892578, -190.9126739501953, -180.2763214111328, -169.63998413085938, -159.00363159179688, -148.3672637939453, -137.7309112548828, -127.09456634521484, -116.45822143554688, -105.82186889648438, -95.18551635742188, -84.5491714477539, -73.91282653808594, -63.27647399902344, -52.6401252746582, -42.00377655029297, -31.367427825927734, -20.7310791015625, -10.094730377197266, 0.5416183471679688, 11.177963256835938, 21.814315795898438, 32.45066452026367, 43.087013244628906, 53.72336196899414, 64.35971069335938, 74.99606323242188, 85.63240814208984, 96.26875305175781, 106.90510559082031, 117.54145812988281, 128.17779541015625, 138.81414794921875, 149.45050048828125, 160.08685302734375, 170.72320556640625, 181.3595428466797, 191.9958953857422]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 7.0, 5.0, 5.0, 12.0, 5.0, 7.0, 15.0, 12.0, 15.0, 19.0, 25.0, 29.0, 29.0, 29.0, 39.0, 35.0, 37.0, 48.0, 40.0, 45.0, 39.0, 37.0, 38.0, 49.0, 44.0, 35.0, 40.0, 36.0, 28.0, 31.0, 32.0, 26.0, 19.0, 15.0, 9.0, 8.0, 12.0, 13.0, 8.0, 8.0, 4.0, 1.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-60.716278076171875, -58.83168029785156, -56.947086334228516, -55.0624885559082, -53.177894592285156, -51.293296813964844, -49.4087028503418, -47.524105072021484, -45.63951110839844, -43.754913330078125, -41.87031936645508, -39.985721588134766, -38.10112762451172, -36.216529846191406, -34.33193588256836, -32.44733810424805, -30.562742233276367, -28.678146362304688, -26.793550491333008, -24.908954620361328, -23.02435874938965, -21.13976287841797, -19.255165100097656, -17.37057113647461, -15.485974311828613, -13.601378440856934, -11.716782569885254, -9.832185745239258, -7.947590351104736, -6.062994003295898, -4.178398132324219, -2.293802261352539, -0.4092063903808594, 1.4753895998001099, 3.359985589981079, 5.244581699371338, 7.129177570343018, 9.013773918151855, 10.898369789123535, 12.782965660095215, 14.667561531066895, 16.55215835571289, 18.43675422668457, 20.32135009765625, 22.20594596862793, 24.09054183959961, 25.97513771057129, 27.85973358154297, 29.74432945251465, 31.628925323486328, 33.51352310180664, 35.39811706542969, 37.28271484375, 39.16730880737305, 41.05190658569336, 42.936500549316406, 44.82109832763672, 46.70569610595703, 48.59029006958008, 50.47488784790039, 52.35948181152344, 54.24407958984375, 56.1286735534668, 58.01327133178711, 59.897865295410156]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 11.0, 8.0, 12.0, 14.0, 9.0, 16.0, 15.0, 21.0, 20.0, 32.0, 24.0, 31.0, 34.0, 37.0, 37.0, 33.0, 34.0, 39.0, 46.0, 37.0, 43.0, 52.0, 54.0, 29.0, 44.0, 32.0, 32.0, 23.0, 35.0, 20.0, 24.0, 14.0, 24.0, 14.0, 9.0, 5.0, 5.0, 9.0, 8.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.15625, -10.8189697265625, -10.481689453125, -10.1444091796875, -9.80712890625, -9.4698486328125, -9.132568359375, -8.7952880859375, -8.4580078125, -8.1207275390625, -7.783447265625, -7.4461669921875, -7.10888671875, -6.7716064453125, -6.434326171875, -6.0970458984375, -5.759765625, -5.4224853515625, -5.085205078125, -4.7479248046875, -4.41064453125, -4.0733642578125, -3.736083984375, -3.3988037109375, -3.0615234375, -2.7242431640625, -2.386962890625, -2.0496826171875, -1.71240234375, -1.3751220703125, -1.037841796875, -0.7005615234375, -0.36328125, -0.0260009765625, 0.311279296875, 0.6485595703125, 0.98583984375, 1.3231201171875, 1.660400390625, 1.9976806640625, 2.3349609375, 2.6722412109375, 3.009521484375, 3.3468017578125, 3.68408203125, 4.0213623046875, 4.358642578125, 4.6959228515625, 5.033203125, 5.3704833984375, 5.707763671875, 6.0450439453125, 6.38232421875, 6.7196044921875, 7.056884765625, 7.3941650390625, 7.7314453125, 8.0687255859375, 8.406005859375, 8.7432861328125, 9.08056640625, 9.4178466796875, 9.755126953125, 10.0924072265625, 10.4296875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 8.0, 13.0, 8.0, 7.0, 23.0, 44.0, 50.0, 71.0, 100.0, 168.0, 267.0, 386.0, 662.0, 1019.0, 1667.0, 2650.0, 4316.0, 6817.0, 11599.0, 19011.0, 32455.0, 56827.0, 107048.0, 266630.0, 283720.0, 111179.0, 58376.0, 33242.0, 19624.0, 11764.0, 7098.0, 4412.0, 2687.0, 1691.0, 1080.0, 633.0, 419.0, 285.0, 150.0, 118.0, 81.0, 51.0, 25.0, 28.0, 19.0, 12.0, 6.0, 2.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.423828125, -2.350433349609375, -2.27703857421875, -2.203643798828125, -2.1302490234375, -2.056854248046875, -1.98345947265625, -1.910064697265625, -1.836669921875, -1.763275146484375, -1.68988037109375, -1.616485595703125, -1.5430908203125, -1.469696044921875, -1.39630126953125, -1.322906494140625, -1.24951171875, -1.176116943359375, -1.10272216796875, -1.029327392578125, -0.9559326171875, -0.882537841796875, -0.80914306640625, -0.735748291015625, -0.662353515625, -0.588958740234375, -0.51556396484375, -0.442169189453125, -0.3687744140625, -0.295379638671875, -0.22198486328125, -0.148590087890625, -0.0751953125, -0.001800537109375, 0.07159423828125, 0.144989013671875, 0.2183837890625, 0.291778564453125, 0.36517333984375, 0.438568115234375, 0.511962890625, 0.585357666015625, 0.65875244140625, 0.732147216796875, 0.8055419921875, 0.878936767578125, 0.95233154296875, 1.025726318359375, 1.09912109375, 1.172515869140625, 1.24591064453125, 1.319305419921875, 1.3927001953125, 1.466094970703125, 1.53948974609375, 1.612884521484375, 1.686279296875, 1.759674072265625, 1.83306884765625, 1.906463623046875, 1.9798583984375, 2.053253173828125, 2.12664794921875, 2.200042724609375, 2.2734375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 6.0, 6.0, 5.0, 4.0, 10.0, 11.0, 13.0, 11.0, 16.0, 16.0, 29.0, 29.0, 30.0, 37.0, 27.0, 33.0, 33.0, 34.0, 45.0, 47.0, 1066.0, 52.0, 52.0, 56.0, 37.0, 36.0, 39.0, 32.0, 33.0, 35.0, 23.0, 27.0, 17.0, 18.0, 12.0, 10.0, 15.0, 9.0, 8.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.16015625, -6.93499755859375, -6.7098388671875, -6.48468017578125, -6.259521484375, -6.03436279296875, -5.8092041015625, -5.58404541015625, -5.35888671875, -5.13372802734375, -4.9085693359375, -4.68341064453125, -4.458251953125, -4.23309326171875, -4.0079345703125, -3.78277587890625, -3.5576171875, -3.33245849609375, -3.1072998046875, -2.88214111328125, -2.656982421875, -2.43182373046875, -2.2066650390625, -1.98150634765625, -1.75634765625, -1.53118896484375, -1.3060302734375, -1.08087158203125, -0.855712890625, -0.63055419921875, -0.4053955078125, -0.18023681640625, 0.044921875, 0.27008056640625, 0.4952392578125, 0.72039794921875, 0.945556640625, 1.17071533203125, 1.3958740234375, 1.62103271484375, 1.84619140625, 2.07135009765625, 2.2965087890625, 2.52166748046875, 2.746826171875, 2.97198486328125, 3.1971435546875, 3.42230224609375, 3.6474609375, 3.87261962890625, 4.0977783203125, 4.32293701171875, 4.548095703125, 4.77325439453125, 4.9984130859375, 5.22357177734375, 5.44873046875, 5.67388916015625, 5.8990478515625, 6.12420654296875, 6.349365234375, 6.57452392578125, 6.7996826171875, 7.02484130859375, 7.25]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 2.0, 8.0, 16.0, 10.0, 15.0, 23.0, 45.0, 70.0, 117.0, 145.0, 212.0, 330.0, 481.0, 726.0, 1129.0, 1827.0, 2997.0, 4568.0, 7390.0, 11829.0, 19234.0, 31479.0, 52726.0, 95184.0, 236532.0, 1366461.0, 112036.0, 59221.0, 35282.0, 21533.0, 13255.0, 8041.0, 5093.0, 3189.0, 2093.0, 1316.0, 848.0, 504.0, 354.0, 281.0, 146.0, 130.0, 86.0, 55.0, 32.0, 27.0, 15.0, 12.0, 11.0, 6.0, 1.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-2.177734375, -2.10992431640625, -2.0421142578125, -1.97430419921875, -1.906494140625, -1.83868408203125, -1.7708740234375, -1.70306396484375, -1.63525390625, -1.56744384765625, -1.4996337890625, -1.43182373046875, -1.364013671875, -1.29620361328125, -1.2283935546875, -1.16058349609375, -1.0927734375, -1.02496337890625, -0.9571533203125, -0.88934326171875, -0.821533203125, -0.75372314453125, -0.6859130859375, -0.61810302734375, -0.55029296875, -0.48248291015625, -0.4146728515625, -0.34686279296875, -0.279052734375, -0.21124267578125, -0.1434326171875, -0.07562255859375, -0.0078125, 0.05999755859375, 0.1278076171875, 0.19561767578125, 0.263427734375, 0.33123779296875, 0.3990478515625, 0.46685791015625, 0.53466796875, 0.60247802734375, 0.6702880859375, 0.73809814453125, 0.805908203125, 0.87371826171875, 0.9415283203125, 1.00933837890625, 1.0771484375, 1.14495849609375, 1.2127685546875, 1.28057861328125, 1.348388671875, 1.41619873046875, 1.4840087890625, 1.55181884765625, 1.61962890625, 1.68743896484375, 1.7552490234375, 1.82305908203125, 1.890869140625, 1.95867919921875, 2.0264892578125, 2.09429931640625, 2.162109375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 10.0, 12.0, 11.0, 14.0, 26.0, 42.0, 45.0, 55.0, 76.0, 69.0, 98.0, 104.0, 106.0, 72.0, 59.0, 58.0, 37.0, 25.0, 19.0, 14.0, 8.0, 5.0, 5.0, 7.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013370513916015625, -0.0012881606817245483, -0.0012392699718475342, -0.00119037926197052, -0.0011414885520935059, -0.0010925978422164917, -0.0010437071323394775, -0.0009948164224624634, -0.0009459257125854492, -0.0008970350027084351, -0.0008481442928314209, -0.0007992535829544067, -0.0007503628730773926, -0.0007014721632003784, -0.0006525814533233643, -0.0006036907434463501, -0.0005548000335693359, -0.0005059093236923218, -0.0004570186138153076, -0.00040812790393829346, -0.0003592371940612793, -0.00031034648418426514, -0.000261455774307251, -0.00021256506443023682, -0.00016367435455322266, -0.0001147836446762085, -6.589293479919434e-05, -1.7002224922180176e-05, 3.1888484954833984e-05, 8.077919483184814e-05, 0.0001296699047088623, 0.00017856061458587646, 0.00022745132446289062, 0.0002763420343399048, 0.00032523274421691895, 0.0003741234540939331, 0.00042301416397094727, 0.0004719048738479614, 0.0005207955837249756, 0.0005696862936019897, 0.0006185770034790039, 0.0006674677133560181, 0.0007163584232330322, 0.0007652491331100464, 0.0008141398429870605, 0.0008630305528640747, 0.0009119212627410889, 0.000960811972618103, 0.0010097026824951172, 0.0010585933923721313, 0.0011074841022491455, 0.0011563748121261597, 0.0012052655220031738, 0.001254156231880188, 0.0013030469417572021, 0.0013519376516342163, 0.0014008283615112305, 0.0014497190713882446, 0.0014986097812652588, 0.001547500491142273, 0.0015963912010192871, 0.0016452819108963013, 0.0016941726207733154, 0.0017430633306503296, 0.0017919540405273438]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 6.0, 8.0, 4.0, 7.0, 19.0, 25.0, 38.0, 55.0, 113.0, 153.0, 407.0, 3032.0, 1042206.0, 1676.0, 344.0, 174.0, 89.0, 50.0, 41.0, 32.0, 18.0, 16.0, 12.0, 8.0, 5.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.045074462890625, -0.04383659362792969, -0.042598724365234375, -0.04136085510253906, -0.04012298583984375, -0.03888511657714844, -0.037647247314453125, -0.03640937805175781, -0.0351715087890625, -0.03393363952636719, -0.032695770263671875, -0.03145790100097656, -0.03022003173828125, -0.028982162475585938, -0.027744293212890625, -0.026506423950195312, -0.0252685546875, -0.024030685424804688, -0.022792816162109375, -0.021554946899414062, -0.02031707763671875, -0.019079208374023438, -0.017841339111328125, -0.016603469848632812, -0.0153656005859375, -0.014127731323242188, -0.012889862060546875, -0.011651992797851562, -0.01041412353515625, -0.009176254272460938, -0.007938385009765625, -0.0067005157470703125, -0.005462646484375, -0.0042247772216796875, -0.002986907958984375, -0.0017490386962890625, -0.00051116943359375, 0.0007266998291015625, 0.001964569091796875, 0.0032024383544921875, 0.0044403076171875, 0.0056781768798828125, 0.006916046142578125, 0.008153915405273438, 0.00939178466796875, 0.010629653930664062, 0.011867523193359375, 0.013105392456054688, 0.01434326171875, 0.015581130981445312, 0.016819000244140625, 0.018056869506835938, 0.01929473876953125, 0.020532608032226562, 0.021770477294921875, 0.023008346557617188, 0.0242462158203125, 0.025484085083007812, 0.026721954345703125, 0.027959823608398438, 0.02919769287109375, 0.030435562133789062, 0.031673431396484375, 0.03291130065917969, 0.034149169921875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 8.0, 21.0, 47.0, 143.0, 244.0, 297.0, 171.0, 61.0, 17.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020674681290984154, -0.0020226251799613237, -0.001977782230824232, -0.0019329393981024623, -0.0018880964489653707, -0.0018432536162436008, -0.0017984106671065092, -0.0017535677179694176, -0.001708724768832326, -0.0016638818196952343, -0.0016190389869734645, -0.0015741960378363729, -0.0015293530886992812, -0.0014845102559775114, -0.0014396673068404198, -0.0013948243577033281, -0.0013499815249815583, -0.0013051385758444667, -0.0012602957431226969, -0.0012154527939856052, -0.0011706098448485136, -0.001125766895711422, -0.0010809240629896522, -0.0010360811138525605, -0.0009912382811307907, -0.00094639539020136, -0.0009015524410642684, -0.0008567095501348376, -0.000811866600997746, -0.0007670237100683153, -0.0007221808191388845, -0.0006773378700017929, -0.0006324950372800231, -0.0005876521463505924, -0.0005428091972135007, -0.00049796630628407, -0.00045312338625080884, -0.00040828046621754766, -0.00036343757528811693, -0.00031859465525485575, -0.00027375173522159457, -0.0002289088151883334, -0.00018406590970698744, -0.0001392230042256415, -9.438008419238031e-05, -4.953716415911913e-05, -4.694273229688406e-06, 4.0148646803572774e-05, 8.499156683683395e-05, 0.00012983448687009513, 0.00017467739235144109, 0.00021952029783278704, 0.0002643632178660482, 0.0003092061378993094, 0.0003540490288287401, 0.0003988919488620013, 0.0004437348688952625, 0.0004885777598246932, 0.0005334207089617848, 0.0005782635998912156, 0.0006231064908206463, 0.0006679494399577379, 0.0007127923308871686, 0.0007576352218165994, 0.000802478170953691]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 3.0, 3.0, 5.0, 9.0, 7.0, 9.0, 14.0, 22.0, 21.0, 29.0, 15.0, 24.0, 33.0, 37.0, 36.0, 39.0, 43.0, 33.0, 39.0, 44.0, 37.0, 30.0, 44.0, 44.0, 44.0, 47.0, 42.0, 40.0, 22.0, 34.0, 17.0, 30.0, 21.0, 9.0, 17.0, 13.0, 7.0, 8.0, 7.0, 12.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005329251289367676, -0.000513705424964428, -0.0004944857209920883, -0.0004752660170197487, -0.00045604631304740906, -0.00043682660907506943, -0.0004176069051027298, -0.00039838720113039017, -0.00037916749715805054, -0.0003599477931857109, -0.0003407280892133713, -0.00032150838524103165, -0.000302288681268692, -0.0002830689772963524, -0.00026384927332401276, -0.0002446295693516731, -0.0002254098653793335, -0.00020619016140699387, -0.00018697045743465424, -0.0001677507534623146, -0.00014853104948997498, -0.00012931134551763535, -0.00011009164154529572, -9.087193757295609e-05, -7.165223360061646e-05, -5.2432529628276825e-05, -3.3212825655937195e-05, -1.3993121683597565e-05, 5.2265822887420654e-06, 2.4446286261081696e-05, 4.3665990233421326e-05, 6.288569420576096e-05, 8.210539817810059e-05, 0.00010132510215044022, 0.00012054480612277985, 0.00013976451009511948, 0.0001589842140674591, 0.00017820391803979874, 0.00019742362201213837, 0.000216643325984478, 0.00023586302995681763, 0.00025508273392915726, 0.0002743024379014969, 0.0002935221418738365, 0.00031274184584617615, 0.0003319615498185158, 0.0003511812537908554, 0.00037040095776319504, 0.00038962066173553467, 0.0004088403657078743, 0.00042806006968021393, 0.00044727977365255356, 0.0004664994776248932, 0.0004857191815972328, 0.0005049388855695724, 0.0005241585895419121, 0.0005433782935142517, 0.0005625979974865913, 0.000581817701458931, 0.0006010374054312706, 0.0006202571094036102, 0.0006394768133759499, 0.0006586965173482895, 0.0006779162213206291, 0.0006971359252929688]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 11.0, 8.0, 12.0, 14.0, 9.0, 16.0, 15.0, 21.0, 20.0, 32.0, 24.0, 31.0, 34.0, 37.0, 37.0, 33.0, 34.0, 39.0, 46.0, 37.0, 43.0, 52.0, 54.0, 29.0, 44.0, 32.0, 32.0, 23.0, 35.0, 20.0, 24.0, 14.0, 24.0, 14.0, 9.0, 5.0, 5.0, 9.0, 8.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.15625, -10.8189697265625, -10.481689453125, -10.1444091796875, -9.80712890625, -9.4698486328125, -9.132568359375, -8.7952880859375, -8.4580078125, -8.1207275390625, -7.783447265625, -7.4461669921875, -7.10888671875, -6.7716064453125, -6.434326171875, -6.0970458984375, -5.759765625, -5.4224853515625, -5.085205078125, -4.7479248046875, -4.41064453125, -4.0733642578125, -3.736083984375, -3.3988037109375, -3.0615234375, -2.7242431640625, -2.386962890625, -2.0496826171875, -1.71240234375, -1.3751220703125, -1.037841796875, -0.7005615234375, -0.36328125, -0.0260009765625, 0.311279296875, 0.6485595703125, 0.98583984375, 1.3231201171875, 1.660400390625, 1.9976806640625, 2.3349609375, 2.6722412109375, 3.009521484375, 3.3468017578125, 3.68408203125, 4.0213623046875, 4.358642578125, 4.6959228515625, 5.033203125, 5.3704833984375, 5.707763671875, 6.0450439453125, 6.38232421875, 6.7196044921875, 7.056884765625, 7.3941650390625, 7.7314453125, 8.0687255859375, 8.406005859375, 8.7432861328125, 9.08056640625, 9.4178466796875, 9.755126953125, 10.0924072265625, 10.4296875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 10.0, 12.0, 13.0, 22.0, 22.0, 32.0, 37.0, 57.0, 80.0, 85.0, 124.0, 162.0, 274.0, 475.0, 928.0, 2563.0, 8483.0, 33001.0, 144155.0, 597821.0, 199754.0, 43629.0, 10972.0, 3166.0, 1084.0, 510.0, 316.0, 213.0, 148.0, 96.0, 76.0, 49.0, 52.0, 38.0, 24.0, 12.0, 10.0, 17.0, 9.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.921875, -11.55615234375, -11.1904296875, -10.82470703125, -10.458984375, -10.09326171875, -9.7275390625, -9.36181640625, -8.99609375, -8.63037109375, -8.2646484375, -7.89892578125, -7.533203125, -7.16748046875, -6.8017578125, -6.43603515625, -6.0703125, -5.70458984375, -5.3388671875, -4.97314453125, -4.607421875, -4.24169921875, -3.8759765625, -3.51025390625, -3.14453125, -2.77880859375, -2.4130859375, -2.04736328125, -1.681640625, -1.31591796875, -0.9501953125, -0.58447265625, -0.21875, 0.14697265625, 0.5126953125, 0.87841796875, 1.244140625, 1.60986328125, 1.9755859375, 2.34130859375, 2.70703125, 3.07275390625, 3.4384765625, 3.80419921875, 4.169921875, 4.53564453125, 4.9013671875, 5.26708984375, 5.6328125, 5.99853515625, 6.3642578125, 6.72998046875, 7.095703125, 7.46142578125, 7.8271484375, 8.19287109375, 8.55859375, 8.92431640625, 9.2900390625, 9.65576171875, 10.021484375, 10.38720703125, 10.7529296875, 11.11865234375, 11.484375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 3.0, 7.0, 9.0, 10.0, 10.0, 10.0, 17.0, 29.0, 22.0, 16.0, 30.0, 38.0, 35.0, 49.0, 38.0, 52.0, 68.0, 110.0, 1691.0, 311.0, 77.0, 56.0, 46.0, 49.0, 29.0, 33.0, 31.0, 28.0, 11.0, 29.0, 14.0, 19.0, 11.0, 13.0, 14.0, 8.0, 11.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-38.15625, -37.09130859375, -36.0263671875, -34.96142578125, -33.896484375, -32.83154296875, -31.7666015625, -30.70166015625, -29.63671875, -28.57177734375, -27.5068359375, -26.44189453125, -25.376953125, -24.31201171875, -23.2470703125, -22.18212890625, -21.1171875, -20.05224609375, -18.9873046875, -17.92236328125, -16.857421875, -15.79248046875, -14.7275390625, -13.66259765625, -12.59765625, -11.53271484375, -10.4677734375, -9.40283203125, -8.337890625, -7.27294921875, -6.2080078125, -5.14306640625, -4.078125, -3.01318359375, -1.9482421875, -0.88330078125, 0.181640625, 1.24658203125, 2.3115234375, 3.37646484375, 4.44140625, 5.50634765625, 6.5712890625, 7.63623046875, 8.701171875, 9.76611328125, 10.8310546875, 11.89599609375, 12.9609375, 14.02587890625, 15.0908203125, 16.15576171875, 17.220703125, 18.28564453125, 19.3505859375, 20.41552734375, 21.48046875, 22.54541015625, 23.6103515625, 24.67529296875, 25.740234375, 26.80517578125, 27.8701171875, 28.93505859375, 30.0]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 11.0, 19.0, 20.0, 19.0, 27.0, 37.0, 43.0, 57.0, 87.0, 117.0, 153.0, 232.0, 336.0, 840.0, 15082.0, 3121172.0, 5616.0, 681.0, 332.0, 222.0, 131.0, 124.0, 80.0, 59.0, 55.0, 33.0, 16.0, 28.0, 16.0, 17.0, 6.0, 11.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.3125, -67.650390625, -64.98828125, -62.326171875, -59.6640625, -57.001953125, -54.33984375, -51.677734375, -49.015625, -46.353515625, -43.69140625, -41.029296875, -38.3671875, -35.705078125, -33.04296875, -30.380859375, -27.71875, -25.056640625, -22.39453125, -19.732421875, -17.0703125, -14.408203125, -11.74609375, -9.083984375, -6.421875, -3.759765625, -1.09765625, 1.564453125, 4.2265625, 6.888671875, 9.55078125, 12.212890625, 14.875, 17.537109375, 20.19921875, 22.861328125, 25.5234375, 28.185546875, 30.84765625, 33.509765625, 36.171875, 38.833984375, 41.49609375, 44.158203125, 46.8203125, 49.482421875, 52.14453125, 54.806640625, 57.46875, 60.130859375, 62.79296875, 65.455078125, 68.1171875, 70.779296875, 73.44140625, 76.103515625, 78.765625, 81.427734375, 84.08984375, 86.751953125, 89.4140625, 92.076171875, 94.73828125, 97.400390625, 100.0625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 59.0, 280.0, 466.0, 177.0, 26.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.5234832763672, -131.73863220214844, -128.9537811279297, -126.1689224243164, -123.38407135009766, -120.5992202758789, -117.81436157226562, -115.02951049804688, -112.24465942382812, -109.45980834960938, -106.6749496459961, -103.89009857177734, -101.1052474975586, -98.32039642333984, -95.53553771972656, -92.75068664550781, -89.96583557128906, -87.18098449707031, -84.39612579345703, -81.61127471923828, -78.82642364501953, -76.04157257080078, -73.2567138671875, -70.47186279296875, -67.68700408935547, -64.90215301513672, -62.1172981262207, -59.33244323730469, -56.54759216308594, -53.76273727416992, -50.977882385253906, -48.193031311035156, -45.408180236816406, -42.62332534790039, -39.83847427368164, -37.053619384765625, -34.268768310546875, -31.48391342163086, -28.699060440063477, -25.914207458496094, -23.12935447692871, -20.344501495361328, -17.559648513793945, -14.774794578552246, -11.989941596984863, -9.20508861541748, -6.420234680175781, -3.6353816986083984, -0.8505287170410156, 1.9343245029449463, 4.719177722930908, 7.504031181335449, 10.288884162902832, 13.073737144470215, 15.858591079711914, 18.643444061279297, 21.42829704284668, 24.213150024414062, 26.998003005981445, 29.782855987548828, 32.567710876464844, 35.352561950683594, 38.13741683959961, 40.922271728515625, 43.707122802734375]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 5.0, 9.0, 8.0, 6.0, 12.0, 16.0, 19.0, 26.0, 18.0, 18.0, 20.0, 32.0, 27.0, 44.0, 30.0, 41.0, 40.0, 39.0, 36.0, 47.0, 43.0, 37.0, 39.0, 50.0, 37.0, 37.0, 30.0, 30.0, 28.0, 19.0, 24.0, 17.0, 16.0, 10.0, 18.0, 9.0, 8.0, 11.0, 4.0, 8.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-88.08821105957031, -85.36933135986328, -82.65045166015625, -79.93157196044922, -77.21269226074219, -74.49382019042969, -71.77494049072266, -69.05606079101562, -66.3371810913086, -63.61830139160156, -60.89942169189453, -58.180545806884766, -55.461666107177734, -52.7427864074707, -50.02391052246094, -47.305030822753906, -44.586151123046875, -41.867271423339844, -39.14839172363281, -36.42951583862305, -33.710636138916016, -30.991756439208984, -28.272878646850586, -25.554000854492188, -22.835121154785156, -20.116241455078125, -17.397363662719727, -14.678484916687012, -11.959606170654297, -9.240727424621582, -6.521848678588867, -3.8029708862304688, -1.0840911865234375, 1.6347875595092773, 4.353666305541992, 7.072545051574707, 9.791423797607422, 12.510302543640137, 15.229181289672852, 17.94805908203125, 20.66693878173828, 23.385818481445312, 26.10469627380371, 28.82357406616211, 31.54245376586914, 34.26133346557617, 36.98020935058594, 39.69908905029297, 42.41796875, 45.13684844970703, 47.85572814941406, 50.57460403442383, 53.29348373413086, 56.01236343383789, 58.731239318847656, 61.45011901855469, 64.16899871826172, 66.88787841796875, 69.60675811767578, 72.32563781738281, 75.04450988769531, 77.76338958740234, 80.48226928710938, 83.2011489868164, 85.92002868652344]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 6.0, 8.0, 11.0, 13.0, 10.0, 13.0, 20.0, 14.0, 17.0, 30.0, 30.0, 27.0, 31.0, 30.0, 40.0, 32.0, 34.0, 49.0, 37.0, 43.0, 36.0, 48.0, 38.0, 33.0, 31.0, 35.0, 44.0, 26.0, 28.0, 38.0, 20.0, 19.0, 18.0, 20.0, 10.0, 8.0, 11.0, 5.0, 7.0, 7.0, 3.0, 9.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.3125, -10.9759521484375, -10.639404296875, -10.3028564453125, -9.96630859375, -9.6297607421875, -9.293212890625, -8.9566650390625, -8.6201171875, -8.2835693359375, -7.947021484375, -7.6104736328125, -7.27392578125, -6.9373779296875, -6.600830078125, -6.2642822265625, -5.927734375, -5.5911865234375, -5.254638671875, -4.9180908203125, -4.58154296875, -4.2449951171875, -3.908447265625, -3.5718994140625, -3.2353515625, -2.8988037109375, -2.562255859375, -2.2257080078125, -1.88916015625, -1.5526123046875, -1.216064453125, -0.8795166015625, -0.54296875, -0.2064208984375, 0.130126953125, 0.4666748046875, 0.80322265625, 1.1397705078125, 1.476318359375, 1.8128662109375, 2.1494140625, 2.4859619140625, 2.822509765625, 3.1590576171875, 3.49560546875, 3.8321533203125, 4.168701171875, 4.5052490234375, 4.841796875, 5.1783447265625, 5.514892578125, 5.8514404296875, 6.18798828125, 6.5245361328125, 6.861083984375, 7.1976318359375, 7.5341796875, 7.8707275390625, 8.207275390625, 8.5438232421875, 8.88037109375, 9.2169189453125, 9.553466796875, 9.8900146484375, 10.2265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 4.0, 5.0, 10.0, 8.0, 5.0, 13.0, 16.0, 24.0, 27.0, 34.0, 40.0, 50.0, 67.0, 88.0, 118.0, 171.0, 291.0, 503.0, 1469.0, 8192.0, 379326.0, 3599756.0, 195555.0, 5899.0, 1218.0, 483.0, 246.0, 162.0, 93.0, 99.0, 64.0, 65.0, 40.0, 32.0, 13.0, 23.0, 15.0, 12.0, 7.0, 10.0, 5.0, 4.0, 4.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.90625, -35.80224609375, -34.6982421875, -33.59423828125, -32.490234375, -31.38623046875, -30.2822265625, -29.17822265625, -28.07421875, -26.97021484375, -25.8662109375, -24.76220703125, -23.658203125, -22.55419921875, -21.4501953125, -20.34619140625, -19.2421875, -18.13818359375, -17.0341796875, -15.93017578125, -14.826171875, -13.72216796875, -12.6181640625, -11.51416015625, -10.41015625, -9.30615234375, -8.2021484375, -7.09814453125, -5.994140625, -4.89013671875, -3.7861328125, -2.68212890625, -1.578125, -0.47412109375, 0.6298828125, 1.73388671875, 2.837890625, 3.94189453125, 5.0458984375, 6.14990234375, 7.25390625, 8.35791015625, 9.4619140625, 10.56591796875, 11.669921875, 12.77392578125, 13.8779296875, 14.98193359375, 16.0859375, 17.18994140625, 18.2939453125, 19.39794921875, 20.501953125, 21.60595703125, 22.7099609375, 23.81396484375, 24.91796875, 26.02197265625, 27.1259765625, 28.22998046875, 29.333984375, 30.43798828125, 31.5419921875, 32.64599609375, 33.75]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 5.0, 10.0, 24.0, 31.0, 70.0, 157.0, 326.0, 684.0, 1181.0, 857.0, 366.0, 175.0, 88.0, 53.0, 28.0, 13.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.625, -60.331787109375, -59.03857421875, -57.745361328125, -56.4521484375, -55.158935546875, -53.86572265625, -52.572509765625, -51.279296875, -49.986083984375, -48.69287109375, -47.399658203125, -46.1064453125, -44.813232421875, -43.52001953125, -42.226806640625, -40.93359375, -39.640380859375, -38.34716796875, -37.053955078125, -35.7607421875, -34.467529296875, -33.17431640625, -31.881103515625, -30.587890625, -29.294677734375, -28.00146484375, -26.708251953125, -25.4150390625, -24.121826171875, -22.82861328125, -21.535400390625, -20.2421875, -18.948974609375, -17.65576171875, -16.362548828125, -15.0693359375, -13.776123046875, -12.48291015625, -11.189697265625, -9.896484375, -8.603271484375, -7.31005859375, -6.016845703125, -4.7236328125, -3.430419921875, -2.13720703125, -0.843994140625, 0.44921875, 1.742431640625, 3.03564453125, 4.328857421875, 5.6220703125, 6.915283203125, 8.20849609375, 9.501708984375, 10.794921875, 12.088134765625, 13.38134765625, 14.674560546875, 15.9677734375, 17.260986328125, 18.55419921875, 19.847412109375, 21.140625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 18.0, 23.0, 71.0, 115.0, 168.0, 261.0, 605.0, 5006.0, 4185254.0, 1621.0, 494.0, 279.0, 155.0, 93.0, 50.0, 33.0, 15.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.1875, -115.6611328125, -108.134765625, -100.6083984375, -93.08203125, -85.5556640625, -78.029296875, -70.5029296875, -62.9765625, -55.4501953125, -47.923828125, -40.3974609375, -32.87109375, -25.3447265625, -17.818359375, -10.2919921875, -2.765625, 4.7607421875, 12.287109375, 19.8134765625, 27.33984375, 34.8662109375, 42.392578125, 49.9189453125, 57.4453125, 64.9716796875, 72.498046875, 80.0244140625, 87.55078125, 95.0771484375, 102.603515625, 110.1298828125, 117.65625, 125.1826171875, 132.708984375, 140.2353515625, 147.76171875, 155.2880859375, 162.814453125, 170.3408203125, 177.8671875, 185.3935546875, 192.919921875, 200.4462890625, 207.97265625, 215.4990234375, 223.025390625, 230.5517578125, 238.078125, 245.6044921875, 253.130859375, 260.6572265625, 268.18359375, 275.7099609375, 283.236328125, 290.7626953125, 298.2890625, 305.8154296875, 313.341796875, 320.8681640625, 328.39453125, 335.9208984375, 343.447265625, 350.9736328125, 358.5]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 10.0, 22.0, 33.0, 63.0, 114.0, 162.0, 170.0, 161.0, 130.0, 69.0, 39.0, 21.0, 8.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.78638458251953, -103.0548324584961, -100.32328033447266, -97.59172821044922, -94.86017608642578, -92.12862396240234, -89.3970718383789, -86.66551971435547, -83.93396759033203, -81.2024154663086, -78.47086334228516, -75.73931121826172, -73.00775909423828, -70.27620697021484, -67.5446548461914, -64.81310272216797, -62.08155059814453, -59.349998474121094, -56.618446350097656, -53.88689422607422, -51.15534210205078, -48.423789978027344, -45.692237854003906, -42.96068572998047, -40.22913360595703, -37.497581481933594, -34.766029357910156, -32.03447723388672, -29.30292510986328, -26.571372985839844, -23.839820861816406, -21.10826873779297, -18.37671661376953, -15.645164489746094, -12.913612365722656, -10.182060241699219, -7.450508117675781, -4.718955993652344, -1.9874038696289062, 0.7441482543945312, 3.4757003784179688, 6.207252502441406, 8.938804626464844, 11.670356750488281, 14.401908874511719, 17.133460998535156, 19.865013122558594, 22.59656524658203, 25.32811737060547, 28.059669494628906, 30.791221618652344, 33.52277374267578, 36.25432586669922, 38.985877990722656, 41.717430114746094, 44.44898223876953, 47.18053436279297, 49.912086486816406, 52.643638610839844, 55.37519073486328, 58.10674285888672, 60.838294982910156, 63.569847106933594, 66.30139923095703, 69.03295135498047]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 4.0, 10.0, 3.0, 7.0, 8.0, 11.0, 20.0, 19.0, 18.0, 17.0, 23.0, 28.0, 36.0, 29.0, 37.0, 39.0, 26.0, 38.0, 40.0, 42.0, 40.0, 36.0, 35.0, 37.0, 43.0, 35.0, 39.0, 26.0, 37.0, 32.0, 26.0, 19.0, 23.0, 14.0, 21.0, 14.0, 15.0, 10.0, 7.0, 6.0, 9.0, 2.0, 2.0, 7.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.13151550292969, -53.29866409301758, -51.4658088684082, -49.632957458496094, -47.80010223388672, -45.96725082397461, -44.1343994140625, -42.301544189453125, -40.46868896484375, -38.63583755493164, -36.802982330322266, -34.970130920410156, -33.13727569580078, -31.304424285888672, -29.47157096862793, -27.638717651367188, -25.805866241455078, -23.973012924194336, -22.140159606933594, -20.307308197021484, -18.47445297241211, -16.6416015625, -14.808748245239258, -12.975894927978516, -11.143041610717773, -9.310188293457031, -7.477335453033447, -5.644482612609863, -3.811629295349121, -1.978775978088379, -0.14592361450195312, 1.686929702758789, 3.5197792053222656, 5.352632522583008, 7.185485363006592, 9.018338203430176, 10.851191520690918, 12.68404483795166, 14.516897201538086, 16.349750518798828, 18.18260383605957, 20.015457153320312, 21.848310470581055, 23.681163787841797, 25.514015197753906, 27.34687042236328, 29.17972183227539, 31.012575149536133, 32.845428466796875, 34.678279876708984, 36.51113510131836, 38.34398651123047, 40.176841735839844, 42.00969314575195, 43.84254455566406, 45.67539978027344, 47.50825500488281, 49.34110641479492, 51.1739616394043, 53.006813049316406, 54.83966827392578, 56.67251968383789, 58.50537109375, 60.338226318359375, 62.171077728271484]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 4.0, 1.0, 2.0, 4.0, 10.0, 8.0, 11.0, 15.0, 16.0, 19.0, 17.0, 26.0, 23.0, 21.0, 27.0, 33.0, 31.0, 39.0, 38.0, 52.0, 43.0, 48.0, 45.0, 49.0, 39.0, 35.0, 34.0, 32.0, 32.0, 33.0, 32.0, 30.0, 24.0, 26.0, 14.0, 13.0, 13.0, 19.0, 13.0, 7.0, 6.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.7265625, -11.384765625, -11.04296875, -10.701171875, -10.359375, -10.017578125, -9.67578125, -9.333984375, -8.9921875, -8.650390625, -8.30859375, -7.966796875, -7.625, -7.283203125, -6.94140625, -6.599609375, -6.2578125, -5.916015625, -5.57421875, -5.232421875, -4.890625, -4.548828125, -4.20703125, -3.865234375, -3.5234375, -3.181640625, -2.83984375, -2.498046875, -2.15625, -1.814453125, -1.47265625, -1.130859375, -0.7890625, -0.447265625, -0.10546875, 0.236328125, 0.578125, 0.919921875, 1.26171875, 1.603515625, 1.9453125, 2.287109375, 2.62890625, 2.970703125, 3.3125, 3.654296875, 3.99609375, 4.337890625, 4.6796875, 5.021484375, 5.36328125, 5.705078125, 6.046875, 6.388671875, 6.73046875, 7.072265625, 7.4140625, 7.755859375, 8.09765625, 8.439453125, 8.78125, 9.123046875, 9.46484375, 9.806640625, 10.1484375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 7.0, 4.0, 11.0, 15.0, 33.0, 35.0, 53.0, 71.0, 118.0, 137.0, 292.0, 351.0, 544.0, 863.0, 1167.0, 1862.0, 2862.0, 4274.0, 6603.0, 10524.0, 16338.0, 25713.0, 41219.0, 68990.0, 125888.0, 311599.0, 193206.0, 92015.0, 53531.0, 32524.0, 20528.0, 12970.0, 8436.0, 5357.0, 3585.0, 2247.0, 1468.0, 1069.0, 634.0, 454.0, 290.0, 208.0, 139.0, 103.0, 67.0, 52.0, 29.0, 30.0, 15.0, 6.0, 9.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0], "bins": [-2.158203125, -2.092315673828125, -2.02642822265625, -1.960540771484375, -1.8946533203125, -1.828765869140625, -1.76287841796875, -1.696990966796875, -1.631103515625, -1.565216064453125, -1.49932861328125, -1.433441162109375, -1.3675537109375, -1.301666259765625, -1.23577880859375, -1.169891357421875, -1.10400390625, -1.038116455078125, -0.97222900390625, -0.906341552734375, -0.8404541015625, -0.774566650390625, -0.70867919921875, -0.642791748046875, -0.576904296875, -0.511016845703125, -0.44512939453125, -0.379241943359375, -0.3133544921875, -0.247467041015625, -0.18157958984375, -0.115692138671875, -0.0498046875, 0.016082763671875, 0.08197021484375, 0.147857666015625, 0.2137451171875, 0.279632568359375, 0.34552001953125, 0.411407470703125, 0.477294921875, 0.543182373046875, 0.60906982421875, 0.674957275390625, 0.7408447265625, 0.806732177734375, 0.87261962890625, 0.938507080078125, 1.00439453125, 1.070281982421875, 1.13616943359375, 1.202056884765625, 1.2679443359375, 1.333831787109375, 1.39971923828125, 1.465606689453125, 1.531494140625, 1.597381591796875, 1.66326904296875, 1.729156494140625, 1.7950439453125, 1.860931396484375, 1.92681884765625, 1.992706298828125, 2.05859375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 5.0, 5.0, 6.0, 3.0, 11.0, 12.0, 14.0, 10.0, 16.0, 26.0, 18.0, 25.0, 32.0, 27.0, 40.0, 37.0, 51.0, 51.0, 49.0, 50.0, 1059.0, 42.0, 40.0, 32.0, 41.0, 35.0, 31.0, 37.0, 41.0, 27.0, 24.0, 20.0, 18.0, 16.0, 15.0, 14.0, 10.0, 8.0, 8.0, 7.0, 1.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.71484375, -6.49041748046875, -6.2659912109375, -6.04156494140625, -5.817138671875, -5.59271240234375, -5.3682861328125, -5.14385986328125, -4.91943359375, -4.69500732421875, -4.4705810546875, -4.24615478515625, -4.021728515625, -3.79730224609375, -3.5728759765625, -3.34844970703125, -3.1240234375, -2.89959716796875, -2.6751708984375, -2.45074462890625, -2.226318359375, -2.00189208984375, -1.7774658203125, -1.55303955078125, -1.32861328125, -1.10418701171875, -0.8797607421875, -0.65533447265625, -0.430908203125, -0.20648193359375, 0.0179443359375, 0.24237060546875, 0.466796875, 0.69122314453125, 0.9156494140625, 1.14007568359375, 1.364501953125, 1.58892822265625, 1.8133544921875, 2.03778076171875, 2.26220703125, 2.48663330078125, 2.7110595703125, 2.93548583984375, 3.159912109375, 3.38433837890625, 3.6087646484375, 3.83319091796875, 4.0576171875, 4.28204345703125, 4.5064697265625, 4.73089599609375, 4.955322265625, 5.17974853515625, 5.4041748046875, 5.62860107421875, 5.85302734375, 6.07745361328125, 6.3018798828125, 6.52630615234375, 6.750732421875, 6.97515869140625, 7.1995849609375, 7.42401123046875, 7.6484375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 17.0, 22.0, 32.0, 57.0, 67.0, 94.0, 144.0, 234.0, 356.0, 571.0, 867.0, 1378.0, 2187.0, 3287.0, 5285.0, 8260.0, 12947.0, 20671.0, 34262.0, 58619.0, 110895.0, 1336706.0, 253414.0, 104041.0, 55950.0, 32510.0, 19817.0, 12380.0, 7818.0, 5070.0, 3215.0, 2060.0, 1441.0, 859.0, 552.0, 348.0, 226.0, 155.0, 88.0, 65.0, 50.0, 40.0, 32.0, 17.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.3125, -2.244384765625, -2.17626953125, -2.108154296875, -2.0400390625, -1.971923828125, -1.90380859375, -1.835693359375, -1.767578125, -1.699462890625, -1.63134765625, -1.563232421875, -1.4951171875, -1.427001953125, -1.35888671875, -1.290771484375, -1.22265625, -1.154541015625, -1.08642578125, -1.018310546875, -0.9501953125, -0.882080078125, -0.81396484375, -0.745849609375, -0.677734375, -0.609619140625, -0.54150390625, -0.473388671875, -0.4052734375, -0.337158203125, -0.26904296875, -0.200927734375, -0.1328125, -0.064697265625, 0.00341796875, 0.071533203125, 0.1396484375, 0.207763671875, 0.27587890625, 0.343994140625, 0.412109375, 0.480224609375, 0.54833984375, 0.616455078125, 0.6845703125, 0.752685546875, 0.82080078125, 0.888916015625, 0.95703125, 1.025146484375, 1.09326171875, 1.161376953125, 1.2294921875, 1.297607421875, 1.36572265625, 1.433837890625, 1.501953125, 1.570068359375, 1.63818359375, 1.706298828125, 1.7744140625, 1.842529296875, 1.91064453125, 1.978759765625, 2.046875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 6.0, 5.0, 10.0, 2.0, 8.0, 2.0, 5.0, 9.0, 10.0, 16.0, 10.0, 30.0, 25.0, 34.0, 34.0, 31.0, 40.0, 61.0, 57.0, 63.0, 85.0, 72.0, 53.0, 55.0, 45.0, 34.0, 43.0, 25.0, 23.0, 23.0, 12.0, 14.0, 8.0, 7.0, 5.0, 8.0, 2.0, 10.0, 3.0, 5.0, 3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0009737014770507812, -0.0009406507015228271, -0.000907599925994873, -0.0008745491504669189, -0.0008414983749389648, -0.0008084475994110107, -0.0007753968238830566, -0.0007423460483551025, -0.0007092952728271484, -0.0006762444972991943, -0.0006431937217712402, -0.0006101429462432861, -0.000577092170715332, -0.0005440413951873779, -0.0005109906196594238, -0.0004779398441314697, -0.0004448890686035156, -0.0004118382930755615, -0.0003787875175476074, -0.0003457367420196533, -0.0003126859664916992, -0.0002796351909637451, -0.000246584415435791, -0.00021353363990783691, -0.0001804828643798828, -0.0001474320888519287, -0.00011438131332397461, -8.133053779602051e-05, -4.8279762268066406e-05, -1.5228986740112305e-05, 1.7821788787841797e-05, 5.08725643157959e-05, 8.392333984375e-05, 0.0001169741153717041, 0.0001500248908996582, 0.0001830756664276123, 0.0002161264419555664, 0.0002491772174835205, 0.0002822279930114746, 0.0003152787685394287, 0.0003483295440673828, 0.0003813803195953369, 0.000414431095123291, 0.0004474818706512451, 0.0004805326461791992, 0.0005135834217071533, 0.0005466341972351074, 0.0005796849727630615, 0.0006127357482910156, 0.0006457865238189697, 0.0006788372993469238, 0.0007118880748748779, 0.000744938850402832, 0.0007779896259307861, 0.0008110404014587402, 0.0008440911769866943, 0.0008771419525146484, 0.0009101927280426025, 0.0009432435035705566, 0.0009762942790985107, 0.0010093450546264648, 0.001042395830154419, 0.001075446605682373, 0.0011084973812103271, 0.0011415481567382812]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 4.0, 2.0, 5.0, 4.0, 14.0, 12.0, 11.0, 24.0, 19.0, 39.0, 59.0, 80.0, 137.0, 205.0, 459.0, 1725.0, 1024660.0, 19561.0, 751.0, 277.0, 143.0, 104.0, 63.0, 46.0, 42.0, 20.0, 18.0, 9.0, 13.0, 10.0, 10.0, 6.0, 4.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.03326416015625, -0.03230595588684082, -0.03134775161743164, -0.03038954734802246, -0.02943134307861328, -0.0284731388092041, -0.027514934539794922, -0.026556730270385742, -0.025598526000976562, -0.024640321731567383, -0.023682117462158203, -0.022723913192749023, -0.021765708923339844, -0.020807504653930664, -0.019849300384521484, -0.018891096115112305, -0.017932891845703125, -0.016974687576293945, -0.016016483306884766, -0.015058279037475586, -0.014100074768066406, -0.013141870498657227, -0.012183666229248047, -0.011225461959838867, -0.010267257690429688, -0.009309053421020508, -0.008350849151611328, -0.0073926448822021484, -0.006434440612792969, -0.005476236343383789, -0.004518032073974609, -0.0035598278045654297, -0.00260162353515625, -0.0016434192657470703, -0.0006852149963378906, 0.00027298927307128906, 0.0012311935424804688, 0.0021893978118896484, 0.003147602081298828, 0.004105806350708008, 0.0050640106201171875, 0.006022214889526367, 0.006980419158935547, 0.007938623428344727, 0.008896827697753906, 0.009855031967163086, 0.010813236236572266, 0.011771440505981445, 0.012729644775390625, 0.013687849044799805, 0.014646053314208984, 0.015604257583618164, 0.016562461853027344, 0.017520666122436523, 0.018478870391845703, 0.019437074661254883, 0.020395278930664062, 0.021353483200073242, 0.022311687469482422, 0.0232698917388916, 0.02422809600830078, 0.02518630027770996, 0.02614450454711914, 0.02710270881652832, 0.0280609130859375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 45.0, 173.0, 428.0, 283.0, 64.0, 10.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014867241261526942, -0.001414787257090211, -0.0013428505044430494, -0.0012709136353805661, -0.0011989767663180828, -0.0011270400136709213, -0.001055103144608438, -0.0009831662755459547, -0.0009112295228987932, -0.0008392927120439708, -0.0007673559011891484, -0.0006954190321266651, -0.0006234822212718427, -0.0005515454104170203, -0.00047960857045836747, -0.0004076717304997146, -0.0003357349196448922, -0.0002637981087900698, -0.00019186126883141696, -0.00011992444342467934, -4.798761801794171e-05, 2.3949192836880684e-05, 9.588603279553354e-05, 0.0001678228727541864, 0.0002397596836090088, 0.0003116964944638312, 0.00038363333442248404, 0.0004555701743811369, 0.0005275069852359593, 0.0005994437960907817, 0.000671380665153265, 0.0007433174760080874, 0.000815254170447588, 0.0008871909813024104, 0.0009591277921572328, 0.001031064661219716, 0.0011030014138668776, 0.0011749382829293609, 0.0012468751519918442, 0.0013188119046390057, 0.001390748773701489, 0.0014626856427639723, 0.0015346223954111338, 0.001606559264473617, 0.0016784961335361004, 0.0017504328861832619, 0.0018223697552457452, 0.0018943066243082285, 0.00196624337695539, 0.0020381801296025515, 0.0021101171150803566, 0.002182053867727518, 0.0022539906203746796, 0.002325927373021841, 0.002397864358499646, 0.0024698011111468077, 0.002541738096624613, 0.0026136748492717743, 0.0026856118347495794, 0.002757548587396741, 0.0028294853400439024, 0.0029014223255217075, 0.002973359078168869, 0.0030452958308160305, 0.003117232583463192]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 0.0, 2.0, 4.0, 8.0, 6.0, 12.0, 13.0, 12.0, 9.0, 21.0, 20.0, 18.0, 27.0, 16.0, 32.0, 40.0, 35.0, 42.0, 41.0, 27.0, 31.0, 32.0, 36.0, 50.0, 44.0, 32.0, 40.0, 40.0, 47.0, 35.0, 23.0, 28.0, 32.0, 22.0, 21.0, 19.0, 15.0, 14.0, 18.0, 6.0, 10.0, 4.0, 5.0, 5.0, 3.0, 7.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0005573034286499023, -0.000540412962436676, -0.0005235224962234497, -0.0005066320300102234, -0.0004897415637969971, -0.00047285109758377075, -0.00045596063137054443, -0.0004390701651573181, -0.0004221796989440918, -0.0004052892327308655, -0.00038839876651763916, -0.00037150830030441284, -0.0003546178340911865, -0.0003377273678779602, -0.0003208369016647339, -0.00030394643545150757, -0.00028705596923828125, -0.00027016550302505493, -0.0002532750368118286, -0.0002363845705986023, -0.00021949410438537598, -0.00020260363817214966, -0.00018571317195892334, -0.00016882270574569702, -0.0001519322395324707, -0.00013504177331924438, -0.00011815130710601807, -0.00010126084089279175, -8.437037467956543e-05, -6.747990846633911e-05, -5.058944225311279e-05, -3.3698976039886475e-05, -1.6808509826660156e-05, 8.195638656616211e-08, 1.697242259979248e-05, 3.38628888130188e-05, 5.075335502624512e-05, 6.764382123947144e-05, 8.453428745269775e-05, 0.00010142475366592407, 0.00011831521987915039, 0.0001352056860923767, 0.00015209615230560303, 0.00016898661851882935, 0.00018587708473205566, 0.00020276755094528198, 0.0002196580171585083, 0.00023654848337173462, 0.00025343894958496094, 0.00027032941579818726, 0.0002872198820114136, 0.0003041103482246399, 0.0003210008144378662, 0.00033789128065109253, 0.00035478174686431885, 0.00037167221307754517, 0.0003885626792907715, 0.0004054531455039978, 0.0004223436117172241, 0.00043923407793045044, 0.00045612454414367676, 0.0004730150103569031, 0.0004899054765701294, 0.0005067959427833557, 0.000523686408996582]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 4.0, 1.0, 2.0, 4.0, 10.0, 8.0, 11.0, 15.0, 16.0, 19.0, 17.0, 26.0, 23.0, 21.0, 27.0, 33.0, 31.0, 39.0, 38.0, 52.0, 43.0, 48.0, 45.0, 49.0, 39.0, 35.0, 34.0, 32.0, 32.0, 33.0, 32.0, 30.0, 24.0, 26.0, 14.0, 13.0, 13.0, 19.0, 13.0, 7.0, 6.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.7265625, -11.384765625, -11.04296875, -10.701171875, -10.359375, -10.017578125, -9.67578125, -9.333984375, -8.9921875, -8.650390625, -8.30859375, -7.966796875, -7.625, -7.283203125, -6.94140625, -6.599609375, -6.2578125, -5.916015625, -5.57421875, -5.232421875, -4.890625, -4.548828125, -4.20703125, -3.865234375, -3.5234375, -3.181640625, -2.83984375, -2.498046875, -2.15625, -1.814453125, -1.47265625, -1.130859375, -0.7890625, -0.447265625, -0.10546875, 0.236328125, 0.578125, 0.919921875, 1.26171875, 1.603515625, 1.9453125, 2.287109375, 2.62890625, 2.970703125, 3.3125, 3.654296875, 3.99609375, 4.337890625, 4.6796875, 5.021484375, 5.36328125, 5.705078125, 6.046875, 6.388671875, 6.73046875, 7.072265625, 7.4140625, 7.755859375, 8.09765625, 8.439453125, 8.78125, 9.123046875, 9.46484375, 9.806640625, 10.1484375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 9.0, 5.0, 2.0, 3.0, 5.0, 12.0, 10.0, 10.0, 38.0, 17.0, 32.0, 42.0, 59.0, 83.0, 98.0, 130.0, 213.0, 319.0, 539.0, 905.0, 2307.0, 11214.0, 139013.0, 816944.0, 65737.0, 6900.0, 1688.0, 759.0, 455.0, 282.0, 198.0, 123.0, 105.0, 69.0, 62.0, 31.0, 27.0, 34.0, 24.0, 19.0, 8.0, 8.0, 8.0, 5.0, 7.0, 0.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.625, -20.995849609375, -20.36669921875, -19.737548828125, -19.1083984375, -18.479248046875, -17.85009765625, -17.220947265625, -16.591796875, -15.962646484375, -15.33349609375, -14.704345703125, -14.0751953125, -13.446044921875, -12.81689453125, -12.187744140625, -11.55859375, -10.929443359375, -10.30029296875, -9.671142578125, -9.0419921875, -8.412841796875, -7.78369140625, -7.154541015625, -6.525390625, -5.896240234375, -5.26708984375, -4.637939453125, -4.0087890625, -3.379638671875, -2.75048828125, -2.121337890625, -1.4921875, -0.863037109375, -0.23388671875, 0.395263671875, 1.0244140625, 1.653564453125, 2.28271484375, 2.911865234375, 3.541015625, 4.170166015625, 4.79931640625, 5.428466796875, 6.0576171875, 6.686767578125, 7.31591796875, 7.945068359375, 8.57421875, 9.203369140625, 9.83251953125, 10.461669921875, 11.0908203125, 11.719970703125, 12.34912109375, 12.978271484375, 13.607421875, 14.236572265625, 14.86572265625, 15.494873046875, 16.1240234375, 16.753173828125, 17.38232421875, 18.011474609375, 18.640625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 1.0, 6.0, 7.0, 11.0, 13.0, 24.0, 31.0, 39.0, 29.0, 46.0, 57.0, 60.0, 96.0, 287.0, 1821.0, 100.0, 79.0, 64.0, 65.0, 55.0, 40.0, 35.0, 24.0, 13.0, 17.0, 8.0, 5.0, 5.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.0, -53.3896484375, -51.779296875, -50.1689453125, -48.55859375, -46.9482421875, -45.337890625, -43.7275390625, -42.1171875, -40.5068359375, -38.896484375, -37.2861328125, -35.67578125, -34.0654296875, -32.455078125, -30.8447265625, -29.234375, -27.6240234375, -26.013671875, -24.4033203125, -22.79296875, -21.1826171875, -19.572265625, -17.9619140625, -16.3515625, -14.7412109375, -13.130859375, -11.5205078125, -9.91015625, -8.2998046875, -6.689453125, -5.0791015625, -3.46875, -1.8583984375, -0.248046875, 1.3623046875, 2.97265625, 4.5830078125, 6.193359375, 7.8037109375, 9.4140625, 11.0244140625, 12.634765625, 14.2451171875, 15.85546875, 17.4658203125, 19.076171875, 20.6865234375, 22.296875, 23.9072265625, 25.517578125, 27.1279296875, 28.73828125, 30.3486328125, 31.958984375, 33.5693359375, 35.1796875, 36.7900390625, 38.400390625, 40.0107421875, 41.62109375, 43.2314453125, 44.841796875, 46.4521484375, 48.0625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 6.0, 6.0, 16.0, 18.0, 26.0, 41.0, 44.0, 72.0, 97.0, 150.0, 358.0, 1225.0, 3121940.0, 20514.0, 562.0, 241.0, 125.0, 68.0, 40.0, 37.0, 33.0, 23.0, 18.0, 13.0, 6.0, 7.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-143.875, -139.046875, -134.21875, -129.390625, -124.5625, -119.734375, -114.90625, -110.078125, -105.25, -100.421875, -95.59375, -90.765625, -85.9375, -81.109375, -76.28125, -71.453125, -66.625, -61.796875, -56.96875, -52.140625, -47.3125, -42.484375, -37.65625, -32.828125, -28.0, -23.171875, -18.34375, -13.515625, -8.6875, -3.859375, 0.96875, 5.796875, 10.625, 15.453125, 20.28125, 25.109375, 29.9375, 34.765625, 39.59375, 44.421875, 49.25, 54.078125, 58.90625, 63.734375, 68.5625, 73.390625, 78.21875, 83.046875, 87.875, 92.703125, 97.53125, 102.359375, 107.1875, 112.015625, 116.84375, 121.671875, 126.5, 131.328125, 136.15625, 140.984375, 145.8125, 150.640625, 155.46875, 160.296875, 165.125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 11.0, 27.0, 71.0, 142.0, 175.0, 227.0, 162.0, 114.0, 52.0, 24.0, 6.0, 1.0, 1.0], "bins": [-73.5364990234375, -72.2325210571289, -70.92853546142578, -69.62455749511719, -68.3205795288086, -67.01659393310547, -65.71261596679688, -64.40863800048828, -63.104652404785156, -61.8006706237793, -60.4966926574707, -59.192710876464844, -57.888729095458984, -56.584747314453125, -55.28076934814453, -53.97678756713867, -52.67280960083008, -51.36882781982422, -50.064849853515625, -48.760868072509766, -47.456886291503906, -46.15290832519531, -44.84892654418945, -43.544944763183594, -42.240966796875, -40.93698501586914, -39.63300704956055, -38.32902526855469, -37.02504348754883, -35.72106170654297, -34.417083740234375, -33.113101959228516, -31.80912208557129, -30.505142211914062, -29.201160430908203, -27.897180557250977, -26.59320068359375, -25.28921890258789, -23.985239028930664, -22.681259155273438, -21.377277374267578, -20.07329750061035, -18.769315719604492, -17.465335845947266, -16.161354064941406, -14.85737419128418, -13.553394317626953, -12.24941349029541, -10.945432662963867, -9.641451835632324, -8.337471008300781, -7.033491134643555, -5.729510307312012, -4.425529479980469, -3.121549129486084, -1.8175687789916992, -0.5135879516601562, 0.7903926372528076, 2.0943732261657715, 3.3983538150787354, 4.702334403991699, 6.006315231323242, 7.310295581817627, 8.614275932312012, 9.918256759643555]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 5.0, 15.0, 10.0, 13.0, 13.0, 13.0, 14.0, 24.0, 32.0, 36.0, 30.0, 37.0, 32.0, 40.0, 42.0, 41.0, 34.0, 37.0, 52.0, 36.0, 45.0, 35.0, 38.0, 34.0, 33.0, 41.0, 21.0, 27.0, 26.0, 21.0, 28.0, 13.0, 12.0, 13.0, 13.0, 9.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-139.5255584716797, -135.69566345214844, -131.86575317382812, -128.03585815429688, -124.2059555053711, -120.37605285644531, -116.54615783691406, -112.71625518798828, -108.8863525390625, -105.05644989013672, -101.22655487060547, -97.39665222167969, -93.5667495727539, -89.73684692382812, -85.90695190429688, -82.0770492553711, -78.24714660644531, -74.41724395751953, -70.58734893798828, -66.7574462890625, -62.92754364013672, -59.0976448059082, -55.26774597167969, -51.437843322753906, -47.607948303222656, -43.77804946899414, -39.94814682006836, -36.118247985839844, -32.28834533691406, -28.458446502685547, -24.6285457611084, -20.79864501953125, -16.96874237060547, -13.13884162902832, -9.308940887451172, -5.47904109954834, -1.6491403579711914, 2.1807594299316406, 6.010660171508789, 9.840560913085938, 13.670461654663086, 17.500362396240234, 21.330263137817383, 25.16016387939453, 28.990062713623047, 32.81996154785156, 36.649864196777344, 40.479766845703125, 44.30966567993164, 48.139564514160156, 51.96946716308594, 55.79936599731445, 59.629268646240234, 63.45916748046875, 67.28907012939453, 71.11897277832031, 74.94886779785156, 78.77877044677734, 82.6086654663086, 86.43856811523438, 90.26847076416016, 94.09837341308594, 97.92826843261719, 101.75817108154297, 105.58807373046875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 1.0, 9.0, 8.0, 12.0, 13.0, 10.0, 9.0, 19.0, 27.0, 20.0, 18.0, 34.0, 26.0, 32.0, 30.0, 44.0, 33.0, 41.0, 44.0, 36.0, 58.0, 47.0, 37.0, 34.0, 29.0, 33.0, 36.0, 31.0, 36.0, 32.0, 26.0, 17.0, 13.0, 14.0, 20.0, 13.0, 10.0, 8.0, 11.0, 8.0, 5.0, 3.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.7890625, -11.4364013671875, -11.083740234375, -10.7310791015625, -10.37841796875, -10.0257568359375, -9.673095703125, -9.3204345703125, -8.9677734375, -8.6151123046875, -8.262451171875, -7.9097900390625, -7.55712890625, -7.2044677734375, -6.851806640625, -6.4991455078125, -6.146484375, -5.7938232421875, -5.441162109375, -5.0885009765625, -4.73583984375, -4.3831787109375, -4.030517578125, -3.6778564453125, -3.3251953125, -2.9725341796875, -2.619873046875, -2.2672119140625, -1.91455078125, -1.5618896484375, -1.209228515625, -0.8565673828125, -0.50390625, -0.1512451171875, 0.201416015625, 0.5540771484375, 0.90673828125, 1.2593994140625, 1.612060546875, 1.9647216796875, 2.3173828125, 2.6700439453125, 3.022705078125, 3.3753662109375, 3.72802734375, 4.0806884765625, 4.433349609375, 4.7860107421875, 5.138671875, 5.4913330078125, 5.843994140625, 6.1966552734375, 6.54931640625, 6.9019775390625, 7.254638671875, 7.6072998046875, 7.9599609375, 8.3126220703125, 8.665283203125, 9.0179443359375, 9.37060546875, 9.7232666015625, 10.075927734375, 10.4285888671875, 10.78125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 9.0, 9.0, 5.0, 13.0, 16.0, 17.0, 24.0, 27.0, 46.0, 55.0, 71.0, 114.0, 143.0, 218.0, 301.0, 557.0, 1016.0, 2241.0, 5392.0, 17074.0, 80368.0, 419722.0, 1346241.0, 1578917.0, 586520.0, 118140.0, 24449.0, 6953.0, 2555.0, 1231.0, 686.0, 328.0, 218.0, 158.0, 115.0, 78.0, 62.0, 52.0, 41.0, 24.0, 11.0, 21.0, 12.0, 5.0, 8.0, 4.0, 6.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-13.7734375, -13.3575439453125, -12.941650390625, -12.5257568359375, -12.10986328125, -11.6939697265625, -11.278076171875, -10.8621826171875, -10.4462890625, -10.0303955078125, -9.614501953125, -9.1986083984375, -8.78271484375, -8.3668212890625, -7.950927734375, -7.5350341796875, -7.119140625, -6.7032470703125, -6.287353515625, -5.8714599609375, -5.45556640625, -5.0396728515625, -4.623779296875, -4.2078857421875, -3.7919921875, -3.3760986328125, -2.960205078125, -2.5443115234375, -2.12841796875, -1.7125244140625, -1.296630859375, -0.8807373046875, -0.46484375, -0.0489501953125, 0.366943359375, 0.7828369140625, 1.19873046875, 1.6146240234375, 2.030517578125, 2.4464111328125, 2.8623046875, 3.2781982421875, 3.694091796875, 4.1099853515625, 4.52587890625, 4.9417724609375, 5.357666015625, 5.7735595703125, 6.189453125, 6.6053466796875, 7.021240234375, 7.4371337890625, 7.85302734375, 8.2689208984375, 8.684814453125, 9.1007080078125, 9.5166015625, 9.9324951171875, 10.348388671875, 10.7642822265625, 11.18017578125, 11.5960693359375, 12.011962890625, 12.4278564453125, 12.84375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 5.0, 19.0, 17.0, 36.0, 66.0, 125.0, 165.0, 287.0, 496.0, 855.0, 757.0, 497.0, 302.0, 168.0, 125.0, 69.0, 32.0, 24.0, 15.0, 10.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0, -16.875, -15.75, -14.625, -13.5, -12.375, -11.25, -10.125, -9.0, -7.875, -6.75, -5.625, -4.5, -3.375, -2.25, -1.125, 0.0, 1.125, 2.25, 3.375, 4.5, 5.625, 6.75, 7.875, 9.0, 10.125, 11.25, 12.375, 13.5, 14.625, 15.75, 16.875, 18.0, 19.125, 20.25, 21.375, 22.5, 23.625, 24.75, 25.875, 27.0, 28.125, 29.25, 30.375, 31.5, 32.625, 33.75, 34.875, 36.0, 37.125, 38.25, 39.375, 40.5, 41.625, 42.75, 43.875, 45.0, 46.125, 47.25, 48.375, 49.5, 50.625, 51.75, 52.875, 54.0]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 14.0, 22.0, 25.0, 38.0, 51.0, 91.0, 153.0, 149.0, 217.0, 303.0, 509.0, 1248.0, 37144.0, 4146563.0, 5472.0, 889.0, 446.0, 273.0, 188.0, 129.0, 120.0, 81.0, 55.0, 41.0, 24.0, 18.0, 4.0, 10.0, 6.0, 2.0, 3.0], "bins": [-192.75, -188.58984375, -184.4296875, -180.26953125, -176.109375, -171.94921875, -167.7890625, -163.62890625, -159.46875, -155.30859375, -151.1484375, -146.98828125, -142.828125, -138.66796875, -134.5078125, -130.34765625, -126.1875, -122.02734375, -117.8671875, -113.70703125, -109.546875, -105.38671875, -101.2265625, -97.06640625, -92.90625, -88.74609375, -84.5859375, -80.42578125, -76.265625, -72.10546875, -67.9453125, -63.78515625, -59.625, -55.46484375, -51.3046875, -47.14453125, -42.984375, -38.82421875, -34.6640625, -30.50390625, -26.34375, -22.18359375, -18.0234375, -13.86328125, -9.703125, -5.54296875, -1.3828125, 2.77734375, 6.9375, 11.09765625, 15.2578125, 19.41796875, 23.578125, 27.73828125, 31.8984375, 36.05859375, 40.21875, 44.37890625, 48.5390625, 52.69921875, 56.859375, 61.01953125, 65.1796875, 69.33984375, 73.5]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 919.0, 94.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-629.6895141601562, -600.6205444335938, -571.5516357421875, -542.482666015625, -513.4137573242188, -484.34478759765625, -455.2758483886719, -426.2069091796875, -397.1379699707031, -368.06903076171875, -339.0000915527344, -309.93115234375, -280.8621826171875, -251.7932586669922, -222.72430419921875, -193.65536499023438, -164.58642578125, -135.51748657226562, -106.44853973388672, -77.37959289550781, -48.31065368652344, -19.241714477539062, 9.827239990234375, 38.89617919921875, 67.96511840820312, 97.0340576171875, 126.1030044555664, 155.1719512939453, 184.2408905029297, 213.30982971191406, 242.3787841796875, 271.4477233886719, 300.5166015625, 329.5855407714844, 358.65447998046875, 387.72344970703125, 416.7923583984375, 445.861328125, 474.9302673339844, 503.99920654296875, 533.068115234375, 562.1370849609375, 591.2059936523438, 620.2749633789062, 649.3438720703125, 678.412841796875, 707.4818115234375, 736.5507202148438, 765.6196899414062, 794.6886596679688, 823.757568359375, 852.8265380859375, 881.8954467773438, 910.9644165039062, 940.0333251953125, 969.102294921875, 998.1712646484375, 1027.240234375, 1056.3092041015625, 1085.3780517578125, 1114.447021484375, 1143.5159912109375, 1172.5849609375, 1201.65380859375, 1230.7227783203125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 3.0, 7.0, 5.0, 6.0, 13.0, 14.0, 13.0, 23.0, 19.0, 29.0, 22.0, 25.0, 40.0, 41.0, 35.0, 51.0, 51.0, 47.0, 48.0, 51.0, 42.0, 33.0, 52.0, 41.0, 44.0, 35.0, 35.0, 23.0, 26.0, 23.0, 21.0, 11.0, 15.0, 15.0, 8.0, 6.0, 4.0, 3.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-80.765380859375, -78.41329193115234, -76.06121063232422, -73.70912170410156, -71.35704040527344, -69.00495147705078, -66.65286254882812, -64.30078125, -61.948692321777344, -59.59660720825195, -57.24452209472656, -54.892433166503906, -52.540348052978516, -50.188262939453125, -47.83617401123047, -45.48408889770508, -43.13200378417969, -40.7799186706543, -38.427833557128906, -36.07574462890625, -33.72365951538086, -31.37157440185547, -29.019487380981445, -26.667400360107422, -24.31531524658203, -21.96323013305664, -19.611143112182617, -17.259056091308594, -14.906970977783203, -12.554884910583496, -10.202798843383789, -7.850711822509766, -5.498634338378906, -3.146548271179199, -0.7944622039794922, 1.5576238632202148, 3.909709930419922, 6.261795997619629, 8.613882064819336, 10.96596908569336, 13.31805419921875, 15.670140266418457, 18.022226333618164, 20.374313354492188, 22.726398468017578, 25.07848358154297, 27.430570602416992, 29.782657623291016, 32.134742736816406, 34.4868278503418, 36.83891296386719, 39.191001892089844, 41.543087005615234, 43.895172119140625, 46.24726104736328, 48.59934616088867, 50.95143127441406, 53.30351638793945, 55.655601501464844, 58.0076904296875, 60.35977554321289, 62.71186065673828, 65.06394958496094, 67.41603088378906, 69.76811981201172]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 0.0, 2.0, 4.0, 7.0, 17.0, 14.0, 10.0, 14.0, 15.0, 18.0, 23.0, 22.0, 28.0, 26.0, 38.0, 38.0, 25.0, 31.0, 40.0, 45.0, 36.0, 43.0, 35.0, 49.0, 36.0, 42.0, 31.0, 40.0, 11.0, 37.0, 38.0, 29.0, 25.0, 14.0, 15.0, 14.0, 19.0, 8.0, 9.0, 9.0, 13.0, 5.0, 4.0, 5.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-11.3125, -10.970458984375, -10.62841796875, -10.286376953125, -9.9443359375, -9.602294921875, -9.26025390625, -8.918212890625, -8.576171875, -8.234130859375, -7.89208984375, -7.550048828125, -7.2080078125, -6.865966796875, -6.52392578125, -6.181884765625, -5.83984375, -5.497802734375, -5.15576171875, -4.813720703125, -4.4716796875, -4.129638671875, -3.78759765625, -3.445556640625, -3.103515625, -2.761474609375, -2.41943359375, -2.077392578125, -1.7353515625, -1.393310546875, -1.05126953125, -0.709228515625, -0.3671875, -0.025146484375, 0.31689453125, 0.658935546875, 1.0009765625, 1.343017578125, 1.68505859375, 2.027099609375, 2.369140625, 2.711181640625, 3.05322265625, 3.395263671875, 3.7373046875, 4.079345703125, 4.42138671875, 4.763427734375, 5.10546875, 5.447509765625, 5.78955078125, 6.131591796875, 6.4736328125, 6.815673828125, 7.15771484375, 7.499755859375, 7.841796875, 8.183837890625, 8.52587890625, 8.867919921875, 9.2099609375, 9.552001953125, 9.89404296875, 10.236083984375, 10.578125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 4.0, 8.0, 8.0, 19.0, 25.0, 54.0, 69.0, 78.0, 101.0, 164.0, 279.0, 317.0, 404.0, 641.0, 960.0, 1288.0, 1845.0, 2593.0, 3776.0, 5178.0, 7642.0, 11025.0, 16213.0, 24786.0, 37541.0, 58603.0, 100827.0, 236228.0, 254693.0, 104379.0, 61047.0, 38455.0, 25122.0, 16952.0, 11239.0, 7674.0, 5385.0, 3675.0, 2723.0, 1896.0, 1328.0, 1010.0, 672.0, 503.0, 350.0, 260.0, 160.0, 105.0, 78.0, 66.0, 39.0, 27.0, 16.0, 9.0, 8.0, 6.0, 3.0, 3.0, 4.0, 0.0, 2.0], "bins": [-1.939453125, -1.876953125, -1.814453125, -1.751953125, -1.689453125, -1.626953125, -1.564453125, -1.501953125, -1.439453125, -1.376953125, -1.314453125, -1.251953125, -1.189453125, -1.126953125, -1.064453125, -1.001953125, -0.939453125, -0.876953125, -0.814453125, -0.751953125, -0.689453125, -0.626953125, -0.564453125, -0.501953125, -0.439453125, -0.376953125, -0.314453125, -0.251953125, -0.189453125, -0.126953125, -0.064453125, -0.001953125, 0.060546875, 0.123046875, 0.185546875, 0.248046875, 0.310546875, 0.373046875, 0.435546875, 0.498046875, 0.560546875, 0.623046875, 0.685546875, 0.748046875, 0.810546875, 0.873046875, 0.935546875, 0.998046875, 1.060546875, 1.123046875, 1.185546875, 1.248046875, 1.310546875, 1.373046875, 1.435546875, 1.498046875, 1.560546875, 1.623046875, 1.685546875, 1.748046875, 1.810546875, 1.873046875, 1.935546875, 1.998046875, 2.060546875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 2.0, 5.0, 9.0, 10.0, 6.0, 21.0, 25.0, 19.0, 22.0, 23.0, 28.0, 34.0, 33.0, 41.0, 36.0, 36.0, 48.0, 52.0, 1076.0, 46.0, 35.0, 42.0, 34.0, 42.0, 29.0, 45.0, 25.0, 31.0, 22.0, 26.0, 20.0, 23.0, 22.0, 13.0, 12.0, 8.0, 2.0, 8.0, 0.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.8828125, -8.62664794921875, -8.3704833984375, -8.11431884765625, -7.858154296875, -7.60198974609375, -7.3458251953125, -7.08966064453125, -6.83349609375, -6.57733154296875, -6.3211669921875, -6.06500244140625, -5.808837890625, -5.55267333984375, -5.2965087890625, -5.04034423828125, -4.7841796875, -4.52801513671875, -4.2718505859375, -4.01568603515625, -3.759521484375, -3.50335693359375, -3.2471923828125, -2.99102783203125, -2.73486328125, -2.47869873046875, -2.2225341796875, -1.96636962890625, -1.710205078125, -1.45404052734375, -1.1978759765625, -0.94171142578125, -0.685546875, -0.42938232421875, -0.1732177734375, 0.08294677734375, 0.339111328125, 0.59527587890625, 0.8514404296875, 1.10760498046875, 1.36376953125, 1.61993408203125, 1.8760986328125, 2.13226318359375, 2.388427734375, 2.64459228515625, 2.9007568359375, 3.15692138671875, 3.4130859375, 3.66925048828125, 3.9254150390625, 4.18157958984375, 4.437744140625, 4.69390869140625, 4.9500732421875, 5.20623779296875, 5.46240234375, 5.71856689453125, 5.9747314453125, 6.23089599609375, 6.487060546875, 6.74322509765625, 6.9993896484375, 7.25555419921875, 7.51171875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 6.0, 9.0, 16.0, 15.0, 29.0, 54.0, 52.0, 87.0, 142.0, 184.0, 337.0, 499.0, 818.0, 1104.0, 1850.0, 2882.0, 4843.0, 7793.0, 12762.0, 20211.0, 33655.0, 56386.0, 103280.0, 1213296.0, 391581.0, 102822.0, 56142.0, 33417.0, 20209.0, 12471.0, 7601.0, 4641.0, 2830.0, 1786.0, 1123.0, 749.0, 486.0, 336.0, 206.0, 125.0, 89.0, 68.0, 51.0, 28.0, 17.0, 11.0, 11.0, 11.0, 5.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.369140625, -2.2901611328125, -2.211181640625, -2.1322021484375, -2.05322265625, -1.9742431640625, -1.895263671875, -1.8162841796875, -1.7373046875, -1.6583251953125, -1.579345703125, -1.5003662109375, -1.42138671875, -1.3424072265625, -1.263427734375, -1.1844482421875, -1.10546875, -1.0264892578125, -0.947509765625, -0.8685302734375, -0.78955078125, -0.7105712890625, -0.631591796875, -0.5526123046875, -0.4736328125, -0.3946533203125, -0.315673828125, -0.2366943359375, -0.15771484375, -0.0787353515625, 0.000244140625, 0.0792236328125, 0.158203125, 0.2371826171875, 0.316162109375, 0.3951416015625, 0.47412109375, 0.5531005859375, 0.632080078125, 0.7110595703125, 0.7900390625, 0.8690185546875, 0.947998046875, 1.0269775390625, 1.10595703125, 1.1849365234375, 1.263916015625, 1.3428955078125, 1.421875, 1.5008544921875, 1.579833984375, 1.6588134765625, 1.73779296875, 1.8167724609375, 1.895751953125, 1.9747314453125, 2.0537109375, 2.1326904296875, 2.211669921875, 2.2906494140625, 2.36962890625, 2.4486083984375, 2.527587890625, 2.6065673828125, 2.685546875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 7.0, 10.0, 16.0, 18.0, 24.0, 21.0, 44.0, 46.0, 46.0, 50.0, 63.0, 78.0, 85.0, 72.0, 76.0, 75.0, 62.0, 49.0, 34.0, 29.0, 23.0, 15.0, 12.0, 9.0, 11.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013637542724609375, -0.0013212859630584717, -0.0012788176536560059, -0.00123634934425354, -0.0011938810348510742, -0.0011514127254486084, -0.0011089444160461426, -0.0010664761066436768, -0.001024007797241211, -0.0009815394878387451, -0.0009390711784362793, -0.0008966028690338135, -0.0008541345596313477, -0.0008116662502288818, -0.000769197940826416, -0.0007267296314239502, -0.0006842613220214844, -0.0006417930126190186, -0.0005993247032165527, -0.0005568563938140869, -0.0005143880844116211, -0.0004719197750091553, -0.00042945146560668945, -0.00038698315620422363, -0.0003445148468017578, -0.000302046537399292, -0.00025957822799682617, -0.00021710991859436035, -0.00017464160919189453, -0.0001321732997894287, -8.970499038696289e-05, -4.723668098449707e-05, -4.76837158203125e-06, 3.769993782043457e-05, 8.016824722290039e-05, 0.0001226365566253662, 0.00016510486602783203, 0.00020757317543029785, 0.00025004148483276367, 0.0002925097942352295, 0.0003349781036376953, 0.00037744641304016113, 0.00041991472244262695, 0.0004623830318450928, 0.0005048513412475586, 0.0005473196506500244, 0.0005897879600524902, 0.0006322562694549561, 0.0006747245788574219, 0.0007171928882598877, 0.0007596611976623535, 0.0008021295070648193, 0.0008445978164672852, 0.000887066125869751, 0.0009295344352722168, 0.0009720027446746826, 0.0010144710540771484, 0.0010569393634796143, 0.00109940767288208, 0.001141875982284546, 0.0011843442916870117, 0.0012268126010894775, 0.0012692809104919434, 0.0013117492198944092, 0.001354217529296875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 5.0, 6.0, 12.0, 10.0, 11.0, 22.0, 20.0, 37.0, 29.0, 66.0, 70.0, 124.0, 186.0, 409.0, 2424.0, 1033775.0, 9945.0, 597.0, 266.0, 139.0, 90.0, 73.0, 59.0, 42.0, 23.0, 20.0, 25.0, 19.0, 18.0, 6.0, 7.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.031280517578125, -0.030402660369873047, -0.029524803161621094, -0.02864694595336914, -0.027769088745117188, -0.026891231536865234, -0.02601337432861328, -0.025135517120361328, -0.024257659912109375, -0.023379802703857422, -0.02250194549560547, -0.021624088287353516, -0.020746231079101562, -0.01986837387084961, -0.018990516662597656, -0.018112659454345703, -0.01723480224609375, -0.016356945037841797, -0.015479087829589844, -0.01460123062133789, -0.013723373413085938, -0.012845516204833984, -0.011967658996582031, -0.011089801788330078, -0.010211944580078125, -0.009334087371826172, -0.008456230163574219, -0.007578372955322266, -0.0067005157470703125, -0.005822658538818359, -0.004944801330566406, -0.004066944122314453, -0.0031890869140625, -0.002311229705810547, -0.0014333724975585938, -0.0005555152893066406, 0.0003223419189453125, 0.0012001991271972656, 0.0020780563354492188, 0.002955913543701172, 0.003833770751953125, 0.004711627960205078, 0.005589485168457031, 0.006467342376708984, 0.0073451995849609375, 0.00822305679321289, 0.009100914001464844, 0.009978771209716797, 0.01085662841796875, 0.011734485626220703, 0.012612342834472656, 0.01349020004272461, 0.014368057250976562, 0.015245914459228516, 0.01612377166748047, 0.017001628875732422, 0.017879486083984375, 0.018757343292236328, 0.01963520050048828, 0.020513057708740234, 0.021390914916992188, 0.02226877212524414, 0.023146629333496094, 0.024024486541748047, 0.02490234375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 16.0, 293.0, 606.0, 93.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002163088647648692, -0.0020445517729967833, -0.0019260148983448744, -0.0018074781401082873, -0.0016889412654563785, -0.0015704043908044696, -0.0014518676325678825, -0.0013333307579159737, -0.0012147938832640648, -0.001096257008612156, -0.000977720133960247, -0.00085918337572366, -0.0007406465010717511, -0.0006221096264198422, -0.0005035728099755943, -0.0003850359935313463, -0.00026649911887943745, -0.00014796227333135903, -2.942542778328061e-05, 8.91114177647978e-05, 0.00020764826331287622, 0.0003261851379647851, 0.00044472195440903306, 0.000563258770853281, 0.0006817956455051899, 0.0008003325201570988, 0.0009188693366013467, 0.0010374061530455947, 0.0011559430276975036, 0.0012744799023494124, 0.0013930166605859995, 0.0015115535352379084, 0.0016300901770591736, 0.0017486270517110825, 0.0018671639263629913, 0.0019857008010149, 0.002104237675666809, 0.002222774550318718, 0.002341311192139983, 0.002459848066791892, 0.002578384941443801, 0.00269692181609571, 0.0028154586907476187, 0.0029339955653995275, 0.0030525322072207928, 0.0031710690818727016, 0.0032896059565246105, 0.0034081428311765194, 0.0035266797058284283, 0.003645216580480337, 0.003763753455132246, 0.003882290329784155, 0.004000827204436064, 0.004119364079087973, 0.0042379009537398815, 0.004356437362730503, 0.004474974237382412, 0.004593511112034321, 0.00471204798668623, 0.004830584861338139, 0.0049491217359900475, 0.005067658610641956, 0.005186195485293865, 0.005304732359945774, 0.005423269234597683]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 5.0, 8.0, 5.0, 10.0, 13.0, 14.0, 17.0, 11.0, 23.0, 22.0, 23.0, 21.0, 23.0, 30.0, 31.0, 53.0, 35.0, 32.0, 41.0, 44.0, 43.0, 23.0, 37.0, 41.0, 41.0, 48.0, 31.0, 31.0, 29.0, 20.0, 20.0, 27.0, 21.0, 11.0, 18.0, 13.0, 8.0, 18.0, 13.0, 9.0, 4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0005220770835876465, -0.0005059316754341125, -0.0004897862672805786, -0.0004736408591270447, -0.00045749545097351074, -0.0004413500428199768, -0.00042520463466644287, -0.00040905922651290894, -0.000392913818359375, -0.00037676841020584106, -0.00036062300205230713, -0.0003444775938987732, -0.00032833218574523926, -0.0003121867775917053, -0.0002960413694381714, -0.00027989596128463745, -0.0002637505531311035, -0.0002476051449775696, -0.00023145973682403564, -0.0002153143286705017, -0.00019916892051696777, -0.00018302351236343384, -0.0001668781042098999, -0.00015073269605636597, -0.00013458728790283203, -0.0001184418797492981, -0.00010229647159576416, -8.615106344223022e-05, -7.000565528869629e-05, -5.3860247135162354e-05, -3.771483898162842e-05, -2.1569430828094482e-05, -5.424022674560547e-06, 1.0721385478973389e-05, 2.6866793632507324e-05, 4.301220178604126e-05, 5.9157609939575195e-05, 7.530301809310913e-05, 9.144842624664307e-05, 0.000107593834400177, 0.00012373924255371094, 0.00013988465070724487, 0.0001560300588607788, 0.00017217546701431274, 0.00018832087516784668, 0.00020446628332138062, 0.00022061169147491455, 0.00023675709962844849, 0.0002529025077819824, 0.00026904791593551636, 0.0002851933240890503, 0.00030133873224258423, 0.00031748414039611816, 0.0003336295485496521, 0.00034977495670318604, 0.00036592036485671997, 0.0003820657730102539, 0.00039821118116378784, 0.0004143565893173218, 0.0004305019974708557, 0.00044664740562438965, 0.0004627928137779236, 0.0004789382219314575, 0.0004950836300849915, 0.0005112290382385254]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 0.0, 2.0, 4.0, 7.0, 17.0, 14.0, 10.0, 14.0, 15.0, 18.0, 23.0, 22.0, 28.0, 26.0, 38.0, 38.0, 25.0, 31.0, 40.0, 45.0, 36.0, 43.0, 35.0, 49.0, 36.0, 42.0, 31.0, 40.0, 11.0, 37.0, 38.0, 29.0, 25.0, 14.0, 15.0, 14.0, 19.0, 8.0, 9.0, 9.0, 13.0, 5.0, 4.0, 5.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-11.3125, -10.970458984375, -10.62841796875, -10.286376953125, -9.9443359375, -9.602294921875, -9.26025390625, -8.918212890625, -8.576171875, -8.234130859375, -7.89208984375, -7.550048828125, -7.2080078125, -6.865966796875, -6.52392578125, -6.181884765625, -5.83984375, -5.497802734375, -5.15576171875, -4.813720703125, -4.4716796875, -4.129638671875, -3.78759765625, -3.445556640625, -3.103515625, -2.761474609375, -2.41943359375, -2.077392578125, -1.7353515625, -1.393310546875, -1.05126953125, -0.709228515625, -0.3671875, -0.025146484375, 0.31689453125, 0.658935546875, 1.0009765625, 1.343017578125, 1.68505859375, 2.027099609375, 2.369140625, 2.711181640625, 3.05322265625, 3.395263671875, 3.7373046875, 4.079345703125, 4.42138671875, 4.763427734375, 5.10546875, 5.447509765625, 5.78955078125, 6.131591796875, 6.4736328125, 6.815673828125, 7.15771484375, 7.499755859375, 7.841796875, 8.183837890625, 8.52587890625, 8.867919921875, 9.2099609375, 9.552001953125, 9.89404296875, 10.236083984375, 10.578125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 1.0, 6.0, 5.0, 6.0, 11.0, 8.0, 13.0, 24.0, 29.0, 40.0, 53.0, 66.0, 109.0, 177.0, 315.0, 556.0, 1079.0, 2375.0, 5026.0, 12157.0, 30827.0, 87100.0, 270066.0, 406933.0, 148277.0, 50240.0, 18710.0, 7692.0, 3352.0, 1516.0, 727.0, 385.0, 222.0, 130.0, 88.0, 62.0, 39.0, 28.0, 23.0, 21.0, 18.0, 14.0, 9.0, 8.0, 9.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.375, -10.0628662109375, -9.750732421875, -9.4385986328125, -9.12646484375, -8.8143310546875, -8.502197265625, -8.1900634765625, -7.8779296875, -7.5657958984375, -7.253662109375, -6.9415283203125, -6.62939453125, -6.3172607421875, -6.005126953125, -5.6929931640625, -5.380859375, -5.0687255859375, -4.756591796875, -4.4444580078125, -4.13232421875, -3.8201904296875, -3.508056640625, -3.1959228515625, -2.8837890625, -2.5716552734375, -2.259521484375, -1.9473876953125, -1.63525390625, -1.3231201171875, -1.010986328125, -0.6988525390625, -0.38671875, -0.0745849609375, 0.237548828125, 0.5496826171875, 0.86181640625, 1.1739501953125, 1.486083984375, 1.7982177734375, 2.1103515625, 2.4224853515625, 2.734619140625, 3.0467529296875, 3.35888671875, 3.6710205078125, 3.983154296875, 4.2952880859375, 4.607421875, 4.9195556640625, 5.231689453125, 5.5438232421875, 5.85595703125, 6.1680908203125, 6.480224609375, 6.7923583984375, 7.1044921875, 7.4166259765625, 7.728759765625, 8.0408935546875, 8.35302734375, 8.6651611328125, 8.977294921875, 9.2894287109375, 9.6015625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 2.0, 6.0, 5.0, 10.0, 16.0, 8.0, 8.0, 21.0, 21.0, 23.0, 32.0, 28.0, 47.0, 45.0, 69.0, 58.0, 95.0, 1677.0, 426.0, 68.0, 61.0, 55.0, 44.0, 31.0, 28.0, 28.0, 25.0, 25.0, 14.0, 16.0, 16.0, 13.0, 11.0, 3.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.59375, -52.09912109375, -50.6044921875, -49.10986328125, -47.615234375, -46.12060546875, -44.6259765625, -43.13134765625, -41.63671875, -40.14208984375, -38.6474609375, -37.15283203125, -35.658203125, -34.16357421875, -32.6689453125, -31.17431640625, -29.6796875, -28.18505859375, -26.6904296875, -25.19580078125, -23.701171875, -22.20654296875, -20.7119140625, -19.21728515625, -17.72265625, -16.22802734375, -14.7333984375, -13.23876953125, -11.744140625, -10.24951171875, -8.7548828125, -7.26025390625, -5.765625, -4.27099609375, -2.7763671875, -1.28173828125, 0.212890625, 1.70751953125, 3.2021484375, 4.69677734375, 6.19140625, 7.68603515625, 9.1806640625, 10.67529296875, 12.169921875, 13.66455078125, 15.1591796875, 16.65380859375, 18.1484375, 19.64306640625, 21.1376953125, 22.63232421875, 24.126953125, 25.62158203125, 27.1162109375, 28.61083984375, 30.10546875, 31.60009765625, 33.0947265625, 34.58935546875, 36.083984375, 37.57861328125, 39.0732421875, 40.56787109375, 42.0625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 6.0, 8.0, 16.0, 21.0, 15.0, 23.0, 38.0, 41.0, 79.0, 98.0, 91.0, 126.0, 242.0, 415.0, 1156.0, 59207.0, 3076920.0, 5456.0, 728.0, 296.0, 189.0, 138.0, 108.0, 74.0, 54.0, 33.0, 32.0, 21.0, 12.0, 16.0, 13.0, 5.0, 9.0, 4.0, 8.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.625, -66.2001953125, -63.775390625, -61.3505859375, -58.92578125, -56.5009765625, -54.076171875, -51.6513671875, -49.2265625, -46.8017578125, -44.376953125, -41.9521484375, -39.52734375, -37.1025390625, -34.677734375, -32.2529296875, -29.828125, -27.4033203125, -24.978515625, -22.5537109375, -20.12890625, -17.7041015625, -15.279296875, -12.8544921875, -10.4296875, -8.0048828125, -5.580078125, -3.1552734375, -0.73046875, 1.6943359375, 4.119140625, 6.5439453125, 8.96875, 11.3935546875, 13.818359375, 16.2431640625, 18.66796875, 21.0927734375, 23.517578125, 25.9423828125, 28.3671875, 30.7919921875, 33.216796875, 35.6416015625, 38.06640625, 40.4912109375, 42.916015625, 45.3408203125, 47.765625, 50.1904296875, 52.615234375, 55.0400390625, 57.46484375, 59.8896484375, 62.314453125, 64.7392578125, 67.1640625, 69.5888671875, 72.013671875, 74.4384765625, 76.86328125, 79.2880859375, 81.712890625, 84.1376953125, 86.5625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 238.0, 773.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-577.455078125, -567.178466796875, -556.9019165039062, -546.6253662109375, -536.3487548828125, -526.0721435546875, -515.7955932617188, -505.5190124511719, -495.242431640625, -484.9658508300781, -474.68927001953125, -464.4126892089844, -454.1361083984375, -443.8595275878906, -433.58294677734375, -423.3063659667969, -413.02978515625, -402.7532043457031, -392.47662353515625, -382.2000427246094, -371.9234619140625, -361.6468811035156, -351.37030029296875, -341.0937194824219, -330.817138671875, -320.5405578613281, -310.26397705078125, -299.9873962402344, -289.7108154296875, -279.4342346191406, -269.15765380859375, -258.8810729980469, -248.6044921875, -238.32791137695312, -228.05133056640625, -217.77474975585938, -207.4981689453125, -197.22158813476562, -186.94500732421875, -176.66842651367188, -166.391845703125, -156.11526489257812, -145.83868408203125, -135.56210327148438, -125.2855224609375, -115.00894165039062, -104.73236083984375, -94.45578002929688, -84.17919158935547, -73.9026107788086, -63.62602996826172, -53.349449157714844, -43.07286834716797, -32.796287536621094, -22.51970672607422, -12.243125915527344, -1.9665451049804688, 8.310035705566406, 18.58661651611328, 28.863197326660156, 39.13977813720703, 49.416358947753906, 59.69293975830078, 69.96952056884766, 80.24610137939453]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 6.0, 2.0, 6.0, 4.0, 8.0, 17.0, 16.0, 9.0, 26.0, 28.0, 17.0, 34.0, 35.0, 35.0, 37.0, 48.0, 35.0, 46.0, 50.0, 55.0, 56.0, 52.0, 38.0, 45.0, 44.0, 19.0, 34.0, 34.0, 38.0, 24.0, 27.0, 15.0, 14.0, 11.0, 7.0, 6.0, 11.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.9784698486328, -130.09603881835938, -126.21360778808594, -122.3311767578125, -118.44874572753906, -114.56631469726562, -110.68389129638672, -106.80146026611328, -102.91902923583984, -99.0365982055664, -95.15416717529297, -91.27173614501953, -87.38931274414062, -83.50688171386719, -79.62445068359375, -75.74201965332031, -71.85958862304688, -67.97715759277344, -64.0947265625, -60.21229934692383, -56.32986831665039, -52.44743728637695, -48.56501007080078, -44.682579040527344, -40.800148010253906, -36.91771697998047, -33.03528594970703, -29.15285873413086, -25.270427703857422, -21.387996673583984, -17.50556755065918, -13.623138427734375, -9.740715026855469, -5.858284950256348, -1.9758548736572266, 1.9065752029418945, 5.789005279541016, 9.671436309814453, 13.553865432739258, 17.436294555664062, 21.3187255859375, 25.201156616210938, 29.083585739135742, 32.96601486206055, 36.848445892333984, 40.73087692260742, 44.613304138183594, 48.49573516845703, 52.37816619873047, 56.260597229003906, 60.143028259277344, 64.02545928955078, 67.90788269042969, 71.79031372070312, 75.67274475097656, 79.55517578125, 83.43760681152344, 87.32003784179688, 91.20246887207031, 95.08489990234375, 98.96733093261719, 102.84976196289062, 106.73218536376953, 110.61461639404297, 114.4970474243164]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 1.0, 5.0, 12.0, 5.0, 7.0, 20.0, 16.0, 18.0, 24.0, 19.0, 21.0, 32.0, 29.0, 37.0, 33.0, 32.0, 35.0, 45.0, 46.0, 40.0, 47.0, 35.0, 42.0, 41.0, 41.0, 40.0, 32.0, 24.0, 28.0, 35.0, 21.0, 13.0, 21.0, 17.0, 18.0, 16.0, 7.0, 5.0, 10.0, 9.0, 4.0, 5.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-12.0, -11.6309814453125, -11.261962890625, -10.8929443359375, -10.52392578125, -10.1549072265625, -9.785888671875, -9.4168701171875, -9.0478515625, -8.6788330078125, -8.309814453125, -7.9407958984375, -7.57177734375, -7.2027587890625, -6.833740234375, -6.4647216796875, -6.095703125, -5.7266845703125, -5.357666015625, -4.9886474609375, -4.61962890625, -4.2506103515625, -3.881591796875, -3.5125732421875, -3.1435546875, -2.7745361328125, -2.405517578125, -2.0364990234375, -1.66748046875, -1.2984619140625, -0.929443359375, -0.5604248046875, -0.19140625, 0.1776123046875, 0.546630859375, 0.9156494140625, 1.28466796875, 1.6536865234375, 2.022705078125, 2.3917236328125, 2.7607421875, 3.1297607421875, 3.498779296875, 3.8677978515625, 4.23681640625, 4.6058349609375, 4.974853515625, 5.3438720703125, 5.712890625, 6.0819091796875, 6.450927734375, 6.8199462890625, 7.18896484375, 7.5579833984375, 7.927001953125, 8.2960205078125, 8.6650390625, 9.0340576171875, 9.403076171875, 9.7720947265625, 10.14111328125, 10.5101318359375, 10.879150390625, 11.2481689453125, 11.6171875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 7.0, 6.0, 11.0, 17.0, 13.0, 10.0, 16.0, 28.0, 33.0, 37.0, 50.0, 57.0, 66.0, 121.0, 168.0, 381.0, 1312.0, 14974.0, 1863339.0, 2292811.0, 18259.0, 1486.0, 432.0, 150.0, 95.0, 87.0, 49.0, 49.0, 29.0, 36.0, 26.0, 23.0, 14.0, 15.0, 21.0, 2.0, 11.0, 6.0, 9.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-48.46875, -47.04443359375, -45.6201171875, -44.19580078125, -42.771484375, -41.34716796875, -39.9228515625, -38.49853515625, -37.07421875, -35.64990234375, -34.2255859375, -32.80126953125, -31.376953125, -29.95263671875, -28.5283203125, -27.10400390625, -25.6796875, -24.25537109375, -22.8310546875, -21.40673828125, -19.982421875, -18.55810546875, -17.1337890625, -15.70947265625, -14.28515625, -12.86083984375, -11.4365234375, -10.01220703125, -8.587890625, -7.16357421875, -5.7392578125, -4.31494140625, -2.890625, -1.46630859375, -0.0419921875, 1.38232421875, 2.806640625, 4.23095703125, 5.6552734375, 7.07958984375, 8.50390625, 9.92822265625, 11.3525390625, 12.77685546875, 14.201171875, 15.62548828125, 17.0498046875, 18.47412109375, 19.8984375, 21.32275390625, 22.7470703125, 24.17138671875, 25.595703125, 27.02001953125, 28.4443359375, 29.86865234375, 31.29296875, 32.71728515625, 34.1416015625, 35.56591796875, 36.990234375, 38.41455078125, 39.8388671875, 41.26318359375, 42.6875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 14.0, 11.0, 16.0, 19.0, 31.0, 29.0, 40.0, 44.0, 62.0, 75.0, 111.0, 124.0, 182.0, 212.0, 318.0, 388.0, 458.0, 436.0, 359.0, 252.0, 183.0, 170.0, 98.0, 97.0, 75.0, 55.0, 42.0, 32.0, 27.0, 24.0, 18.0, 15.0, 7.0, 12.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-16.046875, -15.54052734375, -15.0341796875, -14.52783203125, -14.021484375, -13.51513671875, -13.0087890625, -12.50244140625, -11.99609375, -11.48974609375, -10.9833984375, -10.47705078125, -9.970703125, -9.46435546875, -8.9580078125, -8.45166015625, -7.9453125, -7.43896484375, -6.9326171875, -6.42626953125, -5.919921875, -5.41357421875, -4.9072265625, -4.40087890625, -3.89453125, -3.38818359375, -2.8818359375, -2.37548828125, -1.869140625, -1.36279296875, -0.8564453125, -0.35009765625, 0.15625, 0.66259765625, 1.1689453125, 1.67529296875, 2.181640625, 2.68798828125, 3.1943359375, 3.70068359375, 4.20703125, 4.71337890625, 5.2197265625, 5.72607421875, 6.232421875, 6.73876953125, 7.2451171875, 7.75146484375, 8.2578125, 8.76416015625, 9.2705078125, 9.77685546875, 10.283203125, 10.78955078125, 11.2958984375, 11.80224609375, 12.30859375, 12.81494140625, 13.3212890625, 13.82763671875, 14.333984375, 14.84033203125, 15.3466796875, 15.85302734375, 16.359375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 4.0, 9.0, 12.0, 13.0, 11.0, 17.0, 15.0, 32.0, 25.0, 50.0, 72.0, 65.0, 93.0, 88.0, 153.0, 221.0, 278.0, 477.0, 1382.0, 100097.0, 4078125.0, 10900.0, 732.0, 349.0, 218.0, 161.0, 132.0, 117.0, 104.0, 73.0, 52.0, 40.0, 37.0, 23.0, 21.0, 18.0, 18.0, 11.0, 7.0, 4.0, 10.0, 3.0, 2.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.0, -95.734375, -92.46875, -89.203125, -85.9375, -82.671875, -79.40625, -76.140625, -72.875, -69.609375, -66.34375, -63.078125, -59.8125, -56.546875, -53.28125, -50.015625, -46.75, -43.484375, -40.21875, -36.953125, -33.6875, -30.421875, -27.15625, -23.890625, -20.625, -17.359375, -14.09375, -10.828125, -7.5625, -4.296875, -1.03125, 2.234375, 5.5, 8.765625, 12.03125, 15.296875, 18.5625, 21.828125, 25.09375, 28.359375, 31.625, 34.890625, 38.15625, 41.421875, 44.6875, 47.953125, 51.21875, 54.484375, 57.75, 61.015625, 64.28125, 67.546875, 70.8125, 74.078125, 77.34375, 80.609375, 83.875, 87.140625, 90.40625, 93.671875, 96.9375, 100.203125, 103.46875, 106.734375, 110.0]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 13.0, 765.0, 236.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-816.59521484375, -797.9414672851562, -779.2877197265625, -760.6339721679688, -741.980224609375, -723.3264770507812, -704.6727294921875, -686.0189819335938, -667.365234375, -648.7114868164062, -630.0577392578125, -611.4039916992188, -592.750244140625, -574.0964965820312, -555.4427490234375, -536.7890014648438, -518.13525390625, -499.48150634765625, -480.8277587890625, -462.17401123046875, -443.520263671875, -424.86651611328125, -406.2127685546875, -387.55902099609375, -368.9052734375, -350.25152587890625, -331.5977783203125, -312.94403076171875, -294.290283203125, -275.63653564453125, -256.9827880859375, -238.32904052734375, -219.67523193359375, -201.021484375, -182.36773681640625, -163.7139892578125, -145.06024169921875, -126.406494140625, -107.75274658203125, -89.0989990234375, -70.44525146484375, -51.79150390625, -33.13775634765625, -14.4840087890625, 4.16973876953125, 22.823486328125, 41.47723388671875, 60.1309814453125, 78.78472900390625, 97.4384765625, 116.09222412109375, 134.7459716796875, 153.39971923828125, 172.053466796875, 190.70721435546875, 209.3609619140625, 228.01470947265625, 246.66845703125, 265.32220458984375, 283.9759521484375, 302.62969970703125, 321.283447265625, 339.93719482421875, 358.5909423828125, 377.24468994140625]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 7.0, 2.0, 2.0, 8.0, 6.0, 15.0, 15.0, 15.0, 17.0, 19.0, 24.0, 18.0, 22.0, 35.0, 29.0, 33.0, 27.0, 30.0, 42.0, 33.0, 45.0, 40.0, 41.0, 28.0, 50.0, 39.0, 38.0, 41.0, 34.0, 30.0, 26.0, 23.0, 30.0, 17.0, 24.0, 27.0, 14.0, 13.0, 7.0, 5.0, 10.0, 6.0, 4.0, 3.0, 5.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-61.996986389160156, -59.94422149658203, -57.89146041870117, -55.83869552612305, -53.78593444824219, -51.73316955566406, -49.68040466308594, -47.62763977050781, -45.57487869262695, -43.52211380004883, -41.46935272216797, -39.416587829589844, -37.36382293701172, -35.31106185913086, -33.258296966552734, -31.205533981323242, -29.15277099609375, -27.100008010864258, -25.047245025634766, -22.99448013305664, -20.94171714782715, -18.888954162597656, -16.83618927001953, -14.783426284790039, -12.730663299560547, -10.677900314331055, -8.625136375427246, -6.572372913360596, -4.519609451293945, -2.466846466064453, -0.41408252716064453, 1.638681411743164, 3.6914443969726562, 5.744207859039307, 7.796971321105957, 9.849735260009766, 11.902498245239258, 13.95526123046875, 16.008026123046875, 18.060789108276367, 20.11355209350586, 22.16631507873535, 24.219078063964844, 26.27184295654297, 28.32460594177246, 30.377368927001953, 32.43013381958008, 34.48289489746094, 36.53565979003906, 38.58842468261719, 40.64118576049805, 42.69395065307617, 44.74671173095703, 46.799476623535156, 48.85224151611328, 50.905006408691406, 52.957767486572266, 55.01053237915039, 57.06329345703125, 59.116058349609375, 61.1688232421875, 63.22158432006836, 65.27434539794922, 67.32711029052734, 69.37987518310547]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 7.0, 7.0, 12.0, 7.0, 11.0, 16.0, 16.0, 11.0, 20.0, 22.0, 23.0, 18.0, 37.0, 35.0, 35.0, 38.0, 40.0, 32.0, 37.0, 49.0, 37.0, 49.0, 36.0, 38.0, 31.0, 34.0, 33.0, 35.0, 26.0, 28.0, 25.0, 19.0, 27.0, 17.0, 14.0, 20.0, 9.0, 11.0, 9.0, 9.0, 5.0, 4.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.6484375, -11.29248046875, -10.9365234375, -10.58056640625, -10.224609375, -9.86865234375, -9.5126953125, -9.15673828125, -8.80078125, -8.44482421875, -8.0888671875, -7.73291015625, -7.376953125, -7.02099609375, -6.6650390625, -6.30908203125, -5.953125, -5.59716796875, -5.2412109375, -4.88525390625, -4.529296875, -4.17333984375, -3.8173828125, -3.46142578125, -3.10546875, -2.74951171875, -2.3935546875, -2.03759765625, -1.681640625, -1.32568359375, -0.9697265625, -0.61376953125, -0.2578125, 0.09814453125, 0.4541015625, 0.81005859375, 1.166015625, 1.52197265625, 1.8779296875, 2.23388671875, 2.58984375, 2.94580078125, 3.3017578125, 3.65771484375, 4.013671875, 4.36962890625, 4.7255859375, 5.08154296875, 5.4375, 5.79345703125, 6.1494140625, 6.50537109375, 6.861328125, 7.21728515625, 7.5732421875, 7.92919921875, 8.28515625, 8.64111328125, 8.9970703125, 9.35302734375, 9.708984375, 10.06494140625, 10.4208984375, 10.77685546875, 11.1328125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 7.0, 5.0, 7.0, 12.0, 28.0, 37.0, 71.0, 64.0, 120.0, 175.0, 270.0, 405.0, 629.0, 954.0, 1473.0, 2278.0, 3495.0, 5524.0, 8903.0, 14192.0, 23367.0, 39098.0, 68347.0, 127959.0, 345019.0, 188257.0, 90010.0, 50286.0, 29638.0, 17837.0, 11012.0, 6829.0, 4314.0, 2778.0, 1785.0, 1169.0, 739.0, 491.0, 329.0, 230.0, 124.0, 101.0, 63.0, 46.0, 30.0, 17.0, 13.0, 11.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.62890625, -2.548583984375, -2.46826171875, -2.387939453125, -2.3076171875, -2.227294921875, -2.14697265625, -2.066650390625, -1.986328125, -1.906005859375, -1.82568359375, -1.745361328125, -1.6650390625, -1.584716796875, -1.50439453125, -1.424072265625, -1.34375, -1.263427734375, -1.18310546875, -1.102783203125, -1.0224609375, -0.942138671875, -0.86181640625, -0.781494140625, -0.701171875, -0.620849609375, -0.54052734375, -0.460205078125, -0.3798828125, -0.299560546875, -0.21923828125, -0.138916015625, -0.05859375, 0.021728515625, 0.10205078125, 0.182373046875, 0.2626953125, 0.343017578125, 0.42333984375, 0.503662109375, 0.583984375, 0.664306640625, 0.74462890625, 0.824951171875, 0.9052734375, 0.985595703125, 1.06591796875, 1.146240234375, 1.2265625, 1.306884765625, 1.38720703125, 1.467529296875, 1.5478515625, 1.628173828125, 1.70849609375, 1.788818359375, 1.869140625, 1.949462890625, 2.02978515625, 2.110107421875, 2.1904296875, 2.270751953125, 2.35107421875, 2.431396484375, 2.51171875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 4.0, 3.0, 8.0, 2.0, 4.0, 6.0, 11.0, 6.0, 10.0, 13.0, 14.0, 8.0, 16.0, 18.0, 27.0, 21.0, 30.0, 30.0, 30.0, 44.0, 39.0, 33.0, 31.0, 44.0, 32.0, 1058.0, 48.0, 33.0, 44.0, 32.0, 23.0, 23.0, 33.0, 33.0, 27.0, 23.0, 30.0, 12.0, 23.0, 20.0, 15.0, 20.0, 7.0, 10.0, 4.0, 4.0, 5.0, 3.0, 6.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-6.76953125, -6.56085205078125, -6.3521728515625, -6.14349365234375, -5.934814453125, -5.72613525390625, -5.5174560546875, -5.30877685546875, -5.10009765625, -4.89141845703125, -4.6827392578125, -4.47406005859375, -4.265380859375, -4.05670166015625, -3.8480224609375, -3.63934326171875, -3.4306640625, -3.22198486328125, -3.0133056640625, -2.80462646484375, -2.595947265625, -2.38726806640625, -2.1785888671875, -1.96990966796875, -1.76123046875, -1.55255126953125, -1.3438720703125, -1.13519287109375, -0.926513671875, -0.71783447265625, -0.5091552734375, -0.30047607421875, -0.091796875, 0.11688232421875, 0.3255615234375, 0.53424072265625, 0.742919921875, 0.95159912109375, 1.1602783203125, 1.36895751953125, 1.57763671875, 1.78631591796875, 1.9949951171875, 2.20367431640625, 2.412353515625, 2.62103271484375, 2.8297119140625, 3.03839111328125, 3.2470703125, 3.45574951171875, 3.6644287109375, 3.87310791015625, 4.081787109375, 4.29046630859375, 4.4991455078125, 4.70782470703125, 4.91650390625, 5.12518310546875, 5.3338623046875, 5.54254150390625, 5.751220703125, 5.95989990234375, 6.1685791015625, 6.37725830078125, 6.5859375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 10.0, 10.0, 7.0, 26.0, 32.0, 29.0, 46.0, 71.0, 91.0, 127.0, 194.0, 313.0, 457.0, 701.0, 907.0, 1398.0, 1940.0, 2844.0, 4216.0, 6351.0, 9311.0, 13652.0, 20728.0, 31632.0, 49666.0, 83351.0, 165927.0, 1366199.0, 134773.0, 72377.0, 44523.0, 28494.0, 18453.0, 12332.0, 7995.0, 5619.0, 3825.0, 2628.0, 1813.0, 1270.0, 865.0, 606.0, 391.0, 297.0, 200.0, 123.0, 92.0, 59.0, 43.0, 35.0, 36.0, 18.0, 12.0, 11.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.9736328125, -1.9107208251953125, -1.847808837890625, -1.7848968505859375, -1.72198486328125, -1.6590728759765625, -1.596160888671875, -1.5332489013671875, -1.4703369140625, -1.4074249267578125, -1.344512939453125, -1.2816009521484375, -1.21868896484375, -1.1557769775390625, -1.092864990234375, -1.0299530029296875, -0.967041015625, -0.9041290283203125, -0.841217041015625, -0.7783050537109375, -0.71539306640625, -0.6524810791015625, -0.589569091796875, -0.5266571044921875, -0.4637451171875, -0.4008331298828125, -0.337921142578125, -0.2750091552734375, -0.21209716796875, -0.1491851806640625, -0.086273193359375, -0.0233612060546875, 0.03955078125, 0.1024627685546875, 0.165374755859375, 0.2282867431640625, 0.29119873046875, 0.3541107177734375, 0.417022705078125, 0.4799346923828125, 0.5428466796875, 0.6057586669921875, 0.668670654296875, 0.7315826416015625, 0.79449462890625, 0.8574066162109375, 0.920318603515625, 0.9832305908203125, 1.046142578125, 1.1090545654296875, 1.171966552734375, 1.2348785400390625, 1.29779052734375, 1.3607025146484375, 1.423614501953125, 1.4865264892578125, 1.5494384765625, 1.6123504638671875, 1.675262451171875, 1.7381744384765625, 1.80108642578125, 1.8639984130859375, 1.926910400390625, 1.9898223876953125, 2.052734375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 5.0, 6.0, 13.0, 11.0, 17.0, 25.0, 24.0, 42.0, 44.0, 54.0, 82.0, 78.0, 88.0, 95.0, 71.0, 56.0, 65.0, 50.0, 39.0, 24.0, 29.0, 12.0, 10.0, 14.0, 4.0, 9.0, 9.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015087127685546875, -0.0014614611864089966, -0.0014142096042633057, -0.0013669580221176147, -0.0013197064399719238, -0.001272454857826233, -0.001225203275680542, -0.001177951693534851, -0.0011307001113891602, -0.0010834485292434692, -0.0010361969470977783, -0.0009889453649520874, -0.0009416937828063965, -0.0008944422006607056, -0.0008471906185150146, -0.0007999390363693237, -0.0007526874542236328, -0.0007054358720779419, -0.000658184289932251, -0.0006109327077865601, -0.0005636811256408691, -0.0005164295434951782, -0.0004691779613494873, -0.0004219263792037964, -0.00037467479705810547, -0.00032742321491241455, -0.00028017163276672363, -0.00023292005062103271, -0.0001856684684753418, -0.00013841688632965088, -9.116530418395996e-05, -4.391372203826904e-05, 3.337860107421875e-06, 5.058944225311279e-05, 9.784102439880371e-05, 0.00014509260654449463, 0.00019234418869018555, 0.00023959577083587646, 0.0002868473529815674, 0.0003340989351272583, 0.0003813505172729492, 0.00042860209941864014, 0.00047585368156433105, 0.000523105263710022, 0.0005703568458557129, 0.0006176084280014038, 0.0006648600101470947, 0.0007121115922927856, 0.0007593631744384766, 0.0008066147565841675, 0.0008538663387298584, 0.0009011179208755493, 0.0009483695030212402, 0.0009956210851669312, 0.001042872667312622, 0.001090124249458313, 0.001137375831604004, 0.0011846274137496948, 0.0012318789958953857, 0.0012791305780410767, 0.0013263821601867676, 0.0013736337423324585, 0.0014208853244781494, 0.0014681369066238403, 0.0015153884887695312]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 6.0, 6.0, 13.0, 8.0, 13.0, 18.0, 19.0, 34.0, 47.0, 46.0, 68.0, 109.0, 157.0, 364.0, 1057.0, 886079.0, 158896.0, 828.0, 301.0, 122.0, 100.0, 75.0, 43.0, 33.0, 26.0, 12.0, 19.0, 16.0, 10.0, 8.0, 3.0, 6.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03411865234375, -0.033082008361816406, -0.03204536437988281, -0.03100872039794922, -0.029972076416015625, -0.02893543243408203, -0.027898788452148438, -0.026862144470214844, -0.02582550048828125, -0.024788856506347656, -0.023752212524414062, -0.02271556854248047, -0.021678924560546875, -0.02064228057861328, -0.019605636596679688, -0.018568992614746094, -0.0175323486328125, -0.016495704650878906, -0.015459060668945312, -0.014422416687011719, -0.013385772705078125, -0.012349128723144531, -0.011312484741210938, -0.010275840759277344, -0.00923919677734375, -0.008202552795410156, -0.0071659088134765625, -0.006129264831542969, -0.005092620849609375, -0.004055976867675781, -0.0030193328857421875, -0.0019826889038085938, -0.000946044921875, 9.059906005859375e-05, 0.0011272430419921875, 0.0021638870239257812, 0.003200531005859375, 0.004237174987792969, 0.0052738189697265625, 0.006310462951660156, 0.00734710693359375, 0.008383750915527344, 0.009420394897460938, 0.010457038879394531, 0.011493682861328125, 0.012530326843261719, 0.013566970825195312, 0.014603614807128906, 0.0156402587890625, 0.016676902770996094, 0.017713546752929688, 0.01875019073486328, 0.019786834716796875, 0.02082347869873047, 0.021860122680664062, 0.022896766662597656, 0.02393341064453125, 0.024970054626464844, 0.026006698608398438, 0.02704334259033203, 0.028079986572265625, 0.02911663055419922, 0.030153274536132812, 0.031189918518066406, 0.0322265625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 14.0, 50.0, 139.0, 267.0, 268.0, 173.0, 70.0, 20.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007206786540336907, -0.0006731952307745814, -0.0006257118075154722, -0.0005782283842563629, -0.0005307449027895927, -0.00048326150863431394, -0.0004357780562713742, -0.00038829463301226497, -0.0003408112097531557, -0.00029332778649404645, -0.0002458443632349372, -0.00019836091087199748, -0.00015087748761288822, -0.00010339406435377896, -5.591061199083924e-05, -8.427188731729984e-06, 3.9056234527379274e-05, 8.653966506244615e-05, 0.00013402309559751302, 0.0001815065334085375, 0.00022898995666764677, 0.000276473379926756, 0.00032395683228969574, 0.000371440255548805, 0.00041892367880791426, 0.0004664071020670235, 0.0005138905253261328, 0.000561374006792903, 0.0006088573718443513, 0.0006563408533111215, 0.0007038242765702307, 0.00075130769982934, 0.0007987911812961102, 0.0008462746045552194, 0.0008937580278143287, 0.0009412415092810988, 0.0009887248743325472, 0.0010362083557993174, 0.0010836918372660875, 0.0011311752023175359, 0.0011786585673689842, 0.0012261420488357544, 0.0012736254138872027, 0.001321108895353973, 0.0013685922604054213, 0.0014160757418721914, 0.0014635592233389616, 0.00151104258839041, 0.0015585260698571801, 0.0016060095513239503, 0.0016534929163753986, 0.0017009763978421688, 0.0017484597628936172, 0.0017959432443603873, 0.0018434266094118357, 0.0018909100908786058, 0.001938393572345376, 0.001985877053812146, 0.0020333605352789164, 0.002080843783915043, 0.002128327265381813, 0.0021758107468485832, 0.0022232942283153534, 0.0022707777097821236, 0.00231826095841825]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 3.0, 8.0, 5.0, 10.0, 10.0, 8.0, 14.0, 13.0, 12.0, 27.0, 19.0, 23.0, 21.0, 27.0, 34.0, 38.0, 38.0, 42.0, 32.0, 56.0, 39.0, 38.0, 40.0, 42.0, 36.0, 37.0, 37.0, 33.0, 39.0, 28.0, 22.0, 29.0, 15.0, 25.0, 24.0, 13.0, 14.0, 18.0, 6.0, 4.0, 4.0, 6.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.000668942928314209, -0.0006496105343103409, -0.0006302781403064728, -0.0006109457463026047, -0.0005916133522987366, -0.0005722809582948685, -0.0005529485642910004, -0.0005336161702871323, -0.0005142837762832642, -0.0004949513822793961, -0.00047561898827552795, -0.00045628659427165985, -0.00043695420026779175, -0.00041762180626392365, -0.00039828941226005554, -0.00037895701825618744, -0.00035962462425231934, -0.00034029223024845123, -0.00032095983624458313, -0.000301627442240715, -0.0002822950482368469, -0.0002629626542329788, -0.00024363026022911072, -0.00022429786622524261, -0.0002049654722213745, -0.0001856330782175064, -0.0001663006842136383, -0.0001469682902097702, -0.0001276358962059021, -0.000108303502202034, -8.89711081981659e-05, -6.963871419429779e-05, -5.030632019042969e-05, -3.0973926186561584e-05, -1.1641532182693481e-05, 7.690861821174622e-06, 2.7023255825042725e-05, 4.635564982891083e-05, 6.568804383277893e-05, 8.502043783664703e-05, 0.00010435283184051514, 0.00012368522584438324, 0.00014301761984825134, 0.00016235001385211945, 0.00018168240785598755, 0.00020101480185985565, 0.00022034719586372375, 0.00023967958986759186, 0.00025901198387145996, 0.00027834437787532806, 0.00029767677187919617, 0.00031700916588306427, 0.0003363415598869324, 0.0003556739538908005, 0.0003750063478946686, 0.0003943387418985367, 0.0004136711359024048, 0.0004330035299062729, 0.000452335923910141, 0.0004716683179140091, 0.0004910007119178772, 0.0005103331059217453, 0.0005296654999256134, 0.0005489978939294815, 0.0005683302879333496]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 7.0, 7.0, 12.0, 7.0, 11.0, 16.0, 16.0, 11.0, 20.0, 22.0, 23.0, 18.0, 37.0, 35.0, 35.0, 38.0, 40.0, 32.0, 37.0, 49.0, 37.0, 49.0, 36.0, 38.0, 31.0, 34.0, 33.0, 35.0, 26.0, 28.0, 25.0, 19.0, 27.0, 17.0, 14.0, 20.0, 9.0, 11.0, 9.0, 9.0, 5.0, 4.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.6484375, -11.29248046875, -10.9365234375, -10.58056640625, -10.224609375, -9.86865234375, -9.5126953125, -9.15673828125, -8.80078125, -8.44482421875, -8.0888671875, -7.73291015625, -7.376953125, -7.02099609375, -6.6650390625, -6.30908203125, -5.953125, -5.59716796875, -5.2412109375, -4.88525390625, -4.529296875, -4.17333984375, -3.8173828125, -3.46142578125, -3.10546875, -2.74951171875, -2.3935546875, -2.03759765625, -1.681640625, -1.32568359375, -0.9697265625, -0.61376953125, -0.2578125, 0.09814453125, 0.4541015625, 0.81005859375, 1.166015625, 1.52197265625, 1.8779296875, 2.23388671875, 2.58984375, 2.94580078125, 3.3017578125, 3.65771484375, 4.013671875, 4.36962890625, 4.7255859375, 5.08154296875, 5.4375, 5.79345703125, 6.1494140625, 6.50537109375, 6.861328125, 7.21728515625, 7.5732421875, 7.92919921875, 8.28515625, 8.64111328125, 8.9970703125, 9.35302734375, 9.708984375, 10.06494140625, 10.4208984375, 10.77685546875, 11.1328125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 12.0, 8.0, 11.0, 24.0, 23.0, 17.0, 26.0, 39.0, 54.0, 74.0, 117.0, 164.0, 225.0, 315.0, 590.0, 1494.0, 7526.0, 58859.0, 665810.0, 281025.0, 25754.0, 3883.0, 1045.0, 428.0, 294.0, 192.0, 132.0, 94.0, 73.0, 46.0, 43.0, 31.0, 17.0, 28.0, 10.0, 12.0, 8.0, 13.0, 6.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.765625, -22.07177734375, -21.3779296875, -20.68408203125, -19.990234375, -19.29638671875, -18.6025390625, -17.90869140625, -17.21484375, -16.52099609375, -15.8271484375, -15.13330078125, -14.439453125, -13.74560546875, -13.0517578125, -12.35791015625, -11.6640625, -10.97021484375, -10.2763671875, -9.58251953125, -8.888671875, -8.19482421875, -7.5009765625, -6.80712890625, -6.11328125, -5.41943359375, -4.7255859375, -4.03173828125, -3.337890625, -2.64404296875, -1.9501953125, -1.25634765625, -0.5625, 0.13134765625, 0.8251953125, 1.51904296875, 2.212890625, 2.90673828125, 3.6005859375, 4.29443359375, 4.98828125, 5.68212890625, 6.3759765625, 7.06982421875, 7.763671875, 8.45751953125, 9.1513671875, 9.84521484375, 10.5390625, 11.23291015625, 11.9267578125, 12.62060546875, 13.314453125, 14.00830078125, 14.7021484375, 15.39599609375, 16.08984375, 16.78369140625, 17.4775390625, 18.17138671875, 18.865234375, 19.55908203125, 20.2529296875, 20.94677734375, 21.640625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 7.0, 8.0, 12.0, 10.0, 12.0, 19.0, 20.0, 28.0, 39.0, 35.0, 45.0, 61.0, 69.0, 73.0, 122.0, 1723.0, 280.0, 96.0, 67.0, 64.0, 41.0, 41.0, 32.0, 34.0, 20.0, 20.0, 18.0, 16.0, 13.0, 3.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.625, -43.01806640625, -41.4111328125, -39.80419921875, -38.197265625, -36.59033203125, -34.9833984375, -33.37646484375, -31.76953125, -30.16259765625, -28.5556640625, -26.94873046875, -25.341796875, -23.73486328125, -22.1279296875, -20.52099609375, -18.9140625, -17.30712890625, -15.7001953125, -14.09326171875, -12.486328125, -10.87939453125, -9.2724609375, -7.66552734375, -6.05859375, -4.45166015625, -2.8447265625, -1.23779296875, 0.369140625, 1.97607421875, 3.5830078125, 5.18994140625, 6.796875, 8.40380859375, 10.0107421875, 11.61767578125, 13.224609375, 14.83154296875, 16.4384765625, 18.04541015625, 19.65234375, 21.25927734375, 22.8662109375, 24.47314453125, 26.080078125, 27.68701171875, 29.2939453125, 30.90087890625, 32.5078125, 34.11474609375, 35.7216796875, 37.32861328125, 38.935546875, 40.54248046875, 42.1494140625, 43.75634765625, 45.36328125, 46.97021484375, 48.5771484375, 50.18408203125, 51.791015625, 53.39794921875, 55.0048828125, 56.61181640625, 58.21875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 6.0, 11.0, 16.0, 17.0, 17.0, 36.0, 34.0, 69.0, 63.0, 125.0, 162.0, 415.0, 1181.0, 49074.0, 3089976.0, 3199.0, 554.0, 235.0, 153.0, 98.0, 61.0, 54.0, 27.0, 25.0, 17.0, 12.0, 15.0, 12.0, 10.0, 9.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-134.625, -130.9091796875, -127.193359375, -123.4775390625, -119.76171875, -116.0458984375, -112.330078125, -108.6142578125, -104.8984375, -101.1826171875, -97.466796875, -93.7509765625, -90.03515625, -86.3193359375, -82.603515625, -78.8876953125, -75.171875, -71.4560546875, -67.740234375, -64.0244140625, -60.30859375, -56.5927734375, -52.876953125, -49.1611328125, -45.4453125, -41.7294921875, -38.013671875, -34.2978515625, -30.58203125, -26.8662109375, -23.150390625, -19.4345703125, -15.71875, -12.0029296875, -8.287109375, -4.5712890625, -0.85546875, 2.8603515625, 6.576171875, 10.2919921875, 14.0078125, 17.7236328125, 21.439453125, 25.1552734375, 28.87109375, 32.5869140625, 36.302734375, 40.0185546875, 43.734375, 47.4501953125, 51.166015625, 54.8818359375, 58.59765625, 62.3134765625, 66.029296875, 69.7451171875, 73.4609375, 77.1767578125, 80.892578125, 84.6083984375, 88.32421875, 92.0400390625, 95.755859375, 99.4716796875, 103.1875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 16.0, 102.0, 503.0, 342.0, 49.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.08769607543945, -37.3053092956543, -32.52292251586914, -27.740535736083984, -22.958148956298828, -18.175762176513672, -13.393375396728516, -8.61098861694336, -3.828601837158203, 0.9537849426269531, 5.736171722412109, 10.518558502197266, 15.300945281982422, 20.083332061767578, 24.865718841552734, 29.64810562133789, 34.43049240112305, 39.2128791809082, 43.99526596069336, 48.777652740478516, 53.56003952026367, 58.34242630004883, 63.124813079833984, 67.90719604492188, 72.68959045410156, 77.47197723388672, 82.25436401367188, 87.03675079345703, 91.81913757324219, 96.60152435302734, 101.3839111328125, 106.16629791259766, 110.94866943359375, 115.7310562133789, 120.51344299316406, 125.29582977294922, 130.07821655273438, 134.860595703125, 139.6429901123047, 144.42538452148438, 149.207763671875, 153.99014282226562, 158.7725372314453, 163.554931640625, 168.33731079101562, 173.11968994140625, 177.90208435058594, 182.68447875976562, 187.46685791015625, 192.24923706054688, 197.03163146972656, 201.81402587890625, 206.59640502929688, 211.3787841796875, 216.1611785888672, 220.94357299804688, 225.7259521484375, 230.50833129882812, 235.2907257080078, 240.0731201171875, 244.85549926757812, 249.63787841796875, 254.42027282714844, 259.2026672363281, 263.98504638671875]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 7.0, 3.0, 7.0, 3.0, 8.0, 7.0, 11.0, 12.0, 15.0, 21.0, 17.0, 19.0, 23.0, 28.0, 29.0, 33.0, 47.0, 35.0, 37.0, 32.0, 37.0, 34.0, 28.0, 51.0, 36.0, 37.0, 36.0, 45.0, 33.0, 33.0, 35.0, 23.0, 21.0, 23.0, 22.0, 15.0, 18.0, 15.0, 6.0, 7.0, 13.0, 4.0, 8.0, 6.0, 6.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-101.98184204101562, -98.71770477294922, -95.45356750488281, -92.1894302368164, -88.92529296875, -85.6611557006836, -82.39701843261719, -79.13288116455078, -75.86874389648438, -72.60460662841797, -69.34046936035156, -66.07633209228516, -62.81219482421875, -59.548057556152344, -56.28392028808594, -53.01978302001953, -49.75564193725586, -46.49150466918945, -43.22736740112305, -39.96323013305664, -36.699092864990234, -33.43495178222656, -30.17081642150879, -26.906679153442383, -23.642541885375977, -20.37840461730957, -17.114267349243164, -13.850129127502441, -10.585991859436035, -7.3218536376953125, -4.057716369628906, -0.7935791015625, 2.4705581665039062, 5.7346954345703125, 8.998832702636719, 12.262970924377441, 15.527108192443848, 18.79124641418457, 22.055383682250977, 25.319520950317383, 28.58365821838379, 31.847795486450195, 35.111934661865234, 38.37607192993164, 41.64020919799805, 44.90434646606445, 48.16848373413086, 51.432621002197266, 54.69675827026367, 57.96089553833008, 61.225032806396484, 64.48917388916016, 67.75331115722656, 71.01744842529297, 74.28158569335938, 77.54572296142578, 80.80986022949219, 84.0739974975586, 87.338134765625, 90.6022720336914, 93.86640930175781, 97.13054656982422, 100.39468383789062, 103.65882110595703, 106.92295837402344]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 6.0, 5.0, 6.0, 8.0, 9.0, 11.0, 22.0, 19.0, 17.0, 23.0, 19.0, 29.0, 33.0, 28.0, 44.0, 43.0, 39.0, 47.0, 50.0, 38.0, 41.0, 31.0, 39.0, 40.0, 41.0, 48.0, 30.0, 25.0, 27.0, 29.0, 22.0, 29.0, 20.0, 13.0, 18.0, 16.0, 8.0, 7.0, 5.0, 6.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.765625, -11.3648681640625, -10.964111328125, -10.5633544921875, -10.16259765625, -9.7618408203125, -9.361083984375, -8.9603271484375, -8.5595703125, -8.1588134765625, -7.758056640625, -7.3572998046875, -6.95654296875, -6.5557861328125, -6.155029296875, -5.7542724609375, -5.353515625, -4.9527587890625, -4.552001953125, -4.1512451171875, -3.75048828125, -3.3497314453125, -2.948974609375, -2.5482177734375, -2.1474609375, -1.7467041015625, -1.345947265625, -0.9451904296875, -0.54443359375, -0.1436767578125, 0.257080078125, 0.6578369140625, 1.05859375, 1.4593505859375, 1.860107421875, 2.2608642578125, 2.66162109375, 3.0623779296875, 3.463134765625, 3.8638916015625, 4.2646484375, 4.6654052734375, 5.066162109375, 5.4669189453125, 5.86767578125, 6.2684326171875, 6.669189453125, 7.0699462890625, 7.470703125, 7.8714599609375, 8.272216796875, 8.6729736328125, 9.07373046875, 9.4744873046875, 9.875244140625, 10.2760009765625, 10.6767578125, 11.0775146484375, 11.478271484375, 11.8790283203125, 12.27978515625, 12.6805419921875, 13.081298828125, 13.4820556640625, 13.8828125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 3.0, 6.0, 4.0, 9.0, 11.0, 12.0, 10.0, 9.0, 19.0, 21.0, 24.0, 49.0, 42.0, 65.0, 107.0, 162.0, 237.0, 627.0, 2287.0, 20660.0, 1454666.0, 2665415.0, 44948.0, 3231.0, 750.0, 320.0, 160.0, 107.0, 72.0, 54.0, 43.0, 23.0, 30.0, 26.0, 17.0, 17.0, 8.0, 6.0, 7.0, 5.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.125, -38.87548828125, -37.6259765625, -36.37646484375, -35.126953125, -33.87744140625, -32.6279296875, -31.37841796875, -30.12890625, -28.87939453125, -27.6298828125, -26.38037109375, -25.130859375, -23.88134765625, -22.6318359375, -21.38232421875, -20.1328125, -18.88330078125, -17.6337890625, -16.38427734375, -15.134765625, -13.88525390625, -12.6357421875, -11.38623046875, -10.13671875, -8.88720703125, -7.6376953125, -6.38818359375, -5.138671875, -3.88916015625, -2.6396484375, -1.39013671875, -0.140625, 1.10888671875, 2.3583984375, 3.60791015625, 4.857421875, 6.10693359375, 7.3564453125, 8.60595703125, 9.85546875, 11.10498046875, 12.3544921875, 13.60400390625, 14.853515625, 16.10302734375, 17.3525390625, 18.60205078125, 19.8515625, 21.10107421875, 22.3505859375, 23.60009765625, 24.849609375, 26.09912109375, 27.3486328125, 28.59814453125, 29.84765625, 31.09716796875, 32.3466796875, 33.59619140625, 34.845703125, 36.09521484375, 37.3447265625, 38.59423828125, 39.84375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 4.0, 18.0, 23.0, 44.0, 58.0, 98.0, 177.0, 272.0, 426.0, 695.0, 800.0, 561.0, 330.0, 217.0, 135.0, 84.0, 52.0, 21.0, 19.0, 13.0, 6.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-41.9375, -40.989013671875, -40.04052734375, -39.092041015625, -38.1435546875, -37.195068359375, -36.24658203125, -35.298095703125, -34.349609375, -33.401123046875, -32.45263671875, -31.504150390625, -30.5556640625, -29.607177734375, -28.65869140625, -27.710205078125, -26.76171875, -25.813232421875, -24.86474609375, -23.916259765625, -22.9677734375, -22.019287109375, -21.07080078125, -20.122314453125, -19.173828125, -18.225341796875, -17.27685546875, -16.328369140625, -15.3798828125, -14.431396484375, -13.48291015625, -12.534423828125, -11.5859375, -10.637451171875, -9.68896484375, -8.740478515625, -7.7919921875, -6.843505859375, -5.89501953125, -4.946533203125, -3.998046875, -3.049560546875, -2.10107421875, -1.152587890625, -0.2041015625, 0.744384765625, 1.69287109375, 2.641357421875, 3.58984375, 4.538330078125, 5.48681640625, 6.435302734375, 7.3837890625, 8.332275390625, 9.28076171875, 10.229248046875, 11.177734375, 12.126220703125, 13.07470703125, 14.023193359375, 14.9716796875, 15.920166015625, 16.86865234375, 17.817138671875, 18.765625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 11.0, 12.0, 19.0, 20.0, 36.0, 38.0, 29.0, 45.0, 88.0, 81.0, 124.0, 186.0, 307.0, 559.0, 1460.0, 24900.0, 4115203.0, 48004.0, 1609.0, 497.0, 308.0, 168.0, 144.0, 85.0, 76.0, 75.0, 42.0, 36.0, 21.0, 22.0, 16.0, 13.0, 5.0, 10.0, 5.0, 4.0, 3.0, 5.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.75, -91.6494140625, -88.548828125, -85.4482421875, -82.34765625, -79.2470703125, -76.146484375, -73.0458984375, -69.9453125, -66.8447265625, -63.744140625, -60.6435546875, -57.54296875, -54.4423828125, -51.341796875, -48.2412109375, -45.140625, -42.0400390625, -38.939453125, -35.8388671875, -32.73828125, -29.6376953125, -26.537109375, -23.4365234375, -20.3359375, -17.2353515625, -14.134765625, -11.0341796875, -7.93359375, -4.8330078125, -1.732421875, 1.3681640625, 4.46875, 7.5693359375, 10.669921875, 13.7705078125, 16.87109375, 19.9716796875, 23.072265625, 26.1728515625, 29.2734375, 32.3740234375, 35.474609375, 38.5751953125, 41.67578125, 44.7763671875, 47.876953125, 50.9775390625, 54.078125, 57.1787109375, 60.279296875, 63.3798828125, 66.48046875, 69.5810546875, 72.681640625, 75.7822265625, 78.8828125, 81.9833984375, 85.083984375, 88.1845703125, 91.28515625, 94.3857421875, 97.486328125, 100.5869140625, 103.6875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 125.0, 738.0, 147.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-667.907470703125, -655.1900024414062, -642.4725952148438, -629.755126953125, -617.0377197265625, -604.3202514648438, -591.602783203125, -578.8853759765625, -566.1679077148438, -553.450439453125, -540.7330322265625, -528.0155639648438, -515.2981567382812, -502.5806884765625, -489.8632507324219, -477.14581298828125, -464.4283752441406, -451.7109375, -438.9934997558594, -426.27606201171875, -413.55859375, -400.8411560058594, -388.12371826171875, -375.4062805175781, -362.6888427734375, -349.9714050292969, -337.25396728515625, -324.5364990234375, -311.8190612792969, -299.10162353515625, -286.3841857910156, -273.666748046875, -260.94927978515625, -248.23184204101562, -235.51438903808594, -222.7969512939453, -210.07949829101562, -197.362060546875, -184.64462280273438, -171.92718505859375, -159.209716796875, -146.49227905273438, -133.7748260498047, -121.05738830566406, -108.3399429321289, -95.62249755859375, -82.90505981445312, -70.18761444091797, -57.47016906738281, -44.752723693847656, -32.035282135009766, -19.317840576171875, -6.600395202636719, 6.1170501708984375, 18.834487915039062, 31.55193328857422, 44.269378662109375, 56.98682403564453, 69.70426940917969, 82.42170715332031, 95.13915252685547, 107.85659790039062, 120.57403564453125, 133.29147338867188, 146.00892639160156]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 7.0, 7.0, 5.0, 14.0, 6.0, 5.0, 10.0, 12.0, 23.0, 21.0, 24.0, 28.0, 30.0, 37.0, 34.0, 37.0, 31.0, 49.0, 47.0, 54.0, 59.0, 53.0, 49.0, 44.0, 37.0, 37.0, 45.0, 36.0, 25.0, 18.0, 18.0, 21.0, 20.0, 11.0, 12.0, 7.0, 7.0, 8.0, 6.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.1439208984375, -62.992645263671875, -60.841373443603516, -58.690101623535156, -56.53882598876953, -54.387550354003906, -52.23627853393555, -50.08500671386719, -47.93373107910156, -45.78245544433594, -43.63118362426758, -41.47991180419922, -39.328636169433594, -37.17736053466797, -35.02608871459961, -32.87481689453125, -30.723541259765625, -28.572267532348633, -26.42099380493164, -24.26972007751465, -22.118446350097656, -19.967172622680664, -17.815898895263672, -15.66462516784668, -13.513351440429688, -11.362077713012695, -9.210803985595703, -7.059530258178711, -4.908256530761719, -2.7569828033447266, -0.6057090759277344, 1.5455646514892578, 3.6968460083007812, 5.848119735717773, 7.999393463134766, 10.150667190551758, 12.30194091796875, 14.453214645385742, 16.604488372802734, 18.755762100219727, 20.90703582763672, 23.05830955505371, 25.209583282470703, 27.360857009887695, 29.512130737304688, 31.66340446472168, 33.81467819213867, 35.96595001220703, 38.117225646972656, 40.26850128173828, 42.41977310180664, 44.571044921875, 46.722320556640625, 48.87359619140625, 51.02486801147461, 53.17613983154297, 55.327415466308594, 57.47869110107422, 59.62996292114258, 61.78123474121094, 63.93251037597656, 66.08378601074219, 68.23506164550781, 70.3863296508789, 72.53760528564453]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 5.0, 11.0, 6.0, 10.0, 10.0, 16.0, 22.0, 27.0, 23.0, 25.0, 18.0, 35.0, 36.0, 30.0, 34.0, 35.0, 43.0, 45.0, 40.0, 29.0, 38.0, 49.0, 42.0, 35.0, 39.0, 37.0, 35.0, 27.0, 26.0, 30.0, 17.0, 25.0, 19.0, 25.0, 8.0, 13.0, 7.0, 8.0, 4.0, 2.0, 4.0, 8.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.171875, -9.7777099609375, -9.383544921875, -8.9893798828125, -8.59521484375, -8.2010498046875, -7.806884765625, -7.4127197265625, -7.0185546875, -6.6243896484375, -6.230224609375, -5.8360595703125, -5.44189453125, -5.0477294921875, -4.653564453125, -4.2593994140625, -3.865234375, -3.4710693359375, -3.076904296875, -2.6827392578125, -2.28857421875, -1.8944091796875, -1.500244140625, -1.1060791015625, -0.7119140625, -0.3177490234375, 0.076416015625, 0.4705810546875, 0.86474609375, 1.2589111328125, 1.653076171875, 2.0472412109375, 2.44140625, 2.8355712890625, 3.229736328125, 3.6239013671875, 4.01806640625, 4.4122314453125, 4.806396484375, 5.2005615234375, 5.5947265625, 5.9888916015625, 6.383056640625, 6.7772216796875, 7.17138671875, 7.5655517578125, 7.959716796875, 8.3538818359375, 8.748046875, 9.1422119140625, 9.536376953125, 9.9305419921875, 10.32470703125, 10.7188720703125, 11.113037109375, 11.5072021484375, 11.9013671875, 12.2955322265625, 12.689697265625, 13.0838623046875, 13.47802734375, 13.8721923828125, 14.266357421875, 14.6605224609375, 15.0546875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 5.0, 2.0, 5.0, 6.0, 3.0, 6.0, 21.0, 43.0, 54.0, 93.0, 134.0, 231.0, 330.0, 488.0, 683.0, 1058.0, 1715.0, 2632.0, 4011.0, 6103.0, 9436.0, 14734.0, 23056.0, 36756.0, 60831.0, 109294.0, 257957.0, 250728.0, 107502.0, 60219.0, 36220.0, 22913.0, 14595.0, 9185.0, 6081.0, 4038.0, 2571.0, 1627.0, 1080.0, 741.0, 477.0, 304.0, 229.0, 118.0, 96.0, 54.0, 48.0, 22.0, 11.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.330078125, -2.2548828125, -2.1796875, -2.1044921875, -2.029296875, -1.9541015625, -1.87890625, -1.8037109375, -1.728515625, -1.6533203125, -1.578125, -1.5029296875, -1.427734375, -1.3525390625, -1.27734375, -1.2021484375, -1.126953125, -1.0517578125, -0.9765625, -0.9013671875, -0.826171875, -0.7509765625, -0.67578125, -0.6005859375, -0.525390625, -0.4501953125, -0.375, -0.2998046875, -0.224609375, -0.1494140625, -0.07421875, 0.0009765625, 0.076171875, 0.1513671875, 0.2265625, 0.3017578125, 0.376953125, 0.4521484375, 0.52734375, 0.6025390625, 0.677734375, 0.7529296875, 0.828125, 0.9033203125, 0.978515625, 1.0537109375, 1.12890625, 1.2041015625, 1.279296875, 1.3544921875, 1.4296875, 1.5048828125, 1.580078125, 1.6552734375, 1.73046875, 1.8056640625, 1.880859375, 1.9560546875, 2.03125, 2.1064453125, 2.181640625, 2.2568359375, 2.33203125, 2.4072265625, 2.482421875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 1.0, 2.0, 7.0, 9.0, 7.0, 9.0, 15.0, 9.0, 16.0, 21.0, 19.0, 22.0, 25.0, 22.0, 35.0, 44.0, 36.0, 33.0, 48.0, 48.0, 47.0, 1056.0, 44.0, 41.0, 46.0, 44.0, 25.0, 44.0, 34.0, 27.0, 24.0, 21.0, 20.0, 16.0, 21.0, 9.0, 16.0, 19.0, 10.0, 7.0, 7.0, 2.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.359375, -8.1033935546875, -7.847412109375, -7.5914306640625, -7.33544921875, -7.0794677734375, -6.823486328125, -6.5675048828125, -6.3115234375, -6.0555419921875, -5.799560546875, -5.5435791015625, -5.28759765625, -5.0316162109375, -4.775634765625, -4.5196533203125, -4.263671875, -4.0076904296875, -3.751708984375, -3.4957275390625, -3.23974609375, -2.9837646484375, -2.727783203125, -2.4718017578125, -2.2158203125, -1.9598388671875, -1.703857421875, -1.4478759765625, -1.19189453125, -0.9359130859375, -0.679931640625, -0.4239501953125, -0.16796875, 0.0880126953125, 0.343994140625, 0.5999755859375, 0.85595703125, 1.1119384765625, 1.367919921875, 1.6239013671875, 1.8798828125, 2.1358642578125, 2.391845703125, 2.6478271484375, 2.90380859375, 3.1597900390625, 3.415771484375, 3.6717529296875, 3.927734375, 4.1837158203125, 4.439697265625, 4.6956787109375, 4.95166015625, 5.2076416015625, 5.463623046875, 5.7196044921875, 5.9755859375, 6.2315673828125, 6.487548828125, 6.7435302734375, 6.99951171875, 7.2554931640625, 7.511474609375, 7.7674560546875, 8.0234375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 8.0, 9.0, 9.0, 21.0, 28.0, 41.0, 53.0, 66.0, 101.0, 189.0, 271.0, 402.0, 581.0, 812.0, 1309.0, 1915.0, 2945.0, 4511.0, 6827.0, 10535.0, 15868.0, 24817.0, 40615.0, 69651.0, 138108.0, 1392971.0, 175968.0, 81839.0, 46402.0, 28395.0, 17961.0, 11589.0, 7656.0, 4929.0, 3298.0, 2139.0, 1430.0, 919.0, 663.0, 432.0, 264.0, 190.0, 132.0, 71.0, 57.0, 41.0, 32.0, 22.0, 20.0, 10.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.439453125, -2.362335205078125, -2.28521728515625, -2.208099365234375, -2.1309814453125, -2.053863525390625, -1.97674560546875, -1.899627685546875, -1.822509765625, -1.745391845703125, -1.66827392578125, -1.591156005859375, -1.5140380859375, -1.436920166015625, -1.35980224609375, -1.282684326171875, -1.20556640625, -1.128448486328125, -1.05133056640625, -0.974212646484375, -0.8970947265625, -0.819976806640625, -0.74285888671875, -0.665740966796875, -0.588623046875, -0.511505126953125, -0.43438720703125, -0.357269287109375, -0.2801513671875, -0.203033447265625, -0.12591552734375, -0.048797607421875, 0.0283203125, 0.105438232421875, 0.18255615234375, 0.259674072265625, 0.3367919921875, 0.413909912109375, 0.49102783203125, 0.568145751953125, 0.645263671875, 0.722381591796875, 0.79949951171875, 0.876617431640625, 0.9537353515625, 1.030853271484375, 1.10797119140625, 1.185089111328125, 1.26220703125, 1.339324951171875, 1.41644287109375, 1.493560791015625, 1.5706787109375, 1.647796630859375, 1.72491455078125, 1.802032470703125, 1.879150390625, 1.956268310546875, 2.03338623046875, 2.110504150390625, 2.1876220703125, 2.264739990234375, 2.34185791015625, 2.418975830078125, 2.49609375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 7.0, 8.0, 6.0, 9.0, 8.0, 9.0, 14.0, 20.0, 19.0, 30.0, 49.0, 53.0, 65.0, 82.0, 96.0, 102.0, 86.0, 81.0, 58.0, 46.0, 30.0, 28.0, 20.0, 27.0, 10.0, 9.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0016241073608398438, -0.0015690773725509644, -0.001514047384262085, -0.0014590173959732056, -0.0014039874076843262, -0.0013489574193954468, -0.0012939274311065674, -0.001238897442817688, -0.0011838674545288086, -0.0011288374662399292, -0.0010738074779510498, -0.0010187774896621704, -0.000963747501373291, -0.0009087175130844116, -0.0008536875247955322, -0.0007986575365066528, -0.0007436275482177734, -0.000688597559928894, -0.0006335675716400146, -0.0005785375833511353, -0.0005235075950622559, -0.00046847760677337646, -0.00041344761848449707, -0.0003584176301956177, -0.0003033876419067383, -0.0002483576536178589, -0.0001933276653289795, -0.0001382976770401001, -8.32676887512207e-05, -2.823770046234131e-05, 2.6792287826538086e-05, 8.182227611541748e-05, 0.00013685226440429688, 0.00019188225269317627, 0.00024691224098205566, 0.00030194222927093506, 0.00035697221755981445, 0.00041200220584869385, 0.00046703219413757324, 0.0005220621824264526, 0.000577092170715332, 0.0006321221590042114, 0.0006871521472930908, 0.0007421821355819702, 0.0007972121238708496, 0.000852242112159729, 0.0009072721004486084, 0.0009623020887374878, 0.0010173320770263672, 0.0010723620653152466, 0.001127392053604126, 0.0011824220418930054, 0.0012374520301818848, 0.0012924820184707642, 0.0013475120067596436, 0.001402541995048523, 0.0014575719833374023, 0.0015126019716262817, 0.0015676319599151611, 0.0016226619482040405, 0.00167769193649292, 0.0017327219247817993, 0.0017877519130706787, 0.001842781901359558, 0.0018978118896484375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 3.0, 2.0, 5.0, 0.0, 6.0, 7.0, 8.0, 10.0, 17.0, 21.0, 20.0, 32.0, 52.0, 65.0, 121.0, 190.0, 436.0, 2117.0, 1040988.0, 3244.0, 543.0, 234.0, 135.0, 77.0, 53.0, 39.0, 38.0, 19.0, 15.0, 14.0, 3.0, 12.0, 10.0, 8.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.04144287109375, -0.0402073860168457, -0.038971900939941406, -0.03773641586303711, -0.03650093078613281, -0.035265445709228516, -0.03402996063232422, -0.03279447555541992, -0.031558990478515625, -0.030323505401611328, -0.02908802032470703, -0.027852535247802734, -0.026617050170898438, -0.02538156509399414, -0.024146080017089844, -0.022910594940185547, -0.02167510986328125, -0.020439624786376953, -0.019204139709472656, -0.01796865463256836, -0.016733169555664062, -0.015497684478759766, -0.014262199401855469, -0.013026714324951172, -0.011791229248046875, -0.010555744171142578, -0.009320259094238281, -0.008084774017333984, -0.0068492889404296875, -0.005613803863525391, -0.004378318786621094, -0.003142833709716797, -0.0019073486328125, -0.0006718635559082031, 0.0005636215209960938, 0.0017991065979003906, 0.0030345916748046875, 0.004270076751708984, 0.005505561828613281, 0.006741046905517578, 0.007976531982421875, 0.009212017059326172, 0.010447502136230469, 0.011682987213134766, 0.012918472290039062, 0.01415395736694336, 0.015389442443847656, 0.016624927520751953, 0.01786041259765625, 0.019095897674560547, 0.020331382751464844, 0.02156686782836914, 0.022802352905273438, 0.024037837982177734, 0.02527332305908203, 0.026508808135986328, 0.027744293212890625, 0.028979778289794922, 0.03021526336669922, 0.031450748443603516, 0.03268623352050781, 0.03392171859741211, 0.035157203674316406, 0.0363926887512207, 0.037628173828125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 42.0, 277.0, 516.0, 149.0, 19.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002594602294266224, -0.0024960734881460667, -0.0023975444491952658, -0.0022990156430751085, -0.0022004868369549513, -0.0021019577980041504, -0.002003428991883993, -0.001904900185763836, -0.0018063713796436787, -0.0017078424571081996, -0.0016093136509880424, -0.0015107847284525633, -0.001412255922332406, -0.001313726999796927, -0.001215198077261448, -0.0011166692711412907, -0.0010181403486058116, -0.0009196114842779934, -0.0008210826199501753, -0.0007225536974146962, -0.000624024891294539, -0.0005254959687590599, -0.00042696710443124175, -0.0003284382401034236, -0.00022990937577560544, -0.00013138051144778728, -3.28516325680539e-05, 6.567724631167948e-05, 0.00016420611063949764, 0.00026273500407114625, 0.0003612638683989644, 0.00045979273272678256, 0.0005583215970546007, 0.0006568504613824189, 0.000755379325710237, 0.0008539082482457161, 0.0009524370543658733, 0.0010509659769013524, 0.0011494948994368315, 0.0012480237055569887, 0.001346552511677146, 0.001445081434212625, 0.0015436102403327823, 0.0016421391628682613, 0.0017406679689884186, 0.0018391968915238976, 0.0019377258140593767, 0.002036254620179534, 0.002134783659130335, 0.002233312465250492, 0.002331841504201293, 0.0024303703103214502, 0.0025288991164416075, 0.0026274281553924084, 0.0027259569615125656, 0.002824485767632723, 0.00292301457375288, 0.0030215433798730373, 0.0031200724188238382, 0.0032186012249439955, 0.0033171300310641527, 0.0034156590700149536, 0.003514187876135111, 0.003612716682255268, 0.0037112454883754253]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 2.0, 3.0, 2.0, 4.0, 5.0, 4.0, 11.0, 7.0, 11.0, 17.0, 19.0, 11.0, 21.0, 34.0, 22.0, 22.0, 22.0, 33.0, 33.0, 33.0, 43.0, 41.0, 37.0, 33.0, 28.0, 46.0, 44.0, 33.0, 44.0, 36.0, 29.0, 33.0, 29.0, 18.0, 26.0, 22.0, 25.0, 20.0, 23.0, 21.0, 10.0, 5.0, 11.0, 8.0, 5.0, 0.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0007055401802062988, -0.0006841942667961121, -0.0006628483533859253, -0.0006415024399757385, -0.0006201565265655518, -0.000598810613155365, -0.0005774646997451782, -0.0005561187863349915, -0.0005347728729248047, -0.0005134269595146179, -0.0004920810461044312, -0.0004707351326942444, -0.0004493892192840576, -0.00042804330587387085, -0.0004066973924636841, -0.0003853514790534973, -0.00036400556564331055, -0.0003426596522331238, -0.000321313738822937, -0.00029996782541275024, -0.0002786219120025635, -0.0002572759985923767, -0.00023593008518218994, -0.00021458417177200317, -0.0001932382583618164, -0.00017189234495162964, -0.00015054643154144287, -0.0001292005181312561, -0.00010785460472106934, -8.650869131088257e-05, -6.51627779006958e-05, -4.381686449050903e-05, -2.2470951080322266e-05, -1.125037670135498e-06, 2.022087574005127e-05, 4.156678915023804e-05, 6.29127025604248e-05, 8.425861597061157e-05, 0.00010560452938079834, 0.0001269504427909851, 0.00014829635620117188, 0.00016964226961135864, 0.0001909881830215454, 0.00021233409643173218, 0.00023368000984191895, 0.0002550259232521057, 0.0002763718366622925, 0.00029771775007247925, 0.000319063663482666, 0.0003404095768928528, 0.00036175549030303955, 0.0003831014037132263, 0.0004044473171234131, 0.00042579323053359985, 0.0004471391439437866, 0.0004684850573539734, 0.0004898309707641602, 0.0005111768841743469, 0.0005325227975845337, 0.0005538687109947205, 0.0005752146244049072, 0.000596560537815094, 0.0006179064512252808, 0.0006392523646354675, 0.0006605982780456543]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 5.0, 11.0, 6.0, 10.0, 10.0, 16.0, 22.0, 27.0, 23.0, 25.0, 18.0, 35.0, 36.0, 30.0, 34.0, 35.0, 43.0, 45.0, 40.0, 29.0, 38.0, 49.0, 42.0, 35.0, 39.0, 37.0, 35.0, 27.0, 26.0, 30.0, 18.0, 24.0, 19.0, 25.0, 8.0, 13.0, 7.0, 8.0, 4.0, 2.0, 4.0, 8.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.171875, -9.7777099609375, -9.383544921875, -8.9893798828125, -8.59521484375, -8.2010498046875, -7.806884765625, -7.4127197265625, -7.0185546875, -6.6243896484375, -6.230224609375, -5.8360595703125, -5.44189453125, -5.0477294921875, -4.653564453125, -4.2593994140625, -3.865234375, -3.4710693359375, -3.076904296875, -2.6827392578125, -2.28857421875, -1.8944091796875, -1.500244140625, -1.1060791015625, -0.7119140625, -0.3177490234375, 0.076416015625, 0.4705810546875, 0.86474609375, 1.2589111328125, 1.653076171875, 2.0472412109375, 2.44140625, 2.8355712890625, 3.229736328125, 3.6239013671875, 4.01806640625, 4.4122314453125, 4.806396484375, 5.2005615234375, 5.5947265625, 5.9888916015625, 6.383056640625, 6.7772216796875, 7.17138671875, 7.5655517578125, 7.959716796875, 8.3538818359375, 8.748046875, 9.1422119140625, 9.536376953125, 9.9305419921875, 10.32470703125, 10.7188720703125, 11.113037109375, 11.5072021484375, 11.9013671875, 12.2955322265625, 12.689697265625, 13.0838623046875, 13.47802734375, 13.8721923828125, 14.266357421875, 14.6605224609375, 15.0546875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 8.0, 2.0, 7.0, 8.0, 13.0, 18.0, 22.0, 21.0, 34.0, 38.0, 71.0, 79.0, 100.0, 125.0, 162.0, 265.0, 378.0, 449.0, 611.0, 884.0, 2042.0, 13498.0, 346526.0, 657180.0, 20027.0, 2447.0, 984.0, 674.0, 468.0, 394.0, 256.0, 188.0, 149.0, 94.0, 85.0, 73.0, 44.0, 32.0, 21.0, 20.0, 12.0, 11.0, 10.0, 7.0, 10.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.765625, -24.777587890625, -23.78955078125, -22.801513671875, -21.8134765625, -20.825439453125, -19.83740234375, -18.849365234375, -17.861328125, -16.873291015625, -15.88525390625, -14.897216796875, -13.9091796875, -12.921142578125, -11.93310546875, -10.945068359375, -9.95703125, -8.968994140625, -7.98095703125, -6.992919921875, -6.0048828125, -5.016845703125, -4.02880859375, -3.040771484375, -2.052734375, -1.064697265625, -0.07666015625, 0.911376953125, 1.8994140625, 2.887451171875, 3.87548828125, 4.863525390625, 5.8515625, 6.839599609375, 7.82763671875, 8.815673828125, 9.8037109375, 10.791748046875, 11.77978515625, 12.767822265625, 13.755859375, 14.743896484375, 15.73193359375, 16.719970703125, 17.7080078125, 18.696044921875, 19.68408203125, 20.672119140625, 21.66015625, 22.648193359375, 23.63623046875, 24.624267578125, 25.6123046875, 26.600341796875, 27.58837890625, 28.576416015625, 29.564453125, 30.552490234375, 31.54052734375, 32.528564453125, 33.5166015625, 34.504638671875, 35.49267578125, 36.480712890625, 37.46875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 7.0, 7.0, 6.0, 10.0, 10.0, 11.0, 25.0, 24.0, 26.0, 47.0, 34.0, 35.0, 58.0, 60.0, 81.0, 206.0, 1843.0, 125.0, 73.0, 70.0, 45.0, 46.0, 41.0, 31.0, 27.0, 25.0, 16.0, 19.0, 10.0, 9.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.46875, -47.93798828125, -46.4072265625, -44.87646484375, -43.345703125, -41.81494140625, -40.2841796875, -38.75341796875, -37.22265625, -35.69189453125, -34.1611328125, -32.63037109375, -31.099609375, -29.56884765625, -28.0380859375, -26.50732421875, -24.9765625, -23.44580078125, -21.9150390625, -20.38427734375, -18.853515625, -17.32275390625, -15.7919921875, -14.26123046875, -12.73046875, -11.19970703125, -9.6689453125, -8.13818359375, -6.607421875, -5.07666015625, -3.5458984375, -2.01513671875, -0.484375, 1.04638671875, 2.5771484375, 4.10791015625, 5.638671875, 7.16943359375, 8.7001953125, 10.23095703125, 11.76171875, 13.29248046875, 14.8232421875, 16.35400390625, 17.884765625, 19.41552734375, 20.9462890625, 22.47705078125, 24.0078125, 25.53857421875, 27.0693359375, 28.60009765625, 30.130859375, 31.66162109375, 33.1923828125, 34.72314453125, 36.25390625, 37.78466796875, 39.3154296875, 40.84619140625, 42.376953125, 43.90771484375, 45.4384765625, 46.96923828125, 48.5]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 12.0, 14.0, 18.0, 20.0, 35.0, 35.0, 41.0, 62.0, 83.0, 150.0, 362.0, 1357.0, 3099360.0, 42771.0, 704.0, 239.0, 117.0, 66.0, 48.0, 50.0, 27.0, 31.0, 20.0, 17.0, 11.0, 9.0, 7.0, 7.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.75, -133.421875, -129.09375, -124.765625, -120.4375, -116.109375, -111.78125, -107.453125, -103.125, -98.796875, -94.46875, -90.140625, -85.8125, -81.484375, -77.15625, -72.828125, -68.5, -64.171875, -59.84375, -55.515625, -51.1875, -46.859375, -42.53125, -38.203125, -33.875, -29.546875, -25.21875, -20.890625, -16.5625, -12.234375, -7.90625, -3.578125, 0.75, 5.078125, 9.40625, 13.734375, 18.0625, 22.390625, 26.71875, 31.046875, 35.375, 39.703125, 44.03125, 48.359375, 52.6875, 57.015625, 61.34375, 65.671875, 70.0, 74.328125, 78.65625, 82.984375, 87.3125, 91.640625, 95.96875, 100.296875, 104.625, 108.953125, 113.28125, 117.609375, 121.9375, 126.265625, 130.59375, 134.921875, 139.25]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 271.0, 651.0, 89.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.67513275146484, -101.88948059082031, -97.10383605957031, -92.31818389892578, -87.53253173828125, -82.74687957763672, -77.96122741699219, -73.17558288574219, -68.38993072509766, -63.604278564453125, -58.81863021850586, -54.032981872558594, -49.24732971191406, -44.46167755126953, -39.676029205322266, -34.890380859375, -30.10472869873047, -25.31907844543457, -20.533428192138672, -15.747777938842773, -10.962127685546875, -6.176477432250977, -1.3908271789550781, 3.3948211669921875, 8.180473327636719, 12.966123580932617, 17.751773834228516, 22.537424087524414, 27.323074340820312, 32.108726501464844, 36.89437484741211, 41.680023193359375, 46.465667724609375, 51.251319885253906, 56.03696823120117, 60.82261657714844, 65.60826873779297, 70.3939208984375, 75.1795654296875, 79.96521759033203, 84.75086975097656, 89.5365219116211, 94.32217407226562, 99.10781860351562, 103.89347076416016, 108.67912292480469, 113.46476745605469, 118.25041961669922, 123.03607177734375, 127.82172393798828, 132.6073760986328, 137.3930206298828, 142.17868041992188, 146.96432495117188, 151.74996948242188, 156.53561401367188, 161.32127380371094, 166.10691833496094, 170.892578125, 175.67822265625, 180.4638671875, 185.24952697753906, 190.03517150878906, 194.82083129882812, 199.60647583007812]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 5.0, 2.0, 5.0, 9.0, 6.0, 8.0, 15.0, 15.0, 17.0, 19.0, 23.0, 20.0, 21.0, 19.0, 32.0, 30.0, 30.0, 29.0, 39.0, 38.0, 36.0, 37.0, 41.0, 47.0, 35.0, 32.0, 43.0, 27.0, 40.0, 24.0, 34.0, 28.0, 28.0, 26.0, 17.0, 23.0, 14.0, 15.0, 13.0, 8.0, 3.0, 16.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-85.07910919189453, -82.22688293457031, -79.37466430664062, -76.52244567871094, -73.67021942138672, -70.8179931640625, -67.96577453613281, -65.11355590820312, -62.261329650878906, -59.40910720825195, -56.556884765625, -53.70466232299805, -50.852439880371094, -48.00021743774414, -45.14799499511719, -42.295772552490234, -39.44355010986328, -36.59132766723633, -33.739105224609375, -30.886882781982422, -28.03466033935547, -25.182437896728516, -22.330215454101562, -19.47799301147461, -16.625770568847656, -13.773548126220703, -10.92132568359375, -8.069103240966797, -5.216880798339844, -2.3646583557128906, 0.4875640869140625, 3.3397865295410156, 6.192008972167969, 9.044231414794922, 11.896453857421875, 14.748676300048828, 17.60089874267578, 20.453121185302734, 23.305343627929688, 26.15756607055664, 29.009788513183594, 31.862010955810547, 34.7142333984375, 37.56645584106445, 40.418678283691406, 43.27090072631836, 46.12312316894531, 48.975345611572266, 51.82756805419922, 54.67979049682617, 57.532012939453125, 60.38423538208008, 63.23645782470703, 66.08868408203125, 68.94090270996094, 71.79312133789062, 74.64534759521484, 77.49757385253906, 80.34979248046875, 83.20201110839844, 86.05423736572266, 88.90646362304688, 91.75868225097656, 94.61090087890625, 97.46312713623047]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 0.0, 4.0, 3.0, 3.0, 9.0, 9.0, 14.0, 13.0, 15.0, 20.0, 19.0, 25.0, 25.0, 22.0, 37.0, 39.0, 31.0, 44.0, 34.0, 36.0, 34.0, 38.0, 39.0, 52.0, 36.0, 50.0, 28.0, 39.0, 31.0, 32.0, 31.0, 35.0, 23.0, 20.0, 23.0, 18.0, 14.0, 14.0, 10.0, 10.0, 8.0, 5.0, 1.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.734375, -10.330322265625, -9.92626953125, -9.522216796875, -9.1181640625, -8.714111328125, -8.31005859375, -7.906005859375, -7.501953125, -7.097900390625, -6.69384765625, -6.289794921875, -5.8857421875, -5.481689453125, -5.07763671875, -4.673583984375, -4.26953125, -3.865478515625, -3.46142578125, -3.057373046875, -2.6533203125, -2.249267578125, -1.84521484375, -1.441162109375, -1.037109375, -0.633056640625, -0.22900390625, 0.175048828125, 0.5791015625, 0.983154296875, 1.38720703125, 1.791259765625, 2.1953125, 2.599365234375, 3.00341796875, 3.407470703125, 3.8115234375, 4.215576171875, 4.61962890625, 5.023681640625, 5.427734375, 5.831787109375, 6.23583984375, 6.639892578125, 7.0439453125, 7.447998046875, 7.85205078125, 8.256103515625, 8.66015625, 9.064208984375, 9.46826171875, 9.872314453125, 10.2763671875, 10.680419921875, 11.08447265625, 11.488525390625, 11.892578125, 12.296630859375, 12.70068359375, 13.104736328125, 13.5087890625, 13.912841796875, 14.31689453125, 14.720947265625, 15.125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 1.0, 6.0, 7.0, 9.0, 13.0, 22.0, 21.0, 37.0, 31.0, 47.0, 43.0, 77.0, 87.0, 132.0, 129.0, 222.0, 322.0, 446.0, 763.0, 1634.0, 4907.0, 31119.0, 779987.0, 2978562.0, 371039.0, 17360.0, 3684.0, 1404.0, 656.0, 430.0, 256.0, 169.0, 148.0, 123.0, 75.0, 75.0, 49.0, 48.0, 32.0, 32.0, 19.0, 14.0, 11.0, 8.0, 10.0, 3.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.140625, -25.2509765625, -24.361328125, -23.4716796875, -22.58203125, -21.6923828125, -20.802734375, -19.9130859375, -19.0234375, -18.1337890625, -17.244140625, -16.3544921875, -15.46484375, -14.5751953125, -13.685546875, -12.7958984375, -11.90625, -11.0166015625, -10.126953125, -9.2373046875, -8.34765625, -7.4580078125, -6.568359375, -5.6787109375, -4.7890625, -3.8994140625, -3.009765625, -2.1201171875, -1.23046875, -0.3408203125, 0.548828125, 1.4384765625, 2.328125, 3.2177734375, 4.107421875, 4.9970703125, 5.88671875, 6.7763671875, 7.666015625, 8.5556640625, 9.4453125, 10.3349609375, 11.224609375, 12.1142578125, 13.00390625, 13.8935546875, 14.783203125, 15.6728515625, 16.5625, 17.4521484375, 18.341796875, 19.2314453125, 20.12109375, 21.0107421875, 21.900390625, 22.7900390625, 23.6796875, 24.5693359375, 25.458984375, 26.3486328125, 27.23828125, 28.1279296875, 29.017578125, 29.9072265625, 30.796875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 8.0, 7.0, 12.0, 19.0, 49.0, 61.0, 112.0, 170.0, 332.0, 625.0, 881.0, 752.0, 470.0, 247.0, 134.0, 79.0, 43.0, 32.0, 14.0, 15.0, 9.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.328125, -30.341796875, -29.35546875, -28.369140625, -27.3828125, -26.396484375, -25.41015625, -24.423828125, -23.4375, -22.451171875, -21.46484375, -20.478515625, -19.4921875, -18.505859375, -17.51953125, -16.533203125, -15.546875, -14.560546875, -13.57421875, -12.587890625, -11.6015625, -10.615234375, -9.62890625, -8.642578125, -7.65625, -6.669921875, -5.68359375, -4.697265625, -3.7109375, -2.724609375, -1.73828125, -0.751953125, 0.234375, 1.220703125, 2.20703125, 3.193359375, 4.1796875, 5.166015625, 6.15234375, 7.138671875, 8.125, 9.111328125, 10.09765625, 11.083984375, 12.0703125, 13.056640625, 14.04296875, 15.029296875, 16.015625, 17.001953125, 17.98828125, 18.974609375, 19.9609375, 20.947265625, 21.93359375, 22.919921875, 23.90625, 24.892578125, 25.87890625, 26.865234375, 27.8515625, 28.837890625, 29.82421875, 30.810546875, 31.796875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 14.0, 21.0, 21.0, 33.0, 45.0, 71.0, 93.0, 161.0, 236.0, 454.0, 1319.0, 10852.0, 4028516.0, 148210.0, 2575.0, 688.0, 311.0, 195.0, 127.0, 91.0, 56.0, 44.0, 40.0, 26.0, 22.0, 12.0, 5.0, 10.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.8125, -88.6181640625, -85.423828125, -82.2294921875, -79.03515625, -75.8408203125, -72.646484375, -69.4521484375, -66.2578125, -63.0634765625, -59.869140625, -56.6748046875, -53.48046875, -50.2861328125, -47.091796875, -43.8974609375, -40.703125, -37.5087890625, -34.314453125, -31.1201171875, -27.92578125, -24.7314453125, -21.537109375, -18.3427734375, -15.1484375, -11.9541015625, -8.759765625, -5.5654296875, -2.37109375, 0.8232421875, 4.017578125, 7.2119140625, 10.40625, 13.6005859375, 16.794921875, 19.9892578125, 23.18359375, 26.3779296875, 29.572265625, 32.7666015625, 35.9609375, 39.1552734375, 42.349609375, 45.5439453125, 48.73828125, 51.9326171875, 55.126953125, 58.3212890625, 61.515625, 64.7099609375, 67.904296875, 71.0986328125, 74.29296875, 77.4873046875, 80.681640625, 83.8759765625, 87.0703125, 90.2646484375, 93.458984375, 96.6533203125, 99.84765625, 103.0419921875, 106.236328125, 109.4306640625, 112.625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 261.0, 729.0, 22.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1005.7844848632812, -987.8919067382812, -969.9993896484375, -952.1068115234375, -934.2142944335938, -916.3217163085938, -898.42919921875, -880.53662109375, -862.6441040039062, -844.7515258789062, -826.8590087890625, -808.9664306640625, -791.0739135742188, -773.1813354492188, -755.288818359375, -737.396240234375, -719.503662109375, -701.611083984375, -683.7185668945312, -665.8259887695312, -647.9334716796875, -630.0408935546875, -612.1483764648438, -594.2557983398438, -576.36328125, -558.470703125, -540.5781860351562, -522.6856079101562, -504.7930908203125, -486.9005432128906, -469.00799560546875, -451.11541748046875, -433.222900390625, -415.3303527832031, -397.43780517578125, -379.5452575683594, -361.6527099609375, -343.7601623535156, -325.86761474609375, -307.97503662109375, -290.08251953125, -272.1899719238281, -254.29742431640625, -236.40487670898438, -218.5123291015625, -200.61978149414062, -182.7272186279297, -164.8346710205078, -146.94212341308594, -129.04957580566406, -111.15702819824219, -93.26447296142578, -75.3719253540039, -57.47937774658203, -39.586822509765625, -21.69427490234375, -3.801727294921875, 14.090822219848633, 31.98337173461914, 49.87592315673828, 67.76847076416016, 85.66101837158203, 103.55357360839844, 121.44612121582031, 139.3386688232422]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 8.0, 9.0, 9.0, 14.0, 12.0, 8.0, 16.0, 23.0, 22.0, 24.0, 26.0, 24.0, 34.0, 33.0, 31.0, 30.0, 26.0, 32.0, 39.0, 46.0, 50.0, 42.0, 38.0, 44.0, 35.0, 34.0, 30.0, 24.0, 32.0, 33.0, 36.0, 24.0, 27.0, 10.0, 10.0, 7.0, 7.0, 7.0, 10.0, 5.0, 8.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-52.92021942138672, -51.162864685058594, -49.40550994873047, -47.648155212402344, -45.89080047607422, -44.133445739746094, -42.37609100341797, -40.618736267089844, -38.86138153076172, -37.104026794433594, -35.34667205810547, -33.589317321777344, -31.83196258544922, -30.074607849121094, -28.3172550201416, -26.559900283813477, -24.802547454833984, -23.04519271850586, -21.287837982177734, -19.53048324584961, -17.773128509521484, -16.01577377319336, -14.258420944213867, -12.501066207885742, -10.743711471557617, -8.986356735229492, -7.229002475738525, -5.471648216247559, -3.7142934799194336, -1.9569387435913086, -0.1995849609375, 1.557769775390625, 3.31512451171875, 5.072479248046875, 6.829833507537842, 8.587187767028809, 10.344542503356934, 12.101897239685059, 13.859251022338867, 15.616605758666992, 17.373960494995117, 19.131315231323242, 20.888669967651367, 22.64602279663086, 24.403377532958984, 26.16073226928711, 27.918087005615234, 29.67544174194336, 31.432796478271484, 33.19015121459961, 34.947505950927734, 36.70486068725586, 38.462215423583984, 40.21957015991211, 41.97692108154297, 43.734275817871094, 45.49163055419922, 47.248985290527344, 49.00634002685547, 50.763694763183594, 52.52104949951172, 54.278404235839844, 56.03575897216797, 57.793113708496094, 59.55046844482422]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 10.0, 7.0, 9.0, 10.0, 9.0, 17.0, 12.0, 16.0, 20.0, 18.0, 25.0, 26.0, 32.0, 38.0, 36.0, 39.0, 35.0, 45.0, 41.0, 48.0, 38.0, 38.0, 42.0, 34.0, 35.0, 43.0, 20.0, 39.0, 38.0, 30.0, 29.0, 23.0, 11.0, 23.0, 12.0, 12.0, 11.0, 5.0, 12.0, 6.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.984375, -12.58544921875, -12.1865234375, -11.78759765625, -11.388671875, -10.98974609375, -10.5908203125, -10.19189453125, -9.79296875, -9.39404296875, -8.9951171875, -8.59619140625, -8.197265625, -7.79833984375, -7.3994140625, -7.00048828125, -6.6015625, -6.20263671875, -5.8037109375, -5.40478515625, -5.005859375, -4.60693359375, -4.2080078125, -3.80908203125, -3.41015625, -3.01123046875, -2.6123046875, -2.21337890625, -1.814453125, -1.41552734375, -1.0166015625, -0.61767578125, -0.21875, 0.18017578125, 0.5791015625, 0.97802734375, 1.376953125, 1.77587890625, 2.1748046875, 2.57373046875, 2.97265625, 3.37158203125, 3.7705078125, 4.16943359375, 4.568359375, 4.96728515625, 5.3662109375, 5.76513671875, 6.1640625, 6.56298828125, 6.9619140625, 7.36083984375, 7.759765625, 8.15869140625, 8.5576171875, 8.95654296875, 9.35546875, 9.75439453125, 10.1533203125, 10.55224609375, 10.951171875, 11.35009765625, 11.7490234375, 12.14794921875, 12.546875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 7.0, 12.0, 27.0, 42.0, 76.0, 91.0, 129.0, 227.0, 309.0, 483.0, 751.0, 1168.0, 1826.0, 2838.0, 4373.0, 6671.0, 10304.0, 16442.0, 26572.0, 42677.0, 72549.0, 139915.0, 338662.0, 170837.0, 83165.0, 48303.0, 29452.0, 18116.0, 11519.0, 7389.0, 4790.0, 3135.0, 2035.0, 1275.0, 830.0, 532.0, 325.0, 226.0, 182.0, 100.0, 73.0, 39.0, 34.0, 15.0, 6.0, 5.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.48828125, -2.409576416015625, -2.33087158203125, -2.252166748046875, -2.1734619140625, -2.094757080078125, -2.01605224609375, -1.937347412109375, -1.858642578125, -1.779937744140625, -1.70123291015625, -1.622528076171875, -1.5438232421875, -1.465118408203125, -1.38641357421875, -1.307708740234375, -1.22900390625, -1.150299072265625, -1.07159423828125, -0.992889404296875, -0.9141845703125, -0.835479736328125, -0.75677490234375, -0.678070068359375, -0.599365234375, -0.520660400390625, -0.44195556640625, -0.363250732421875, -0.2845458984375, -0.205841064453125, -0.12713623046875, -0.048431396484375, 0.0302734375, 0.108978271484375, 0.18768310546875, 0.266387939453125, 0.3450927734375, 0.423797607421875, 0.50250244140625, 0.581207275390625, 0.659912109375, 0.738616943359375, 0.81732177734375, 0.896026611328125, 0.9747314453125, 1.053436279296875, 1.13214111328125, 1.210845947265625, 1.28955078125, 1.368255615234375, 1.44696044921875, 1.525665283203125, 1.6043701171875, 1.683074951171875, 1.76177978515625, 1.840484619140625, 1.919189453125, 1.997894287109375, 2.07659912109375, 2.155303955078125, 2.2340087890625, 2.312713623046875, 2.39141845703125, 2.470123291015625, 2.548828125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 4.0, 8.0, 5.0, 12.0, 11.0, 18.0, 21.0, 23.0, 19.0, 32.0, 36.0, 33.0, 30.0, 45.0, 31.0, 45.0, 46.0, 39.0, 1052.0, 51.0, 29.0, 34.0, 42.0, 39.0, 46.0, 33.0, 29.0, 31.0, 31.0, 19.0, 18.0, 21.0, 24.0, 22.0, 10.0, 8.0, 7.0, 6.0, 5.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1953125, -7.9306640625, -7.666015625, -7.4013671875, -7.13671875, -6.8720703125, -6.607421875, -6.3427734375, -6.078125, -5.8134765625, -5.548828125, -5.2841796875, -5.01953125, -4.7548828125, -4.490234375, -4.2255859375, -3.9609375, -3.6962890625, -3.431640625, -3.1669921875, -2.90234375, -2.6376953125, -2.373046875, -2.1083984375, -1.84375, -1.5791015625, -1.314453125, -1.0498046875, -0.78515625, -0.5205078125, -0.255859375, 0.0087890625, 0.2734375, 0.5380859375, 0.802734375, 1.0673828125, 1.33203125, 1.5966796875, 1.861328125, 2.1259765625, 2.390625, 2.6552734375, 2.919921875, 3.1845703125, 3.44921875, 3.7138671875, 3.978515625, 4.2431640625, 4.5078125, 4.7724609375, 5.037109375, 5.3017578125, 5.56640625, 5.8310546875, 6.095703125, 6.3603515625, 6.625, 6.8896484375, 7.154296875, 7.4189453125, 7.68359375, 7.9482421875, 8.212890625, 8.4775390625, 8.7421875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 6.0, 23.0, 21.0, 34.0, 48.0, 87.0, 105.0, 164.0, 239.0, 371.0, 618.0, 843.0, 1324.0, 2153.0, 3404.0, 5530.0, 8746.0, 13695.0, 22179.0, 36101.0, 60632.0, 110214.0, 1315875.0, 254130.0, 108095.0, 58819.0, 35406.0, 22000.0, 13650.0, 8447.0, 5158.0, 3250.0, 1995.0, 1251.0, 869.0, 554.0, 347.0, 255.0, 155.0, 103.0, 61.0, 56.0, 38.0, 20.0, 13.0, 16.0, 7.0, 1.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-2.62890625, -2.5491943359375, -2.469482421875, -2.3897705078125, -2.31005859375, -2.2303466796875, -2.150634765625, -2.0709228515625, -1.9912109375, -1.9114990234375, -1.831787109375, -1.7520751953125, -1.67236328125, -1.5926513671875, -1.512939453125, -1.4332275390625, -1.353515625, -1.2738037109375, -1.194091796875, -1.1143798828125, -1.03466796875, -0.9549560546875, -0.875244140625, -0.7955322265625, -0.7158203125, -0.6361083984375, -0.556396484375, -0.4766845703125, -0.39697265625, -0.3172607421875, -0.237548828125, -0.1578369140625, -0.078125, 0.0015869140625, 0.081298828125, 0.1610107421875, 0.24072265625, 0.3204345703125, 0.400146484375, 0.4798583984375, 0.5595703125, 0.6392822265625, 0.718994140625, 0.7987060546875, 0.87841796875, 0.9581298828125, 1.037841796875, 1.1175537109375, 1.197265625, 1.2769775390625, 1.356689453125, 1.4364013671875, 1.51611328125, 1.5958251953125, 1.675537109375, 1.7552490234375, 1.8349609375, 1.9146728515625, 1.994384765625, 2.0740966796875, 2.15380859375, 2.2335205078125, 2.313232421875, 2.3929443359375, 2.47265625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 6.0, 7.0, 8.0, 7.0, 8.0, 16.0, 18.0, 20.0, 24.0, 30.0, 26.0, 29.0, 51.0, 43.0, 56.0, 73.0, 57.0, 55.0, 58.0, 61.0, 48.0, 35.0, 40.0, 22.0, 21.0, 20.0, 21.0, 20.0, 22.0, 14.0, 8.0, 11.0, 12.0, 9.0, 0.0, 9.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008940696716308594, -0.0008653402328491211, -0.0008366107940673828, -0.0008078813552856445, -0.0007791519165039062, -0.000750422477722168, -0.0007216930389404297, -0.0006929636001586914, -0.0006642341613769531, -0.0006355047225952148, -0.0006067752838134766, -0.0005780458450317383, -0.00054931640625, -0.0005205869674682617, -0.0004918575286865234, -0.00046312808990478516, -0.0004343986511230469, -0.0004056692123413086, -0.0003769397735595703, -0.00034821033477783203, -0.00031948089599609375, -0.00029075145721435547, -0.0002620220184326172, -0.0002332925796508789, -0.00020456314086914062, -0.00017583370208740234, -0.00014710426330566406, -0.00011837482452392578, -8.96453857421875e-05, -6.091594696044922e-05, -3.218650817871094e-05, -3.4570693969726562e-06, 2.5272369384765625e-05, 5.4001808166503906e-05, 8.273124694824219e-05, 0.00011146068572998047, 0.00014019012451171875, 0.00016891956329345703, 0.0001976490020751953, 0.0002263784408569336, 0.0002551078796386719, 0.00028383731842041016, 0.00031256675720214844, 0.0003412961959838867, 0.000370025634765625, 0.0003987550735473633, 0.00042748451232910156, 0.00045621395111083984, 0.0004849433898925781, 0.0005136728286743164, 0.0005424022674560547, 0.000571131706237793, 0.0005998611450195312, 0.0006285905838012695, 0.0006573200225830078, 0.0006860494613647461, 0.0007147789001464844, 0.0007435083389282227, 0.0007722377777099609, 0.0008009672164916992, 0.0008296966552734375, 0.0008584260940551758, 0.0008871555328369141, 0.0009158849716186523, 0.0009446144104003906]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 18.0, 11.0, 14.0, 15.0, 19.0, 20.0, 36.0, 41.0, 54.0, 73.0, 129.0, 153.0, 312.0, 679.0, 10232.0, 1028770.0, 6427.0, 631.0, 273.0, 187.0, 125.0, 75.0, 58.0, 31.0, 26.0, 27.0, 14.0, 11.0, 21.0, 12.0, 10.0, 6.0, 4.0, 9.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0229644775390625, -0.02221059799194336, -0.02145671844482422, -0.020702838897705078, -0.019948959350585938, -0.019195079803466797, -0.018441200256347656, -0.017687320709228516, -0.016933441162109375, -0.016179561614990234, -0.015425682067871094, -0.014671802520751953, -0.013917922973632812, -0.013164043426513672, -0.012410163879394531, -0.01165628433227539, -0.01090240478515625, -0.01014852523803711, -0.009394645690917969, -0.008640766143798828, -0.007886886596679688, -0.007133007049560547, -0.006379127502441406, -0.005625247955322266, -0.004871368408203125, -0.004117488861083984, -0.0033636093139648438, -0.002609729766845703, -0.0018558502197265625, -0.0011019706726074219, -0.00034809112548828125, 0.0004057884216308594, 0.00115966796875, 0.0019135475158691406, 0.0026674270629882812, 0.003421306610107422, 0.0041751861572265625, 0.004929065704345703, 0.005682945251464844, 0.006436824798583984, 0.007190704345703125, 0.007944583892822266, 0.008698463439941406, 0.009452342987060547, 0.010206222534179688, 0.010960102081298828, 0.011713981628417969, 0.01246786117553711, 0.01322174072265625, 0.01397562026977539, 0.014729499816894531, 0.015483379364013672, 0.016237258911132812, 0.016991138458251953, 0.017745018005371094, 0.018498897552490234, 0.019252777099609375, 0.020006656646728516, 0.020760536193847656, 0.021514415740966797, 0.022268295288085938, 0.023022174835205078, 0.02377605438232422, 0.02452993392944336, 0.0252838134765625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 159.0, 767.0, 80.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00251849670894444, -0.002354952972382307, -0.0021914090029895306, -0.0020278652664273977, -0.001864321529865265, -0.001700777793303132, -0.0015372339403256774, -0.0013736900873482227, -0.00121014635078609, -0.001046602614223957, -0.0008830587612465024, -0.0007195149664767087, -0.0005559711717069149, -0.00039242737693712115, -0.0002288835821673274, -6.533972918987274e-05, 9.82040073722601e-05, 0.00026174780214205384, 0.0004252915969118476, 0.0005888353916816413, 0.0007523791864514351, 0.0009159229812212288, 0.0010794667759910226, 0.0012430106289684772, 0.00140655436553061, 0.001570098102092743, 0.0017336419550701976, 0.0018971858080476522, 0.002060729544609785, 0.002224273281171918, 0.0023878170177340508, 0.0025513609871268272, 0.0027149049565196037, 0.0028784486930817366, 0.0030419924296438694, 0.003205536399036646, 0.0033690801355987787, 0.0035326238721609116, 0.003696167841553688, 0.003859711578115821, 0.004023255314677954, 0.00418679928407073, 0.004350342787802219, 0.004513886757194996, 0.004677430726587772, 0.0048409742303192616, 0.005004518199712038, 0.005168061703443527, 0.005331605672836304, 0.00549514964222908, 0.005658693145960569, 0.005822237115353346, 0.005985780619084835, 0.0061493245884776115, 0.006312868557870388, 0.0064764125272631645, 0.006639956030994654, 0.00680350000038743, 0.006967043504118919, 0.007130587473511696, 0.007294131442904472, 0.0074576749466359615, 0.007621218916028738, 0.007784762419760227, 0.007948306389153004]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 5.0, 7.0, 5.0, 3.0, 5.0, 7.0, 20.0, 15.0, 12.0, 16.0, 27.0, 23.0, 24.0, 20.0, 27.0, 21.0, 39.0, 29.0, 40.0, 33.0, 42.0, 42.0, 43.0, 53.0, 39.0, 41.0, 30.0, 31.0, 32.0, 34.0, 38.0, 30.0, 27.0, 19.0, 21.0, 24.0, 8.0, 11.0, 15.0, 14.0, 7.0, 4.0, 6.0, 4.0, 0.0, 1.0, 4.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.000576317310333252, -0.0005602911114692688, -0.0005442649126052856, -0.0005282387137413025, -0.0005122125148773193, -0.0004961863160133362, -0.00048016011714935303, -0.0004641339182853699, -0.0004481077194213867, -0.00043208152055740356, -0.0004160553216934204, -0.00040002912282943726, -0.0003840029239654541, -0.00036797672510147095, -0.0003519505262374878, -0.00033592432737350464, -0.0003198981285095215, -0.00030387192964553833, -0.0002878457307815552, -0.000271819531917572, -0.00025579333305358887, -0.0002397671341896057, -0.00022374093532562256, -0.0002077147364616394, -0.00019168853759765625, -0.0001756623387336731, -0.00015963613986968994, -0.0001436099410057068, -0.00012758374214172363, -0.00011155754327774048, -9.553134441375732e-05, -7.950514554977417e-05, -6.347894668579102e-05, -4.745274782180786e-05, -3.142654895782471e-05, -1.5400350093841553e-05, 6.258487701416016e-07, 1.6652047634124756e-05, 3.267824649810791e-05, 4.8704445362091064e-05, 6.473064422607422e-05, 8.075684309005737e-05, 9.678304195404053e-05, 0.00011280924081802368, 0.00012883543968200684, 0.00014486163854599, 0.00016088783740997314, 0.0001769140362739563, 0.00019294023513793945, 0.0002089664340019226, 0.00022499263286590576, 0.00024101883172988892, 0.00025704503059387207, 0.0002730712294578552, 0.0002890974283218384, 0.00030512362718582153, 0.0003211498260498047, 0.00033717602491378784, 0.000353202223777771, 0.00036922842264175415, 0.0003852546215057373, 0.00040128082036972046, 0.0004173070192337036, 0.00043333321809768677, 0.0004493594169616699]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 10.0, 7.0, 9.0, 10.0, 9.0, 17.0, 12.0, 16.0, 20.0, 18.0, 25.0, 26.0, 32.0, 38.0, 36.0, 39.0, 35.0, 45.0, 41.0, 48.0, 38.0, 38.0, 42.0, 34.0, 35.0, 43.0, 20.0, 39.0, 38.0, 30.0, 29.0, 23.0, 11.0, 23.0, 12.0, 12.0, 11.0, 5.0, 12.0, 6.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.984375, -12.58544921875, -12.1865234375, -11.78759765625, -11.388671875, -10.98974609375, -10.5908203125, -10.19189453125, -9.79296875, -9.39404296875, -8.9951171875, -8.59619140625, -8.197265625, -7.79833984375, -7.3994140625, -7.00048828125, -6.6015625, -6.20263671875, -5.8037109375, -5.40478515625, -5.005859375, -4.60693359375, -4.2080078125, -3.80908203125, -3.41015625, -3.01123046875, -2.6123046875, -2.21337890625, -1.814453125, -1.41552734375, -1.0166015625, -0.61767578125, -0.21875, 0.18017578125, 0.5791015625, 0.97802734375, 1.376953125, 1.77587890625, 2.1748046875, 2.57373046875, 2.97265625, 3.37158203125, 3.7705078125, 4.16943359375, 4.568359375, 4.96728515625, 5.3662109375, 5.76513671875, 6.1640625, 6.56298828125, 6.9619140625, 7.36083984375, 7.759765625, 8.15869140625, 8.5576171875, 8.95654296875, 9.35546875, 9.75439453125, 10.1533203125, 10.55224609375, 10.951171875, 11.35009765625, 11.7490234375, 12.14794921875, 12.546875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 12.0, 11.0, 16.0, 12.0, 30.0, 34.0, 37.0, 61.0, 69.0, 88.0, 103.0, 179.0, 265.0, 392.0, 735.0, 1573.0, 3930.0, 11128.0, 37735.0, 170652.0, 580925.0, 181653.0, 39478.0, 11630.0, 4050.0, 1615.0, 761.0, 439.0, 294.0, 165.0, 121.0, 86.0, 65.0, 52.0, 36.0, 35.0, 25.0, 15.0, 19.0, 11.0, 8.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.65625, -16.14404296875, -15.6318359375, -15.11962890625, -14.607421875, -14.09521484375, -13.5830078125, -13.07080078125, -12.55859375, -12.04638671875, -11.5341796875, -11.02197265625, -10.509765625, -9.99755859375, -9.4853515625, -8.97314453125, -8.4609375, -7.94873046875, -7.4365234375, -6.92431640625, -6.412109375, -5.89990234375, -5.3876953125, -4.87548828125, -4.36328125, -3.85107421875, -3.3388671875, -2.82666015625, -2.314453125, -1.80224609375, -1.2900390625, -0.77783203125, -0.265625, 0.24658203125, 0.7587890625, 1.27099609375, 1.783203125, 2.29541015625, 2.8076171875, 3.31982421875, 3.83203125, 4.34423828125, 4.8564453125, 5.36865234375, 5.880859375, 6.39306640625, 6.9052734375, 7.41748046875, 7.9296875, 8.44189453125, 8.9541015625, 9.46630859375, 9.978515625, 10.49072265625, 11.0029296875, 11.51513671875, 12.02734375, 12.53955078125, 13.0517578125, 13.56396484375, 14.076171875, 14.58837890625, 15.1005859375, 15.61279296875, 16.125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 15.0, 10.0, 11.0, 24.0, 28.0, 17.0, 20.0, 21.0, 40.0, 43.0, 56.0, 57.0, 76.0, 106.0, 365.0, 1525.0, 136.0, 88.0, 63.0, 52.0, 38.0, 36.0, 39.0, 28.0, 22.0, 22.0, 19.0, 21.0, 15.0, 12.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.8125, -31.599609375, -30.38671875, -29.173828125, -27.9609375, -26.748046875, -25.53515625, -24.322265625, -23.109375, -21.896484375, -20.68359375, -19.470703125, -18.2578125, -17.044921875, -15.83203125, -14.619140625, -13.40625, -12.193359375, -10.98046875, -9.767578125, -8.5546875, -7.341796875, -6.12890625, -4.916015625, -3.703125, -2.490234375, -1.27734375, -0.064453125, 1.1484375, 2.361328125, 3.57421875, 4.787109375, 6.0, 7.212890625, 8.42578125, 9.638671875, 10.8515625, 12.064453125, 13.27734375, 14.490234375, 15.703125, 16.916015625, 18.12890625, 19.341796875, 20.5546875, 21.767578125, 22.98046875, 24.193359375, 25.40625, 26.619140625, 27.83203125, 29.044921875, 30.2578125, 31.470703125, 32.68359375, 33.896484375, 35.109375, 36.322265625, 37.53515625, 38.748046875, 39.9609375, 41.173828125, 42.38671875, 43.599609375, 44.8125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 5.0, 10.0, 9.0, 16.0, 16.0, 26.0, 43.0, 55.0, 62.0, 76.0, 121.0, 171.0, 238.0, 395.0, 906.0, 5953.0, 626308.0, 2498915.0, 10065.0, 1056.0, 429.0, 230.0, 165.0, 109.0, 87.0, 62.0, 50.0, 35.0, 21.0, 20.0, 19.0, 13.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.21875, -49.51611328125, -47.8134765625, -46.11083984375, -44.408203125, -42.70556640625, -41.0029296875, -39.30029296875, -37.59765625, -35.89501953125, -34.1923828125, -32.48974609375, -30.787109375, -29.08447265625, -27.3818359375, -25.67919921875, -23.9765625, -22.27392578125, -20.5712890625, -18.86865234375, -17.166015625, -15.46337890625, -13.7607421875, -12.05810546875, -10.35546875, -8.65283203125, -6.9501953125, -5.24755859375, -3.544921875, -1.84228515625, -0.1396484375, 1.56298828125, 3.265625, 4.96826171875, 6.6708984375, 8.37353515625, 10.076171875, 11.77880859375, 13.4814453125, 15.18408203125, 16.88671875, 18.58935546875, 20.2919921875, 21.99462890625, 23.697265625, 25.39990234375, 27.1025390625, 28.80517578125, 30.5078125, 32.21044921875, 33.9130859375, 35.61572265625, 37.318359375, 39.02099609375, 40.7236328125, 42.42626953125, 44.12890625, 45.83154296875, 47.5341796875, 49.23681640625, 50.939453125, 52.64208984375, 54.3447265625, 56.04736328125, 57.75]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 58.0, 440.0, 438.0, 67.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.07611083984375, -163.00210571289062, -158.9281005859375, -154.8540802001953, -150.7800750732422, -146.70606994628906, -142.63206481933594, -138.55804443359375, -134.48403930664062, -130.4100341796875, -126.33602142333984, -122.26201629638672, -118.18800354003906, -114.11399841308594, -110.03999328613281, -105.96598052978516, -101.89197540283203, -97.8179702758789, -93.74395751953125, -89.66995239257812, -85.59593963623047, -81.52193450927734, -77.44792175292969, -73.37391662597656, -69.29991149902344, -65.22590637207031, -61.151893615722656, -57.07788848876953, -53.003875732421875, -48.92987060546875, -44.85586166381836, -40.78185272216797, -36.70783233642578, -32.63382339477539, -28.559814453125, -24.485807418823242, -20.41179847717285, -16.33778953552246, -12.263782501220703, -8.189773559570312, -4.115764617919922, -0.04175615310668945, 4.032252311706543, 8.106260299682617, 12.180269241333008, 16.2542781829834, 20.328285217285156, 24.402294158935547, 28.476303100585938, 32.55031204223633, 36.62432098388672, 40.698326110839844, 44.7723388671875, 48.846343994140625, 52.920352935791016, 56.994361877441406, 61.0683708190918, 65.14237976074219, 69.21638488769531, 73.29039764404297, 77.3644027709961, 81.43841552734375, 85.51242065429688, 89.58642578125, 93.66043853759766]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 10.0, 8.0, 16.0, 8.0, 20.0, 16.0, 21.0, 24.0, 19.0, 31.0, 22.0, 19.0, 41.0, 47.0, 37.0, 35.0, 35.0, 38.0, 45.0, 38.0, 45.0, 35.0, 31.0, 35.0, 33.0, 32.0, 26.0, 33.0, 19.0, 25.0, 18.0, 17.0, 15.0, 16.0, 11.0, 20.0, 16.0, 9.0, 8.0, 6.0, 6.0, 6.0, 4.0, 3.0, 3.0, 4.0], "bins": [-85.65505981445312, -83.41960144042969, -81.18414306640625, -78.94868469238281, -76.7132339477539, -74.47777557373047, -72.24231719970703, -70.0068588256836, -67.77140045166016, -65.53594207763672, -63.30048751831055, -61.06502914428711, -58.82957077026367, -56.5941162109375, -54.35865783691406, -52.123199462890625, -49.88774490356445, -47.652286529541016, -45.416831970214844, -43.181373596191406, -40.94591522216797, -38.71045684814453, -36.47500228881836, -34.23954391479492, -32.00408935546875, -29.768632888793945, -27.533174514770508, -25.297718048095703, -23.062259674072266, -20.82680320739746, -18.591346740722656, -16.35588836669922, -14.120433807373047, -11.884976387023926, -9.649518966674805, -7.4140625, -5.178605079650879, -2.943147659301758, -0.7076911926269531, 1.527766227722168, 3.763223648071289, 5.99868106842041, 8.234138488769531, 10.469594955444336, 12.705052375793457, 14.940509796142578, 17.175966262817383, 19.411422729492188, 21.646881103515625, 23.88233757019043, 26.117795944213867, 28.353252410888672, 30.58871078491211, 32.82416534423828, 35.05962371826172, 37.295082092285156, 39.530540466308594, 41.76599884033203, 44.0014533996582, 46.23691177368164, 48.47237014770508, 50.70782470703125, 52.94328308105469, 55.178741455078125, 57.4141960144043]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 4.0, 8.0, 5.0, 14.0, 8.0, 10.0, 8.0, 19.0, 19.0, 16.0, 24.0, 24.0, 29.0, 28.0, 36.0, 40.0, 37.0, 35.0, 39.0, 39.0, 49.0, 35.0, 35.0, 38.0, 37.0, 47.0, 26.0, 29.0, 36.0, 32.0, 25.0, 21.0, 20.0, 17.0, 19.0, 27.0, 10.0, 9.0, 10.0, 11.0, 11.0, 3.0, 7.0, 3.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8203125, -11.433837890625, -11.04736328125, -10.660888671875, -10.2744140625, -9.887939453125, -9.50146484375, -9.114990234375, -8.728515625, -8.342041015625, -7.95556640625, -7.569091796875, -7.1826171875, -6.796142578125, -6.40966796875, -6.023193359375, -5.63671875, -5.250244140625, -4.86376953125, -4.477294921875, -4.0908203125, -3.704345703125, -3.31787109375, -2.931396484375, -2.544921875, -2.158447265625, -1.77197265625, -1.385498046875, -0.9990234375, -0.612548828125, -0.22607421875, 0.160400390625, 0.546875, 0.933349609375, 1.31982421875, 1.706298828125, 2.0927734375, 2.479248046875, 2.86572265625, 3.252197265625, 3.638671875, 4.025146484375, 4.41162109375, 4.798095703125, 5.1845703125, 5.571044921875, 5.95751953125, 6.343994140625, 6.73046875, 7.116943359375, 7.50341796875, 7.889892578125, 8.2763671875, 8.662841796875, 9.04931640625, 9.435791015625, 9.822265625, 10.208740234375, 10.59521484375, 10.981689453125, 11.3681640625, 11.754638671875, 12.14111328125, 12.527587890625, 12.9140625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 5.0, 10.0, 9.0, 12.0, 10.0, 12.0, 9.0, 14.0, 18.0, 26.0, 24.0, 24.0, 29.0, 32.0, 53.0, 95.0, 123.0, 287.0, 685.0, 3163.0, 38401.0, 2055788.0, 2052705.0, 37960.0, 3187.0, 765.0, 283.0, 122.0, 105.0, 62.0, 42.0, 24.0, 32.0, 20.0, 19.0, 20.0, 14.0, 16.0, 9.0, 13.0, 6.0, 9.0, 10.0, 8.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0], "bins": [-39.25, -38.060546875, -36.87109375, -35.681640625, -34.4921875, -33.302734375, -32.11328125, -30.923828125, -29.734375, -28.544921875, -27.35546875, -26.166015625, -24.9765625, -23.787109375, -22.59765625, -21.408203125, -20.21875, -19.029296875, -17.83984375, -16.650390625, -15.4609375, -14.271484375, -13.08203125, -11.892578125, -10.703125, -9.513671875, -8.32421875, -7.134765625, -5.9453125, -4.755859375, -3.56640625, -2.376953125, -1.1875, 0.001953125, 1.19140625, 2.380859375, 3.5703125, 4.759765625, 5.94921875, 7.138671875, 8.328125, 9.517578125, 10.70703125, 11.896484375, 13.0859375, 14.275390625, 15.46484375, 16.654296875, 17.84375, 19.033203125, 20.22265625, 21.412109375, 22.6015625, 23.791015625, 24.98046875, 26.169921875, 27.359375, 28.548828125, 29.73828125, 30.927734375, 32.1171875, 33.306640625, 34.49609375, 35.685546875, 36.875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 12.0, 15.0, 11.0, 27.0, 55.0, 47.0, 57.0, 92.0, 162.0, 278.0, 365.0, 493.0, 558.0, 553.0, 436.0, 280.0, 181.0, 117.0, 84.0, 56.0, 42.0, 36.0, 16.0, 17.0, 19.0, 16.0, 12.0, 4.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.78125, -16.252197265625, -15.72314453125, -15.194091796875, -14.6650390625, -14.135986328125, -13.60693359375, -13.077880859375, -12.548828125, -12.019775390625, -11.49072265625, -10.961669921875, -10.4326171875, -9.903564453125, -9.37451171875, -8.845458984375, -8.31640625, -7.787353515625, -7.25830078125, -6.729248046875, -6.2001953125, -5.671142578125, -5.14208984375, -4.613037109375, -4.083984375, -3.554931640625, -3.02587890625, -2.496826171875, -1.9677734375, -1.438720703125, -0.90966796875, -0.380615234375, 0.1484375, 0.677490234375, 1.20654296875, 1.735595703125, 2.2646484375, 2.793701171875, 3.32275390625, 3.851806640625, 4.380859375, 4.909912109375, 5.43896484375, 5.968017578125, 6.4970703125, 7.026123046875, 7.55517578125, 8.084228515625, 8.61328125, 9.142333984375, 9.67138671875, 10.200439453125, 10.7294921875, 11.258544921875, 11.78759765625, 12.316650390625, 12.845703125, 13.374755859375, 13.90380859375, 14.432861328125, 14.9619140625, 15.490966796875, 16.02001953125, 16.549072265625, 17.078125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 6.0, 11.0, 10.0, 17.0, 16.0, 36.0, 37.0, 79.0, 140.0, 216.0, 580.0, 2057.0, 29225.0, 3606772.0, 543098.0, 9882.0, 1251.0, 375.0, 176.0, 93.0, 61.0, 35.0, 35.0, 20.0, 10.0, 8.0, 13.0, 9.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-66.8125, -64.947265625, -63.08203125, -61.216796875, -59.3515625, -57.486328125, -55.62109375, -53.755859375, -51.890625, -50.025390625, -48.16015625, -46.294921875, -44.4296875, -42.564453125, -40.69921875, -38.833984375, -36.96875, -35.103515625, -33.23828125, -31.373046875, -29.5078125, -27.642578125, -25.77734375, -23.912109375, -22.046875, -20.181640625, -18.31640625, -16.451171875, -14.5859375, -12.720703125, -10.85546875, -8.990234375, -7.125, -5.259765625, -3.39453125, -1.529296875, 0.3359375, 2.201171875, 4.06640625, 5.931640625, 7.796875, 9.662109375, 11.52734375, 13.392578125, 15.2578125, 17.123046875, 18.98828125, 20.853515625, 22.71875, 24.583984375, 26.44921875, 28.314453125, 30.1796875, 32.044921875, 33.91015625, 35.775390625, 37.640625, 39.505859375, 41.37109375, 43.236328125, 45.1015625, 46.966796875, 48.83203125, 50.697265625, 52.5625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 141.0, 668.0, 194.0, 10.0, 0.0, 0.0, 1.0], "bins": [-630.7893676757812, -620.00732421875, -609.2252197265625, -598.4431762695312, -587.6611328125, -576.8790893554688, -566.0969848632812, -555.31494140625, -544.5328979492188, -533.7508544921875, -522.96875, -512.1867065429688, -501.4046630859375, -490.6225891113281, -479.84051513671875, -469.0584716796875, -458.2763977050781, -447.49432373046875, -436.7122802734375, -425.9302062988281, -415.1481628417969, -404.3660888671875, -393.58404541015625, -382.8019714355469, -372.0198974609375, -361.2378234863281, -350.4557800292969, -339.6737060546875, -328.89166259765625, -318.1095886230469, -307.3275146484375, -296.54547119140625, -285.763427734375, -274.9813537597656, -264.1993103027344, -253.417236328125, -242.63519287109375, -231.85311889648438, -221.07106018066406, -210.28900146484375, -199.5069580078125, -188.7248992919922, -177.94284057617188, -167.1607666015625, -156.37872314453125, -145.59664916992188, -134.81459045410156, -124.03253173828125, -113.25047302246094, -102.46841430664062, -91.68635559082031, -80.90428924560547, -70.12223052978516, -59.340171813964844, -48.55810546875, -37.77604675292969, -26.99398422241211, -16.211923599243164, -5.429862976074219, 5.352199554443359, 16.134258270263672, 26.916316986083984, 37.69838333129883, 48.48044204711914, 59.26250076293945]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 4.0, 4.0, 9.0, 6.0, 5.0, 25.0, 12.0, 18.0, 14.0, 22.0, 20.0, 22.0, 27.0, 32.0, 36.0, 26.0, 39.0, 34.0, 45.0, 45.0, 41.0, 28.0, 44.0, 34.0, 31.0, 39.0, 42.0, 33.0, 33.0, 31.0, 29.0, 24.0, 29.0, 14.0, 20.0, 13.0, 15.0, 12.0, 18.0, 5.0, 4.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-52.5272102355957, -50.97853469848633, -49.42985916137695, -47.88118362426758, -46.3325080871582, -44.78383255004883, -43.23515701293945, -41.68648147583008, -40.1378059387207, -38.58913040161133, -37.04045486450195, -35.49177932739258, -33.9431037902832, -32.39442825317383, -30.845752716064453, -29.297077178955078, -27.748401641845703, -26.199726104736328, -24.651050567626953, -23.102375030517578, -21.553699493408203, -20.005023956298828, -18.456348419189453, -16.907672882080078, -15.358997344970703, -13.810321807861328, -12.261646270751953, -10.712970733642578, -9.164295196533203, -7.615619659423828, -6.066944122314453, -4.518268585205078, -2.969593048095703, -1.4209175109863281, 0.12775802612304688, 1.6764335632324219, 3.225109100341797, 4.773784637451172, 6.322460174560547, 7.871135711669922, 9.419811248779297, 10.968486785888672, 12.517162322998047, 14.065837860107422, 15.614513397216797, 17.163188934326172, 18.711864471435547, 20.260540008544922, 21.809215545654297, 23.357891082763672, 24.906566619873047, 26.455242156982422, 28.003917694091797, 29.552593231201172, 31.101268768310547, 32.64994430541992, 34.1986198425293, 35.74729537963867, 37.29597091674805, 38.84464645385742, 40.3933219909668, 41.94199752807617, 43.49067306518555, 45.03934860229492, 46.5880241394043]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 8.0, 7.0, 13.0, 9.0, 11.0, 16.0, 13.0, 12.0, 25.0, 23.0, 16.0, 35.0, 26.0, 25.0, 37.0, 39.0, 28.0, 38.0, 35.0, 40.0, 40.0, 38.0, 33.0, 38.0, 47.0, 37.0, 33.0, 31.0, 23.0, 25.0, 24.0, 25.0, 19.0, 17.0, 16.0, 19.0, 13.0, 11.0, 15.0, 17.0, 5.0, 3.0, 8.0, 6.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6953125, -11.3194580078125, -10.943603515625, -10.5677490234375, -10.19189453125, -9.8160400390625, -9.440185546875, -9.0643310546875, -8.6884765625, -8.3126220703125, -7.936767578125, -7.5609130859375, -7.18505859375, -6.8092041015625, -6.433349609375, -6.0574951171875, -5.681640625, -5.3057861328125, -4.929931640625, -4.5540771484375, -4.17822265625, -3.8023681640625, -3.426513671875, -3.0506591796875, -2.6748046875, -2.2989501953125, -1.923095703125, -1.5472412109375, -1.17138671875, -0.7955322265625, -0.419677734375, -0.0438232421875, 0.33203125, 0.7078857421875, 1.083740234375, 1.4595947265625, 1.83544921875, 2.2113037109375, 2.587158203125, 2.9630126953125, 3.3388671875, 3.7147216796875, 4.090576171875, 4.4664306640625, 4.84228515625, 5.2181396484375, 5.593994140625, 5.9698486328125, 6.345703125, 6.7215576171875, 7.097412109375, 7.4732666015625, 7.84912109375, 8.2249755859375, 8.600830078125, 8.9766845703125, 9.3525390625, 9.7283935546875, 10.104248046875, 10.4801025390625, 10.85595703125, 11.2318115234375, 11.607666015625, 11.9835205078125, 12.359375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 9.0, 9.0, 13.0, 16.0, 35.0, 41.0, 64.0, 90.0, 146.0, 199.0, 278.0, 459.0, 649.0, 940.0, 1456.0, 1996.0, 2924.0, 4207.0, 6195.0, 9092.0, 13000.0, 19051.0, 28719.0, 44578.0, 73205.0, 139180.0, 321608.0, 158518.0, 79679.0, 47152.0, 30108.0, 20501.0, 13797.0, 9522.0, 6638.0, 4602.0, 3134.0, 2156.0, 1449.0, 1000.0, 704.0, 459.0, 298.0, 246.0, 164.0, 82.0, 66.0, 49.0, 34.0, 16.0, 10.0, 7.0, 9.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-2.17578125, -2.10687255859375, -2.0379638671875, -1.96905517578125, -1.900146484375, -1.83123779296875, -1.7623291015625, -1.69342041015625, -1.62451171875, -1.55560302734375, -1.4866943359375, -1.41778564453125, -1.348876953125, -1.27996826171875, -1.2110595703125, -1.14215087890625, -1.0732421875, -1.00433349609375, -0.9354248046875, -0.86651611328125, -0.797607421875, -0.72869873046875, -0.6597900390625, -0.59088134765625, -0.52197265625, -0.45306396484375, -0.3841552734375, -0.31524658203125, -0.246337890625, -0.17742919921875, -0.1085205078125, -0.03961181640625, 0.029296875, 0.09820556640625, 0.1671142578125, 0.23602294921875, 0.304931640625, 0.37384033203125, 0.4427490234375, 0.51165771484375, 0.58056640625, 0.64947509765625, 0.7183837890625, 0.78729248046875, 0.856201171875, 0.92510986328125, 0.9940185546875, 1.06292724609375, 1.1318359375, 1.20074462890625, 1.2696533203125, 1.33856201171875, 1.407470703125, 1.47637939453125, 1.5452880859375, 1.61419677734375, 1.68310546875, 1.75201416015625, 1.8209228515625, 1.88983154296875, 1.958740234375, 2.02764892578125, 2.0965576171875, 2.16546630859375, 2.234375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 1.0, 2.0, 5.0, 8.0, 7.0, 2.0, 1.0, 7.0, 11.0, 15.0, 17.0, 17.0, 19.0, 13.0, 20.0, 18.0, 18.0, 16.0, 20.0, 32.0, 32.0, 36.0, 44.0, 19.0, 46.0, 35.0, 47.0, 1057.0, 37.0, 39.0, 32.0, 35.0, 24.0, 30.0, 34.0, 26.0, 19.0, 35.0, 21.0, 29.0, 13.0, 12.0, 20.0, 14.0, 10.0, 6.0, 13.0, 5.0, 1.0, 2.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.9140625, -6.68603515625, -6.4580078125, -6.22998046875, -6.001953125, -5.77392578125, -5.5458984375, -5.31787109375, -5.08984375, -4.86181640625, -4.6337890625, -4.40576171875, -4.177734375, -3.94970703125, -3.7216796875, -3.49365234375, -3.265625, -3.03759765625, -2.8095703125, -2.58154296875, -2.353515625, -2.12548828125, -1.8974609375, -1.66943359375, -1.44140625, -1.21337890625, -0.9853515625, -0.75732421875, -0.529296875, -0.30126953125, -0.0732421875, 0.15478515625, 0.3828125, 0.61083984375, 0.8388671875, 1.06689453125, 1.294921875, 1.52294921875, 1.7509765625, 1.97900390625, 2.20703125, 2.43505859375, 2.6630859375, 2.89111328125, 3.119140625, 3.34716796875, 3.5751953125, 3.80322265625, 4.03125, 4.25927734375, 4.4873046875, 4.71533203125, 4.943359375, 5.17138671875, 5.3994140625, 5.62744140625, 5.85546875, 6.08349609375, 6.3115234375, 6.53955078125, 6.767578125, 6.99560546875, 7.2236328125, 7.45166015625, 7.6796875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 6.0, 1.0, 6.0, 11.0, 11.0, 17.0, 19.0, 33.0, 62.0, 58.0, 77.0, 119.0, 228.0, 303.0, 409.0, 677.0, 894.0, 1301.0, 2010.0, 2915.0, 4396.0, 6627.0, 9666.0, 14236.0, 21046.0, 31121.0, 47735.0, 79779.0, 154003.0, 1367792.0, 139782.0, 74128.0, 46009.0, 29680.0, 19620.0, 13367.0, 9292.0, 6292.0, 4327.0, 2780.0, 2034.0, 1332.0, 920.0, 631.0, 440.0, 295.0, 225.0, 110.0, 72.0, 81.0, 60.0, 29.0, 19.0, 20.0, 16.0, 13.0, 3.0, 5.0, 4.0, 2.0], "bins": [-2.291015625, -2.222503662109375, -2.15399169921875, -2.085479736328125, -2.0169677734375, -1.948455810546875, -1.87994384765625, -1.811431884765625, -1.742919921875, -1.674407958984375, -1.60589599609375, -1.537384033203125, -1.4688720703125, -1.400360107421875, -1.33184814453125, -1.263336181640625, -1.19482421875, -1.126312255859375, -1.05780029296875, -0.989288330078125, -0.9207763671875, -0.852264404296875, -0.78375244140625, -0.715240478515625, -0.646728515625, -0.578216552734375, -0.50970458984375, -0.441192626953125, -0.3726806640625, -0.304168701171875, -0.23565673828125, -0.167144775390625, -0.0986328125, -0.030120849609375, 0.03839111328125, 0.106903076171875, 0.1754150390625, 0.243927001953125, 0.31243896484375, 0.380950927734375, 0.449462890625, 0.517974853515625, 0.58648681640625, 0.654998779296875, 0.7235107421875, 0.792022705078125, 0.86053466796875, 0.929046630859375, 0.99755859375, 1.066070556640625, 1.13458251953125, 1.203094482421875, 1.2716064453125, 1.340118408203125, 1.40863037109375, 1.477142333984375, 1.545654296875, 1.614166259765625, 1.68267822265625, 1.751190185546875, 1.8197021484375, 1.888214111328125, 1.95672607421875, 2.025238037109375, 2.09375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 6.0, 9.0, 8.0, 9.0, 19.0, 24.0, 22.0, 20.0, 28.0, 28.0, 47.0, 46.0, 42.0, 61.0, 80.0, 75.0, 74.0, 48.0, 58.0, 48.0, 45.0, 31.0, 25.0, 21.0, 20.0, 15.0, 18.0, 11.0, 8.0, 4.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0013227462768554688, -0.001277923583984375, -0.0012331008911132812, -0.0011882781982421875, -0.0011434555053710938, -0.0010986328125, -0.0010538101196289062, -0.0010089874267578125, -0.0009641647338867188, -0.000919342041015625, -0.0008745193481445312, -0.0008296966552734375, -0.0007848739624023438, -0.00074005126953125, -0.0006952285766601562, -0.0006504058837890625, -0.0006055831909179688, -0.000560760498046875, -0.0005159378051757812, -0.0004711151123046875, -0.00042629241943359375, -0.0003814697265625, -0.00033664703369140625, -0.0002918243408203125, -0.00024700164794921875, -0.000202178955078125, -0.00015735626220703125, -0.0001125335693359375, -6.771087646484375e-05, -2.288818359375e-05, 2.193450927734375e-05, 6.67572021484375e-05, 0.00011157989501953125, 0.000156402587890625, 0.00020122528076171875, 0.0002460479736328125, 0.00029087066650390625, 0.000335693359375, 0.00038051605224609375, 0.0004253387451171875, 0.00047016143798828125, 0.000514984130859375, 0.0005598068237304688, 0.0006046295166015625, 0.0006494522094726562, 0.00069427490234375, 0.0007390975952148438, 0.0007839202880859375, 0.0008287429809570312, 0.000873565673828125, 0.0009183883666992188, 0.0009632110595703125, 0.0010080337524414062, 0.0010528564453125, 0.0010976791381835938, 0.0011425018310546875, 0.0011873245239257812, 0.001232147216796875, 0.0012769699096679688, 0.0013217926025390625, 0.0013666152954101562, 0.00141143798828125, 0.0014562606811523438, 0.0015010833740234375, 0.0015459060668945312]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 9.0, 8.0, 13.0, 12.0, 22.0, 22.0, 17.0, 44.0, 55.0, 53.0, 101.0, 136.0, 196.0, 349.0, 816.0, 36485.0, 1006810.0, 1947.0, 528.0, 294.0, 129.0, 99.0, 82.0, 61.0, 44.0, 34.0, 38.0, 29.0, 14.0, 16.0, 16.0, 10.0, 9.0, 7.0, 9.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0], "bins": [-0.033050537109375, -0.032138824462890625, -0.03122711181640625, -0.030315399169921875, -0.0294036865234375, -0.028491973876953125, -0.02758026123046875, -0.026668548583984375, -0.0257568359375, -0.024845123291015625, -0.02393341064453125, -0.023021697998046875, -0.0221099853515625, -0.021198272705078125, -0.02028656005859375, -0.019374847412109375, -0.018463134765625, -0.017551422119140625, -0.01663970947265625, -0.015727996826171875, -0.0148162841796875, -0.013904571533203125, -0.01299285888671875, -0.012081146240234375, -0.01116943359375, -0.010257720947265625, -0.00934600830078125, -0.008434295654296875, -0.0075225830078125, -0.006610870361328125, -0.00569915771484375, -0.004787445068359375, -0.003875732421875, -0.002964019775390625, -0.00205230712890625, -0.001140594482421875, -0.0002288818359375, 0.000682830810546875, 0.00159454345703125, 0.002506256103515625, 0.00341796875, 0.004329681396484375, 0.00524139404296875, 0.006153106689453125, 0.0070648193359375, 0.007976531982421875, 0.00888824462890625, 0.009799957275390625, 0.010711669921875, 0.011623382568359375, 0.01253509521484375, 0.013446807861328125, 0.0143585205078125, 0.015270233154296875, 0.01618194580078125, 0.017093658447265625, 0.01800537109375, 0.018917083740234375, 0.01982879638671875, 0.020740509033203125, 0.0216522216796875, 0.022563934326171875, 0.02347564697265625, 0.024387359619140625, 0.025299072265625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 49.0, 474.0, 419.0, 60.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004267726559191942, -0.00415235897526145, -0.004036991391330957, -0.003921623807400465, -0.0038062562234699726, -0.00369088863953948, -0.0035755212884396315, -0.003460153704509139, -0.0033447861205786467, -0.0032294185366481543, -0.003114050952717662, -0.0029986833687871695, -0.0028833160176873207, -0.0027679484337568283, -0.002652580849826336, -0.0025372132658958435, -0.002421845681965351, -0.0023064780980348587, -0.0021911105141043663, -0.002075742930173874, -0.0019603753462433815, -0.001845007878728211, -0.0017296404112130404, -0.001614272827282548, -0.0014989052433520555, -0.0013835376594215631, -0.0012681700754910707, -0.0011528026079759002, -0.0010374350240454078, -0.0009220674401149154, -0.0008066999143920839, -0.0006913323886692524, -0.00057596480473876, -0.00046059724991209805, -0.0003452296950854361, -0.00022986214025877416, -0.00011449458543211222, 8.729984983801842e-07, 0.00011624052422121167, 0.00023160804994404316, 0.00034697563387453556, 0.0004623431887011975, 0.0005777107435278594, 0.0006930782692506909, 0.0008084458531811833, 0.0009238134371116757, 0.0010391809046268463, 0.0011545484885573387, 0.0012699160724878311, 0.0013852836564183235, 0.001500651240348816, 0.0016160187078639865, 0.001731386291794479, 0.0018467538757249713, 0.001962121343240142, 0.0020774889271706343, 0.0021928565111011267, 0.002308224095031619, 0.0024235916789621115, 0.002538959262892604, 0.0026543266139924526, 0.002769694197922945, 0.0028850617818534374, 0.00300042936578393, 0.0031157969497144222]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 3.0, 5.0, 12.0, 7.0, 7.0, 11.0, 13.0, 16.0, 13.0, 18.0, 22.0, 19.0, 20.0, 28.0, 20.0, 35.0, 34.0, 25.0, 36.0, 37.0, 29.0, 36.0, 29.0, 31.0, 36.0, 45.0, 36.0, 33.0, 34.0, 33.0, 33.0, 30.0, 23.0, 29.0, 23.0, 25.0, 24.0, 12.0, 13.0, 10.0, 10.0, 9.0, 8.0, 4.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0], "bins": [-0.000674903392791748, -0.0006539048627018929, -0.0006329063326120377, -0.0006119078025221825, -0.0005909092724323273, -0.0005699107423424721, -0.0005489122122526169, -0.0005279136821627617, -0.0005069151520729065, -0.0004859166219830513, -0.0004649180918931961, -0.0004439195618033409, -0.0004229210317134857, -0.0004019225016236305, -0.00038092397153377533, -0.00035992544144392014, -0.00033892691135406494, -0.00031792838126420975, -0.00029692985117435455, -0.00027593132108449936, -0.00025493279099464417, -0.00023393426090478897, -0.00021293573081493378, -0.00019193720072507858, -0.0001709386706352234, -0.0001499401405453682, -0.000128941610455513, -0.0001079430803656578, -8.694455027580261e-05, -6.594602018594742e-05, -4.4947490096092224e-05, -2.394896000623703e-05, -2.950429916381836e-06, 1.8048100173473358e-05, 3.904663026332855e-05, 6.0045160353183746e-05, 8.104369044303894e-05, 0.00010204222053289413, 0.00012304075062274933, 0.00014403928071260452, 0.00016503781080245972, 0.0001860363408923149, 0.0002070348709821701, 0.0002280334010720253, 0.0002490319311618805, 0.0002700304612517357, 0.0002910289913415909, 0.0003120275214314461, 0.00033302605152130127, 0.00035402458161115646, 0.00037502311170101166, 0.00039602164179086685, 0.00041702017188072205, 0.00043801870197057724, 0.00045901723206043243, 0.00048001576215028763, 0.0005010142922401428, 0.000522012822329998, 0.0005430113524198532, 0.0005640098825097084, 0.0005850084125995636, 0.0006060069426894188, 0.000627005472779274, 0.0006480040028691292, 0.0006690025329589844]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 8.0, 7.0, 13.0, 9.0, 11.0, 16.0, 13.0, 12.0, 25.0, 23.0, 16.0, 35.0, 26.0, 25.0, 37.0, 39.0, 28.0, 38.0, 35.0, 40.0, 40.0, 38.0, 33.0, 38.0, 47.0, 37.0, 33.0, 31.0, 23.0, 25.0, 24.0, 25.0, 19.0, 17.0, 16.0, 19.0, 13.0, 11.0, 15.0, 17.0, 5.0, 3.0, 8.0, 6.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6953125, -11.3194580078125, -10.943603515625, -10.5677490234375, -10.19189453125, -9.8160400390625, -9.440185546875, -9.0643310546875, -8.6884765625, -8.3126220703125, -7.936767578125, -7.5609130859375, -7.18505859375, -6.8092041015625, -6.433349609375, -6.0574951171875, -5.681640625, -5.3057861328125, -4.929931640625, -4.5540771484375, -4.17822265625, -3.8023681640625, -3.426513671875, -3.0506591796875, -2.6748046875, -2.2989501953125, -1.923095703125, -1.5472412109375, -1.17138671875, -0.7955322265625, -0.419677734375, -0.0438232421875, 0.33203125, 0.7078857421875, 1.083740234375, 1.4595947265625, 1.83544921875, 2.2113037109375, 2.587158203125, 2.9630126953125, 3.3388671875, 3.7147216796875, 4.090576171875, 4.4664306640625, 4.84228515625, 5.2181396484375, 5.593994140625, 5.9698486328125, 6.345703125, 6.7215576171875, 7.097412109375, 7.4732666015625, 7.84912109375, 8.2249755859375, 8.600830078125, 8.9766845703125, 9.3525390625, 9.7283935546875, 10.104248046875, 10.4801025390625, 10.85595703125, 11.2318115234375, 11.607666015625, 11.9835205078125, 12.359375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 8.0, 9.0, 12.0, 16.0, 21.0, 34.0, 35.0, 68.0, 84.0, 95.0, 143.0, 149.0, 250.0, 322.0, 426.0, 669.0, 1001.0, 1949.0, 3897.0, 8741.0, 23006.0, 74724.0, 289277.0, 452425.0, 129059.0, 37299.0, 12913.0, 5349.0, 2549.0, 1384.0, 780.0, 485.0, 341.0, 267.0, 181.0, 155.0, 114.0, 76.0, 67.0, 48.0, 40.0, 19.0, 26.0, 11.0, 13.0, 10.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.96875, -12.55322265625, -12.1376953125, -11.72216796875, -11.306640625, -10.89111328125, -10.4755859375, -10.06005859375, -9.64453125, -9.22900390625, -8.8134765625, -8.39794921875, -7.982421875, -7.56689453125, -7.1513671875, -6.73583984375, -6.3203125, -5.90478515625, -5.4892578125, -5.07373046875, -4.658203125, -4.24267578125, -3.8271484375, -3.41162109375, -2.99609375, -2.58056640625, -2.1650390625, -1.74951171875, -1.333984375, -0.91845703125, -0.5029296875, -0.08740234375, 0.328125, 0.74365234375, 1.1591796875, 1.57470703125, 1.990234375, 2.40576171875, 2.8212890625, 3.23681640625, 3.65234375, 4.06787109375, 4.4833984375, 4.89892578125, 5.314453125, 5.72998046875, 6.1455078125, 6.56103515625, 6.9765625, 7.39208984375, 7.8076171875, 8.22314453125, 8.638671875, 9.05419921875, 9.4697265625, 9.88525390625, 10.30078125, 10.71630859375, 11.1318359375, 11.54736328125, 11.962890625, 12.37841796875, 12.7939453125, 13.20947265625, 13.625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 12.0, 16.0, 9.0, 17.0, 12.0, 19.0, 25.0, 17.0, 35.0, 34.0, 48.0, 50.0, 61.0, 102.0, 188.0, 1554.0, 284.0, 110.0, 71.0, 41.0, 41.0, 41.0, 38.0, 25.0, 27.0, 27.0, 27.0, 23.0, 11.0, 16.0, 9.0, 8.0, 5.0, 4.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-36.15625, -35.08349609375, -34.0107421875, -32.93798828125, -31.865234375, -30.79248046875, -29.7197265625, -28.64697265625, -27.57421875, -26.50146484375, -25.4287109375, -24.35595703125, -23.283203125, -22.21044921875, -21.1376953125, -20.06494140625, -18.9921875, -17.91943359375, -16.8466796875, -15.77392578125, -14.701171875, -13.62841796875, -12.5556640625, -11.48291015625, -10.41015625, -9.33740234375, -8.2646484375, -7.19189453125, -6.119140625, -5.04638671875, -3.9736328125, -2.90087890625, -1.828125, -0.75537109375, 0.3173828125, 1.39013671875, 2.462890625, 3.53564453125, 4.6083984375, 5.68115234375, 6.75390625, 7.82666015625, 8.8994140625, 9.97216796875, 11.044921875, 12.11767578125, 13.1904296875, 14.26318359375, 15.3359375, 16.40869140625, 17.4814453125, 18.55419921875, 19.626953125, 20.69970703125, 21.7724609375, 22.84521484375, 23.91796875, 24.99072265625, 26.0634765625, 27.13623046875, 28.208984375, 29.28173828125, 30.3544921875, 31.42724609375, 32.5]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 11.0, 14.0, 8.0, 19.0, 15.0, 21.0, 35.0, 38.0, 65.0, 70.0, 70.0, 124.0, 168.0, 251.0, 343.0, 732.0, 2991.0, 68261.0, 3010023.0, 57685.0, 2875.0, 677.0, 332.0, 220.0, 174.0, 116.0, 72.0, 56.0, 39.0, 53.0, 31.0, 27.0, 17.0, 9.0, 14.0, 14.0, 9.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-54.125, -52.55517578125, -50.9853515625, -49.41552734375, -47.845703125, -46.27587890625, -44.7060546875, -43.13623046875, -41.56640625, -39.99658203125, -38.4267578125, -36.85693359375, -35.287109375, -33.71728515625, -32.1474609375, -30.57763671875, -29.0078125, -27.43798828125, -25.8681640625, -24.29833984375, -22.728515625, -21.15869140625, -19.5888671875, -18.01904296875, -16.44921875, -14.87939453125, -13.3095703125, -11.73974609375, -10.169921875, -8.60009765625, -7.0302734375, -5.46044921875, -3.890625, -2.32080078125, -0.7509765625, 0.81884765625, 2.388671875, 3.95849609375, 5.5283203125, 7.09814453125, 8.66796875, 10.23779296875, 11.8076171875, 13.37744140625, 14.947265625, 16.51708984375, 18.0869140625, 19.65673828125, 21.2265625, 22.79638671875, 24.3662109375, 25.93603515625, 27.505859375, 29.07568359375, 30.6455078125, 32.21533203125, 33.78515625, 35.35498046875, 36.9248046875, 38.49462890625, 40.064453125, 41.63427734375, 43.2041015625, 44.77392578125, 46.34375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 594.0, 422.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-301.8596496582031, -289.7641906738281, -277.668701171875, -265.5732421875, -253.47776794433594, -241.38229370117188, -229.28683471679688, -217.1913604736328, -205.09588623046875, -193.0004119873047, -180.90493774414062, -168.80947875976562, -156.71400451660156, -144.6185302734375, -132.5230712890625, -120.42759704589844, -108.33212280273438, -96.23664855957031, -84.14118194580078, -72.04571533203125, -59.95024108886719, -47.85477066040039, -35.759300231933594, -23.663833618164062, -11.568359375, 0.5271110534667969, 12.622581481933594, 24.71805191040039, 36.81352233886719, 48.908992767333984, 61.00446319580078, 73.09992980957031, 85.1954345703125, 97.29090881347656, 109.3863754272461, 121.48184204101562, 133.5773162841797, 145.67279052734375, 157.76824951171875, 169.8637237548828, 181.95919799804688, 194.05467224121094, 206.150146484375, 218.24560546875, 230.34107971191406, 242.43655395507812, 254.53201293945312, 266.62750244140625, 278.72296142578125, 290.81842041015625, 302.9139099121094, 315.0093688964844, 327.1048583984375, 339.2003173828125, 351.2957763671875, 363.3912353515625, 375.4867248535156, 387.5821838378906, 399.67767333984375, 411.77313232421875, 423.86859130859375, 435.9640808105469, 448.0595397949219, 460.155029296875, 472.25048828125]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 10.0, 7.0, 8.0, 13.0, 15.0, 21.0, 23.0, 25.0, 23.0, 33.0, 27.0, 40.0, 41.0, 39.0, 47.0, 54.0, 43.0, 43.0, 43.0, 43.0, 38.0, 56.0, 36.0, 35.0, 46.0, 35.0, 27.0, 26.0, 18.0, 12.0, 15.0, 12.0, 3.0, 11.0, 7.0, 11.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-81.05384826660156, -78.62247467041016, -76.19110107421875, -73.75971984863281, -71.3283462524414, -68.89697265625, -66.4655990600586, -64.03422546386719, -61.60285186767578, -59.171478271484375, -56.7401008605957, -54.3087272644043, -51.87735366821289, -49.44597625732422, -47.01460266113281, -44.583229064941406, -42.151851654052734, -39.72047805786133, -37.289100646972656, -34.85772705078125, -32.426353454589844, -29.994977951049805, -27.563602447509766, -25.13222885131836, -22.70085334777832, -20.26947784423828, -17.838104248046875, -15.406728744506836, -12.975354194641113, -10.54397964477539, -8.112604141235352, -5.681230545043945, -3.2498550415039062, -0.8184802532196045, 1.6128945350646973, 4.044269561767578, 6.475644111633301, 8.907018661499023, 11.338394165039062, 13.769767761230469, 16.201143264770508, 18.632518768310547, 21.063892364501953, 23.495267868041992, 25.92664337158203, 28.358016967773438, 30.789392471313477, 33.22076416015625, 35.65214157104492, 38.08351516723633, 40.514892578125, 42.946266174316406, 45.37763977050781, 47.80901336669922, 50.24039077758789, 52.6717643737793, 55.10314178466797, 57.534515380859375, 59.96589279174805, 62.39726638793945, 64.82864379882812, 67.26001739501953, 69.69139099121094, 72.12276458740234, 74.55413818359375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 6.0, 6.0, 7.0, 13.0, 5.0, 16.0, 17.0, 17.0, 16.0, 20.0, 19.0, 18.0, 29.0, 29.0, 30.0, 41.0, 37.0, 31.0, 24.0, 40.0, 40.0, 36.0, 43.0, 44.0, 35.0, 26.0, 44.0, 35.0, 28.0, 22.0, 31.0, 22.0, 19.0, 18.0, 21.0, 17.0, 15.0, 11.0, 15.0, 13.0, 11.0, 11.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.2890625, -11.913818359375, -11.53857421875, -11.163330078125, -10.7880859375, -10.412841796875, -10.03759765625, -9.662353515625, -9.287109375, -8.911865234375, -8.53662109375, -8.161376953125, -7.7861328125, -7.410888671875, -7.03564453125, -6.660400390625, -6.28515625, -5.909912109375, -5.53466796875, -5.159423828125, -4.7841796875, -4.408935546875, -4.03369140625, -3.658447265625, -3.283203125, -2.907958984375, -2.53271484375, -2.157470703125, -1.7822265625, -1.406982421875, -1.03173828125, -0.656494140625, -0.28125, 0.093994140625, 0.46923828125, 0.844482421875, 1.2197265625, 1.594970703125, 1.97021484375, 2.345458984375, 2.720703125, 3.095947265625, 3.47119140625, 3.846435546875, 4.2216796875, 4.596923828125, 4.97216796875, 5.347412109375, 5.72265625, 6.097900390625, 6.47314453125, 6.848388671875, 7.2236328125, 7.598876953125, 7.97412109375, 8.349365234375, 8.724609375, 9.099853515625, 9.47509765625, 9.850341796875, 10.2255859375, 10.600830078125, 10.97607421875, 11.351318359375, 11.7265625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 7.0, 5.0, 4.0, 14.0, 8.0, 12.0, 9.0, 19.0, 16.0, 21.0, 31.0, 42.0, 39.0, 52.0, 56.0, 83.0, 122.0, 152.0, 189.0, 260.0, 300.0, 372.0, 913.0, 4173360.0, 15851.0, 588.0, 413.0, 277.0, 262.0, 178.0, 149.0, 104.0, 82.0, 54.0, 40.0, 40.0, 31.0, 31.0, 16.0, 15.0, 13.0, 12.0, 9.0, 12.0, 5.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-345.5, -335.28515625, -325.0703125, -314.85546875, -304.640625, -294.42578125, -284.2109375, -273.99609375, -263.78125, -253.56640625, -243.3515625, -233.13671875, -222.921875, -212.70703125, -202.4921875, -192.27734375, -182.0625, -171.84765625, -161.6328125, -151.41796875, -141.203125, -130.98828125, -120.7734375, -110.55859375, -100.34375, -90.12890625, -79.9140625, -69.69921875, -59.484375, -49.26953125, -39.0546875, -28.83984375, -18.625, -8.41015625, 1.8046875, 12.01953125, 22.234375, 32.44921875, 42.6640625, 52.87890625, 63.09375, 73.30859375, 83.5234375, 93.73828125, 103.953125, 114.16796875, 124.3828125, 134.59765625, 144.8125, 155.02734375, 165.2421875, 175.45703125, 185.671875, 195.88671875, 206.1015625, 216.31640625, 226.53125, 236.74609375, 246.9609375, 257.17578125, 267.390625, 277.60546875, 287.8203125, 298.03515625, 308.25]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 7.0, 3.0, 7.0, 17.0, 18.0, 21.0, 20.0, 50.0, 41.0, 62.0, 96.0, 118.0, 163.0, 253.0, 407.0, 579.0, 632.0, 514.0, 333.0, 222.0, 129.0, 84.0, 67.0, 50.0, 33.0, 38.0, 32.0, 24.0, 11.0, 7.0, 7.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.859375, -18.23583984375, -17.6123046875, -16.98876953125, -16.365234375, -15.74169921875, -15.1181640625, -14.49462890625, -13.87109375, -13.24755859375, -12.6240234375, -12.00048828125, -11.376953125, -10.75341796875, -10.1298828125, -9.50634765625, -8.8828125, -8.25927734375, -7.6357421875, -7.01220703125, -6.388671875, -5.76513671875, -5.1416015625, -4.51806640625, -3.89453125, -3.27099609375, -2.6474609375, -2.02392578125, -1.400390625, -0.77685546875, -0.1533203125, 0.47021484375, 1.09375, 1.71728515625, 2.3408203125, 2.96435546875, 3.587890625, 4.21142578125, 4.8349609375, 5.45849609375, 6.08203125, 6.70556640625, 7.3291015625, 7.95263671875, 8.576171875, 9.19970703125, 9.8232421875, 10.44677734375, 11.0703125, 11.69384765625, 12.3173828125, 12.94091796875, 13.564453125, 14.18798828125, 14.8115234375, 15.43505859375, 16.05859375, 16.68212890625, 17.3056640625, 17.92919921875, 18.552734375, 19.17626953125, 19.7998046875, 20.42333984375, 21.046875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 4.0, 7.0, 11.0, 13.0, 11.0, 18.0, 16.0, 33.0, 33.0, 43.0, 44.0, 53.0, 73.0, 138.0, 483.0, 1669488.0, 2522745.0, 488.0, 152.0, 78.0, 62.0, 53.0, 48.0, 40.0, 27.0, 25.0, 26.0, 16.0, 12.0, 7.0, 10.0, 3.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-257.25, -250.298828125, -243.34765625, -236.396484375, -229.4453125, -222.494140625, -215.54296875, -208.591796875, -201.640625, -194.689453125, -187.73828125, -180.787109375, -173.8359375, -166.884765625, -159.93359375, -152.982421875, -146.03125, -139.080078125, -132.12890625, -125.177734375, -118.2265625, -111.275390625, -104.32421875, -97.373046875, -90.421875, -83.470703125, -76.51953125, -69.568359375, -62.6171875, -55.666015625, -48.71484375, -41.763671875, -34.8125, -27.861328125, -20.91015625, -13.958984375, -7.0078125, -0.056640625, 6.89453125, 13.845703125, 20.796875, 27.748046875, 34.69921875, 41.650390625, 48.6015625, 55.552734375, 62.50390625, 69.455078125, 76.40625, 83.357421875, 90.30859375, 97.259765625, 104.2109375, 111.162109375, 118.11328125, 125.064453125, 132.015625, 138.966796875, 145.91796875, 152.869140625, 159.8203125, 166.771484375, 173.72265625, 180.673828125, 187.625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 32.0, 292.0, 537.0, 140.0, 12.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-294.3432312011719, -286.2338562011719, -278.12445068359375, -270.01507568359375, -261.90570068359375, -253.7963104248047, -245.68692016601562, -237.57754516601562, -229.46817016601562, -221.35877990722656, -213.24940490722656, -205.1400146484375, -197.0306396484375, -188.92124938964844, -180.81185913085938, -172.70248413085938, -164.5930938720703, -156.48370361328125, -148.37432861328125, -140.2649383544922, -132.1555633544922, -124.04617309570312, -115.9367904663086, -107.82740783691406, -99.71802520751953, -91.608642578125, -83.49925994873047, -75.38987731933594, -67.28048706054688, -59.17110824584961, -51.06172180175781, -42.95233917236328, -34.84294128417969, -26.733558654785156, -18.624174118041992, -10.514789581298828, -2.405406951904297, 5.703975677490234, 13.813362121582031, 21.922744750976562, 30.032127380371094, 38.141510009765625, 46.250892639160156, 54.36027908325195, 62.469661712646484, 70.57904052734375, 78.68843078613281, 86.79781341552734, 94.90719604492188, 103.0165786743164, 111.12596130371094, 119.2353515625, 127.3447265625, 135.45411682128906, 143.56350708007812, 151.67288208007812, 159.78225708007812, 167.8916473388672, 176.0010223388672, 184.11041259765625, 192.21978759765625, 200.3291778564453, 208.43856811523438, 216.54794311523438, 224.65733337402344]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 5.0, 6.0, 7.0, 18.0, 17.0, 19.0, 25.0, 29.0, 30.0, 26.0, 31.0, 34.0, 42.0, 39.0, 35.0, 45.0, 40.0, 51.0, 45.0, 47.0, 33.0, 46.0, 41.0, 32.0, 37.0, 35.0, 16.0, 22.0, 15.0, 19.0, 21.0, 14.0, 12.0, 18.0, 12.0, 3.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.878536224365234, -61.82505798339844, -59.771575927734375, -57.71809387207031, -55.664615631103516, -53.61113739013672, -51.557655334472656, -49.504173278808594, -47.4506950378418, -45.397216796875, -43.34373474121094, -41.290252685546875, -39.23677444458008, -37.18329620361328, -35.12981414794922, -33.076332092285156, -31.02285385131836, -28.96937370300293, -26.9158935546875, -24.86241340637207, -22.80893325805664, -20.75545310974121, -18.70197296142578, -16.64849281311035, -14.595012664794922, -12.541532516479492, -10.488052368164062, -8.434572219848633, -6.381092071533203, -4.327611923217773, -2.2741317749023438, -0.22065162658691406, 1.8328323364257812, 3.886312484741211, 5.939792633056641, 7.99327278137207, 10.0467529296875, 12.10023307800293, 14.15371322631836, 16.20719337463379, 18.26067352294922, 20.31415367126465, 22.367633819580078, 24.421113967895508, 26.474594116210938, 28.528074264526367, 30.581554412841797, 32.635032653808594, 34.688514709472656, 36.74199676513672, 38.795475006103516, 40.84895324707031, 42.902435302734375, 44.95591735839844, 47.009395599365234, 49.06287384033203, 51.116355895996094, 53.169837951660156, 55.22331619262695, 57.27679443359375, 59.33027648925781, 61.383758544921875, 63.43723678588867, 65.49071502685547, 67.54419708251953]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 6.0, 7.0, 13.0, 17.0, 16.0, 21.0, 26.0, 28.0, 27.0, 29.0, 30.0, 38.0, 38.0, 35.0, 31.0, 38.0, 42.0, 50.0, 49.0, 45.0, 48.0, 34.0, 39.0, 28.0, 29.0, 26.0, 31.0, 34.0, 26.0, 13.0, 18.0, 16.0, 16.0, 8.0, 8.0, 5.0, 8.0, 5.0, 4.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.4609375, -13.0391845703125, -12.617431640625, -12.1956787109375, -11.77392578125, -11.3521728515625, -10.930419921875, -10.5086669921875, -10.0869140625, -9.6651611328125, -9.243408203125, -8.8216552734375, -8.39990234375, -7.9781494140625, -7.556396484375, -7.1346435546875, -6.712890625, -6.2911376953125, -5.869384765625, -5.4476318359375, -5.02587890625, -4.6041259765625, -4.182373046875, -3.7606201171875, -3.3388671875, -2.9171142578125, -2.495361328125, -2.0736083984375, -1.65185546875, -1.2301025390625, -0.808349609375, -0.3865966796875, 0.03515625, 0.4569091796875, 0.878662109375, 1.3004150390625, 1.72216796875, 2.1439208984375, 2.565673828125, 2.9874267578125, 3.4091796875, 3.8309326171875, 4.252685546875, 4.6744384765625, 5.09619140625, 5.5179443359375, 5.939697265625, 6.3614501953125, 6.783203125, 7.2049560546875, 7.626708984375, 8.0484619140625, 8.47021484375, 8.8919677734375, 9.313720703125, 9.7354736328125, 10.1572265625, 10.5789794921875, 11.000732421875, 11.4224853515625, 11.84423828125, 12.2659912109375, 12.687744140625, 13.1094970703125, 13.53125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 19.0, 16.0, 28.0, 41.0, 52.0, 72.0, 112.0, 185.0, 297.0, 478.0, 714.0, 1068.0, 1795.0, 2819.0, 4597.0, 7303.0, 12090.0, 19563.0, 33786.0, 58588.0, 112933.0, 336270.0, 233337.0, 95506.0, 51418.0, 29475.0, 17690.0, 10607.0, 6587.0, 4107.0, 2546.0, 1595.0, 984.0, 703.0, 424.0, 274.0, 168.0, 94.0, 60.0, 49.0, 31.0, 29.0, 12.0, 15.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.962890625, -2.869964599609375, -2.77703857421875, -2.684112548828125, -2.5911865234375, -2.498260498046875, -2.40533447265625, -2.312408447265625, -2.219482421875, -2.126556396484375, -2.03363037109375, -1.940704345703125, -1.8477783203125, -1.754852294921875, -1.66192626953125, -1.569000244140625, -1.47607421875, -1.383148193359375, -1.29022216796875, -1.197296142578125, -1.1043701171875, -1.011444091796875, -0.91851806640625, -0.825592041015625, -0.732666015625, -0.639739990234375, -0.54681396484375, -0.453887939453125, -0.3609619140625, -0.268035888671875, -0.17510986328125, -0.082183837890625, 0.0107421875, 0.103668212890625, 0.19659423828125, 0.289520263671875, 0.3824462890625, 0.475372314453125, 0.56829833984375, 0.661224365234375, 0.754150390625, 0.847076416015625, 0.94000244140625, 1.032928466796875, 1.1258544921875, 1.218780517578125, 1.31170654296875, 1.404632568359375, 1.49755859375, 1.590484619140625, 1.68341064453125, 1.776336669921875, 1.8692626953125, 1.962188720703125, 2.05511474609375, 2.148040771484375, 2.240966796875, 2.333892822265625, 2.42681884765625, 2.519744873046875, 2.6126708984375, 2.705596923828125, 2.79852294921875, 2.891448974609375, 2.984375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 8.0, 8.0, 11.0, 8.0, 17.0, 13.0, 17.0, 26.0, 26.0, 23.0, 28.0, 35.0, 29.0, 28.0, 30.0, 50.0, 42.0, 41.0, 54.0, 1065.0, 37.0, 44.0, 35.0, 29.0, 35.0, 36.0, 36.0, 22.0, 23.0, 26.0, 21.0, 26.0, 22.0, 12.0, 11.0, 13.0, 4.0, 5.0, 8.0, 6.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.1060791015625, -7.844970703125, -7.5838623046875, -7.32275390625, -7.0616455078125, -6.800537109375, -6.5394287109375, -6.2783203125, -6.0172119140625, -5.756103515625, -5.4949951171875, -5.23388671875, -4.9727783203125, -4.711669921875, -4.4505615234375, -4.189453125, -3.9283447265625, -3.667236328125, -3.4061279296875, -3.14501953125, -2.8839111328125, -2.622802734375, -2.3616943359375, -2.1005859375, -1.8394775390625, -1.578369140625, -1.3172607421875, -1.05615234375, -0.7950439453125, -0.533935546875, -0.2728271484375, -0.01171875, 0.2493896484375, 0.510498046875, 0.7716064453125, 1.03271484375, 1.2938232421875, 1.554931640625, 1.8160400390625, 2.0771484375, 2.3382568359375, 2.599365234375, 2.8604736328125, 3.12158203125, 3.3826904296875, 3.643798828125, 3.9049072265625, 4.166015625, 4.4271240234375, 4.688232421875, 4.9493408203125, 5.21044921875, 5.4715576171875, 5.732666015625, 5.9937744140625, 6.2548828125, 6.5159912109375, 6.777099609375, 7.0382080078125, 7.29931640625, 7.5604248046875, 7.821533203125, 8.0826416015625, 8.34375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 13.0, 17.0, 20.0, 20.0, 41.0, 55.0, 69.0, 117.0, 176.0, 231.0, 372.0, 551.0, 792.0, 1246.0, 1818.0, 2777.0, 4244.0, 6544.0, 10389.0, 16038.0, 24988.0, 40006.0, 65387.0, 123352.0, 1379817.0, 191602.0, 88135.0, 50459.0, 31502.0, 20035.0, 12860.0, 8249.0, 5224.0, 3349.0, 2263.0, 1413.0, 953.0, 634.0, 454.0, 288.0, 195.0, 149.0, 80.0, 72.0, 39.0, 24.0, 16.0, 16.0, 17.0, 5.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.494140625, -2.41558837890625, -2.3370361328125, -2.25848388671875, -2.179931640625, -2.10137939453125, -2.0228271484375, -1.94427490234375, -1.86572265625, -1.78717041015625, -1.7086181640625, -1.63006591796875, -1.551513671875, -1.47296142578125, -1.3944091796875, -1.31585693359375, -1.2373046875, -1.15875244140625, -1.0802001953125, -1.00164794921875, -0.923095703125, -0.84454345703125, -0.7659912109375, -0.68743896484375, -0.60888671875, -0.53033447265625, -0.4517822265625, -0.37322998046875, -0.294677734375, -0.21612548828125, -0.1375732421875, -0.05902099609375, 0.01953125, 0.09808349609375, 0.1766357421875, 0.25518798828125, 0.333740234375, 0.41229248046875, 0.4908447265625, 0.56939697265625, 0.64794921875, 0.72650146484375, 0.8050537109375, 0.88360595703125, 0.962158203125, 1.04071044921875, 1.1192626953125, 1.19781494140625, 1.2763671875, 1.35491943359375, 1.4334716796875, 1.51202392578125, 1.590576171875, 1.66912841796875, 1.7476806640625, 1.82623291015625, 1.90478515625, 1.98333740234375, 2.0618896484375, 2.14044189453125, 2.218994140625, 2.29754638671875, 2.3760986328125, 2.45465087890625, 2.533203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 5.0, 4.0, 5.0, 8.0, 12.0, 10.0, 9.0, 5.0, 11.0, 21.0, 12.0, 26.0, 28.0, 27.0, 40.0, 54.0, 53.0, 65.0, 55.0, 54.0, 66.0, 60.0, 36.0, 52.0, 41.0, 43.0, 29.0, 22.0, 21.0, 25.0, 17.0, 18.0, 14.0, 6.0, 5.0, 4.0, 11.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.0014677047729492188, -0.0014258027076721191, -0.0013839006423950195, -0.00134199857711792, -0.0013000965118408203, -0.0012581944465637207, -0.001216292381286621, -0.0011743903160095215, -0.0011324882507324219, -0.0010905861854553223, -0.0010486841201782227, -0.001006782054901123, -0.0009648799896240234, -0.0009229779243469238, -0.0008810758590698242, -0.0008391737937927246, -0.000797271728515625, -0.0007553696632385254, -0.0007134675979614258, -0.0006715655326843262, -0.0006296634674072266, -0.000587761402130127, -0.0005458593368530273, -0.0005039572715759277, -0.0004620552062988281, -0.0004201531410217285, -0.0003782510757446289, -0.0003363490104675293, -0.0002944469451904297, -0.0002525448799133301, -0.00021064281463623047, -0.00016874074935913086, -0.00012683868408203125, -8.493661880493164e-05, -4.303455352783203e-05, -1.1324882507324219e-06, 4.076957702636719e-05, 8.26716423034668e-05, 0.0001245737075805664, 0.00016647577285766602, 0.00020837783813476562, 0.00025027990341186523, 0.00029218196868896484, 0.00033408403396606445, 0.00037598609924316406, 0.00041788816452026367, 0.0004597902297973633, 0.0005016922950744629, 0.0005435943603515625, 0.0005854964256286621, 0.0006273984909057617, 0.0006693005561828613, 0.0007112026214599609, 0.0007531046867370605, 0.0007950067520141602, 0.0008369088172912598, 0.0008788108825683594, 0.000920712947845459, 0.0009626150131225586, 0.0010045170783996582, 0.0010464191436767578, 0.0010883212089538574, 0.001130223274230957, 0.0011721253395080566, 0.0012140274047851562]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 6.0, 3.0, 6.0, 3.0, 4.0, 9.0, 10.0, 7.0, 11.0, 15.0, 19.0, 15.0, 27.0, 35.0, 48.0, 64.0, 68.0, 90.0, 115.0, 167.0, 235.0, 395.0, 564.0, 1151.0, 96227.0, 944431.0, 2537.0, 726.0, 456.0, 282.0, 190.0, 140.0, 122.0, 73.0, 53.0, 46.0, 39.0, 31.0, 24.0, 20.0, 20.0, 19.0, 15.0, 9.0, 6.0, 6.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0233917236328125, -0.02266526222229004, -0.021938800811767578, -0.021212339401245117, -0.020485877990722656, -0.019759416580200195, -0.019032955169677734, -0.018306493759155273, -0.017580032348632812, -0.01685357093811035, -0.01612710952758789, -0.01540064811706543, -0.014674186706542969, -0.013947725296020508, -0.013221263885498047, -0.012494802474975586, -0.011768341064453125, -0.011041879653930664, -0.010315418243408203, -0.009588956832885742, -0.008862495422363281, -0.00813603401184082, -0.007409572601318359, -0.0066831111907958984, -0.0059566497802734375, -0.0052301883697509766, -0.004503726959228516, -0.0037772655487060547, -0.0030508041381835938, -0.002324342727661133, -0.0015978813171386719, -0.0008714199066162109, -0.00014495849609375, 0.0005815029144287109, 0.0013079643249511719, 0.002034425735473633, 0.0027608871459960938, 0.0034873485565185547, 0.004213809967041016, 0.0049402713775634766, 0.0056667327880859375, 0.0063931941986083984, 0.007119655609130859, 0.00784611701965332, 0.008572578430175781, 0.009299039840698242, 0.010025501251220703, 0.010751962661743164, 0.011478424072265625, 0.012204885482788086, 0.012931346893310547, 0.013657808303833008, 0.014384269714355469, 0.01511073112487793, 0.01583719253540039, 0.01656365394592285, 0.017290115356445312, 0.018016576766967773, 0.018743038177490234, 0.019469499588012695, 0.020195960998535156, 0.020922422409057617, 0.021648883819580078, 0.02237534523010254, 0.023101806640625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 56.0, 345.0, 465.0, 117.0, 20.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001998190302401781, -0.0018990898970514536, -0.0017999893752858043, -0.0017008889699354768, -0.0016017884481698275, -0.0015026880428195, -0.0014035876374691725, -0.0013044871157035232, -0.0012053865939378738, -0.0011062861885875463, -0.001007185666821897, -0.0009080852614715695, -0.0008089847397059202, -0.0007098843343555927, -0.0006107838707976043, -0.0005116834072396159, -0.0004125830018892884, -0.0003134825383313, -0.00021438208932522684, -0.00011528164031915367, -1.618117676116526e-05, 8.291925769299269e-05, 0.0001820197212509811, 0.0002811201848089695, 0.0003802206483669579, 0.0004793211119249463, 0.0005784215754829347, 0.0006775220390409231, 0.0007766224443912506, 0.000875722907949239, 0.0009748233715072274, 0.0010739238932728767, 0.0011730242986232042, 0.0012721247039735317, 0.001371225225739181, 0.0014703256310895085, 0.0015694261528551579, 0.0016685265582054853, 0.0017676269635558128, 0.0018667274853214622, 0.0019658280070871115, 0.002064928412437439, 0.0021640288177877665, 0.0022631294559687376, 0.002362229861319065, 0.0024613302666693926, 0.00256043067201972, 0.0026595313102006912, 0.002758631482720375, 0.0028577318880707026, 0.00295683229342103, 0.003055932931602001, 0.0031550333369523287, 0.003254133742302656, 0.0033532341476529837, 0.003452334553003311, 0.0035514351911842823, 0.00365053559653461, 0.0037496360018849373, 0.0038487366400659084, 0.003947836812585592, 0.004046937450766563, 0.0041460380889475346, 0.004245138261467218, 0.0043442388996481895]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 10.0, 2.0, 6.0, 10.0, 12.0, 10.0, 22.0, 15.0, 10.0, 19.0, 17.0, 28.0, 34.0, 34.0, 31.0, 24.0, 33.0, 19.0, 39.0, 31.0, 34.0, 32.0, 36.0, 31.0, 27.0, 43.0, 39.0, 29.0, 35.0, 25.0, 29.0, 28.0, 30.0, 33.0, 23.0, 15.0, 13.0, 17.0, 8.0, 6.0, 11.0, 6.0, 9.0, 5.0, 7.0, 7.0, 3.0, 4.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0006529688835144043, -0.0006329845637083054, -0.0006130002439022064, -0.0005930159240961075, -0.0005730316042900085, -0.0005530472844839096, -0.0005330629646778107, -0.0005130786448717117, -0.0004930943250656128, -0.00047311000525951385, -0.0004531256854534149, -0.000433141365647316, -0.00041315704584121704, -0.0003931727260351181, -0.00037318840622901917, -0.0003532040864229202, -0.0003332197666168213, -0.00031323544681072235, -0.0002932511270046234, -0.0002732668071985245, -0.00025328248739242554, -0.0002332981675863266, -0.00021331384778022766, -0.00019332952797412872, -0.00017334520816802979, -0.00015336088836193085, -0.0001333765685558319, -0.00011339224874973297, -9.340792894363403e-05, -7.34236091375351e-05, -5.343928933143616e-05, -3.345496952533722e-05, -1.3470649719238281e-05, 6.513670086860657e-06, 2.6497989892959595e-05, 4.648230969905853e-05, 6.646662950515747e-05, 8.645094931125641e-05, 0.00010643526911735535, 0.00012641958892345428, 0.00014640390872955322, 0.00016638822853565216, 0.0001863725483417511, 0.00020635686814785004, 0.00022634118795394897, 0.0002463255077600479, 0.00026630982756614685, 0.0002862941473722458, 0.0003062784671783447, 0.00032626278698444366, 0.0003462471067905426, 0.00036623142659664154, 0.0003862157464027405, 0.0004062000662088394, 0.00042618438601493835, 0.0004461687058210373, 0.00046615302562713623, 0.00048613734543323517, 0.0005061216652393341, 0.000526105985045433, 0.000546090304851532, 0.0005660746246576309, 0.0005860589444637299, 0.0006060432642698288, 0.0006260275840759277]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 6.0, 7.0, 13.0, 17.0, 16.0, 21.0, 26.0, 28.0, 27.0, 29.0, 30.0, 38.0, 38.0, 35.0, 31.0, 38.0, 42.0, 50.0, 49.0, 45.0, 48.0, 34.0, 39.0, 28.0, 29.0, 26.0, 31.0, 34.0, 26.0, 13.0, 18.0, 16.0, 16.0, 8.0, 8.0, 5.0, 8.0, 5.0, 4.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.4609375, -13.0391845703125, -12.617431640625, -12.1956787109375, -11.77392578125, -11.3521728515625, -10.930419921875, -10.5086669921875, -10.0869140625, -9.6651611328125, -9.243408203125, -8.8216552734375, -8.39990234375, -7.9781494140625, -7.556396484375, -7.1346435546875, -6.712890625, -6.2911376953125, -5.869384765625, -5.4476318359375, -5.02587890625, -4.6041259765625, -4.182373046875, -3.7606201171875, -3.3388671875, -2.9171142578125, -2.495361328125, -2.0736083984375, -1.65185546875, -1.2301025390625, -0.808349609375, -0.3865966796875, 0.03515625, 0.4569091796875, 0.878662109375, 1.3004150390625, 1.72216796875, 2.1439208984375, 2.565673828125, 2.9874267578125, 3.4091796875, 3.8309326171875, 4.252685546875, 4.6744384765625, 5.09619140625, 5.5179443359375, 5.939697265625, 6.3614501953125, 6.783203125, 7.2049560546875, 7.626708984375, 8.0484619140625, 8.47021484375, 8.8919677734375, 9.313720703125, 9.7354736328125, 10.1572265625, 10.5789794921875, 11.000732421875, 11.4224853515625, 11.84423828125, 12.2659912109375, 12.687744140625, 13.1094970703125, 13.53125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 7.0, 8.0, 12.0, 18.0, 29.0, 37.0, 61.0, 80.0, 107.0, 127.0, 187.0, 232.0, 347.0, 436.0, 516.0, 681.0, 896.0, 1230.0, 1804.0, 3614.0, 12813.0, 79449.0, 509099.0, 367149.0, 51140.0, 9089.0, 3097.0, 1607.0, 1082.0, 852.0, 682.0, 505.0, 399.0, 308.0, 222.0, 164.0, 127.0, 84.0, 71.0, 60.0, 27.0, 36.0, 23.0, 14.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.751220703125, -19.11181640625, -18.472412109375, -17.8330078125, -17.193603515625, -16.55419921875, -15.914794921875, -15.275390625, -14.635986328125, -13.99658203125, -13.357177734375, -12.7177734375, -12.078369140625, -11.43896484375, -10.799560546875, -10.16015625, -9.520751953125, -8.88134765625, -8.241943359375, -7.6025390625, -6.963134765625, -6.32373046875, -5.684326171875, -5.044921875, -4.405517578125, -3.76611328125, -3.126708984375, -2.4873046875, -1.847900390625, -1.20849609375, -0.569091796875, 0.0703125, 0.709716796875, 1.34912109375, 1.988525390625, 2.6279296875, 3.267333984375, 3.90673828125, 4.546142578125, 5.185546875, 5.824951171875, 6.46435546875, 7.103759765625, 7.7431640625, 8.382568359375, 9.02197265625, 9.661376953125, 10.30078125, 10.940185546875, 11.57958984375, 12.218994140625, 12.8583984375, 13.497802734375, 14.13720703125, 14.776611328125, 15.416015625, 16.055419921875, 16.69482421875, 17.334228515625, 17.9736328125, 18.613037109375, 19.25244140625, 19.891845703125, 20.53125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 9.0, 6.0, 8.0, 9.0, 12.0, 23.0, 30.0, 40.0, 36.0, 56.0, 62.0, 61.0, 84.0, 289.0, 1798.0, 126.0, 75.0, 68.0, 62.0, 47.0, 27.0, 34.0, 22.0, 17.0, 10.0, 13.0, 9.0, 6.0, 3.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.53125, -49.93359375, -48.3359375, -46.73828125, -45.140625, -43.54296875, -41.9453125, -40.34765625, -38.75, -37.15234375, -35.5546875, -33.95703125, -32.359375, -30.76171875, -29.1640625, -27.56640625, -25.96875, -24.37109375, -22.7734375, -21.17578125, -19.578125, -17.98046875, -16.3828125, -14.78515625, -13.1875, -11.58984375, -9.9921875, -8.39453125, -6.796875, -5.19921875, -3.6015625, -2.00390625, -0.40625, 1.19140625, 2.7890625, 4.38671875, 5.984375, 7.58203125, 9.1796875, 10.77734375, 12.375, 13.97265625, 15.5703125, 17.16796875, 18.765625, 20.36328125, 21.9609375, 23.55859375, 25.15625, 26.75390625, 28.3515625, 29.94921875, 31.546875, 33.14453125, 34.7421875, 36.33984375, 37.9375, 39.53515625, 41.1328125, 42.73046875, 44.328125, 45.92578125, 47.5234375, 49.12109375, 50.71875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 10.0, 12.0, 11.0, 20.0, 15.0, 32.0, 32.0, 50.0, 82.0, 152.0, 229.0, 514.0, 1711.0, 3092134.0, 48682.0, 1053.0, 366.0, 217.0, 119.0, 84.0, 54.0, 33.0, 25.0, 14.0, 15.0, 13.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.375, -134.99609375, -130.6171875, -126.23828125, -121.859375, -117.48046875, -113.1015625, -108.72265625, -104.34375, -99.96484375, -95.5859375, -91.20703125, -86.828125, -82.44921875, -78.0703125, -73.69140625, -69.3125, -64.93359375, -60.5546875, -56.17578125, -51.796875, -47.41796875, -43.0390625, -38.66015625, -34.28125, -29.90234375, -25.5234375, -21.14453125, -16.765625, -12.38671875, -8.0078125, -3.62890625, 0.75, 5.12890625, 9.5078125, 13.88671875, 18.265625, 22.64453125, 27.0234375, 31.40234375, 35.78125, 40.16015625, 44.5390625, 48.91796875, 53.296875, 57.67578125, 62.0546875, 66.43359375, 70.8125, 75.19140625, 79.5703125, 83.94921875, 88.328125, 92.70703125, 97.0859375, 101.46484375, 105.84375, 110.22265625, 114.6015625, 118.98046875, 123.359375, 127.73828125, 132.1171875, 136.49609375, 140.875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 8.0, 87.0, 678.0, 225.0, 18.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.0487823486328, -147.89520263671875, -140.7416229248047, -133.58804321289062, -126.43445587158203, -119.28087615966797, -112.12728881835938, -104.97370910644531, -97.82012939453125, -90.66654968261719, -83.51296997070312, -76.35938262939453, -69.20580291748047, -62.052223205566406, -54.89863967895508, -47.74505615234375, -40.59147644042969, -33.437896728515625, -26.284313201904297, -19.1307315826416, -11.977149963378906, -4.823570251464844, 2.3300132751464844, 9.483596801757812, 16.637176513671875, 23.79075813293457, 30.944339752197266, 38.097923278808594, 45.251502990722656, 52.40508270263672, 59.55866622924805, 66.71224975585938, 73.8658447265625, 81.01942443847656, 88.17300415039062, 95.32659149169922, 102.48017120361328, 109.63375091552734, 116.78733825683594, 123.94091796875, 131.09449768066406, 138.24807739257812, 145.4016571044922, 152.55523681640625, 159.70883178710938, 166.86239624023438, 174.0159912109375, 181.16957092285156, 188.32315063476562, 195.4767303466797, 202.63031005859375, 209.7838897705078, 216.93746948242188, 224.091064453125, 231.24464416503906, 238.39822387695312, 245.5518035888672, 252.70538330078125, 259.8589782714844, 267.0125427246094, 274.1661376953125, 281.3197021484375, 288.4732971191406, 295.62689208984375, 302.78045654296875]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 5.0, 7.0, 8.0, 4.0, 8.0, 16.0, 20.0, 17.0, 19.0, 21.0, 28.0, 42.0, 40.0, 33.0, 41.0, 53.0, 56.0, 70.0, 57.0, 58.0, 47.0, 50.0, 37.0, 31.0, 40.0, 44.0, 23.0, 18.0, 18.0, 21.0, 12.0, 8.0, 11.0, 10.0, 7.0, 7.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.5247802734375, -89.72315216064453, -85.9215316772461, -82.11990356445312, -78.31828308105469, -74.51665496826172, -70.71502685546875, -66.91340637207031, -63.111778259277344, -59.31015396118164, -55.50852966308594, -51.70690155029297, -47.905277252197266, -44.10365295410156, -40.30202865600586, -36.500404357910156, -32.69878005981445, -28.89715576171875, -25.095529556274414, -21.29390525817871, -17.492279052734375, -13.690654754638672, -9.889030456542969, -6.087404251098633, -2.2857799530029297, 1.5158450603485107, 5.317470073699951, 9.119094848632812, 12.920720100402832, 16.72234535217285, 20.523969650268555, 24.32559585571289, 28.127220153808594, 31.928844451904297, 35.73046875, 39.53209686279297, 43.33372116088867, 47.135345458984375, 50.93696975708008, 54.73859405517578, 58.54022216796875, 62.34184646606445, 66.14347076416016, 69.94509887695312, 73.74671936035156, 77.54834747314453, 81.3499755859375, 85.15159606933594, 88.95321655273438, 92.75484466552734, 96.55646514892578, 100.35809326171875, 104.15971374511719, 107.96134185791016, 111.76296997070312, 115.56459045410156, 119.36621856689453, 123.1678466796875, 126.96946716308594, 130.77108764648438, 134.57272338867188, 138.3743438720703, 142.17596435546875, 145.97760009765625, 149.7792205810547]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 4.0, 5.0, 9.0, 11.0, 12.0, 14.0, 13.0, 26.0, 17.0, 27.0, 35.0, 27.0, 30.0, 27.0, 34.0, 40.0, 31.0, 35.0, 45.0, 32.0, 51.0, 40.0, 34.0, 38.0, 45.0, 27.0, 28.0, 33.0, 31.0, 26.0, 25.0, 27.0, 23.0, 17.0, 16.0, 14.0, 6.0, 6.0, 6.0, 8.0, 3.0, 5.0, 4.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6640625, -13.2530517578125, -12.842041015625, -12.4310302734375, -12.02001953125, -11.6090087890625, -11.197998046875, -10.7869873046875, -10.3759765625, -9.9649658203125, -9.553955078125, -9.1429443359375, -8.73193359375, -8.3209228515625, -7.909912109375, -7.4989013671875, -7.087890625, -6.6768798828125, -6.265869140625, -5.8548583984375, -5.44384765625, -5.0328369140625, -4.621826171875, -4.2108154296875, -3.7998046875, -3.3887939453125, -2.977783203125, -2.5667724609375, -2.15576171875, -1.7447509765625, -1.333740234375, -0.9227294921875, -0.51171875, -0.1007080078125, 0.310302734375, 0.7213134765625, 1.13232421875, 1.5433349609375, 1.954345703125, 2.3653564453125, 2.7763671875, 3.1873779296875, 3.598388671875, 4.0093994140625, 4.42041015625, 4.8314208984375, 5.242431640625, 5.6534423828125, 6.064453125, 6.4754638671875, 6.886474609375, 7.2974853515625, 7.70849609375, 8.1195068359375, 8.530517578125, 8.9415283203125, 9.3525390625, 9.7635498046875, 10.174560546875, 10.5855712890625, 10.99658203125, 11.4075927734375, 11.818603515625, 12.2296142578125, 12.640625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 8.0, 6.0, 11.0, 11.0, 18.0, 18.0, 14.0, 29.0, 33.0, 30.0, 48.0, 61.0, 78.0, 93.0, 107.0, 129.0, 143.0, 248.0, 449.0, 1141.0, 4030.0, 29149.0, 1191278.0, 2856364.0, 100072.0, 7146.0, 1715.0, 657.0, 288.0, 211.0, 126.0, 115.0, 95.0, 67.0, 54.0, 48.0, 36.0, 32.0, 25.0, 23.0, 11.0, 13.0, 18.0, 13.0, 5.0, 5.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-40.59375, -39.33251953125, -38.0712890625, -36.81005859375, -35.548828125, -34.28759765625, -33.0263671875, -31.76513671875, -30.50390625, -29.24267578125, -27.9814453125, -26.72021484375, -25.458984375, -24.19775390625, -22.9365234375, -21.67529296875, -20.4140625, -19.15283203125, -17.8916015625, -16.63037109375, -15.369140625, -14.10791015625, -12.8466796875, -11.58544921875, -10.32421875, -9.06298828125, -7.8017578125, -6.54052734375, -5.279296875, -4.01806640625, -2.7568359375, -1.49560546875, -0.234375, 1.02685546875, 2.2880859375, 3.54931640625, 4.810546875, 6.07177734375, 7.3330078125, 8.59423828125, 9.85546875, 11.11669921875, 12.3779296875, 13.63916015625, 14.900390625, 16.16162109375, 17.4228515625, 18.68408203125, 19.9453125, 21.20654296875, 22.4677734375, 23.72900390625, 24.990234375, 26.25146484375, 27.5126953125, 28.77392578125, 30.03515625, 31.29638671875, 32.5576171875, 33.81884765625, 35.080078125, 36.34130859375, 37.6025390625, 38.86376953125, 40.125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 6.0, 14.0, 24.0, 24.0, 50.0, 120.0, 192.0, 336.0, 700.0, 1182.0, 683.0, 299.0, 211.0, 105.0, 51.0, 38.0, 15.0, 13.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.3125, -61.856689453125, -60.40087890625, -58.945068359375, -57.4892578125, -56.033447265625, -54.57763671875, -53.121826171875, -51.666015625, -50.210205078125, -48.75439453125, -47.298583984375, -45.8427734375, -44.386962890625, -42.93115234375, -41.475341796875, -40.01953125, -38.563720703125, -37.10791015625, -35.652099609375, -34.1962890625, -32.740478515625, -31.28466796875, -29.828857421875, -28.373046875, -26.917236328125, -25.46142578125, -24.005615234375, -22.5498046875, -21.093994140625, -19.63818359375, -18.182373046875, -16.7265625, -15.270751953125, -13.81494140625, -12.359130859375, -10.9033203125, -9.447509765625, -7.99169921875, -6.535888671875, -5.080078125, -3.624267578125, -2.16845703125, -0.712646484375, 0.7431640625, 2.198974609375, 3.65478515625, 5.110595703125, 6.56640625, 8.022216796875, 9.47802734375, 10.933837890625, 12.3896484375, 13.845458984375, 15.30126953125, 16.757080078125, 18.212890625, 19.668701171875, 21.12451171875, 22.580322265625, 24.0361328125, 25.491943359375, 26.94775390625, 28.403564453125, 29.859375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 7.0, 10.0, 24.0, 32.0, 46.0, 85.0, 158.0, 367.0, 863.0, 4157.0, 1642452.0, 2539963.0, 4474.0, 918.0, 310.0, 155.0, 97.0, 64.0, 34.0, 15.0, 17.0, 14.0, 6.0, 2.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.375, -104.021484375, -100.66796875, -97.314453125, -93.9609375, -90.607421875, -87.25390625, -83.900390625, -80.546875, -77.193359375, -73.83984375, -70.486328125, -67.1328125, -63.779296875, -60.42578125, -57.072265625, -53.71875, -50.365234375, -47.01171875, -43.658203125, -40.3046875, -36.951171875, -33.59765625, -30.244140625, -26.890625, -23.537109375, -20.18359375, -16.830078125, -13.4765625, -10.123046875, -6.76953125, -3.416015625, -0.0625, 3.291015625, 6.64453125, 9.998046875, 13.3515625, 16.705078125, 20.05859375, 23.412109375, 26.765625, 30.119140625, 33.47265625, 36.826171875, 40.1796875, 43.533203125, 46.88671875, 50.240234375, 53.59375, 56.947265625, 60.30078125, 63.654296875, 67.0078125, 70.361328125, 73.71484375, 77.068359375, 80.421875, 83.775390625, 87.12890625, 90.482421875, 93.8359375, 97.189453125, 100.54296875, 103.896484375, 107.25]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 12.0, 863.0, 139.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.4566650390625, -177.9335174560547, -151.41038513183594, -124.88723754882812, -98.36409759521484, -71.84095764160156, -45.31781005859375, -18.794677734375, 7.7284698486328125, 34.251609802246094, 60.77475357055664, 87.29789733886719, 113.82103729248047, 140.34417724609375, 166.86732482910156, 193.3904571533203, 219.91360473632812, 246.43675231933594, 272.95989990234375, 299.4830322265625, 326.00616455078125, 352.529296875, 379.0524597167969, 405.5755920410156, 432.0987548828125, 458.62188720703125, 485.1450500488281, 511.6681823730469, 538.1913452148438, 564.7144775390625, 591.2376098632812, 617.7607421875, 644.2838745117188, 670.8070068359375, 697.3301391601562, 723.853271484375, 750.37646484375, 776.8995971679688, 803.4227294921875, 829.9458618164062, 856.468994140625, 882.9921264648438, 909.5152587890625, 936.0384521484375, 962.5615844726562, 989.084716796875, 1015.6078491210938, 1042.1309814453125, 1068.6541748046875, 1095.1773681640625, 1121.700439453125, 1148.2236328125, 1174.7467041015625, 1201.2698974609375, 1227.79296875, 1254.316162109375, 1280.8392333984375, 1307.3624267578125, 1333.885498046875, 1360.40869140625, 1386.9317626953125, 1413.4549560546875, 1439.97802734375, 1466.501220703125, 1493.0244140625]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 1.0, 4.0, 11.0, 8.0, 8.0, 7.0, 14.0, 11.0, 15.0, 24.0, 29.0, 30.0, 31.0, 30.0, 35.0, 35.0, 42.0, 45.0, 43.0, 35.0, 46.0, 34.0, 43.0, 34.0, 38.0, 35.0, 37.0, 32.0, 32.0, 35.0, 29.0, 22.0, 24.0, 17.0, 18.0, 11.0, 10.0, 8.0, 5.0, 10.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-84.82231140136719, -82.17188262939453, -79.5214614868164, -76.87103271484375, -74.2206039428711, -71.57017517089844, -68.91975402832031, -66.26932525634766, -63.618900299072266, -60.968475341796875, -58.31804656982422, -55.66762161254883, -53.01719665527344, -50.36676788330078, -47.71634292602539, -45.06591796875, -42.415489196777344, -39.76506423950195, -37.1146354675293, -34.464210510253906, -31.813783645629883, -29.16335678100586, -26.51293182373047, -23.862504959106445, -21.212078094482422, -18.5616512298584, -15.911225318908691, -13.260799407958984, -10.610372543334961, -7.9599456787109375, -5.3095197677612305, -2.6590938568115234, -0.0086669921875, 2.6417593955993652, 5.2921857833862305, 7.942612171173096, 10.593038558959961, 13.243465423583984, 15.893891334533691, 18.5443172454834, 21.194744110107422, 23.845170974731445, 26.49559783935547, 29.14602279663086, 31.796449661254883, 34.446876525878906, 37.0973014831543, 39.74772644042969, 42.398155212402344, 45.048580169677734, 47.69900894165039, 50.34943389892578, 52.99986267089844, 55.65028762817383, 58.30071258544922, 60.951141357421875, 63.601566314697266, 66.25199127197266, 68.90242004394531, 71.55284881591797, 74.2032699584961, 76.85369873046875, 79.5041275024414, 82.15454864501953, 84.80497741699219]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 5.0, 7.0, 11.0, 16.0, 14.0, 10.0, 20.0, 25.0, 33.0, 23.0, 24.0, 33.0, 25.0, 32.0, 35.0, 37.0, 72.0, 41.0, 43.0, 49.0, 43.0, 40.0, 38.0, 40.0, 38.0, 35.0, 34.0, 34.0, 18.0, 15.0, 18.0, 17.0, 9.0, 14.0, 7.0, 13.0, 6.0, 6.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.34375, -11.965087890625, -11.58642578125, -11.207763671875, -10.8291015625, -10.450439453125, -10.07177734375, -9.693115234375, -9.314453125, -8.935791015625, -8.55712890625, -8.178466796875, -7.7998046875, -7.421142578125, -7.04248046875, -6.663818359375, -6.28515625, -5.906494140625, -5.52783203125, -5.149169921875, -4.7705078125, -4.391845703125, -4.01318359375, -3.634521484375, -3.255859375, -2.877197265625, -2.49853515625, -2.119873046875, -1.7412109375, -1.362548828125, -0.98388671875, -0.605224609375, -0.2265625, 0.152099609375, 0.53076171875, 0.909423828125, 1.2880859375, 1.666748046875, 2.04541015625, 2.424072265625, 2.802734375, 3.181396484375, 3.56005859375, 3.938720703125, 4.3173828125, 4.696044921875, 5.07470703125, 5.453369140625, 5.83203125, 6.210693359375, 6.58935546875, 6.968017578125, 7.3466796875, 7.725341796875, 8.10400390625, 8.482666015625, 8.861328125, 9.239990234375, 9.61865234375, 9.997314453125, 10.3759765625, 10.754638671875, 11.13330078125, 11.511962890625, 11.890625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 11.0, 9.0, 15.0, 23.0, 25.0, 46.0, 70.0, 109.0, 121.0, 212.0, 334.0, 465.0, 637.0, 1000.0, 1535.0, 2172.0, 3256.0, 5005.0, 7647.0, 11525.0, 17651.0, 27400.0, 42393.0, 69644.0, 135442.0, 331393.0, 170693.0, 82145.0, 48672.0, 30882.0, 19987.0, 12667.0, 8475.0, 5623.0, 3669.0, 2452.0, 1686.0, 1135.0, 757.0, 498.0, 351.0, 237.0, 162.0, 110.0, 84.0, 41.0, 30.0, 24.0, 20.0, 10.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-2.24609375, -2.177276611328125, -2.10845947265625, -2.039642333984375, -1.9708251953125, -1.902008056640625, -1.83319091796875, -1.764373779296875, -1.695556640625, -1.626739501953125, -1.55792236328125, -1.489105224609375, -1.4202880859375, -1.351470947265625, -1.28265380859375, -1.213836669921875, -1.14501953125, -1.076202392578125, -1.00738525390625, -0.938568115234375, -0.8697509765625, -0.800933837890625, -0.73211669921875, -0.663299560546875, -0.594482421875, -0.525665283203125, -0.45684814453125, -0.388031005859375, -0.3192138671875, -0.250396728515625, -0.18157958984375, -0.112762451171875, -0.0439453125, 0.024871826171875, 0.09368896484375, 0.162506103515625, 0.2313232421875, 0.300140380859375, 0.36895751953125, 0.437774658203125, 0.506591796875, 0.575408935546875, 0.64422607421875, 0.713043212890625, 0.7818603515625, 0.850677490234375, 0.91949462890625, 0.988311767578125, 1.05712890625, 1.125946044921875, 1.19476318359375, 1.263580322265625, 1.3323974609375, 1.401214599609375, 1.47003173828125, 1.538848876953125, 1.607666015625, 1.676483154296875, 1.74530029296875, 1.814117431640625, 1.8829345703125, 1.951751708984375, 2.02056884765625, 2.089385986328125, 2.158203125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 6.0, 8.0, 6.0, 8.0, 15.0, 14.0, 21.0, 21.0, 16.0, 28.0, 31.0, 18.0, 45.0, 27.0, 27.0, 33.0, 38.0, 31.0, 41.0, 1064.0, 45.0, 51.0, 41.0, 43.0, 34.0, 28.0, 25.0, 27.0, 33.0, 26.0, 25.0, 27.0, 15.0, 15.0, 15.0, 13.0, 8.0, 11.0, 6.0, 7.0, 4.0, 4.0, 6.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.1171875, -6.893310546875, -6.66943359375, -6.445556640625, -6.2216796875, -5.997802734375, -5.77392578125, -5.550048828125, -5.326171875, -5.102294921875, -4.87841796875, -4.654541015625, -4.4306640625, -4.206787109375, -3.98291015625, -3.759033203125, -3.53515625, -3.311279296875, -3.08740234375, -2.863525390625, -2.6396484375, -2.415771484375, -2.19189453125, -1.968017578125, -1.744140625, -1.520263671875, -1.29638671875, -1.072509765625, -0.8486328125, -0.624755859375, -0.40087890625, -0.177001953125, 0.046875, 0.270751953125, 0.49462890625, 0.718505859375, 0.9423828125, 1.166259765625, 1.39013671875, 1.614013671875, 1.837890625, 2.061767578125, 2.28564453125, 2.509521484375, 2.7333984375, 2.957275390625, 3.18115234375, 3.405029296875, 3.62890625, 3.852783203125, 4.07666015625, 4.300537109375, 4.5244140625, 4.748291015625, 4.97216796875, 5.196044921875, 5.419921875, 5.643798828125, 5.86767578125, 6.091552734375, 6.3154296875, 6.539306640625, 6.76318359375, 6.987060546875, 7.2109375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 9.0, 8.0, 12.0, 27.0, 31.0, 39.0, 59.0, 81.0, 115.0, 177.0, 274.0, 404.0, 568.0, 839.0, 1294.0, 1860.0, 2737.0, 4190.0, 6131.0, 9343.0, 14398.0, 22216.0, 34182.0, 53880.0, 93927.0, 217621.0, 1349603.0, 111080.0, 61696.0, 38367.0, 24707.0, 16098.0, 10467.0, 6910.0, 4611.0, 2966.0, 2086.0, 1352.0, 915.0, 598.0, 400.0, 282.0, 178.0, 116.0, 94.0, 52.0, 36.0, 29.0, 30.0, 16.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.166015625, -2.098602294921875, -2.03118896484375, -1.963775634765625, -1.8963623046875, -1.828948974609375, -1.76153564453125, -1.694122314453125, -1.626708984375, -1.559295654296875, -1.49188232421875, -1.424468994140625, -1.3570556640625, -1.289642333984375, -1.22222900390625, -1.154815673828125, -1.08740234375, -1.019989013671875, -0.95257568359375, -0.885162353515625, -0.8177490234375, -0.750335693359375, -0.68292236328125, -0.615509033203125, -0.548095703125, -0.480682373046875, -0.41326904296875, -0.345855712890625, -0.2784423828125, -0.211029052734375, -0.14361572265625, -0.076202392578125, -0.0087890625, 0.058624267578125, 0.12603759765625, 0.193450927734375, 0.2608642578125, 0.328277587890625, 0.39569091796875, 0.463104248046875, 0.530517578125, 0.597930908203125, 0.66534423828125, 0.732757568359375, 0.8001708984375, 0.867584228515625, 0.93499755859375, 1.002410888671875, 1.06982421875, 1.137237548828125, 1.20465087890625, 1.272064208984375, 1.3394775390625, 1.406890869140625, 1.47430419921875, 1.541717529296875, 1.609130859375, 1.676544189453125, 1.74395751953125, 1.811370849609375, 1.8787841796875, 1.946197509765625, 2.01361083984375, 2.081024169921875, 2.1484375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 6.0, 6.0, 8.0, 8.0, 19.0, 24.0, 29.0, 38.0, 70.0, 97.0, 109.0, 122.0, 123.0, 104.0, 75.0, 61.0, 36.0, 23.0, 8.0, 9.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0020465850830078125, -0.00198577344417572, -0.001924961805343628, -0.0018641501665115356, -0.0018033385276794434, -0.001742526888847351, -0.0016817152500152588, -0.0016209036111831665, -0.0015600919723510742, -0.001499280333518982, -0.0014384686946868896, -0.0013776570558547974, -0.001316845417022705, -0.0012560337781906128, -0.0011952221393585205, -0.0011344105005264282, -0.001073598861694336, -0.0010127872228622437, -0.0009519755840301514, -0.0008911639451980591, -0.0008303523063659668, -0.0007695406675338745, -0.0007087290287017822, -0.0006479173898696899, -0.0005871057510375977, -0.0005262941122055054, -0.0004654824733734131, -0.0004046708345413208, -0.0003438591957092285, -0.00028304755687713623, -0.00022223591804504395, -0.00016142427921295166, -0.00010061264038085938, -3.980100154876709e-05, 2.1010637283325195e-05, 8.182227611541748e-05, 0.00014263391494750977, 0.00020344555377960205, 0.00026425719261169434, 0.0003250688314437866, 0.0003858804702758789, 0.0004466921091079712, 0.0005075037479400635, 0.0005683153867721558, 0.000629127025604248, 0.0006899386644363403, 0.0007507503032684326, 0.0008115619421005249, 0.0008723735809326172, 0.0009331852197647095, 0.0009939968585968018, 0.001054808497428894, 0.0011156201362609863, 0.0011764317750930786, 0.001237243413925171, 0.0012980550527572632, 0.0013588666915893555, 0.0014196783304214478, 0.00148048996925354, 0.0015413016080856323, 0.0016021132469177246, 0.001662924885749817, 0.0017237365245819092, 0.0017845481634140015, 0.0018453598022460938]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 14.0, 8.0, 17.0, 19.0, 30.0, 46.0, 85.0, 158.0, 232.0, 382.0, 934.0, 36550.0, 1007330.0, 1378.0, 549.0, 306.0, 181.0, 96.0, 72.0, 41.0, 30.0, 17.0, 15.0, 13.0, 8.0, 11.0, 6.0, 5.0, 6.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03118896484375, -0.030155658721923828, -0.029122352600097656, -0.028089046478271484, -0.027055740356445312, -0.02602243423461914, -0.02498912811279297, -0.023955821990966797, -0.022922515869140625, -0.021889209747314453, -0.02085590362548828, -0.01982259750366211, -0.018789291381835938, -0.017755985260009766, -0.016722679138183594, -0.015689373016357422, -0.01465606689453125, -0.013622760772705078, -0.012589454650878906, -0.011556148529052734, -0.010522842407226562, -0.00948953628540039, -0.008456230163574219, -0.007422924041748047, -0.006389617919921875, -0.005356311798095703, -0.004323005676269531, -0.0032896995544433594, -0.0022563934326171875, -0.0012230873107910156, -0.00018978118896484375, 0.0008435249328613281, 0.0018768310546875, 0.002910137176513672, 0.003943443298339844, 0.004976749420166016, 0.0060100555419921875, 0.007043361663818359, 0.008076667785644531, 0.009109973907470703, 0.010143280029296875, 0.011176586151123047, 0.012209892272949219, 0.01324319839477539, 0.014276504516601562, 0.015309810638427734, 0.016343116760253906, 0.017376422882080078, 0.01840972900390625, 0.019443035125732422, 0.020476341247558594, 0.021509647369384766, 0.022542953491210938, 0.02357625961303711, 0.02460956573486328, 0.025642871856689453, 0.026676177978515625, 0.027709484100341797, 0.02874279022216797, 0.02977609634399414, 0.030809402465820312, 0.031842708587646484, 0.032876014709472656, 0.03390932083129883, 0.034942626953125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 128.0, 801.0, 84.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015713725006207824, -0.0014209036016836762, -0.0012704345863312483, -0.0011199656873941422, -0.0009694967302493751, -0.0008190277731046081, -0.0006685588741675019, -0.000518089858815074, -0.00036762095987796783, -0.00021715201728511602, -6.66830746922642e-05, 8.378585334867239e-05, 0.00023425481049343944, 0.0003847237676382065, 0.0005351926665753126, 0.0006856616819277406, 0.0008361305808648467, 0.0009865994798019528, 0.0011370684951543808, 0.001287537394091487, 0.001438006293028593, 0.001588475308381021, 0.0017389442073181272, 0.0018894132226705551, 0.0020398821216076612, 0.0021903510205447674, 0.0023408199194818735, 0.0024912888184189796, 0.0026417579501867294, 0.0027922268491238356, 0.0029426957480609417, 0.0030931648798286915, 0.0032436340115964413, 0.0033941029105335474, 0.0035445718094706535, 0.0036950409412384033, 0.0038455098401755095, 0.003995978739112616, 0.004146447405219078, 0.004296916536986828, 0.004447385668754578, 0.004597854800522327, 0.00474832346662879, 0.00489879259839654, 0.005049261264503002, 0.005199730396270752, 0.005350199528038502, 0.005500668194144964, 0.005651136860251427, 0.0058016059920191765, 0.005952074658125639, 0.006102543789893389, 0.006253012455999851, 0.006403481587767601, 0.006553950719535351, 0.006704419385641813, 0.006854888517409563, 0.007005357649177313, 0.007155826315283775, 0.007306295447051525, 0.007456764113157988, 0.007607233244925737, 0.0077577019110322, 0.00790817104279995, 0.0080586401745677]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 5.0, 4.0, 6.0, 2.0, 8.0, 5.0, 6.0, 15.0, 13.0, 19.0, 15.0, 27.0, 36.0, 32.0, 28.0, 38.0, 36.0, 45.0, 36.0, 44.0, 38.0, 55.0, 49.0, 40.0, 28.0, 35.0, 38.0, 33.0, 49.0, 35.0, 20.0, 32.0, 31.0, 25.0, 20.0, 10.0, 11.0, 8.0, 8.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0007399916648864746, -0.0007201842963695526, -0.0007003769278526306, -0.0006805695593357086, -0.0006607621908187866, -0.0006409548223018646, -0.0006211474537849426, -0.0006013400852680206, -0.0005815327167510986, -0.0005617253482341766, -0.0005419179797172546, -0.0005221106112003326, -0.0005023032426834106, -0.00048249587416648865, -0.00046268850564956665, -0.00044288113713264465, -0.00042307376861572266, -0.00040326640009880066, -0.00038345903158187866, -0.00036365166306495667, -0.00034384429454803467, -0.00032403692603111267, -0.0003042295575141907, -0.0002844221889972687, -0.0002646148204803467, -0.0002448074519634247, -0.00022500008344650269, -0.0002051927149295807, -0.0001853853464126587, -0.0001655779778957367, -0.0001457706093788147, -0.0001259632408618927, -0.0001061558723449707, -8.63485038280487e-05, -6.654113531112671e-05, -4.673376679420471e-05, -2.6926398277282715e-05, -7.119029760360718e-06, 1.268833875656128e-05, 3.2495707273483276e-05, 5.2303075790405273e-05, 7.211044430732727e-05, 9.191781282424927e-05, 0.00011172518134117126, 0.00013153254985809326, 0.00015133991837501526, 0.00017114728689193726, 0.00019095465540885925, 0.00021076202392578125, 0.00023056939244270325, 0.00025037676095962524, 0.00027018412947654724, 0.00028999149799346924, 0.00030979886651039124, 0.00032960623502731323, 0.00034941360354423523, 0.0003692209720611572, 0.0003890283405780792, 0.0004088357090950012, 0.0004286430776119232, 0.0004484504461288452, 0.0004682578146457672, 0.0004880651831626892, 0.0005078725516796112, 0.0005276799201965332]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 5.0, 7.0, 11.0, 16.0, 14.0, 10.0, 20.0, 25.0, 33.0, 23.0, 24.0, 33.0, 25.0, 32.0, 35.0, 37.0, 72.0, 41.0, 43.0, 49.0, 43.0, 40.0, 38.0, 40.0, 38.0, 35.0, 34.0, 34.0, 18.0, 15.0, 18.0, 17.0, 9.0, 14.0, 7.0, 13.0, 6.0, 6.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.34375, -11.965087890625, -11.58642578125, -11.207763671875, -10.8291015625, -10.450439453125, -10.07177734375, -9.693115234375, -9.314453125, -8.935791015625, -8.55712890625, -8.178466796875, -7.7998046875, -7.421142578125, -7.04248046875, -6.663818359375, -6.28515625, -5.906494140625, -5.52783203125, -5.149169921875, -4.7705078125, -4.391845703125, -4.01318359375, -3.634521484375, -3.255859375, -2.877197265625, -2.49853515625, -2.119873046875, -1.7412109375, -1.362548828125, -0.98388671875, -0.605224609375, -0.2265625, 0.152099609375, 0.53076171875, 0.909423828125, 1.2880859375, 1.666748046875, 2.04541015625, 2.424072265625, 2.802734375, 3.181396484375, 3.56005859375, 3.938720703125, 4.3173828125, 4.696044921875, 5.07470703125, 5.453369140625, 5.83203125, 6.210693359375, 6.58935546875, 6.968017578125, 7.3466796875, 7.725341796875, 8.10400390625, 8.482666015625, 8.861328125, 9.239990234375, 9.61865234375, 9.997314453125, 10.3759765625, 10.754638671875, 11.13330078125, 11.511962890625, 11.890625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 3.0, 1.0, 6.0, 10.0, 9.0, 15.0, 27.0, 33.0, 49.0, 71.0, 85.0, 132.0, 187.0, 289.0, 373.0, 574.0, 879.0, 1289.0, 2114.0, 4025.0, 12751.0, 111367.0, 782249.0, 109257.0, 12656.0, 3947.0, 2062.0, 1318.0, 880.0, 610.0, 378.0, 271.0, 194.0, 124.0, 95.0, 63.0, 53.0, 28.0, 20.0, 21.0, 13.0, 12.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.28125, -30.2880859375, -29.294921875, -28.3017578125, -27.30859375, -26.3154296875, -25.322265625, -24.3291015625, -23.3359375, -22.3427734375, -21.349609375, -20.3564453125, -19.36328125, -18.3701171875, -17.376953125, -16.3837890625, -15.390625, -14.3974609375, -13.404296875, -12.4111328125, -11.41796875, -10.4248046875, -9.431640625, -8.4384765625, -7.4453125, -6.4521484375, -5.458984375, -4.4658203125, -3.47265625, -2.4794921875, -1.486328125, -0.4931640625, 0.5, 1.4931640625, 2.486328125, 3.4794921875, 4.47265625, 5.4658203125, 6.458984375, 7.4521484375, 8.4453125, 9.4384765625, 10.431640625, 11.4248046875, 12.41796875, 13.4111328125, 14.404296875, 15.3974609375, 16.390625, 17.3837890625, 18.376953125, 19.3701171875, 20.36328125, 21.3564453125, 22.349609375, 23.3427734375, 24.3359375, 25.3291015625, 26.322265625, 27.3154296875, 28.30859375, 29.3017578125, 30.294921875, 31.2880859375, 32.28125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 13.0, 15.0, 19.0, 23.0, 27.0, 32.0, 42.0, 49.0, 70.0, 135.0, 359.0, 1757.0, 119.0, 87.0, 58.0, 59.0, 34.0, 34.0, 29.0, 16.0, 18.0, 10.0, 11.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.21875, -52.4765625, -50.734375, -48.9921875, -47.25, -45.5078125, -43.765625, -42.0234375, -40.28125, -38.5390625, -36.796875, -35.0546875, -33.3125, -31.5703125, -29.828125, -28.0859375, -26.34375, -24.6015625, -22.859375, -21.1171875, -19.375, -17.6328125, -15.890625, -14.1484375, -12.40625, -10.6640625, -8.921875, -7.1796875, -5.4375, -3.6953125, -1.953125, -0.2109375, 1.53125, 3.2734375, 5.015625, 6.7578125, 8.5, 10.2421875, 11.984375, 13.7265625, 15.46875, 17.2109375, 18.953125, 20.6953125, 22.4375, 24.1796875, 25.921875, 27.6640625, 29.40625, 31.1484375, 32.890625, 34.6328125, 36.375, 38.1171875, 39.859375, 41.6015625, 43.34375, 45.0859375, 46.828125, 48.5703125, 50.3125, 52.0546875, 53.796875, 55.5390625, 57.28125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 13.0, 14.0, 15.0, 49.0, 56.0, 82.0, 128.0, 226.0, 523.0, 2063.0, 3133531.0, 7569.0, 739.0, 251.0, 157.0, 99.0, 68.0, 39.0, 28.0, 16.0, 12.0, 8.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-186.0, -180.478515625, -174.95703125, -169.435546875, -163.9140625, -158.392578125, -152.87109375, -147.349609375, -141.828125, -136.306640625, -130.78515625, -125.263671875, -119.7421875, -114.220703125, -108.69921875, -103.177734375, -97.65625, -92.134765625, -86.61328125, -81.091796875, -75.5703125, -70.048828125, -64.52734375, -59.005859375, -53.484375, -47.962890625, -42.44140625, -36.919921875, -31.3984375, -25.876953125, -20.35546875, -14.833984375, -9.3125, -3.791015625, 1.73046875, 7.251953125, 12.7734375, 18.294921875, 23.81640625, 29.337890625, 34.859375, 40.380859375, 45.90234375, 51.423828125, 56.9453125, 62.466796875, 67.98828125, 73.509765625, 79.03125, 84.552734375, 90.07421875, 95.595703125, 101.1171875, 106.638671875, 112.16015625, 117.681640625, 123.203125, 128.724609375, 134.24609375, 139.767578125, 145.2890625, 150.810546875, 156.33203125, 161.853515625, 167.375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 98.0, 817.0, 95.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-659.046142578125, -645.7333984375, -632.4207153320312, -619.1079711914062, -605.7952270507812, -592.4825439453125, -579.1697998046875, -565.8570556640625, -552.5443725585938, -539.2316284179688, -525.9189453125, -512.606201171875, -499.2934875488281, -485.9807434082031, -472.66802978515625, -459.35528564453125, -446.04254150390625, -432.7298278808594, -419.4170837402344, -406.1043701171875, -392.7916564941406, -379.4789123535156, -366.16619873046875, -352.85345458984375, -339.540771484375, -326.2280578613281, -312.9153137207031, -299.60260009765625, -286.2898864746094, -272.9771423339844, -259.6644287109375, -246.35169982910156, -233.0389862060547, -219.72625732421875, -206.41354370117188, -193.10081481933594, -179.7880859375, -166.47537231445312, -153.1626434326172, -139.84991455078125, -126.53719329833984, -113.22447204589844, -99.9117431640625, -86.5990219116211, -73.28630065917969, -59.97357177734375, -46.660850524902344, -33.348121643066406, -20.035400390625, -6.7226762771606445, 6.590047836303711, 19.90277099609375, 33.21549606323242, 46.528221130371094, 59.8409423828125, 73.15367126464844, 86.46639251708984, 99.77911376953125, 113.09184265136719, 126.4045639038086, 139.71728515625, 153.03001403808594, 166.34274291992188, 179.65545654296875, 192.9681854248047]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 6.0, 2.0, 3.0, 6.0, 10.0, 7.0, 12.0, 15.0, 20.0, 18.0, 17.0, 22.0, 23.0, 25.0, 30.0, 34.0, 29.0, 27.0, 33.0, 27.0, 34.0, 45.0, 42.0, 47.0, 40.0, 45.0, 36.0, 33.0, 28.0, 38.0, 28.0, 30.0, 34.0, 34.0, 26.0, 18.0, 14.0, 14.0, 13.0, 10.0, 10.0, 5.0, 6.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-111.92774963378906, -108.70206451416016, -105.47638702392578, -102.25070190429688, -99.02501678466797, -95.79933166503906, -92.57365417480469, -89.34796905517578, -86.12228393554688, -82.89659881591797, -79.6709213256836, -76.44523620605469, -73.21955108642578, -69.99386596679688, -66.7681884765625, -63.542503356933594, -60.31682586669922, -57.09114456176758, -53.86545944213867, -50.63977813720703, -47.414093017578125, -44.188411712646484, -40.962730407714844, -37.73704528808594, -34.5113639831543, -31.285680770874023, -28.05999755859375, -24.83431625366211, -21.608633041381836, -18.382949829101562, -15.157268524169922, -11.931585311889648, -8.705902099609375, -5.48021936416626, -2.2545366287231445, 0.9711456298828125, 4.196828842163086, 7.422512054443359, 10.648193359375, 13.873876571655273, 17.099559783935547, 20.32524299621582, 23.550926208496094, 26.776607513427734, 30.002290725708008, 33.22797393798828, 36.45365524291992, 39.67933654785156, 42.90502166748047, 46.13070297241211, 49.356388092041016, 52.582069396972656, 55.80775451660156, 59.0334358215332, 62.259117126464844, 65.48480224609375, 68.71047973632812, 71.93616485595703, 75.1618423461914, 78.38752746582031, 81.61321258544922, 84.83889770507812, 88.0645751953125, 91.2902603149414, 94.51594543457031]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 7.0, 12.0, 11.0, 14.0, 14.0, 16.0, 21.0, 19.0, 18.0, 27.0, 42.0, 34.0, 26.0, 61.0, 55.0, 51.0, 49.0, 50.0, 51.0, 47.0, 46.0, 43.0, 41.0, 44.0, 36.0, 23.0, 27.0, 23.0, 16.0, 13.0, 16.0, 15.0, 5.0, 3.0, 5.0, 1.0, 4.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4921875, -14.0443115234375, -13.596435546875, -13.1485595703125, -12.70068359375, -12.2528076171875, -11.804931640625, -11.3570556640625, -10.9091796875, -10.4613037109375, -10.013427734375, -9.5655517578125, -9.11767578125, -8.6697998046875, -8.221923828125, -7.7740478515625, -7.326171875, -6.8782958984375, -6.430419921875, -5.9825439453125, -5.53466796875, -5.0867919921875, -4.638916015625, -4.1910400390625, -3.7431640625, -3.2952880859375, -2.847412109375, -2.3995361328125, -1.95166015625, -1.5037841796875, -1.055908203125, -0.6080322265625, -0.16015625, 0.2877197265625, 0.735595703125, 1.1834716796875, 1.63134765625, 2.0792236328125, 2.527099609375, 2.9749755859375, 3.4228515625, 3.8707275390625, 4.318603515625, 4.7664794921875, 5.21435546875, 5.6622314453125, 6.110107421875, 6.5579833984375, 7.005859375, 7.4537353515625, 7.901611328125, 8.3494873046875, 8.79736328125, 9.2452392578125, 9.693115234375, 10.1409912109375, 10.5888671875, 11.0367431640625, 11.484619140625, 11.9324951171875, 12.38037109375, 12.8282470703125, 13.276123046875, 13.7239990234375, 14.171875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 6.0, 4.0, 8.0, 7.0, 11.0, 12.0, 17.0, 26.0, 32.0, 51.0, 63.0, 97.0, 144.0, 241.0, 342.0, 532.0, 1024.0, 2046.0, 4309.0, 11376.0, 44304.0, 280883.0, 1641934.0, 1809204.0, 328077.0, 48149.0, 12117.0, 4608.0, 2035.0, 997.0, 586.0, 342.0, 214.0, 143.0, 97.0, 65.0, 39.0, 51.0, 20.0, 18.0, 20.0, 8.0, 7.0, 7.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-22.09375, -21.463134765625, -20.83251953125, -20.201904296875, -19.5712890625, -18.940673828125, -18.31005859375, -17.679443359375, -17.048828125, -16.418212890625, -15.78759765625, -15.156982421875, -14.5263671875, -13.895751953125, -13.26513671875, -12.634521484375, -12.00390625, -11.373291015625, -10.74267578125, -10.112060546875, -9.4814453125, -8.850830078125, -8.22021484375, -7.589599609375, -6.958984375, -6.328369140625, -5.69775390625, -5.067138671875, -4.4365234375, -3.805908203125, -3.17529296875, -2.544677734375, -1.9140625, -1.283447265625, -0.65283203125, -0.022216796875, 0.6083984375, 1.239013671875, 1.86962890625, 2.500244140625, 3.130859375, 3.761474609375, 4.39208984375, 5.022705078125, 5.6533203125, 6.283935546875, 6.91455078125, 7.545166015625, 8.17578125, 8.806396484375, 9.43701171875, 10.067626953125, 10.6982421875, 11.328857421875, 11.95947265625, 12.590087890625, 13.220703125, 13.851318359375, 14.48193359375, 15.112548828125, 15.7431640625, 16.373779296875, 17.00439453125, 17.635009765625, 18.265625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 19.0, 100.0, 1099.0, 2500.0, 329.0, 26.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.375, -152.490234375, -147.60546875, -142.720703125, -137.8359375, -132.951171875, -128.06640625, -123.181640625, -118.296875, -113.412109375, -108.52734375, -103.642578125, -98.7578125, -93.873046875, -88.98828125, -84.103515625, -79.21875, -74.333984375, -69.44921875, -64.564453125, -59.6796875, -54.794921875, -49.91015625, -45.025390625, -40.140625, -35.255859375, -30.37109375, -25.486328125, -20.6015625, -15.716796875, -10.83203125, -5.947265625, -1.0625, 3.822265625, 8.70703125, 13.591796875, 18.4765625, 23.361328125, 28.24609375, 33.130859375, 38.015625, 42.900390625, 47.78515625, 52.669921875, 57.5546875, 62.439453125, 67.32421875, 72.208984375, 77.09375, 81.978515625, 86.86328125, 91.748046875, 96.6328125, 101.517578125, 106.40234375, 111.287109375, 116.171875, 121.056640625, 125.94140625, 130.826171875, 135.7109375, 140.595703125, 145.48046875, 150.365234375, 155.25]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 22.0, 44.0, 133.0, 577.0, 3372.0, 4184753.0, 4458.0, 670.0, 163.0, 41.0, 22.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-235.375, -227.912109375, -220.44921875, -212.986328125, -205.5234375, -198.060546875, -190.59765625, -183.134765625, -175.671875, -168.208984375, -160.74609375, -153.283203125, -145.8203125, -138.357421875, -130.89453125, -123.431640625, -115.96875, -108.505859375, -101.04296875, -93.580078125, -86.1171875, -78.654296875, -71.19140625, -63.728515625, -56.265625, -48.802734375, -41.33984375, -33.876953125, -26.4140625, -18.951171875, -11.48828125, -4.025390625, 3.4375, 10.900390625, 18.36328125, 25.826171875, 33.2890625, 40.751953125, 48.21484375, 55.677734375, 63.140625, 70.603515625, 78.06640625, 85.529296875, 92.9921875, 100.455078125, 107.91796875, 115.380859375, 122.84375, 130.306640625, 137.76953125, 145.232421875, 152.6953125, 160.158203125, 167.62109375, 175.083984375, 182.546875, 190.009765625, 197.47265625, 204.935546875, 212.3984375, 219.861328125, 227.32421875, 234.787109375, 242.25]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 16.0, 201.0, 654.0, 135.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-563.9052734375, -552.4888305664062, -541.0723266601562, -529.6558837890625, -518.2394409179688, -506.8229675292969, -495.406494140625, -483.99005126953125, -472.5736083984375, -461.1571350097656, -449.7406921386719, -438.32421875, -426.90777587890625, -415.4913024902344, -404.0748291015625, -392.65838623046875, -381.2419128417969, -369.825439453125, -358.40899658203125, -346.9925231933594, -335.5760803222656, -324.15960693359375, -312.7431640625, -301.3266906738281, -289.91021728515625, -278.4937438964844, -267.0773010253906, -255.66082763671875, -244.244384765625, -232.82791137695312, -221.4114532470703, -209.9949951171875, -198.57855224609375, -187.16209411621094, -175.74563598632812, -164.32916259765625, -152.9127197265625, -141.49624633789062, -130.0797882080078, -118.663330078125, -107.24687194824219, -95.83041381835938, -84.41395568847656, -72.99748992919922, -61.581031799316406, -50.164573669433594, -38.74810791015625, -27.331649780273438, -15.915191650390625, -4.49873161315918, 6.917728424072266, 18.334190368652344, 29.750648498535156, 41.16710662841797, 52.58357238769531, 64.00003051757812, 75.41648864746094, 86.83294677734375, 98.24940490722656, 109.6658706665039, 121.08232879638672, 132.498779296875, 143.91525268554688, 155.3317108154297, 166.7481689453125]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 3.0, 6.0, 6.0, 10.0, 8.0, 12.0, 19.0, 19.0, 16.0, 21.0, 28.0, 22.0, 33.0, 39.0, 38.0, 19.0, 31.0, 52.0, 48.0, 32.0, 43.0, 36.0, 48.0, 35.0, 46.0, 41.0, 36.0, 38.0, 32.0, 34.0, 23.0, 19.0, 15.0, 14.0, 17.0, 14.0, 9.0, 9.0, 11.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.65288543701172, -94.69966888427734, -91.74644470214844, -88.79322814941406, -85.84001159667969, -82.88679504394531, -79.93357849121094, -76.98035430908203, -74.02713775634766, -71.07392120361328, -68.12069702148438, -65.16748046875, -62.214263916015625, -59.26104736328125, -56.30782699584961, -53.35460662841797, -50.401390075683594, -47.44817352294922, -44.49495315551758, -41.54173278808594, -38.58851623535156, -35.63529968261719, -32.68207931518555, -29.72886085510254, -26.77564239501953, -23.822423934936523, -20.869205474853516, -17.915987014770508, -14.9627685546875, -12.009550094604492, -9.056331634521484, -6.103113174438477, -3.1498947143554688, -0.19667625427246094, 2.756542205810547, 5.709760665893555, 8.662979125976562, 11.61619758605957, 14.569416046142578, 17.522634506225586, 20.475852966308594, 23.4290714263916, 26.38228988647461, 29.335508346557617, 32.288726806640625, 35.241943359375, 38.19516372680664, 41.14838409423828, 44.101600646972656, 47.05481719970703, 50.00803756713867, 52.96125793457031, 55.91447448730469, 58.86769104003906, 61.8209114074707, 64.77413177490234, 67.72734832763672, 70.6805648803711, 73.6337890625, 76.58700561523438, 79.54022216796875, 82.49343872070312, 85.4466552734375, 88.3998794555664, 91.35309600830078]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 5.0, 10.0, 9.0, 17.0, 17.0, 14.0, 27.0, 27.0, 20.0, 30.0, 40.0, 42.0, 53.0, 36.0, 69.0, 50.0, 54.0, 41.0, 57.0, 40.0, 44.0, 43.0, 47.0, 33.0, 36.0, 32.0, 14.0, 20.0, 13.0, 9.0, 11.0, 4.0, 8.0, 6.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-15.0234375, -14.613037109375, -14.20263671875, -13.792236328125, -13.3818359375, -12.971435546875, -12.56103515625, -12.150634765625, -11.740234375, -11.329833984375, -10.91943359375, -10.509033203125, -10.0986328125, -9.688232421875, -9.27783203125, -8.867431640625, -8.45703125, -8.046630859375, -7.63623046875, -7.225830078125, -6.8154296875, -6.405029296875, -5.99462890625, -5.584228515625, -5.173828125, -4.763427734375, -4.35302734375, -3.942626953125, -3.5322265625, -3.121826171875, -2.71142578125, -2.301025390625, -1.890625, -1.480224609375, -1.06982421875, -0.659423828125, -0.2490234375, 0.161376953125, 0.57177734375, 0.982177734375, 1.392578125, 1.802978515625, 2.21337890625, 2.623779296875, 3.0341796875, 3.444580078125, 3.85498046875, 4.265380859375, 4.67578125, 5.086181640625, 5.49658203125, 5.906982421875, 6.3173828125, 6.727783203125, 7.13818359375, 7.548583984375, 7.958984375, 8.369384765625, 8.77978515625, 9.190185546875, 9.6005859375, 10.010986328125, 10.42138671875, 10.831787109375, 11.2421875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 5.0, 11.0, 22.0, 27.0, 35.0, 60.0, 101.0, 144.0, 264.0, 337.0, 583.0, 839.0, 1415.0, 2162.0, 3492.0, 5685.0, 9726.0, 16448.0, 29034.0, 52710.0, 105408.0, 294536.0, 295838.0, 106076.0, 53253.0, 28679.0, 16369.0, 9734.0, 5918.0, 3619.0, 2225.0, 1364.0, 880.0, 523.0, 329.0, 229.0, 168.0, 89.0, 71.0, 46.0, 33.0, 19.0, 20.0, 9.0, 8.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.884765625, -2.7999267578125, -2.715087890625, -2.6302490234375, -2.54541015625, -2.4605712890625, -2.375732421875, -2.2908935546875, -2.2060546875, -2.1212158203125, -2.036376953125, -1.9515380859375, -1.86669921875, -1.7818603515625, -1.697021484375, -1.6121826171875, -1.52734375, -1.4425048828125, -1.357666015625, -1.2728271484375, -1.18798828125, -1.1031494140625, -1.018310546875, -0.9334716796875, -0.8486328125, -0.7637939453125, -0.678955078125, -0.5941162109375, -0.50927734375, -0.4244384765625, -0.339599609375, -0.2547607421875, -0.169921875, -0.0850830078125, -0.000244140625, 0.0845947265625, 0.16943359375, 0.2542724609375, 0.339111328125, 0.4239501953125, 0.5087890625, 0.5936279296875, 0.678466796875, 0.7633056640625, 0.84814453125, 0.9329833984375, 1.017822265625, 1.1026611328125, 1.1875, 1.2723388671875, 1.357177734375, 1.4420166015625, 1.52685546875, 1.6116943359375, 1.696533203125, 1.7813720703125, 1.8662109375, 1.9510498046875, 2.035888671875, 2.1207275390625, 2.20556640625, 2.2904052734375, 2.375244140625, 2.4600830078125, 2.544921875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 10.0, 9.0, 13.0, 14.0, 21.0, 20.0, 25.0, 29.0, 20.0, 31.0, 32.0, 43.0, 48.0, 52.0, 40.0, 38.0, 44.0, 1070.0, 38.0, 47.0, 33.0, 40.0, 37.0, 35.0, 37.0, 36.0, 26.0, 22.0, 20.0, 16.0, 20.0, 11.0, 7.0, 7.0, 3.0, 7.0, 6.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.6015625, -6.3673095703125, -6.133056640625, -5.8988037109375, -5.66455078125, -5.4302978515625, -5.196044921875, -4.9617919921875, -4.7275390625, -4.4932861328125, -4.259033203125, -4.0247802734375, -3.79052734375, -3.5562744140625, -3.322021484375, -3.0877685546875, -2.853515625, -2.6192626953125, -2.385009765625, -2.1507568359375, -1.91650390625, -1.6822509765625, -1.447998046875, -1.2137451171875, -0.9794921875, -0.7452392578125, -0.510986328125, -0.2767333984375, -0.04248046875, 0.1917724609375, 0.426025390625, 0.6602783203125, 0.89453125, 1.1287841796875, 1.363037109375, 1.5972900390625, 1.83154296875, 2.0657958984375, 2.300048828125, 2.5343017578125, 2.7685546875, 3.0028076171875, 3.237060546875, 3.4713134765625, 3.70556640625, 3.9398193359375, 4.174072265625, 4.4083251953125, 4.642578125, 4.8768310546875, 5.111083984375, 5.3453369140625, 5.57958984375, 5.8138427734375, 6.048095703125, 6.2823486328125, 6.5166015625, 6.7508544921875, 6.985107421875, 7.2193603515625, 7.45361328125, 7.6878662109375, 7.922119140625, 8.1563720703125, 8.390625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 14.0, 21.0, 19.0, 30.0, 40.0, 64.0, 97.0, 156.0, 184.0, 305.0, 473.0, 734.0, 1070.0, 1656.0, 2645.0, 4258.0, 7127.0, 11700.0, 19798.0, 33381.0, 58458.0, 112982.0, 1355429.0, 252190.0, 102332.0, 54148.0, 30887.0, 18075.0, 11015.0, 6725.0, 4105.0, 2470.0, 1600.0, 1004.0, 656.0, 419.0, 294.0, 191.0, 127.0, 77.0, 48.0, 36.0, 24.0, 18.0, 14.0, 10.0, 9.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.525390625, -2.450958251953125, -2.37652587890625, -2.302093505859375, -2.2276611328125, -2.153228759765625, -2.07879638671875, -2.004364013671875, -1.929931640625, -1.855499267578125, -1.78106689453125, -1.706634521484375, -1.6322021484375, -1.557769775390625, -1.48333740234375, -1.408905029296875, -1.33447265625, -1.260040283203125, -1.18560791015625, -1.111175537109375, -1.0367431640625, -0.962310791015625, -0.88787841796875, -0.813446044921875, -0.739013671875, -0.664581298828125, -0.59014892578125, -0.515716552734375, -0.4412841796875, -0.366851806640625, -0.29241943359375, -0.217987060546875, -0.1435546875, -0.069122314453125, 0.00531005859375, 0.079742431640625, 0.1541748046875, 0.228607177734375, 0.30303955078125, 0.377471923828125, 0.451904296875, 0.526336669921875, 0.60076904296875, 0.675201416015625, 0.7496337890625, 0.824066162109375, 0.89849853515625, 0.972930908203125, 1.04736328125, 1.121795654296875, 1.19622802734375, 1.270660400390625, 1.3450927734375, 1.419525146484375, 1.49395751953125, 1.568389892578125, 1.642822265625, 1.717254638671875, 1.79168701171875, 1.866119384765625, 1.9405517578125, 2.014984130859375, 2.08941650390625, 2.163848876953125, 2.23828125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 9.0, 2.0, 14.0, 16.0, 22.0, 15.0, 23.0, 30.0, 39.0, 51.0, 70.0, 89.0, 121.0, 99.0, 103.0, 71.0, 44.0, 41.0, 30.0, 27.0, 16.0, 13.0, 15.0, 14.0, 11.0, 8.0, 8.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017290115356445312, -0.0016824603080749512, -0.001635909080505371, -0.001589357852935791, -0.001542806625366211, -0.0014962553977966309, -0.0014497041702270508, -0.0014031529426574707, -0.0013566017150878906, -0.0013100504875183105, -0.0012634992599487305, -0.0012169480323791504, -0.0011703968048095703, -0.0011238455772399902, -0.0010772943496704102, -0.00103074312210083, -0.00098419189453125, -0.0009376406669616699, -0.0008910894393920898, -0.0008445382118225098, -0.0007979869842529297, -0.0007514357566833496, -0.0007048845291137695, -0.0006583333015441895, -0.0006117820739746094, -0.0005652308464050293, -0.0005186796188354492, -0.00047212839126586914, -0.00042557716369628906, -0.000379025936126709, -0.0003324747085571289, -0.00028592348098754883, -0.00023937225341796875, -0.00019282102584838867, -0.0001462697982788086, -9.971857070922852e-05, -5.316734313964844e-05, -6.616115570068359e-06, 3.993511199951172e-05, 8.64863395690918e-05, 0.00013303756713867188, 0.00017958879470825195, 0.00022614002227783203, 0.0002726912498474121, 0.0003192424774169922, 0.00036579370498657227, 0.00041234493255615234, 0.0004588961601257324, 0.0005054473876953125, 0.0005519986152648926, 0.0005985498428344727, 0.0006451010704040527, 0.0006916522979736328, 0.0007382035255432129, 0.000784754753112793, 0.000831305980682373, 0.0008778572082519531, 0.0009244084358215332, 0.0009709596633911133, 0.0010175108909606934, 0.0010640621185302734, 0.0011106133460998535, 0.0011571645736694336, 0.0012037158012390137, 0.0012502670288085938]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 6.0, 5.0, 11.0, 19.0, 27.0, 29.0, 37.0, 55.0, 81.0, 101.0, 168.0, 245.0, 414.0, 758.0, 4905.0, 1038174.0, 1818.0, 671.0, 357.0, 222.0, 112.0, 91.0, 73.0, 44.0, 40.0, 20.0, 25.0, 12.0, 10.0, 6.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02886962890625, -0.027977466583251953, -0.027085304260253906, -0.02619314193725586, -0.025300979614257812, -0.024408817291259766, -0.02351665496826172, -0.022624492645263672, -0.021732330322265625, -0.020840167999267578, -0.01994800567626953, -0.019055843353271484, -0.018163681030273438, -0.01727151870727539, -0.016379356384277344, -0.015487194061279297, -0.01459503173828125, -0.013702869415283203, -0.012810707092285156, -0.01191854476928711, -0.011026382446289062, -0.010134220123291016, -0.009242057800292969, -0.008349895477294922, -0.007457733154296875, -0.006565570831298828, -0.005673408508300781, -0.004781246185302734, -0.0038890838623046875, -0.0029969215393066406, -0.0021047592163085938, -0.0012125968933105469, -0.0003204345703125, 0.0005717277526855469, 0.0014638900756835938, 0.0023560523986816406, 0.0032482147216796875, 0.004140377044677734, 0.005032539367675781, 0.005924701690673828, 0.006816864013671875, 0.007709026336669922, 0.008601188659667969, 0.009493350982666016, 0.010385513305664062, 0.01127767562866211, 0.012169837951660156, 0.013062000274658203, 0.01395416259765625, 0.014846324920654297, 0.015738487243652344, 0.01663064956665039, 0.017522811889648438, 0.018414974212646484, 0.01930713653564453, 0.020199298858642578, 0.021091461181640625, 0.021983623504638672, 0.02287578582763672, 0.023767948150634766, 0.024660110473632812, 0.02555227279663086, 0.026444435119628906, 0.027336597442626953, 0.028228759765625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 16.0, 867.0, 127.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016239110846072435, -0.0014713670825585723, -0.0013188229640945792, -0.001166278962045908, -0.001013734843581915, -0.0008611908415332437, -0.0007086468394845724, -0.0005561027210205793, -0.0004035587189719081, -0.00025101465871557593, -9.847062756307423e-05, 5.407340358942747e-05, 0.00020661746384575963, 0.0003591615241020918, 0.000511705526150763, 0.0006642496446147561, 0.0008167936466634274, 0.0009693377069197595, 0.0011218817671760917, 0.001274425769224763, 0.001426969887688756, 0.0015795138897374272, 0.0017320578917860985, 0.0018846020102500916, 0.0020371461287140846, 0.0021896902471780777, 0.002342234132811427, 0.00249477825127542, 0.0026473223697394133, 0.0027998662553727627, 0.0029524103738367558, 0.003104954492300749, 0.003257498610764742, 0.003410042729228735, 0.0035625866148620844, 0.0037151307333260775, 0.0038676748517900705, 0.00402021873742342, 0.004172762855887413, 0.004325306974351406, 0.004477851092815399, 0.004630395211279392, 0.004782939329743385, 0.004935483448207378, 0.005088027101010084, 0.005240571219474077, 0.00539311533793807, 0.005545659456402063, 0.005698203109204769, 0.005850747227668762, 0.006003291346132755, 0.006155835464596748, 0.006308379117399454, 0.006460923235863447, 0.00661346735432744, 0.006766011472791433, 0.006918555591255426, 0.0070710997097194195, 0.0072236438281834126, 0.007376187480986118, 0.007528731599450111, 0.0076812757179141045, 0.007833819836378098, 0.00798636395484209, 0.008138908073306084]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 0.0, 1.0, 9.0, 3.0, 6.0, 9.0, 14.0, 11.0, 24.0, 17.0, 17.0, 14.0, 14.0, 23.0, 20.0, 29.0, 27.0, 35.0, 38.0, 35.0, 33.0, 42.0, 31.0, 44.0, 42.0, 43.0, 45.0, 49.0, 34.0, 27.0, 33.0, 28.0, 32.0, 19.0, 22.0, 17.0, 14.0, 23.0, 16.0, 10.0, 10.0, 12.0, 6.0, 7.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.00047343969345092773, -0.0004579499363899231, -0.00044246017932891846, -0.0004269704222679138, -0.0004114806652069092, -0.00039599090814590454, -0.0003805011510848999, -0.00036501139402389526, -0.0003495216369628906, -0.000334031879901886, -0.00031854212284088135, -0.0003030523657798767, -0.00028756260871887207, -0.00027207285165786743, -0.0002565830945968628, -0.00024109333753585815, -0.00022560358047485352, -0.00021011382341384888, -0.00019462406635284424, -0.0001791343092918396, -0.00016364455223083496, -0.00014815479516983032, -0.00013266503810882568, -0.00011717528104782104, -0.0001016855239868164, -8.619576692581177e-05, -7.070600986480713e-05, -5.521625280380249e-05, -3.972649574279785e-05, -2.4236738681793213e-05, -8.746981620788574e-06, 6.7427754402160645e-06, 2.2232532501220703e-05, 3.772228956222534e-05, 5.321204662322998e-05, 6.870180368423462e-05, 8.419156074523926e-05, 9.96813178062439e-05, 0.00011517107486724854, 0.00013066083192825317, 0.0001461505889892578, 0.00016164034605026245, 0.0001771301031112671, 0.00019261986017227173, 0.00020810961723327637, 0.000223599374294281, 0.00023908913135528564, 0.0002545788884162903, 0.0002700686454772949, 0.00028555840253829956, 0.0003010481595993042, 0.00031653791666030884, 0.0003320276737213135, 0.0003475174307823181, 0.00036300718784332275, 0.0003784969449043274, 0.00039398670196533203, 0.00040947645902633667, 0.0004249662160873413, 0.00044045597314834595, 0.0004559457302093506, 0.0004714354872703552, 0.00048692524433135986, 0.0005024150013923645, 0.0005179047584533691]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 5.0, 10.0, 9.0, 17.0, 17.0, 14.0, 27.0, 27.0, 20.0, 30.0, 40.0, 42.0, 53.0, 36.0, 69.0, 50.0, 54.0, 41.0, 57.0, 40.0, 44.0, 43.0, 47.0, 33.0, 36.0, 32.0, 14.0, 20.0, 13.0, 9.0, 11.0, 4.0, 8.0, 6.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-15.0234375, -14.613037109375, -14.20263671875, -13.792236328125, -13.3818359375, -12.971435546875, -12.56103515625, -12.150634765625, -11.740234375, -11.329833984375, -10.91943359375, -10.509033203125, -10.0986328125, -9.688232421875, -9.27783203125, -8.867431640625, -8.45703125, -8.046630859375, -7.63623046875, -7.225830078125, -6.8154296875, -6.405029296875, -5.99462890625, -5.584228515625, -5.173828125, -4.763427734375, -4.35302734375, -3.942626953125, -3.5322265625, -3.121826171875, -2.71142578125, -2.301025390625, -1.890625, -1.480224609375, -1.06982421875, -0.659423828125, -0.2490234375, 0.161376953125, 0.57177734375, 0.982177734375, 1.392578125, 1.802978515625, 2.21337890625, 2.623779296875, 3.0341796875, 3.444580078125, 3.85498046875, 4.265380859375, 4.67578125, 5.086181640625, 5.49658203125, 5.906982421875, 6.3173828125, 6.727783203125, 7.13818359375, 7.548583984375, 7.958984375, 8.369384765625, 8.77978515625, 9.190185546875, 9.6005859375, 10.010986328125, 10.42138671875, 10.831787109375, 11.2421875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 11.0, 16.0, 28.0, 33.0, 41.0, 54.0, 97.0, 130.0, 193.0, 261.0, 475.0, 782.0, 1480.0, 3265.0, 9356.0, 34469.0, 230826.0, 659684.0, 80030.0, 16932.0, 5396.0, 2198.0, 1093.0, 615.0, 375.0, 210.0, 162.0, 94.0, 67.0, 38.0, 36.0, 24.0, 16.0, 10.0, 10.0, 16.0, 8.0, 6.0, 0.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-27.59375, -26.83251953125, -26.0712890625, -25.31005859375, -24.548828125, -23.78759765625, -23.0263671875, -22.26513671875, -21.50390625, -20.74267578125, -19.9814453125, -19.22021484375, -18.458984375, -17.69775390625, -16.9365234375, -16.17529296875, -15.4140625, -14.65283203125, -13.8916015625, -13.13037109375, -12.369140625, -11.60791015625, -10.8466796875, -10.08544921875, -9.32421875, -8.56298828125, -7.8017578125, -7.04052734375, -6.279296875, -5.51806640625, -4.7568359375, -3.99560546875, -3.234375, -2.47314453125, -1.7119140625, -0.95068359375, -0.189453125, 0.57177734375, 1.3330078125, 2.09423828125, 2.85546875, 3.61669921875, 4.3779296875, 5.13916015625, 5.900390625, 6.66162109375, 7.4228515625, 8.18408203125, 8.9453125, 9.70654296875, 10.4677734375, 11.22900390625, 11.990234375, 12.75146484375, 13.5126953125, 14.27392578125, 15.03515625, 15.79638671875, 16.5576171875, 17.31884765625, 18.080078125, 18.84130859375, 19.6025390625, 20.36376953125, 21.125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 6.0, 12.0, 24.0, 23.0, 34.0, 41.0, 52.0, 54.0, 72.0, 93.0, 272.0, 1878.0, 111.0, 82.0, 66.0, 63.0, 46.0, 30.0, 17.0, 14.0, 15.0, 4.0, 11.0, 5.0, 2.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.46875, -48.7998046875, -47.130859375, -45.4619140625, -43.79296875, -42.1240234375, -40.455078125, -38.7861328125, -37.1171875, -35.4482421875, -33.779296875, -32.1103515625, -30.44140625, -28.7724609375, -27.103515625, -25.4345703125, -23.765625, -22.0966796875, -20.427734375, -18.7587890625, -17.08984375, -15.4208984375, -13.751953125, -12.0830078125, -10.4140625, -8.7451171875, -7.076171875, -5.4072265625, -3.73828125, -2.0693359375, -0.400390625, 1.2685546875, 2.9375, 4.6064453125, 6.275390625, 7.9443359375, 9.61328125, 11.2822265625, 12.951171875, 14.6201171875, 16.2890625, 17.9580078125, 19.626953125, 21.2958984375, 22.96484375, 24.6337890625, 26.302734375, 27.9716796875, 29.640625, 31.3095703125, 32.978515625, 34.6474609375, 36.31640625, 37.9853515625, 39.654296875, 41.3232421875, 42.9921875, 44.6611328125, 46.330078125, 47.9990234375, 49.66796875, 51.3369140625, 53.005859375, 54.6748046875, 56.34375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 5.0, 3.0, 10.0, 15.0, 13.0, 19.0, 40.0, 61.0, 71.0, 155.0, 317.0, 993.0, 75863.0, 3065961.0, 1294.0, 427.0, 169.0, 87.0, 64.0, 37.0, 32.0, 26.0, 16.0, 5.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-165.375, -160.525390625, -155.67578125, -150.826171875, -145.9765625, -141.126953125, -136.27734375, -131.427734375, -126.578125, -121.728515625, -116.87890625, -112.029296875, -107.1796875, -102.330078125, -97.48046875, -92.630859375, -87.78125, -82.931640625, -78.08203125, -73.232421875, -68.3828125, -63.533203125, -58.68359375, -53.833984375, -48.984375, -44.134765625, -39.28515625, -34.435546875, -29.5859375, -24.736328125, -19.88671875, -15.037109375, -10.1875, -5.337890625, -0.48828125, 4.361328125, 9.2109375, 14.060546875, 18.91015625, 23.759765625, 28.609375, 33.458984375, 38.30859375, 43.158203125, 48.0078125, 52.857421875, 57.70703125, 62.556640625, 67.40625, 72.255859375, 77.10546875, 81.955078125, 86.8046875, 91.654296875, 96.50390625, 101.353515625, 106.203125, 111.052734375, 115.90234375, 120.751953125, 125.6015625, 130.451171875, 135.30078125, 140.150390625, 145.0]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 16.0, 154.0, 718.0, 115.0, 12.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-300.0871887207031, -293.89129638671875, -287.6954040527344, -281.4995422363281, -275.30364990234375, -269.1077575683594, -262.911865234375, -256.7159729003906, -250.5200958251953, -244.32420349121094, -238.12832641601562, -231.93243408203125, -225.73654174804688, -219.54066467285156, -213.3447723388672, -207.14889526367188, -200.9530029296875, -194.75711059570312, -188.5612335205078, -182.36534118652344, -176.16946411132812, -169.97357177734375, -163.77767944335938, -157.581787109375, -151.3859100341797, -145.1900177001953, -138.994140625, -132.79824829101562, -126.60236358642578, -120.40647888183594, -114.21058654785156, -108.01470184326172, -101.81880950927734, -95.6229248046875, -89.42703247070312, -83.23114776611328, -77.03526306152344, -70.8393783569336, -64.64349365234375, -58.447601318359375, -52.25171661376953, -46.05583190917969, -39.85994338989258, -33.66405487060547, -27.468170166015625, -21.27228355407715, -15.076396942138672, -8.880508422851562, -2.6846237182617188, 3.511262893676758, 9.707149505615234, 15.903036117553711, 22.098922729492188, 28.294809341430664, 34.49069595336914, 40.68658447265625, 46.882469177246094, 53.07835388183594, 59.27424240112305, 65.47013092041016, 71.666015625, 77.86190032958984, 84.05778503417969, 90.25367736816406, 96.4495620727539]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 1.0, 7.0, 4.0, 5.0, 4.0, 5.0, 7.0, 12.0, 11.0, 16.0, 12.0, 16.0, 19.0, 18.0, 22.0, 27.0, 22.0, 42.0, 33.0, 35.0, 33.0, 43.0, 37.0, 39.0, 33.0, 35.0, 42.0, 31.0, 39.0, 35.0, 24.0, 31.0, 31.0, 21.0, 22.0, 27.0, 36.0, 24.0, 19.0, 17.0, 15.0, 7.0, 9.0, 11.0, 5.0, 3.0, 8.0, 2.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-88.22542572021484, -85.53599548339844, -82.8465576171875, -80.1571273803711, -77.46769714355469, -74.77825927734375, -72.08882904052734, -69.39939880371094, -66.7099609375, -64.0205307006836, -61.331092834472656, -58.64166259765625, -55.95222854614258, -53.262794494628906, -50.5733642578125, -47.88393020629883, -45.194496154785156, -42.505062103271484, -39.81562805175781, -37.126197814941406, -34.436763763427734, -31.747329711914062, -29.057897567749023, -26.368465423583984, -23.679031372070312, -20.98959732055664, -18.3001651763916, -15.610732078552246, -12.92129898071289, -10.231865882873535, -7.54243278503418, -4.853000640869141, -2.1635665893554688, 0.5258665084838867, 3.215299606323242, 5.904732704162598, 8.594165802001953, 11.283598899841309, 13.973031997680664, 16.662464141845703, 19.351898193359375, 22.041332244873047, 24.730764389038086, 27.420196533203125, 30.109630584716797, 32.79906463623047, 35.488494873046875, 38.17792892456055, 40.86736297607422, 43.55679702758789, 46.24623107910156, 48.93566131591797, 51.62509536743164, 54.31452941894531, 57.00395965576172, 59.69339370727539, 62.38282775878906, 65.07225799560547, 67.7616958618164, 70.45112609863281, 73.14056396484375, 75.82999420166016, 78.51942443847656, 81.2088623046875, 83.8982925415039]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 6.0, 9.0, 11.0, 21.0, 14.0, 24.0, 23.0, 38.0, 26.0, 43.0, 45.0, 48.0, 54.0, 50.0, 45.0, 59.0, 50.0, 40.0, 36.0, 40.0, 45.0, 41.0, 42.0, 38.0, 23.0, 16.0, 25.0, 16.0, 17.0, 16.0, 6.0, 10.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.09375, -17.5595703125, -17.025390625, -16.4912109375, -15.95703125, -15.4228515625, -14.888671875, -14.3544921875, -13.8203125, -13.2861328125, -12.751953125, -12.2177734375, -11.68359375, -11.1494140625, -10.615234375, -10.0810546875, -9.546875, -9.0126953125, -8.478515625, -7.9443359375, -7.41015625, -6.8759765625, -6.341796875, -5.8076171875, -5.2734375, -4.7392578125, -4.205078125, -3.6708984375, -3.13671875, -2.6025390625, -2.068359375, -1.5341796875, -1.0, -0.4658203125, 0.068359375, 0.6025390625, 1.13671875, 1.6708984375, 2.205078125, 2.7392578125, 3.2734375, 3.8076171875, 4.341796875, 4.8759765625, 5.41015625, 5.9443359375, 6.478515625, 7.0126953125, 7.546875, 8.0810546875, 8.615234375, 9.1494140625, 9.68359375, 10.2177734375, 10.751953125, 11.2861328125, 11.8203125, 12.3544921875, 12.888671875, 13.4228515625, 13.95703125, 14.4912109375, 15.025390625, 15.5595703125, 16.09375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 4.0, 4.0, 2.0, 4.0, 7.0, 11.0, 15.0, 18.0, 21.0, 31.0, 25.0, 40.0, 34.0, 41.0, 54.0, 86.0, 92.0, 127.0, 199.0, 230.0, 334.0, 446.0, 763.0, 1747.0, 7357.0, 2462960.0, 1709612.0, 5967.0, 1528.0, 745.0, 441.0, 309.0, 228.0, 171.0, 120.0, 108.0, 78.0, 59.0, 39.0, 52.0, 24.0, 29.0, 27.0, 30.0, 10.0, 12.0, 19.0, 6.0, 2.0, 7.0, 4.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-89.8125, -87.0869140625, -84.361328125, -81.6357421875, -78.91015625, -76.1845703125, -73.458984375, -70.7333984375, -68.0078125, -65.2822265625, -62.556640625, -59.8310546875, -57.10546875, -54.3798828125, -51.654296875, -48.9287109375, -46.203125, -43.4775390625, -40.751953125, -38.0263671875, -35.30078125, -32.5751953125, -29.849609375, -27.1240234375, -24.3984375, -21.6728515625, -18.947265625, -16.2216796875, -13.49609375, -10.7705078125, -8.044921875, -5.3193359375, -2.59375, 0.1318359375, 2.857421875, 5.5830078125, 8.30859375, 11.0341796875, 13.759765625, 16.4853515625, 19.2109375, 21.9365234375, 24.662109375, 27.3876953125, 30.11328125, 32.8388671875, 35.564453125, 38.2900390625, 41.015625, 43.7412109375, 46.466796875, 49.1923828125, 51.91796875, 54.6435546875, 57.369140625, 60.0947265625, 62.8203125, 65.5458984375, 68.271484375, 70.9970703125, 73.72265625, 76.4482421875, 79.173828125, 81.8994140625, 84.625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 12.0, 16.0, 27.0, 65.0, 155.0, 456.0, 1062.0, 1302.0, 576.0, 232.0, 89.0, 41.0, 19.0, 12.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-68.9375, -67.442626953125, -65.94775390625, -64.452880859375, -62.9580078125, -61.463134765625, -59.96826171875, -58.473388671875, -56.978515625, -55.483642578125, -53.98876953125, -52.493896484375, -50.9990234375, -49.504150390625, -48.00927734375, -46.514404296875, -45.01953125, -43.524658203125, -42.02978515625, -40.534912109375, -39.0400390625, -37.545166015625, -36.05029296875, -34.555419921875, -33.060546875, -31.565673828125, -30.07080078125, -28.575927734375, -27.0810546875, -25.586181640625, -24.09130859375, -22.596435546875, -21.1015625, -19.606689453125, -18.11181640625, -16.616943359375, -15.1220703125, -13.627197265625, -12.13232421875, -10.637451171875, -9.142578125, -7.647705078125, -6.15283203125, -4.657958984375, -3.1630859375, -1.668212890625, -0.17333984375, 1.321533203125, 2.81640625, 4.311279296875, 5.80615234375, 7.301025390625, 8.7958984375, 10.290771484375, 11.78564453125, 13.280517578125, 14.775390625, 16.270263671875, 17.76513671875, 19.260009765625, 20.7548828125, 22.249755859375, 23.74462890625, 25.239501953125, 26.734375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 13.0, 29.0, 54.0, 109.0, 276.0, 1307.0, 25468.0, 4122565.0, 42314.0, 1610.0, 322.0, 116.0, 39.0, 27.0, 15.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.6875, -90.080078125, -87.47265625, -84.865234375, -82.2578125, -79.650390625, -77.04296875, -74.435546875, -71.828125, -69.220703125, -66.61328125, -64.005859375, -61.3984375, -58.791015625, -56.18359375, -53.576171875, -50.96875, -48.361328125, -45.75390625, -43.146484375, -40.5390625, -37.931640625, -35.32421875, -32.716796875, -30.109375, -27.501953125, -24.89453125, -22.287109375, -19.6796875, -17.072265625, -14.46484375, -11.857421875, -9.25, -6.642578125, -4.03515625, -1.427734375, 1.1796875, 3.787109375, 6.39453125, 9.001953125, 11.609375, 14.216796875, 16.82421875, 19.431640625, 22.0390625, 24.646484375, 27.25390625, 29.861328125, 32.46875, 35.076171875, 37.68359375, 40.291015625, 42.8984375, 45.505859375, 48.11328125, 50.720703125, 53.328125, 55.935546875, 58.54296875, 61.150390625, 63.7578125, 66.365234375, 68.97265625, 71.580078125, 74.1875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 7.0, 13.0, 40.0, 80.0, 147.0, 261.0, 226.0, 127.0, 61.0, 28.0, 10.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-424.3914794921875, -416.0339050292969, -407.6763610839844, -399.31878662109375, -390.96124267578125, -382.6036682128906, -374.24609375, -365.8885498046875, -357.5309753417969, -349.17340087890625, -340.81585693359375, -332.4582824707031, -324.1007080078125, -315.7431640625, -307.3855895996094, -299.0280456542969, -290.67047119140625, -282.3128967285156, -273.9553527832031, -265.5977783203125, -257.240234375, -248.88265991210938, -240.52508544921875, -232.1675262451172, -223.80996704101562, -215.45240783691406, -207.0948486328125, -198.73727416992188, -190.3797149658203, -182.02215576171875, -173.66458129882812, -165.30702209472656, -156.94949340820312, -148.59193420410156, -140.234375, -131.87680053710938, -123.51924133300781, -115.16168212890625, -106.80411529541016, -98.44654846191406, -90.08898162841797, -81.73141479492188, -73.37385559082031, -65.01629638671875, -56.658729553222656, -48.30116653442383, -39.943603515625, -31.586040496826172, -23.228477478027344, -14.870914459228516, -6.5133514404296875, 1.8442115783691406, 10.201774597167969, 18.559337615966797, 26.916900634765625, 35.27446365356445, 43.63202667236328, 51.98958969116211, 60.34715270996094, 68.7047119140625, 77.0622787475586, 85.41984558105469, 93.77740478515625, 102.13496398925781, 110.4925308227539]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 6.0, 5.0, 8.0, 11.0, 8.0, 10.0, 9.0, 14.0, 16.0, 24.0, 19.0, 26.0, 30.0, 40.0, 38.0, 29.0, 48.0, 32.0, 43.0, 38.0, 34.0, 37.0, 38.0, 45.0, 37.0, 31.0, 33.0, 32.0, 42.0, 32.0, 23.0, 30.0, 19.0, 23.0, 14.0, 13.0, 10.0, 12.0, 10.0, 11.0, 5.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.222496032714844, -57.05686569213867, -54.8912353515625, -52.725608825683594, -50.55997848510742, -48.39434814453125, -46.228721618652344, -44.06309127807617, -41.8974609375, -39.73183059692383, -37.566200256347656, -35.40057373046875, -33.23494338989258, -31.069313049316406, -28.903684616088867, -26.738056182861328, -24.572425842285156, -22.406795501708984, -20.241167068481445, -18.075538635253906, -15.909908294677734, -13.744278907775879, -11.578649520874023, -9.413020133972168, -7.2473907470703125, -5.081761360168457, -2.9161319732666016, -0.7505025863647461, 1.4151268005371094, 3.580756187438965, 5.74638557434082, 7.912014961242676, 10.07763671875, 12.243266105651855, 14.408895492553711, 16.57452392578125, 18.740154266357422, 20.905784606933594, 23.071413040161133, 25.237041473388672, 27.402671813964844, 29.568302154541016, 31.733930587768555, 33.899559020996094, 36.065189361572266, 38.23081970214844, 40.396446228027344, 42.562076568603516, 44.72770690917969, 46.89333724975586, 49.05896759033203, 51.22459411621094, 53.39022445678711, 55.55585479736328, 57.72148132324219, 59.88711166381836, 62.05274200439453, 64.21836853027344, 66.38400268554688, 68.54962921142578, 70.71525573730469, 72.88088989257812, 75.04651641845703, 77.21215057373047, 79.37777709960938]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 4.0, 5.0, 9.0, 4.0, 13.0, 11.0, 18.0, 17.0, 16.0, 27.0, 29.0, 23.0, 34.0, 29.0, 38.0, 46.0, 50.0, 45.0, 48.0, 35.0, 41.0, 47.0, 44.0, 41.0, 32.0, 44.0, 32.0, 37.0, 30.0, 28.0, 12.0, 15.0, 17.0, 15.0, 14.0, 10.0, 9.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.75, -97.125, -93.5, -89.875, -86.25, -82.625, -79.0, -75.375, -71.75, -68.125, -64.5, -60.875, -57.25, -53.625, -50.0, -46.375, -42.75, -39.125, -35.5, -31.875, -28.25, -24.625, -21.0, -17.375, -13.75, -10.125, -6.5, -2.875, 0.75, 4.375, 8.0, 11.625, 15.25, 18.875, 22.5, 26.125, 29.75, 33.375, 37.0, 40.625, 44.25, 47.875, 51.5, 55.125, 58.75, 62.375, 66.0, 69.625, 73.25, 76.875, 80.5, 84.125, 87.75, 91.375, 95.0, 98.625, 102.25, 105.875, 109.5, 113.125, 116.75, 120.375, 124.0, 127.625, 131.25]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 14.0, 9.0, 8.0, 22.0, 33.0, 59.0, 67.0, 127.0, 157.0, 275.0, 399.0, 586.0, 944.0, 1574.0, 2616.0, 4349.0, 7266.0, 12151.0, 21433.0, 39361.0, 75465.0, 169558.0, 395390.0, 157410.0, 71996.0, 37178.0, 20514.0, 11824.0, 6963.0, 4040.0, 2517.0, 1569.0, 964.0, 622.0, 386.0, 246.0, 137.0, 111.0, 74.0, 40.0, 32.0, 23.0, 21.0, 10.0, 3.0, 7.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.640625, -25.844482421875, -25.04833984375, -24.252197265625, -23.4560546875, -22.659912109375, -21.86376953125, -21.067626953125, -20.271484375, -19.475341796875, -18.67919921875, -17.883056640625, -17.0869140625, -16.290771484375, -15.49462890625, -14.698486328125, -13.90234375, -13.106201171875, -12.31005859375, -11.513916015625, -10.7177734375, -9.921630859375, -9.12548828125, -8.329345703125, -7.533203125, -6.737060546875, -5.94091796875, -5.144775390625, -4.3486328125, -3.552490234375, -2.75634765625, -1.960205078125, -1.1640625, -0.367919921875, 0.42822265625, 1.224365234375, 2.0205078125, 2.816650390625, 3.61279296875, 4.408935546875, 5.205078125, 6.001220703125, 6.79736328125, 7.593505859375, 8.3896484375, 9.185791015625, 9.98193359375, 10.778076171875, 11.57421875, 12.370361328125, 13.16650390625, 13.962646484375, 14.7587890625, 15.554931640625, 16.35107421875, 17.147216796875, 17.943359375, 18.739501953125, 19.53564453125, 20.331787109375, 21.1279296875, 21.924072265625, 22.72021484375, 23.516357421875, 24.3125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 8.0, 8.0, 4.0, 4.0, 10.0, 18.0, 9.0, 17.0, 20.0, 18.0, 24.0, 34.0, 33.0, 27.0, 24.0, 31.0, 32.0, 43.0, 38.0, 40.0, 50.0, 1066.0, 34.0, 40.0, 40.0, 38.0, 39.0, 37.0, 30.0, 23.0, 33.0, 37.0, 18.0, 16.0, 18.0, 13.0, 9.0, 10.0, 7.0, 7.0, 4.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0], "bins": [-80.25, -78.0869140625, -75.923828125, -73.7607421875, -71.59765625, -69.4345703125, -67.271484375, -65.1083984375, -62.9453125, -60.7822265625, -58.619140625, -56.4560546875, -54.29296875, -52.1298828125, -49.966796875, -47.8037109375, -45.640625, -43.4775390625, -41.314453125, -39.1513671875, -36.98828125, -34.8251953125, -32.662109375, -30.4990234375, -28.3359375, -26.1728515625, -24.009765625, -21.8466796875, -19.68359375, -17.5205078125, -15.357421875, -13.1943359375, -11.03125, -8.8681640625, -6.705078125, -4.5419921875, -2.37890625, -0.2158203125, 1.947265625, 4.1103515625, 6.2734375, 8.4365234375, 10.599609375, 12.7626953125, 14.92578125, 17.0888671875, 19.251953125, 21.4150390625, 23.578125, 25.7412109375, 27.904296875, 30.0673828125, 32.23046875, 34.3935546875, 36.556640625, 38.7197265625, 40.8828125, 43.0458984375, 45.208984375, 47.3720703125, 49.53515625, 51.6982421875, 53.861328125, 56.0244140625, 58.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 11.0, 20.0, 26.0, 34.0, 48.0, 80.0, 111.0, 166.0, 256.0, 408.0, 650.0, 1104.0, 1690.0, 2756.0, 4362.0, 6897.0, 11354.0, 19010.0, 31018.0, 52097.0, 93557.0, 217019.0, 1379101.0, 118586.0, 62252.0, 36663.0, 22319.0, 13522.0, 8159.0, 5157.0, 3188.0, 2006.0, 1264.0, 767.0, 524.0, 329.0, 187.0, 124.0, 116.0, 68.0, 43.0, 28.0, 18.0, 15.0, 8.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.484375, -20.772216796875, -20.06005859375, -19.347900390625, -18.6357421875, -17.923583984375, -17.21142578125, -16.499267578125, -15.787109375, -15.074951171875, -14.36279296875, -13.650634765625, -12.9384765625, -12.226318359375, -11.51416015625, -10.802001953125, -10.08984375, -9.377685546875, -8.66552734375, -7.953369140625, -7.2412109375, -6.529052734375, -5.81689453125, -5.104736328125, -4.392578125, -3.680419921875, -2.96826171875, -2.256103515625, -1.5439453125, -0.831787109375, -0.11962890625, 0.592529296875, 1.3046875, 2.016845703125, 2.72900390625, 3.441162109375, 4.1533203125, 4.865478515625, 5.57763671875, 6.289794921875, 7.001953125, 7.714111328125, 8.42626953125, 9.138427734375, 9.8505859375, 10.562744140625, 11.27490234375, 11.987060546875, 12.69921875, 13.411376953125, 14.12353515625, 14.835693359375, 15.5478515625, 16.260009765625, 16.97216796875, 17.684326171875, 18.396484375, 19.108642578125, 19.82080078125, 20.532958984375, 21.2451171875, 21.957275390625, 22.66943359375, 23.381591796875, 24.09375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 0.0, 5.0, 6.0, 9.0, 6.0, 7.0, 13.0, 12.0, 14.0, 26.0, 22.0, 37.0, 48.0, 65.0, 74.0, 87.0, 100.0, 91.0, 85.0, 68.0, 55.0, 32.0, 28.0, 24.0, 16.0, 7.0, 17.0, 15.0, 6.0, 1.0, 5.0, 2.0, 1.0, 5.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.020294189453125, -0.019688129425048828, -0.019082069396972656, -0.018476009368896484, -0.017869949340820312, -0.01726388931274414, -0.01665782928466797, -0.016051769256591797, -0.015445709228515625, -0.014839649200439453, -0.014233589172363281, -0.01362752914428711, -0.013021469116210938, -0.012415409088134766, -0.011809349060058594, -0.011203289031982422, -0.01059722900390625, -0.009991168975830078, -0.009385108947753906, -0.008779048919677734, -0.008172988891601562, -0.007566928863525391, -0.006960868835449219, -0.006354808807373047, -0.005748748779296875, -0.005142688751220703, -0.004536628723144531, -0.003930568695068359, -0.0033245086669921875, -0.0027184486389160156, -0.0021123886108398438, -0.0015063285827636719, -0.0009002685546875, -0.0002942085266113281, 0.00031185150146484375, 0.0009179115295410156, 0.0015239715576171875, 0.0021300315856933594, 0.0027360916137695312, 0.003342151641845703, 0.003948211669921875, 0.004554271697998047, 0.005160331726074219, 0.005766391754150391, 0.0063724517822265625, 0.006978511810302734, 0.007584571838378906, 0.008190631866455078, 0.00879669189453125, 0.009402751922607422, 0.010008811950683594, 0.010614871978759766, 0.011220932006835938, 0.01182699203491211, 0.012433052062988281, 0.013039112091064453, 0.013645172119140625, 0.014251232147216797, 0.014857292175292969, 0.01546335220336914, 0.016069412231445312, 0.016675472259521484, 0.017281532287597656, 0.017887592315673828, 0.01849365234375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 7.0, 7.0, 7.0, 19.0, 19.0, 32.0, 21.0, 34.0, 47.0, 52.0, 75.0, 109.0, 174.0, 240.0, 412.0, 705.0, 1641.0, 4188.0, 16207.0, 99898.0, 672665.0, 213497.0, 27620.0, 6275.0, 2115.0, 950.0, 514.0, 327.0, 180.0, 134.0, 87.0, 59.0, 60.0, 47.0, 27.0, 24.0, 18.0, 9.0, 8.0, 8.0, 14.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.1268310546875, -0.12294864654541016, -0.11906623840332031, -0.11518383026123047, -0.11130142211914062, -0.10741901397705078, -0.10353660583496094, -0.0996541976928711, -0.09577178955078125, -0.0918893814086914, -0.08800697326660156, -0.08412456512451172, -0.08024215698242188, -0.07635974884033203, -0.07247734069824219, -0.06859493255615234, -0.0647125244140625, -0.060830116271972656, -0.05694770812988281, -0.05306529998779297, -0.049182891845703125, -0.04530048370361328, -0.04141807556152344, -0.037535667419433594, -0.03365325927734375, -0.029770851135253906, -0.025888442993164062, -0.02200603485107422, -0.018123626708984375, -0.014241218566894531, -0.010358810424804688, -0.006476402282714844, -0.002593994140625, 0.0012884140014648438, 0.0051708221435546875, 0.009053230285644531, 0.012935638427734375, 0.01681804656982422, 0.020700454711914062, 0.024582862854003906, 0.02846527099609375, 0.032347679138183594, 0.03623008728027344, 0.04011249542236328, 0.043994903564453125, 0.04787731170654297, 0.05175971984863281, 0.055642127990722656, 0.0595245361328125, 0.06340694427490234, 0.06728935241699219, 0.07117176055908203, 0.07505416870117188, 0.07893657684326172, 0.08281898498535156, 0.0867013931274414, 0.09058380126953125, 0.0944662094116211, 0.09834861755371094, 0.10223102569580078, 0.10611343383789062, 0.10999584197998047, 0.11387825012207031, 0.11776065826416016, 0.12164306640625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 26.0, 55.0, 122.0, 239.0, 267.0, 184.0, 75.0, 21.0, 11.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.016790717840194702, -0.01568986475467682, -0.01458901260048151, -0.013488160446286201, -0.012387307360768318, -0.011286454275250435, -0.010185602121055126, -0.009084749966859818, -0.007983896881341934, -0.006883044261485338, -0.005782191641628742, -0.004681339021772146, -0.0035804864019155502, -0.0024796337820589542, -0.0013787811622023582, -0.00027792854234576225, 0.0008229240775108337, 0.0019237766973674297, 0.0030246293172240257, 0.004125481937080622, 0.005226334556937218, 0.006327187176793814, 0.00742803979665041, 0.008528891950845718, 0.009629745036363602, 0.010730598121881485, 0.011831450276076794, 0.012932302430272102, 0.014033155515789986, 0.015134008601307869, 0.016234859824180603, 0.017335712909698486, 0.01843656226992607, 0.019537415355443954, 0.020638268440961838, 0.021739119663834572, 0.022839972749352455, 0.02394082583487034, 0.025041677057743073, 0.026142530143260956, 0.02724338322877884, 0.028344236314296722, 0.029445089399814606, 0.03054594062268734, 0.03164679557085037, 0.03274764493107796, 0.03384849801659584, 0.034949351102113724, 0.03605020418763161, 0.03715105727314949, 0.038251910358667374, 0.03935276344418526, 0.04045361280441284, 0.041554465889930725, 0.04265531897544861, 0.04375617206096649, 0.044857025146484375, 0.04595787823200226, 0.04705873131752014, 0.048159584403038025, 0.04926043748855591, 0.05036128684878349, 0.051462139934301376, 0.05256299301981926, 0.05366384610533714]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 7.0, 3.0, 9.0, 4.0, 10.0, 14.0, 17.0, 15.0, 9.0, 24.0, 25.0, 34.0, 24.0, 28.0, 33.0, 38.0, 38.0, 41.0, 41.0, 43.0, 47.0, 41.0, 62.0, 47.0, 38.0, 24.0, 39.0, 27.0, 30.0, 23.0, 24.0, 20.0, 18.0, 25.0, 14.0, 14.0, 20.0, 11.0, 4.0, 6.0, 6.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.008380234241485596, -0.008100881241261959, -0.007821528241038322, -0.007542175240814686, -0.007262822240591049, -0.006983469240367413, -0.006704116240143776, -0.006424763239920139, -0.006145410239696503, -0.005866057239472866, -0.005586704239249229, -0.005307351239025593, -0.005027998238801956, -0.0047486452385783195, -0.004469292238354683, -0.004189939238131046, -0.00391058623790741, -0.003631233237683773, -0.0033518802374601364, -0.0030725272372365, -0.002793174237012863, -0.0025138212367892265, -0.00223446823656559, -0.0019551152363419533, -0.0016757622361183167, -0.00139640923589468, -0.0011170562356710434, -0.0008377032354474068, -0.0005583502352237701, -0.0002789972350001335, 3.557652235031128e-07, 0.00027970876544713974, 0.0005590617656707764, 0.000838414765894413, 0.0011177677661180496, 0.0013971207663416862, 0.0016764737665653229, 0.0019558267667889595, 0.002235179767012596, 0.0025145327672362328, 0.0027938857674598694, 0.003073238767683506, 0.0033525917679071426, 0.0036319447681307793, 0.003911297768354416, 0.0041906507685780525, 0.004470003768801689, 0.004749356769025326, 0.005028709769248962, 0.005308062769472599, 0.005587415769696236, 0.005866768769919872, 0.006146121770143509, 0.0064254747703671455, 0.006704827770590782, 0.006984180770814419, 0.007263533771038055, 0.007542886771261692, 0.007822239771485329, 0.008101592771708965, 0.008380945771932602, 0.008660298772156239, 0.008939651772379875, 0.009219004772603512, 0.009498357772827148]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 4.0, 5.0, 9.0, 4.0, 13.0, 10.0, 19.0, 17.0, 17.0, 26.0, 29.0, 23.0, 33.0, 30.0, 38.0, 46.0, 50.0, 45.0, 49.0, 34.0, 41.0, 47.0, 44.0, 41.0, 32.0, 44.0, 32.0, 37.0, 30.0, 28.0, 12.0, 15.0, 17.0, 15.0, 14.0, 10.0, 9.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.75, -97.125, -93.5, -89.875, -86.25, -82.625, -79.0, -75.375, -71.75, -68.125, -64.5, -60.875, -57.25, -53.625, -50.0, -46.375, -42.75, -39.125, -35.5, -31.875, -28.25, -24.625, -21.0, -17.375, -13.75, -10.125, -6.5, -2.875, 0.75, 4.375, 8.0, 11.625, 15.25, 18.875, 22.5, 26.125, 29.75, 33.375, 37.0, 40.625, 44.25, 47.875, 51.5, 55.125, 58.75, 62.375, 66.0, 69.625, 73.25, 76.875, 80.5, 84.125, 87.75, 91.375, 95.0, 98.625, 102.25, 105.875, 109.5, 113.125, 116.75, 120.375, 124.0, 127.625, 131.25]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 6.0, 17.0, 15.0, 18.0, 17.0, 30.0, 44.0, 59.0, 101.0, 144.0, 226.0, 376.0, 610.0, 1115.0, 2082.0, 4272.0, 10346.0, 34536.0, 190027.0, 631234.0, 130109.0, 26356.0, 8805.0, 3714.0, 1803.0, 1003.0, 555.0, 301.0, 180.0, 115.0, 85.0, 69.0, 45.0, 35.0, 18.0, 24.0, 15.0, 10.0, 9.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.796875, -29.783935546875, -28.77099609375, -27.758056640625, -26.7451171875, -25.732177734375, -24.71923828125, -23.706298828125, -22.693359375, -21.680419921875, -20.66748046875, -19.654541015625, -18.6416015625, -17.628662109375, -16.61572265625, -15.602783203125, -14.58984375, -13.576904296875, -12.56396484375, -11.551025390625, -10.5380859375, -9.525146484375, -8.51220703125, -7.499267578125, -6.486328125, -5.473388671875, -4.46044921875, -3.447509765625, -2.4345703125, -1.421630859375, -0.40869140625, 0.604248046875, 1.6171875, 2.630126953125, 3.64306640625, 4.656005859375, 5.6689453125, 6.681884765625, 7.69482421875, 8.707763671875, 9.720703125, 10.733642578125, 11.74658203125, 12.759521484375, 13.7724609375, 14.785400390625, 15.79833984375, 16.811279296875, 17.82421875, 18.837158203125, 19.85009765625, 20.863037109375, 21.8759765625, 22.888916015625, 23.90185546875, 24.914794921875, 25.927734375, 26.940673828125, 27.95361328125, 28.966552734375, 29.9794921875, 30.992431640625, 32.00537109375, 33.018310546875, 34.03125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 10.0, 9.0, 20.0, 19.0, 15.0, 22.0, 47.0, 46.0, 63.0, 71.0, 87.0, 1949.0, 288.0, 73.0, 93.0, 56.0, 48.0, 36.0, 30.0, 20.0, 13.0, 7.0, 10.0, 3.0, 7.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-308.75, -299.0859375, -289.421875, -279.7578125, -270.09375, -260.4296875, -250.765625, -241.1015625, -231.4375, -221.7734375, -212.109375, -202.4453125, -192.78125, -183.1171875, -173.453125, -163.7890625, -154.125, -144.4609375, -134.796875, -125.1328125, -115.46875, -105.8046875, -96.140625, -86.4765625, -76.8125, -67.1484375, -57.484375, -47.8203125, -38.15625, -28.4921875, -18.828125, -9.1640625, 0.5, 10.1640625, 19.828125, 29.4921875, 39.15625, 48.8203125, 58.484375, 68.1484375, 77.8125, 87.4765625, 97.140625, 106.8046875, 116.46875, 126.1328125, 135.796875, 145.4609375, 155.125, 164.7890625, 174.453125, 184.1171875, 193.78125, 203.4453125, 213.109375, 222.7734375, 232.4375, 242.1015625, 251.765625, 261.4296875, 271.09375, 280.7578125, 290.421875, 300.0859375, 309.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 24.0, 28.0, 54.0, 80.0, 143.0, 278.0, 589.0, 1489.0, 6931.0, 377698.0, 2746131.0, 9218.0, 1666.0, 641.0, 319.0, 157.0, 92.0, 57.0, 37.0, 15.0, 15.0, 2.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.25, -79.513671875, -76.77734375, -74.041015625, -71.3046875, -68.568359375, -65.83203125, -63.095703125, -60.359375, -57.623046875, -54.88671875, -52.150390625, -49.4140625, -46.677734375, -43.94140625, -41.205078125, -38.46875, -35.732421875, -32.99609375, -30.259765625, -27.5234375, -24.787109375, -22.05078125, -19.314453125, -16.578125, -13.841796875, -11.10546875, -8.369140625, -5.6328125, -2.896484375, -0.16015625, 2.576171875, 5.3125, 8.048828125, 10.78515625, 13.521484375, 16.2578125, 18.994140625, 21.73046875, 24.466796875, 27.203125, 29.939453125, 32.67578125, 35.412109375, 38.1484375, 40.884765625, 43.62109375, 46.357421875, 49.09375, 51.830078125, 54.56640625, 57.302734375, 60.0390625, 62.775390625, 65.51171875, 68.248046875, 70.984375, 73.720703125, 76.45703125, 79.193359375, 81.9296875, 84.666015625, 87.40234375, 90.138671875, 92.875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 7.0, 8.0, 9.0, 18.0, 46.0, 127.0, 306.0, 321.0, 113.0, 30.0, 12.0, 10.0, 4.0, 3.0, 0.0, 1.0], "bins": [-1013.841796875, -995.455322265625, -977.0689086914062, -958.6824951171875, -940.2960205078125, -921.9095458984375, -903.5231323242188, -885.13671875, -866.750244140625, -848.36376953125, -829.9773559570312, -811.5909423828125, -793.2044677734375, -774.8179931640625, -756.4315795898438, -738.045166015625, -719.65869140625, -701.272216796875, -682.8858032226562, -664.4993896484375, -646.1129150390625, -627.7264404296875, -609.3400268554688, -590.95361328125, -572.567138671875, -554.1806640625, -535.7942504882812, -517.4078369140625, -499.0213623046875, -480.6349182128906, -462.24847412109375, -443.8620300292969, -425.47552490234375, -407.0890808105469, -388.70263671875, -370.3161926269531, -351.92974853515625, -333.5433044433594, -315.1568603515625, -296.7704162597656, -278.38397216796875, -259.9975280761719, -241.611083984375, -223.22463989257812, -204.83819580078125, -186.45175170898438, -168.0653076171875, -149.67886352539062, -131.29241943359375, -112.90597534179688, -94.51953125, -76.13308715820312, -57.74664306640625, -39.360198974609375, -20.9737548828125, -2.587310791015625, 15.79913330078125, 34.185577392578125, 52.572021484375, 70.95846557617188, 89.34490966796875, 107.73135375976562, 126.1177978515625, 144.50424194335938, 162.89068603515625]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 7.0, 6.0, 7.0, 6.0, 16.0, 19.0, 12.0, 16.0, 27.0, 31.0, 31.0, 43.0, 36.0, 38.0, 58.0, 59.0, 56.0, 53.0, 51.0, 49.0, 58.0, 48.0, 47.0, 44.0, 36.0, 32.0, 25.0, 19.0, 17.0, 17.0, 9.0, 5.0, 3.0, 9.0, 6.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-298.53338623046875, -289.53375244140625, -280.53411865234375, -271.5345153808594, -262.5348815917969, -253.53524780273438, -244.53562927246094, -235.5360107421875, -226.536376953125, -217.5367431640625, -208.53712463378906, -199.53750610351562, -190.53787231445312, -181.53823852539062, -172.5386199951172, -163.53900146484375, -154.53936767578125, -145.53973388671875, -136.5401153564453, -127.54048919677734, -118.54086303710938, -109.5412368774414, -100.54161071777344, -91.54198455810547, -82.5423583984375, -73.54273223876953, -64.54310607910156, -55.543479919433594, -46.543853759765625, -37.544227600097656, -28.544601440429688, -19.54497528076172, -10.54534912109375, -1.5457229614257812, 7.4539031982421875, 16.453529357910156, 25.453155517578125, 34.452781677246094, 43.45240783691406, 52.45203399658203, 61.45166015625, 70.45128631591797, 79.45091247558594, 88.4505386352539, 97.45016479492188, 106.44979095458984, 115.44941711425781, 124.44904327392578, 133.44866943359375, 142.44830322265625, 151.4479217529297, 160.44754028320312, 169.44717407226562, 178.44680786132812, 187.44642639160156, 196.446044921875, 205.4456787109375, 214.4453125, 223.44493103027344, 232.44454956054688, 241.44418334960938, 250.44381713867188, 259.44342041015625, 268.44305419921875, 277.44268798828125]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 8.0, 5.0, 13.0, 14.0, 15.0, 23.0, 18.0, 25.0, 34.0, 50.0, 57.0, 77.0, 98.0, 125.0, 198.0, 236.0, 315.0, 401.0, 586.0, 785.0, 1380.0, 1040866.0, 803.0, 597.0, 439.0, 337.0, 238.0, 200.0, 121.0, 119.0, 81.0, 71.0, 45.0, 35.0, 33.0, 24.0, 16.0, 12.0, 13.0, 11.0, 9.0, 9.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.40814971923828, -65.09004211425781, -62.771942138671875, -60.453834533691406, -58.1357307434082, -55.817626953125, -53.49951934814453, -51.18141555786133, -48.863311767578125, -46.54520797729492, -44.22710418701172, -41.90899658203125, -39.59089279174805, -37.272789001464844, -34.954681396484375, -32.63657760620117, -30.31847381591797, -28.000370025634766, -25.68226432800293, -23.364158630371094, -21.04605484008789, -18.727951049804688, -16.40984535217285, -14.091739654541016, -11.773635864257812, -9.455531120300293, -7.137426376342773, -4.819321632385254, -2.5012168884277344, -0.18311214447021484, 2.1349925994873047, 4.453098297119141, 6.771209716796875, 9.089314460754395, 11.407419204711914, 13.725523948669434, 16.043628692626953, 18.361732482910156, 20.679838180541992, 22.997943878173828, 25.31604766845703, 27.634151458740234, 29.95225715637207, 32.270362854003906, 34.58846664428711, 36.90657043457031, 39.22467803955078, 41.542781829833984, 43.86088562011719, 46.17898941040039, 48.497093200683594, 50.81520080566406, 53.133304595947266, 55.45140838623047, 57.76951599121094, 60.08761978149414, 62.405723571777344, 64.72383117675781, 67.04193115234375, 69.36003875732422, 71.67814636230469, 73.99624633789062, 76.3143539428711, 78.63246154785156, 80.9505615234375]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 8.0, 8.0, 3.0, 8.0, 11.0, 19.0, 44.0, 166.0, 51462608.0, 153.0, 42.0, 17.0, 16.0, 10.0, 5.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 7.0, 5.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8952.0, -8471.625, -7991.25, -7510.875, -7030.5, -6550.125, -6069.75, -5589.375, -5109.0, -4628.625, -4148.25, -3667.875, -3187.5, -2707.125, -2226.75, -1746.375, -1266.0, -785.625, -305.25, 175.125, 655.5, 1135.875, 1616.25, 2096.625, 2577.0, 3057.375, 3537.75, 4018.125, 4498.5, 4978.875, 5459.25, 5939.625, 6420.0, 6900.375, 7380.75, 7861.125, 8341.5, 8821.875, 9302.25, 9782.625, 10263.0, 10743.375, 11223.75, 11704.125, 12184.5, 12664.875, 13145.25, 13625.625, 14106.0, 14586.375, 15066.75, 15547.125, 16027.5, 16507.875, 16988.25, 17468.625, 17949.0, 18429.375, 18909.75, 19390.125, 19870.5, 20350.875, 20831.25, 21311.625, 21792.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 10.0, 11.0, 15.0, 37.0, 34.0, 53.0, 95.0, 109.0, 170.0, 273.0, 394.0, 485.0, 635.0, 900.0, 1391.0, 1971.0, 2718.0, 3655.0, 5374.0, 7637.0, 10253.0, 15038.0, 21520.0, 31603.0, 46989.0, 70647.0, 107675.0, 170125.0, 295742.0, 1078032.0, 3499804.0, 356905.0, 195192.0, 120321.0, 78792.0, 52073.0, 34985.0, 24122.0, 16753.0, 11462.0, 7986.0, 5681.0, 3894.0, 2807.0, 2131.0, 1477.0, 1022.0, 741.0, 526.0, 358.0, 280.0, 186.0, 100.0, 86.0, 57.0, 35.0, 31.0, 22.0, 15.0, 8.0, 5.0, 3.0, 3.0], "bins": [-8.640625, -8.363037109375, -8.08544921875, -7.807861328125, -7.5302734375, -7.252685546875, -6.97509765625, -6.697509765625, -6.419921875, -6.142333984375, -5.86474609375, -5.587158203125, -5.3095703125, -5.031982421875, -4.75439453125, -4.476806640625, -4.19921875, -3.921630859375, -3.64404296875, -3.366455078125, -3.0888671875, -2.811279296875, -2.53369140625, -2.256103515625, -1.978515625, -1.700927734375, -1.42333984375, -1.145751953125, -0.8681640625, -0.590576171875, -0.31298828125, -0.035400390625, 0.2421875, 0.519775390625, 0.79736328125, 1.074951171875, 1.3525390625, 1.630126953125, 1.90771484375, 2.185302734375, 2.462890625, 2.740478515625, 3.01806640625, 3.295654296875, 3.5732421875, 3.850830078125, 4.12841796875, 4.406005859375, 4.68359375, 4.961181640625, 5.23876953125, 5.516357421875, 5.7939453125, 6.071533203125, 6.34912109375, 6.626708984375, 6.904296875, 7.181884765625, 7.45947265625, 7.737060546875, 8.0146484375, 8.292236328125, 8.56982421875, 8.847412109375, 9.125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 8.0, 7.0, 8.0, 4.0, 1.0, 12.0, 11.0, 9.0, 8.0, 13.0, 15.0, 20.0, 24.0, 17.0, 33.0, 31.0, 31.0, 35.0, 24.0, 26.0, 36.0, 49.0, 111.0, 548.0, 383.0, 111.0, 56.0, 42.0, 47.0, 26.0, 33.0, 30.0, 30.0, 29.0, 18.0, 30.0, 16.0, 26.0, 12.0, 12.0, 14.0, 5.0, 9.0, 4.0, 4.0, 6.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.53125, -21.802734375, -21.07421875, -20.345703125, -19.6171875, -18.888671875, -18.16015625, -17.431640625, -16.703125, -15.974609375, -15.24609375, -14.517578125, -13.7890625, -13.060546875, -12.33203125, -11.603515625, -10.875, -10.146484375, -9.41796875, -8.689453125, -7.9609375, -7.232421875, -6.50390625, -5.775390625, -5.046875, -4.318359375, -3.58984375, -2.861328125, -2.1328125, -1.404296875, -0.67578125, 0.052734375, 0.78125, 1.509765625, 2.23828125, 2.966796875, 3.6953125, 4.423828125, 5.15234375, 5.880859375, 6.609375, 7.337890625, 8.06640625, 8.794921875, 9.5234375, 10.251953125, 10.98046875, 11.708984375, 12.4375, 13.166015625, 13.89453125, 14.623046875, 15.3515625, 16.080078125, 16.80859375, 17.537109375, 18.265625, 18.994140625, 19.72265625, 20.451171875, 21.1796875, 21.908203125, 22.63671875, 23.365234375, 24.09375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [6.0, 5.0, 1.0, 1.0, 8.0, 11.0, 19.0, 14.0, 26.0, 34.0, 51.0, 66.0, 86.0, 152.0, 187.0, 311.0, 401.0, 615.0, 921.0, 1304.0, 2103.0, 3152.0, 4902.0, 7676.0, 12374.0, 20184.0, 33796.0, 56552.0, 100078.0, 183828.0, 368932.0, 3281751.0, 1484884.0, 330557.0, 168263.0, 92350.0, 52866.0, 31476.0, 18776.0, 11648.0, 7235.0, 4782.0, 3007.0, 1998.0, 1291.0, 867.0, 613.0, 388.0, 269.0, 202.0, 134.0, 83.0, 69.0, 54.0, 37.0, 17.0, 14.0, 10.0, 8.0, 2.0, 2.0, 4.0, 0.0, 3.0], "bins": [-13.2578125, -12.8426513671875, -12.427490234375, -12.0123291015625, -11.59716796875, -11.1820068359375, -10.766845703125, -10.3516845703125, -9.9365234375, -9.5213623046875, -9.106201171875, -8.6910400390625, -8.27587890625, -7.8607177734375, -7.445556640625, -7.0303955078125, -6.615234375, -6.2000732421875, -5.784912109375, -5.3697509765625, -4.95458984375, -4.5394287109375, -4.124267578125, -3.7091064453125, -3.2939453125, -2.8787841796875, -2.463623046875, -2.0484619140625, -1.63330078125, -1.2181396484375, -0.802978515625, -0.3878173828125, 0.02734375, 0.4425048828125, 0.857666015625, 1.2728271484375, 1.68798828125, 2.1031494140625, 2.518310546875, 2.9334716796875, 3.3486328125, 3.7637939453125, 4.178955078125, 4.5941162109375, 5.00927734375, 5.4244384765625, 5.839599609375, 6.2547607421875, 6.669921875, 7.0850830078125, 7.500244140625, 7.9154052734375, 8.33056640625, 8.7457275390625, 9.160888671875, 9.5760498046875, 9.9912109375, 10.4063720703125, 10.821533203125, 11.2366943359375, 11.65185546875, 12.0670166015625, 12.482177734375, 12.8973388671875, 13.3125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 7.0, 6.0, 10.0, 11.0, 13.0, 15.0, 17.0, 16.0, 27.0, 17.0, 25.0, 35.0, 34.0, 37.0, 25.0, 29.0, 49.0, 63.0, 134.0, 452.0, 380.0, 128.0, 79.0, 53.0, 37.0, 49.0, 31.0, 30.0, 35.0, 20.0, 31.0, 20.0, 14.0, 22.0, 14.0, 12.0, 10.0, 9.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-17.609375, -17.05810546875, -16.5068359375, -15.95556640625, -15.404296875, -14.85302734375, -14.3017578125, -13.75048828125, -13.19921875, -12.64794921875, -12.0966796875, -11.54541015625, -10.994140625, -10.44287109375, -9.8916015625, -9.34033203125, -8.7890625, -8.23779296875, -7.6865234375, -7.13525390625, -6.583984375, -6.03271484375, -5.4814453125, -4.93017578125, -4.37890625, -3.82763671875, -3.2763671875, -2.72509765625, -2.173828125, -1.62255859375, -1.0712890625, -0.52001953125, 0.03125, 0.58251953125, 1.1337890625, 1.68505859375, 2.236328125, 2.78759765625, 3.3388671875, 3.89013671875, 4.44140625, 4.99267578125, 5.5439453125, 6.09521484375, 6.646484375, 7.19775390625, 7.7490234375, 8.30029296875, 8.8515625, 9.40283203125, 9.9541015625, 10.50537109375, 11.056640625, 11.60791015625, 12.1591796875, 12.71044921875, 13.26171875, 13.81298828125, 14.3642578125, 14.91552734375, 15.466796875, 16.01806640625, 16.5693359375, 17.12060546875, 17.671875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 6.0, 0.0, 0.0, 3.0, 16.0, 8.0, 10.0, 33.0, 22.0, 32.0, 57.0, 52.0, 70.0, 94.0, 125.0, 126.0, 201.0, 231.0, 324.0, 500.0, 633.0, 880.0, 1304.0, 1974.0, 3274.0, 5749.0, 11084.0, 26250.0, 86892.0, 5916174.0, 163718.0, 38125.0, 14580.0, 7245.0, 3787.0, 2417.0, 1597.0, 984.0, 722.0, 521.0, 426.0, 305.0, 213.0, 169.0, 129.0, 68.0, 70.0, 54.0, 59.0, 29.0, 26.0, 30.0, 18.0, 4.0, 15.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-36.53125, -35.34033203125, -34.1494140625, -32.95849609375, -31.767578125, -30.57666015625, -29.3857421875, -28.19482421875, -27.00390625, -25.81298828125, -24.6220703125, -23.43115234375, -22.240234375, -21.04931640625, -19.8583984375, -18.66748046875, -17.4765625, -16.28564453125, -15.0947265625, -13.90380859375, -12.712890625, -11.52197265625, -10.3310546875, -9.14013671875, -7.94921875, -6.75830078125, -5.5673828125, -4.37646484375, -3.185546875, -1.99462890625, -0.8037109375, 0.38720703125, 1.578125, 2.76904296875, 3.9599609375, 5.15087890625, 6.341796875, 7.53271484375, 8.7236328125, 9.91455078125, 11.10546875, 12.29638671875, 13.4873046875, 14.67822265625, 15.869140625, 17.06005859375, 18.2509765625, 19.44189453125, 20.6328125, 21.82373046875, 23.0146484375, 24.20556640625, 25.396484375, 26.58740234375, 27.7783203125, 28.96923828125, 30.16015625, 31.35107421875, 32.5419921875, 33.73291015625, 34.923828125, 36.11474609375, 37.3056640625, 38.49658203125, 39.6875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 3.0, 6.0, 5.0, 10.0, 13.0, 10.0, 15.0, 17.0, 14.0, 18.0, 36.0, 21.0, 48.0, 32.0, 42.0, 47.0, 47.0, 93.0, 161.0, 425.0, 323.0, 132.0, 99.0, 51.0, 53.0, 41.0, 39.0, 30.0, 27.0, 22.0, 26.0, 19.0, 22.0, 6.0, 16.0, 3.0, 9.0, 10.0, 5.0, 8.0, 5.0, 6.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8125, -12.3973388671875, -11.982177734375, -11.5670166015625, -11.15185546875, -10.7366943359375, -10.321533203125, -9.9063720703125, -9.4912109375, -9.0760498046875, -8.660888671875, -8.2457275390625, -7.83056640625, -7.4154052734375, -7.000244140625, -6.5850830078125, -6.169921875, -5.7547607421875, -5.339599609375, -4.9244384765625, -4.50927734375, -4.0941162109375, -3.678955078125, -3.2637939453125, -2.8486328125, -2.4334716796875, -2.018310546875, -1.6031494140625, -1.18798828125, -0.7728271484375, -0.357666015625, 0.0574951171875, 0.47265625, 0.8878173828125, 1.302978515625, 1.7181396484375, 2.13330078125, 2.5484619140625, 2.963623046875, 3.3787841796875, 3.7939453125, 4.2091064453125, 4.624267578125, 5.0394287109375, 5.45458984375, 5.8697509765625, 6.284912109375, 6.7000732421875, 7.115234375, 7.5303955078125, 7.945556640625, 8.3607177734375, 8.77587890625, 9.1910400390625, 9.606201171875, 10.0213623046875, 10.4365234375, 10.8516845703125, 11.266845703125, 11.6820068359375, 12.09716796875, 12.5123291015625, 12.927490234375, 13.3426513671875, 13.7578125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 9.0, 9.0, 13.0, 30.0, 55.0, 125.0, 435.0, 190.0, 58.0, 39.0, 14.0, 9.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.762855529785156, -22.805233001708984, -20.847612380981445, -18.889989852905273, -16.9323673248291, -14.974745750427246, -13.01712417602539, -11.059501647949219, -9.101880073547363, -7.14425802230835, -5.186635971069336, -3.2290143966674805, -1.2713923454284668, 0.6862297058105469, 2.6438512802124023, 4.601473808288574, 6.55909538269043, 8.516716957092285, 10.474339485168457, 12.431961059570312, 14.389583587646484, 16.347206115722656, 18.304826736450195, 20.262449264526367, 22.220069885253906, 24.177692413330078, 26.135313034057617, 28.09293556213379, 30.05055809020996, 32.0081787109375, 33.96580123901367, 35.923423767089844, 37.881046295166016, 39.83866882324219, 41.79629135131836, 43.75391387939453, 45.71153259277344, 47.66915512084961, 49.62677764892578, 51.58440017700195, 53.542022705078125, 55.4996452331543, 57.45726776123047, 59.414886474609375, 61.37250900268555, 63.33013153076172, 65.28775024414062, 67.24537658691406, 69.20299530029297, 71.16061401367188, 73.11824035644531, 75.07585906982422, 77.03348541259766, 78.99110412597656, 80.94873046875, 82.9063491821289, 84.86397552490234, 86.82159423828125, 88.77922058105469, 90.7368392944336, 92.69446563720703, 94.65208435058594, 96.60971069335938, 98.56732940673828, 100.52494812011719]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 2.0, 6.0, 7.0, 6.0, 9.0, 5.0, 14.0, 11.0, 9.0, 14.0, 15.0, 10.0, 12.0, 24.0, 24.0, 22.0, 21.0, 31.0, 36.0, 46.0, 34.0, 35.0, 33.0, 40.0, 37.0, 47.0, 44.0, 44.0, 32.0, 32.0, 33.0, 32.0, 22.0, 29.0, 21.0, 23.0, 15.0, 19.0, 19.0, 15.0, 12.0, 13.0, 7.0, 10.0, 11.0, 10.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.156578063964844, -16.627605438232422, -16.098630905151367, -15.569657325744629, -15.04068374633789, -14.511711120605469, -13.98273754119873, -13.453763961791992, -12.924790382385254, -12.395816802978516, -11.866843223571777, -11.337869644165039, -10.808897018432617, -10.279922485351562, -9.75094985961914, -9.221976280212402, -8.693002700805664, -8.164029121398926, -7.6350555419921875, -7.106082439422607, -6.577108860015869, -6.048135280609131, -5.519162178039551, -4.9901885986328125, -4.461215019226074, -3.932241439819336, -3.4032680988311768, -2.8742947578430176, -2.3453211784362793, -1.816347599029541, -1.2873742580413818, -0.7584009170532227, -0.2294292449951172, 0.29954421520233154, 0.8285176753997803, 1.357491135597229, 1.8864645957946777, 2.415438175201416, 2.944411516189575, 3.4733848571777344, 4.002358436584473, 4.531332015991211, 5.060305595397949, 5.589278697967529, 6.118252277374268, 6.647225856781006, 7.176198959350586, 7.705172538757324, 8.234146118164062, 8.7631196975708, 9.292093276977539, 9.821066856384277, 10.350040435791016, 10.879013061523438, 11.407986640930176, 11.936960220336914, 12.465933799743652, 12.99490737915039, 13.523880958557129, 14.052854537963867, 14.581827163696289, 15.110801696777344, 15.639774322509766, 16.168746948242188, 16.697721481323242]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 6.0, 5.0, 5.0, 10.0, 12.0, 14.0, 16.0, 24.0, 35.0, 46.0, 49.0, 70.0, 106.0, 139.0, 175.0, 246.0, 373.0, 503.0, 725.0, 1098.0, 1705.0, 2889.0, 4884.0, 9743.0, 23589.0, 114503.0, 3953316.0, 46831.0, 15541.0, 7290.0, 3850.0, 2123.0, 1420.0, 906.0, 606.0, 436.0, 274.0, 208.0, 128.0, 106.0, 73.0, 57.0, 39.0, 33.0, 11.0, 19.0, 13.0, 8.0, 7.0, 4.0, 4.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.04913330078125, -0.047655582427978516, -0.04617786407470703, -0.04470014572143555, -0.04322242736816406, -0.04174470901489258, -0.040266990661621094, -0.03878927230834961, -0.037311553955078125, -0.03583383560180664, -0.034356117248535156, -0.03287839889526367, -0.03140068054199219, -0.029922962188720703, -0.02844524383544922, -0.026967525482177734, -0.02548980712890625, -0.024012088775634766, -0.02253437042236328, -0.021056652069091797, -0.019578933715820312, -0.018101215362548828, -0.016623497009277344, -0.01514577865600586, -0.013668060302734375, -0.01219034194946289, -0.010712623596191406, -0.009234905242919922, -0.0077571868896484375, -0.006279468536376953, -0.004801750183105469, -0.0033240318298339844, -0.0018463134765625, -0.0003685951232910156, 0.0011091232299804688, 0.002586841583251953, 0.0040645599365234375, 0.005542278289794922, 0.007019996643066406, 0.00849771499633789, 0.009975433349609375, 0.01145315170288086, 0.012930870056152344, 0.014408588409423828, 0.015886306762695312, 0.017364025115966797, 0.01884174346923828, 0.020319461822509766, 0.02179718017578125, 0.023274898529052734, 0.02475261688232422, 0.026230335235595703, 0.027708053588867188, 0.029185771942138672, 0.030663490295410156, 0.03214120864868164, 0.033618927001953125, 0.03509664535522461, 0.036574363708496094, 0.03805208206176758, 0.03952980041503906, 0.04100751876831055, 0.04248523712158203, 0.043962955474853516, 0.045440673828125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 9.0, 4.0, 8.0, 6.0, 8.0, 6.0, 5.0, 8.0, 13.0, 17.0, 24.0, 777.0, 18.0, 11.0, 13.0, 11.0, 8.0, 8.0, 3.0, 8.0, 9.0, 7.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006343841552734375, -0.0061419010162353516, -0.005939960479736328, -0.005738019943237305, -0.005536079406738281, -0.005334138870239258, -0.005132198333740234, -0.004930257797241211, -0.0047283172607421875, -0.004526376724243164, -0.004324436187744141, -0.004122495651245117, -0.003920555114746094, -0.0037186145782470703, -0.003516674041748047, -0.0033147335052490234, -0.00311279296875, -0.0029108524322509766, -0.002708911895751953, -0.0025069713592529297, -0.0023050308227539062, -0.002103090286254883, -0.0019011497497558594, -0.001699209213256836, -0.0014972686767578125, -0.001295328140258789, -0.0010933876037597656, -0.0008914470672607422, -0.0006895065307617188, -0.0004875659942626953, -0.0002856254577636719, -8.368492126464844e-05, 0.000118255615234375, 0.00032019615173339844, 0.0005221366882324219, 0.0007240772247314453, 0.0009260177612304688, 0.0011279582977294922, 0.0013298988342285156, 0.001531839370727539, 0.0017337799072265625, 0.001935720443725586, 0.0021376609802246094, 0.002339601516723633, 0.0025415420532226562, 0.0027434825897216797, 0.002945423126220703, 0.0031473636627197266, 0.00334930419921875, 0.0035512447357177734, 0.003753185272216797, 0.00395512580871582, 0.004157066345214844, 0.004359006881713867, 0.004560947418212891, 0.004762887954711914, 0.0049648284912109375, 0.005166769027709961, 0.005368709564208984, 0.005570650100708008, 0.005772590637207031, 0.005974531173706055, 0.006176471710205078, 0.0063784122467041016, 0.006580352783203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 9.0, 6.0, 13.0, 13.0, 21.0, 21.0, 43.0, 64.0, 83.0, 111.0, 149.0, 257.0, 389.0, 629.0, 1174.0, 2631.0, 8485.0, 47466.0, 788289.0, 3247372.0, 78512.0, 11734.0, 3394.0, 1367.0, 757.0, 433.0, 256.0, 190.0, 108.0, 91.0, 60.0, 43.0, 30.0, 20.0, 20.0, 15.0, 9.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0667724609375, -0.06455516815185547, -0.06233787536621094, -0.060120582580566406, -0.057903289794921875, -0.055685997009277344, -0.05346870422363281, -0.05125141143798828, -0.04903411865234375, -0.04681682586669922, -0.04459953308105469, -0.042382240295410156, -0.040164947509765625, -0.037947654724121094, -0.03573036193847656, -0.03351306915283203, -0.0312957763671875, -0.02907848358154297, -0.026861190795898438, -0.024643898010253906, -0.022426605224609375, -0.020209312438964844, -0.017992019653320312, -0.01577472686767578, -0.01355743408203125, -0.011340141296386719, -0.009122848510742188, -0.006905555725097656, -0.004688262939453125, -0.0024709701538085938, -0.0002536773681640625, 0.0019636154174804688, 0.004180908203125, 0.006398200988769531, 0.008615493774414062, 0.010832786560058594, 0.013050079345703125, 0.015267372131347656, 0.017484664916992188, 0.01970195770263672, 0.02191925048828125, 0.02413654327392578, 0.026353836059570312, 0.028571128845214844, 0.030788421630859375, 0.033005714416503906, 0.03522300720214844, 0.03744029998779297, 0.0396575927734375, 0.04187488555908203, 0.04409217834472656, 0.046309471130371094, 0.048526763916015625, 0.050744056701660156, 0.05296134948730469, 0.05517864227294922, 0.05739593505859375, 0.05961322784423828, 0.06183052062988281, 0.06404781341552734, 0.06626510620117188, 0.0684823989868164, 0.07069969177246094, 0.07291698455810547, 0.07513427734375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 6.0, 10.0, 10.0, 13.0, 12.0, 12.0, 19.0, 18.0, 21.0, 39.0, 49.0, 59.0, 69.0, 95.0, 136.0, 150.0, 165.0, 337.0, 1063.0, 668.0, 264.0, 181.0, 141.0, 93.0, 99.0, 68.0, 67.0, 38.0, 43.0, 19.0, 18.0, 22.0, 11.0, 10.0, 12.0, 11.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00740814208984375, -0.007132172584533691, -0.006856203079223633, -0.006580233573913574, -0.006304264068603516, -0.006028294563293457, -0.0057523250579833984, -0.00547635555267334, -0.005200386047363281, -0.004924416542053223, -0.004648447036743164, -0.0043724775314331055, -0.004096508026123047, -0.0038205385208129883, -0.0035445690155029297, -0.003268599510192871, -0.0029926300048828125, -0.002716660499572754, -0.0024406909942626953, -0.0021647214889526367, -0.0018887519836425781, -0.0016127824783325195, -0.001336812973022461, -0.0010608434677124023, -0.0007848739624023438, -0.0005089044570922852, -0.00023293495178222656, 4.303455352783203e-05, 0.0003190040588378906, 0.0005949735641479492, 0.0008709430694580078, 0.0011469125747680664, 0.001422882080078125, 0.0016988515853881836, 0.001974821090698242, 0.0022507905960083008, 0.0025267601013183594, 0.002802729606628418, 0.0030786991119384766, 0.003354668617248535, 0.0036306381225585938, 0.003906607627868652, 0.004182577133178711, 0.0044585466384887695, 0.004734516143798828, 0.005010485649108887, 0.005286455154418945, 0.005562424659729004, 0.0058383941650390625, 0.006114363670349121, 0.00639033317565918, 0.006666302680969238, 0.006942272186279297, 0.0072182416915893555, 0.007494211196899414, 0.007770180702209473, 0.008046150207519531, 0.00832211971282959, 0.008598089218139648, 0.008874058723449707, 0.009150028228759766, 0.009425997734069824, 0.009701967239379883, 0.009977936744689941, 0.01025390625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 17.0, 33.0, 89.0, 214.0, 353.0, 174.0, 73.0, 20.0, 10.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07552838325500488, -0.07091432809829712, -0.06630027294158936, -0.06168622151017189, -0.057072170078754425, -0.05245811492204666, -0.0478440597653389, -0.04323000833392143, -0.03861595317721367, -0.034001898020505905, -0.02938784658908844, -0.024773791432380676, -0.020159738138318062, -0.015545684844255447, -0.010931629687547684, -0.0063175782561302185, -0.0017035230994224548, 0.002910530660301447, 0.007524584420025349, 0.012138638645410538, 0.016752691939473152, 0.021366745233535767, 0.02598080039024353, 0.030594851821660995, 0.03520890697836876, 0.03982296213507652, 0.04443701356649399, 0.04905106872320175, 0.053665123879909515, 0.05827917531132698, 0.06289322674274445, 0.06750728189945221, 0.07212133705615997, 0.07673539221286774, 0.0813494473695755, 0.08596350252628326, 0.09057755023241043, 0.0951916053891182, 0.09980566054582596, 0.10441970825195312, 0.10903376340866089, 0.11364781856536865, 0.11826187372207642, 0.12287592887878418, 0.12748998403549194, 0.1321040391921997, 0.13671809434890747, 0.14133213460445404, 0.145946204662323, 0.15056025981903076, 0.15517431497573853, 0.1597883701324463, 0.16440242528915405, 0.16901648044586182, 0.17363053560256958, 0.17824457585811615, 0.1828586310148239, 0.18747268617153168, 0.19208674132823944, 0.1967007964849472, 0.20131485164165497, 0.20592889189720154, 0.2105429470539093, 0.21515700221061707, 0.21977105736732483]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 11.0, 5.0, 11.0, 12.0, 21.0, 21.0, 21.0, 29.0, 30.0, 42.0, 40.0, 40.0, 47.0, 66.0, 57.0, 64.0, 58.0, 41.0, 48.0, 48.0, 41.0, 36.0, 39.0, 25.0, 30.0, 28.0, 15.0, 14.0, 11.0, 14.0, 9.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038662850856781006, -0.03730905055999756, -0.03595525026321411, -0.034601449966430664, -0.03324764966964722, -0.03189384937286377, -0.030540049076080322, -0.029186248779296875, -0.027832448482513428, -0.02647864818572998, -0.025124847888946533, -0.023771047592163086, -0.02241724729537964, -0.02106344699859619, -0.019709646701812744, -0.018355846405029297, -0.01700204610824585, -0.015648245811462402, -0.014294445514678955, -0.012940645217895508, -0.01158684492111206, -0.010233044624328613, -0.008879244327545166, -0.007525444030761719, -0.0061716437339782715, -0.004817843437194824, -0.003464043140411377, -0.0021102428436279297, -0.0007564425468444824, 0.0005973577499389648, 0.0019511580467224121, 0.0033049583435058594, 0.004658758640289307, 0.006012558937072754, 0.007366359233856201, 0.008720159530639648, 0.010073959827423096, 0.011427760124206543, 0.01278156042098999, 0.014135360717773438, 0.015489161014556885, 0.016842961311340332, 0.01819676160812378, 0.019550561904907227, 0.020904362201690674, 0.02225816249847412, 0.02361196279525757, 0.024965763092041016, 0.026319563388824463, 0.02767336368560791, 0.029027163982391357, 0.030380964279174805, 0.03173476457595825, 0.0330885648727417, 0.034442365169525146, 0.035796165466308594, 0.03714996576309204, 0.03850376605987549, 0.039857566356658936, 0.04121136665344238, 0.04256516695022583, 0.04391896724700928, 0.045272767543792725, 0.04662656784057617, 0.04798036813735962]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 7.0, 15.0, 7.0, 22.0, 31.0, 42.0, 42.0, 60.0, 84.0, 118.0, 158.0, 191.0, 248.0, 368.0, 519.0, 729.0, 977.0, 1423.0, 2212.0, 3449.0, 5493.0, 10155.0, 21172.0, 183726.0, 761162.0, 26370.0, 11645.0, 6416.0, 3797.0, 2381.0, 1660.0, 1088.0, 762.0, 507.0, 403.0, 304.0, 196.0, 153.0, 126.0, 102.0, 47.0, 41.0, 32.0, 42.0, 30.0, 9.0, 11.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.05352783203125, -0.051860809326171875, -0.05019378662109375, -0.048526763916015625, -0.0468597412109375, -0.045192718505859375, -0.04352569580078125, -0.041858673095703125, -0.040191650390625, -0.038524627685546875, -0.03685760498046875, -0.035190582275390625, -0.0335235595703125, -0.031856536865234375, -0.03018951416015625, -0.028522491455078125, -0.02685546875, -0.025188446044921875, -0.02352142333984375, -0.021854400634765625, -0.0201873779296875, -0.018520355224609375, -0.01685333251953125, -0.015186309814453125, -0.013519287109375, -0.011852264404296875, -0.01018524169921875, -0.008518218994140625, -0.0068511962890625, -0.005184173583984375, -0.00351715087890625, -0.001850128173828125, -0.00018310546875, 0.001483917236328125, 0.00315093994140625, 0.004817962646484375, 0.0064849853515625, 0.008152008056640625, 0.00981903076171875, 0.011486053466796875, 0.013153076171875, 0.014820098876953125, 0.01648712158203125, 0.018154144287109375, 0.0198211669921875, 0.021488189697265625, 0.02315521240234375, 0.024822235107421875, 0.0264892578125, 0.028156280517578125, 0.02982330322265625, 0.031490325927734375, 0.0331573486328125, 0.034824371337890625, 0.03649139404296875, 0.038158416748046875, 0.039825439453125, 0.041492462158203125, 0.04315948486328125, 0.044826507568359375, 0.0464935302734375, 0.048160552978515625, 0.04982757568359375, 0.051494598388671875, 0.05316162109375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 4.0, 5.0, 8.0, 8.0, 8.0, 7.0, 20.0, 90.0, 335.0, 315.0, 85.0, 16.0, 11.0, 14.0, 9.0, 4.0, 5.0, 7.0, 7.0, 8.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0061492919921875, -0.005951344966888428, -0.0057533979415893555, -0.005555450916290283, -0.005357503890991211, -0.005159556865692139, -0.004961609840393066, -0.004763662815093994, -0.004565715789794922, -0.00436776876449585, -0.004169821739196777, -0.003971874713897705, -0.003773927688598633, -0.0035759806632995605, -0.0033780336380004883, -0.003180086612701416, -0.0029821395874023438, -0.0027841925621032715, -0.0025862455368041992, -0.002388298511505127, -0.0021903514862060547, -0.0019924044609069824, -0.0017944574356079102, -0.0015965104103088379, -0.0013985633850097656, -0.0012006163597106934, -0.001002669334411621, -0.0008047223091125488, -0.0006067752838134766, -0.0004088282585144043, -0.00021088123321533203, -1.2934207916259766e-05, 0.0001850128173828125, 0.00038295984268188477, 0.000580906867980957, 0.0007788538932800293, 0.0009768009185791016, 0.0011747479438781738, 0.001372694969177246, 0.0015706419944763184, 0.0017685890197753906, 0.001966536045074463, 0.002164483070373535, 0.0023624300956726074, 0.0025603771209716797, 0.002758324146270752, 0.0029562711715698242, 0.0031542181968688965, 0.0033521652221679688, 0.003550112247467041, 0.0037480592727661133, 0.0039460062980651855, 0.004143953323364258, 0.00434190034866333, 0.004539847373962402, 0.004737794399261475, 0.004935741424560547, 0.005133688449859619, 0.005331635475158691, 0.005529582500457764, 0.005727529525756836, 0.005925476551055908, 0.0061234235763549805, 0.006321370601654053, 0.006519317626953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 5.0, 11.0, 18.0, 22.0, 19.0, 25.0, 42.0, 64.0, 93.0, 115.0, 159.0, 236.0, 346.0, 564.0, 870.0, 1415.0, 2688.0, 5817.0, 17034.0, 151925.0, 806225.0, 42175.0, 9442.0, 4019.0, 1968.0, 1089.0, 737.0, 419.0, 274.0, 198.0, 146.0, 118.0, 81.0, 46.0, 40.0, 23.0, 20.0, 22.0, 10.0, 11.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08587646484375, -0.08283805847167969, -0.07979965209960938, -0.07676124572753906, -0.07372283935546875, -0.07068443298339844, -0.06764602661132812, -0.06460762023925781, -0.0615692138671875, -0.05853080749511719, -0.055492401123046875, -0.05245399475097656, -0.04941558837890625, -0.04637718200683594, -0.043338775634765625, -0.04030036926269531, -0.037261962890625, -0.03422355651855469, -0.031185150146484375, -0.028146743774414062, -0.02510833740234375, -0.022069931030273438, -0.019031524658203125, -0.015993118286132812, -0.0129547119140625, -0.009916305541992188, -0.006877899169921875, -0.0038394927978515625, -0.00080108642578125, 0.0022373199462890625, 0.005275726318359375, 0.008314132690429688, 0.0113525390625, 0.014390945434570312, 0.017429351806640625, 0.020467758178710938, 0.02350616455078125, 0.026544570922851562, 0.029582977294921875, 0.03262138366699219, 0.0356597900390625, 0.03869819641113281, 0.041736602783203125, 0.04477500915527344, 0.04781341552734375, 0.05085182189941406, 0.053890228271484375, 0.05692863464355469, 0.059967041015625, 0.06300544738769531, 0.06604385375976562, 0.06908226013183594, 0.07212066650390625, 0.07515907287597656, 0.07819747924804688, 0.08123588562011719, 0.0842742919921875, 0.08731269836425781, 0.09035110473632812, 0.09338951110839844, 0.09642791748046875, 0.09946632385253906, 0.10250473022460938, 0.10554313659667969, 0.10858154296875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 4.0, 3.0, 12.0, 8.0, 11.0, 9.0, 9.0, 14.0, 15.0, 19.0, 21.0, 22.0, 26.0, 29.0, 39.0, 36.0, 39.0, 38.0, 35.0, 34.0, 33.0, 43.0, 39.0, 31.0, 39.0, 38.0, 38.0, 25.0, 33.0, 43.0, 38.0, 21.0, 21.0, 15.0, 17.0, 12.0, 19.0, 12.0, 16.0, 9.0, 8.0, 5.0, 4.0, 6.0, 6.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0231475830078125, -0.022372007369995117, -0.021596431732177734, -0.02082085609436035, -0.02004528045654297, -0.019269704818725586, -0.018494129180908203, -0.01771855354309082, -0.016942977905273438, -0.016167402267456055, -0.015391826629638672, -0.014616250991821289, -0.013840675354003906, -0.013065099716186523, -0.01228952407836914, -0.011513948440551758, -0.010738372802734375, -0.009962797164916992, -0.00918722152709961, -0.008411645889282227, -0.007636070251464844, -0.006860494613647461, -0.006084918975830078, -0.005309343338012695, -0.0045337677001953125, -0.0037581920623779297, -0.002982616424560547, -0.002207040786743164, -0.0014314651489257812, -0.0006558895111083984, 0.00011968612670898438, 0.0008952617645263672, 0.00167083740234375, 0.002446413040161133, 0.0032219886779785156, 0.0039975643157958984, 0.004773139953613281, 0.005548715591430664, 0.006324291229248047, 0.00709986686706543, 0.007875442504882812, 0.008651018142700195, 0.009426593780517578, 0.010202169418334961, 0.010977745056152344, 0.011753320693969727, 0.01252889633178711, 0.013304471969604492, 0.014080047607421875, 0.014855623245239258, 0.01563119888305664, 0.016406774520874023, 0.017182350158691406, 0.01795792579650879, 0.018733501434326172, 0.019509077072143555, 0.020284652709960938, 0.02106022834777832, 0.021835803985595703, 0.022611379623413086, 0.02338695526123047, 0.02416253089904785, 0.024938106536865234, 0.025713682174682617, 0.0264892578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 7.0, 10.0, 8.0, 8.0, 27.0, 34.0, 51.0, 65.0, 101.0, 181.0, 281.0, 593.0, 1306.0, 3519.0, 17059.0, 947592.0, 67436.0, 6433.0, 1999.0, 835.0, 401.0, 220.0, 129.0, 86.0, 48.0, 47.0, 26.0, 16.0, 9.0, 10.0, 5.0, 1.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1224365234375, -0.11900997161865234, -0.11558341979980469, -0.11215686798095703, -0.10873031616210938, -0.10530376434326172, -0.10187721252441406, -0.0984506607055664, -0.09502410888671875, -0.0915975570678711, -0.08817100524902344, -0.08474445343017578, -0.08131790161132812, -0.07789134979248047, -0.07446479797363281, -0.07103824615478516, -0.0676116943359375, -0.06418514251708984, -0.06075859069824219, -0.05733203887939453, -0.053905487060546875, -0.05047893524169922, -0.04705238342285156, -0.043625831604003906, -0.04019927978515625, -0.036772727966308594, -0.03334617614746094, -0.02991962432861328, -0.026493072509765625, -0.02306652069091797, -0.019639968872070312, -0.016213417053222656, -0.012786865234375, -0.009360313415527344, -0.0059337615966796875, -0.0025072097778320312, 0.000919342041015625, 0.004345893859863281, 0.0077724456787109375, 0.011198997497558594, 0.01462554931640625, 0.018052101135253906, 0.021478652954101562, 0.02490520477294922, 0.028331756591796875, 0.03175830841064453, 0.03518486022949219, 0.038611412048339844, 0.0420379638671875, 0.045464515686035156, 0.04889106750488281, 0.05231761932373047, 0.055744171142578125, 0.05917072296142578, 0.06259727478027344, 0.0660238265991211, 0.06945037841796875, 0.0728769302368164, 0.07630348205566406, 0.07973003387451172, 0.08315658569335938, 0.08658313751220703, 0.09000968933105469, 0.09343624114990234, 0.09686279296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 8.0, 9.0, 11.0, 13.0, 14.0, 21.0, 45.0, 41.0, 61.0, 54.0, 72.0, 116.0, 93.0, 62.0, 81.0, 60.0, 46.0, 42.0, 31.0, 28.0, 15.0, 14.0, 12.0, 11.0, 2.0, 4.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-9.834766387939453e-06, -9.57585871219635e-06, -9.316951036453247e-06, -9.058043360710144e-06, -8.799135684967041e-06, -8.540228009223938e-06, -8.281320333480835e-06, -8.022412657737732e-06, -7.763504981994629e-06, -7.504597306251526e-06, -7.245689630508423e-06, -6.98678195476532e-06, -6.727874279022217e-06, -6.468966603279114e-06, -6.210058927536011e-06, -5.951151251792908e-06, -5.692243576049805e-06, -5.433335900306702e-06, -5.174428224563599e-06, -4.915520548820496e-06, -4.656612873077393e-06, -4.3977051973342896e-06, -4.1387975215911865e-06, -3.8798898458480835e-06, -3.6209821701049805e-06, -3.3620744943618774e-06, -3.1031668186187744e-06, -2.8442591428756714e-06, -2.5853514671325684e-06, -2.3264437913894653e-06, -2.0675361156463623e-06, -1.8086284399032593e-06, -1.5497207641601562e-06, -1.2908130884170532e-06, -1.0319054126739502e-06, -7.729977369308472e-07, -5.140900611877441e-07, -2.551823854446411e-07, 3.725290298461914e-09, 2.6263296604156494e-07, 5.21540641784668e-07, 7.80448317527771e-07, 1.039355993270874e-06, 1.298263669013977e-06, 1.55717134475708e-06, 1.816079020500183e-06, 2.074986696243286e-06, 2.333894371986389e-06, 2.592802047729492e-06, 2.8517097234725952e-06, 3.1106173992156982e-06, 3.3695250749588013e-06, 3.6284327507019043e-06, 3.887340426445007e-06, 4.14624810218811e-06, 4.405155777931213e-06, 4.664063453674316e-06, 4.9229711294174194e-06, 5.1818788051605225e-06, 5.4407864809036255e-06, 5.6996941566467285e-06, 5.9586018323898315e-06, 6.2175095081329346e-06, 6.476417183876038e-06, 6.735324859619141e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 3.0, 3.0, 3.0, 8.0, 16.0, 30.0, 28.0, 32.0, 50.0, 79.0, 147.0, 246.0, 415.0, 878.0, 1830.0, 5526.0, 28361.0, 947938.0, 50779.0, 7694.0, 2305.0, 1001.0, 461.0, 283.0, 128.0, 109.0, 81.0, 39.0, 20.0, 20.0, 12.0, 11.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2144775390625, -0.20845603942871094, -0.20243453979492188, -0.1964130401611328, -0.19039154052734375, -0.1843700408935547, -0.17834854125976562, -0.17232704162597656, -0.1663055419921875, -0.16028404235839844, -0.15426254272460938, -0.1482410430908203, -0.14221954345703125, -0.1361980438232422, -0.13017654418945312, -0.12415504455566406, -0.118133544921875, -0.11211204528808594, -0.10609054565429688, -0.10006904602050781, -0.09404754638671875, -0.08802604675292969, -0.08200454711914062, -0.07598304748535156, -0.0699615478515625, -0.06394004821777344, -0.057918548583984375, -0.05189704895019531, -0.04587554931640625, -0.03985404968261719, -0.033832550048828125, -0.027811050415039062, -0.02178955078125, -0.015768051147460938, -0.009746551513671875, -0.0037250518798828125, 0.00229644775390625, 0.008317947387695312, 0.014339447021484375, 0.020360946655273438, 0.0263824462890625, 0.03240394592285156, 0.038425445556640625, 0.04444694519042969, 0.05046844482421875, 0.05648994445800781, 0.06251144409179688, 0.06853294372558594, 0.074554443359375, 0.08057594299316406, 0.08659744262695312, 0.09261894226074219, 0.09864044189453125, 0.10466194152832031, 0.11068344116210938, 0.11670494079589844, 0.1227264404296875, 0.12874794006347656, 0.13476943969726562, 0.1407909393310547, 0.14681243896484375, 0.1528339385986328, 0.15885543823242188, 0.16487693786621094, 0.1708984375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 4.0, 6.0, 5.0, 11.0, 10.0, 2.0, 9.0, 17.0, 12.0, 7.0, 20.0, 26.0, 65.0, 116.0, 441.0, 90.0, 41.0, 34.0, 23.0, 14.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10614013671875, -0.10286331176757812, -0.09958648681640625, -0.09630966186523438, -0.0930328369140625, -0.08975601196289062, -0.08647918701171875, -0.08320236206054688, -0.079925537109375, -0.07664871215820312, -0.07337188720703125, -0.07009506225585938, -0.0668182373046875, -0.06354141235351562, -0.06026458740234375, -0.056987762451171875, -0.0537109375, -0.050434112548828125, -0.04715728759765625, -0.043880462646484375, -0.0406036376953125, -0.037326812744140625, -0.03404998779296875, -0.030773162841796875, -0.027496337890625, -0.024219512939453125, -0.02094268798828125, -0.017665863037109375, -0.0143890380859375, -0.011112213134765625, -0.00783538818359375, -0.004558563232421875, -0.00128173828125, 0.001995086669921875, 0.00527191162109375, 0.008548736572265625, 0.0118255615234375, 0.015102386474609375, 0.01837921142578125, 0.021656036376953125, 0.024932861328125, 0.028209686279296875, 0.03148651123046875, 0.034763336181640625, 0.0380401611328125, 0.041316986083984375, 0.04459381103515625, 0.047870635986328125, 0.0511474609375, 0.054424285888671875, 0.05770111083984375, 0.060977935791015625, 0.0642547607421875, 0.06753158569335938, 0.07080841064453125, 0.07408523559570312, 0.077362060546875, 0.08063888549804688, 0.08391571044921875, 0.08719253540039062, 0.0904693603515625, 0.09374618530273438, 0.09702301025390625, 0.10029983520507812, 0.10357666015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 9.0, 6.0, 19.0, 30.0, 171.0, 565.0, 129.0, 28.0, 18.0, 12.0, 3.0, 3.0, 3.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5227593183517456, -1.4849562644958496, -1.4471532106399536, -1.4093501567840576, -1.3715471029281616, -1.3337440490722656, -1.2959409952163696, -1.2581379413604736, -1.220334768295288, -1.182531714439392, -1.144728660583496, -1.1069256067276, -1.069122552871704, -1.031319499015808, -0.9935163855552673, -0.9557133316993713, -0.9179103374481201, -0.8801072835922241, -0.8423042297363281, -0.8045011758804321, -0.7666981220245361, -0.7288950681686401, -0.6910919547080994, -0.6532889008522034, -0.6154858469963074, -0.5776827931404114, -0.5398797392845154, -0.5020766854286194, -0.464273601770401, -0.426470547914505, -0.3886674642562866, -0.3508644104003906, -0.31306129693984985, -0.27525824308395386, -0.23745517432689667, -0.19965210556983948, -0.16184905171394348, -0.12404599785804749, -0.0862429291009903, -0.048439860343933105, -0.01063680648803711, 0.027166254818439484, 0.06496931612491608, 0.10277237743139267, 0.14057543873786926, 0.17837849259376526, 0.21618156135082245, 0.25398463010787964, 0.29178768396377563, 0.32959073781967163, 0.3673937916755676, 0.405196875333786, 0.442999929189682, 0.480802983045578, 0.5186060667037964, 0.5564091205596924, 0.5942121744155884, 0.6320152282714844, 0.6698182821273804, 0.7076213359832764, 0.7454243898391724, 0.7832274436950684, 0.8210305571556091, 0.8588336110115051, 0.8966366648674011]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 3.0, 5.0, 9.0, 6.0, 21.0, 22.0, 33.0, 58.0, 71.0, 137.0, 137.0, 124.0, 122.0, 88.0, 50.0, 38.0, 25.0, 8.0, 11.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6240644454956055, -0.6043663024902344, -0.5846681594848633, -0.5649700164794922, -0.5452718734741211, -0.52557373046875, -0.5058755874633789, -0.4861774444580078, -0.4664793014526367, -0.4467811584472656, -0.42708301544189453, -0.40738487243652344, -0.38768672943115234, -0.36798858642578125, -0.34829044342041016, -0.32859230041503906, -0.30889415740966797, -0.2891960144042969, -0.2694978713989258, -0.2497997283935547, -0.2301015853881836, -0.2104034423828125, -0.1907052993774414, -0.1710071563720703, -0.15130901336669922, -0.13161087036132812, -0.11191272735595703, -0.09221458435058594, -0.07251644134521484, -0.05281829833984375, -0.033120155334472656, -0.013422012329101562, 0.006276071071624756, 0.02597421407699585, 0.04567235708236694, 0.06537050008773804, 0.08506864309310913, 0.10476678609848022, 0.12446492910385132, 0.1441630721092224, 0.1638612151145935, 0.1835593581199646, 0.2032575011253357, 0.2229556441307068, 0.24265378713607788, 0.262351930141449, 0.28205007314682007, 0.30174821615219116, 0.32144635915756226, 0.34114450216293335, 0.36084264516830444, 0.38054078817367554, 0.40023893117904663, 0.4199370741844177, 0.4396352171897888, 0.4593333601951599, 0.479031503200531, 0.4987296462059021, 0.5184277892112732, 0.5381259322166443, 0.5578240752220154, 0.5775222182273865, 0.5972203612327576, 0.6169185042381287, 0.6366166472434998]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 10.0, 9.0, 12.0, 13.0, 11.0, 17.0, 35.0, 40.0, 125.0, 1086.0, 42800.0, 4146638.0, 3044.0, 189.0, 74.0, 36.0, 22.0, 22.0, 21.0, 13.0, 8.0, 5.0, 5.0, 4.0, 7.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.2232666015625, -5.055908203125, -4.8885498046875, -4.72119140625, -4.5538330078125, -4.386474609375, -4.2191162109375, -4.0517578125, -3.8843994140625, -3.717041015625, -3.5496826171875, -3.38232421875, -3.2149658203125, -3.047607421875, -2.8802490234375, -2.712890625, -2.5455322265625, -2.378173828125, -2.2108154296875, -2.04345703125, -1.8760986328125, -1.708740234375, -1.5413818359375, -1.3740234375, -1.2066650390625, -1.039306640625, -0.8719482421875, -0.70458984375, -0.5372314453125, -0.369873046875, -0.2025146484375, -0.03515625, 0.1322021484375, 0.299560546875, 0.4669189453125, 0.63427734375, 0.8016357421875, 0.968994140625, 1.1363525390625, 1.3037109375, 1.4710693359375, 1.638427734375, 1.8057861328125, 1.97314453125, 2.1405029296875, 2.307861328125, 2.4752197265625, 2.642578125, 2.8099365234375, 2.977294921875, 3.1446533203125, 3.31201171875, 3.4793701171875, 3.646728515625, 3.8140869140625, 3.9814453125, 4.1488037109375, 4.316162109375, 4.4835205078125, 4.65087890625, 4.8182373046875, 4.985595703125, 5.1529541015625, 5.3203125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 4.0, 5.0, 4.0, 6.0, 5.0, 6.0, 13.0, 21.0, 42.0, 80.0, 139.0, 194.0, 171.0, 113.0, 62.0, 24.0, 22.0, 11.0, 6.0, 6.0, 8.0, 8.0, 5.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004169464111328125, -0.004033923149108887, -0.0038983821868896484, -0.00376284122467041, -0.003627300262451172, -0.0034917593002319336, -0.0033562183380126953, -0.003220677375793457, -0.0030851364135742188, -0.0029495954513549805, -0.002814054489135742, -0.002678513526916504, -0.0025429725646972656, -0.0024074316024780273, -0.002271890640258789, -0.0021363496780395508, -0.0020008087158203125, -0.0018652677536010742, -0.001729726791381836, -0.0015941858291625977, -0.0014586448669433594, -0.001323103904724121, -0.0011875629425048828, -0.0010520219802856445, -0.0009164810180664062, -0.000780940055847168, -0.0006453990936279297, -0.0005098581314086914, -0.0003743171691894531, -0.00023877620697021484, -0.00010323524475097656, 3.230571746826172e-05, 0.0001678466796875, 0.0003033876419067383, 0.00043892860412597656, 0.0005744695663452148, 0.0007100105285644531, 0.0008455514907836914, 0.0009810924530029297, 0.001116633415222168, 0.0012521743774414062, 0.0013877153396606445, 0.0015232563018798828, 0.001658797264099121, 0.0017943382263183594, 0.0019298791885375977, 0.002065420150756836, 0.0022009611129760742, 0.0023365020751953125, 0.0024720430374145508, 0.002607583999633789, 0.0027431249618530273, 0.0028786659240722656, 0.003014206886291504, 0.003149747848510742, 0.0032852888107299805, 0.0034208297729492188, 0.003556370735168457, 0.0036919116973876953, 0.0038274526596069336, 0.003962993621826172, 0.00409853458404541, 0.0042340755462646484, 0.004369616508483887, 0.004505157470703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 11.0, 7.0, 6.0, 10.0, 9.0, 14.0, 23.0, 25.0, 32.0, 40.0, 50.0, 67.0, 89.0, 87.0, 141.0, 125.0, 199.0, 527.0, 15317.0, 4174204.0, 2606.0, 209.0, 119.0, 105.0, 78.0, 53.0, 36.0, 36.0, 18.0, 16.0, 8.0, 1.0, 2.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.447265625, -1.4104843139648438, -1.3737030029296875, -1.3369216918945312, -1.300140380859375, -1.2633590698242188, -1.2265777587890625, -1.1897964477539062, -1.15301513671875, -1.1162338256835938, -1.0794525146484375, -1.0426712036132812, -1.005889892578125, -0.9691085815429688, -0.9323272705078125, -0.8955459594726562, -0.8587646484375, -0.8219833374023438, -0.7852020263671875, -0.7484207153320312, -0.711639404296875, -0.6748580932617188, -0.6380767822265625, -0.6012954711914062, -0.56451416015625, -0.5277328491210938, -0.4909515380859375, -0.45417022705078125, -0.417388916015625, -0.38060760498046875, -0.3438262939453125, -0.30704498291015625, -0.270263671875, -0.23348236083984375, -0.1967010498046875, -0.15991973876953125, -0.123138427734375, -0.08635711669921875, -0.0495758056640625, -0.01279449462890625, 0.02398681640625, 0.06076812744140625, 0.0975494384765625, 0.13433074951171875, 0.171112060546875, 0.20789337158203125, 0.2446746826171875, 0.28145599365234375, 0.3182373046875, 0.35501861572265625, 0.3917999267578125, 0.42858123779296875, 0.465362548828125, 0.5021438598632812, 0.5389251708984375, 0.5757064819335938, 0.61248779296875, 0.6492691040039062, 0.6860504150390625, 0.7228317260742188, 0.759613037109375, 0.7963943481445312, 0.8331756591796875, 0.8699569702148438, 0.90673828125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 6.0, 3.0, 3.0, 6.0, 5.0, 10.0, 12.0, 12.0, 13.0, 11.0, 13.0, 29.0, 27.0, 34.0, 52.0, 62.0, 80.0, 105.0, 118.0, 149.0, 157.0, 185.0, 266.0, 350.0, 1104.0, 327.0, 216.0, 153.0, 139.0, 120.0, 86.0, 62.0, 51.0, 31.0, 30.0, 14.0, 7.0, 4.0, 13.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.011260986328125, -0.01097559928894043, -0.01069021224975586, -0.010404825210571289, -0.010119438171386719, -0.009834051132202148, -0.009548664093017578, -0.009263277053833008, -0.008977890014648438, -0.008692502975463867, -0.008407115936279297, -0.008121728897094727, -0.007836341857910156, -0.007550954818725586, -0.007265567779541016, -0.006980180740356445, -0.006694793701171875, -0.006409406661987305, -0.006124019622802734, -0.005838632583618164, -0.005553245544433594, -0.0052678585052490234, -0.004982471466064453, -0.004697084426879883, -0.0044116973876953125, -0.004126310348510742, -0.003840923309326172, -0.0035555362701416016, -0.0032701492309570312, -0.002984762191772461, -0.0026993751525878906, -0.0024139881134033203, -0.00212860107421875, -0.0018432140350341797, -0.0015578269958496094, -0.001272439956665039, -0.0009870529174804688, -0.0007016658782958984, -0.0004162788391113281, -0.0001308917999267578, 0.0001544952392578125, 0.0004398822784423828, 0.0007252693176269531, 0.0010106563568115234, 0.0012960433959960938, 0.001581430435180664, 0.0018668174743652344, 0.0021522045135498047, 0.002437591552734375, 0.0027229785919189453, 0.0030083656311035156, 0.003293752670288086, 0.0035791397094726562, 0.0038645267486572266, 0.004149913787841797, 0.004435300827026367, 0.0047206878662109375, 0.005006074905395508, 0.005291461944580078, 0.0055768489837646484, 0.005862236022949219, 0.006147623062133789, 0.006433010101318359, 0.00671839714050293, 0.0070037841796875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 13.0, 106.0, 894.0, 5.0, 2.0], "bins": [-6.651535511016846, -6.543209552764893, -6.4348835945129395, -6.326557159423828, -6.218231201171875, -6.109905242919922, -6.001579284667969, -5.893253326416016, -5.784926891326904, -5.676600933074951, -5.568274974822998, -5.459948539733887, -5.351622581481934, -5.2432966232299805, -5.134970664978027, -5.026644706726074, -4.918318748474121, -4.809992790222168, -4.701666831970215, -4.5933403968811035, -4.48501443862915, -4.376688480377197, -4.268362522125244, -4.160036563873291, -4.05171012878418, -3.9433841705322266, -3.8350579738616943, -3.726732015609741, -3.618405818939209, -3.510079860687256, -3.4017539024353027, -3.2934277057647705, -3.1851015090942383, -3.076775550842285, -2.968449354171753, -2.8601233959198, -2.7517971992492676, -2.6434712409973145, -2.5351452827453613, -2.426819086074829, -2.318493127822876, -2.210167169570923, -2.1018409729003906, -1.9935150146484375, -1.8851889371871948, -1.7768628597259521, -1.6685367822647095, -1.5602107048034668, -1.4518847465515137, -1.343558669090271, -1.2352325916290283, -1.1269066333770752, -1.0185805559158325, -0.9102544784545898, -0.8019284009933472, -0.6936023831367493, -0.5852762460708618, -0.47695019841194153, -0.36862415075302124, -0.26029807329177856, -0.15197202563285828, -0.04364597797393799, 0.06468009948730469, 0.1730061173439026, 0.28133219480514526]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 9.0, 6.0, 14.0, 18.0, 31.0, 60.0, 78.0, 88.0, 93.0, 108.0, 115.0, 111.0, 66.0, 67.0, 44.0, 32.0, 19.0, 18.0, 11.0, 8.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4141967296600342, -0.4048404395580292, -0.39548414945602417, -0.3861278295516968, -0.3767715394496918, -0.36741524934768677, -0.35805895924568176, -0.34870266914367676, -0.33934634923934937, -0.32999005913734436, -0.32063376903533936, -0.31127744913101196, -0.30192115902900696, -0.29256486892700195, -0.28320857882499695, -0.27385228872299194, -0.26449596881866455, -0.25513967871665955, -0.24578337371349335, -0.23642708361148834, -0.22707077860832214, -0.21771448850631714, -0.20835819840431213, -0.19900189340114594, -0.18964561820030212, -0.18028932809829712, -0.17093302309513092, -0.16157673299312592, -0.15222042798995972, -0.1428641378879547, -0.1335078477859497, -0.12415154278278351, -0.11479523777961731, -0.10543894022703171, -0.0960826426744461, -0.0867263525724411, -0.0773700475692749, -0.0680137574672699, -0.058657459914684296, -0.049301162362098694, -0.03994486480951309, -0.03058856725692749, -0.021232271566987038, -0.011875975877046585, -0.0025196783244609833, 0.0068366192281246185, 0.016192913055419922, 0.025549210608005524, 0.034905508160591125, 0.04426180571317673, 0.05361810326576233, 0.06297439336776733, 0.07233069837093353, 0.08168698847293854, 0.09104328602552414, 0.10039958357810974, 0.10975588113069534, 0.11911217868328094, 0.12846846878528595, 0.13782477378845215, 0.14718106389045715, 0.15653736889362335, 0.16589365899562836, 0.17524996399879456, 0.18460625410079956]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 0.0, 14.0, 18.0, 16.0, 19.0, 21.0, 33.0, 54.0, 85.0, 95.0, 122.0, 178.0, 247.0, 284.0, 399.0, 502.0, 667.0, 902.0, 1194.0, 1662.0, 2390.0, 3443.0, 5186.0, 8465.0, 15311.0, 38231.0, 333120.0, 542105.0, 48661.0, 17290.0, 9126.0, 5578.0, 3665.0, 2486.0, 1711.0, 1323.0, 979.0, 709.0, 546.0, 388.0, 321.0, 252.0, 203.0, 155.0, 101.0, 78.0, 55.0, 49.0, 39.0, 27.0, 15.0, 6.0, 11.0, 13.0, 4.0, 4.0, 3.0, 5.0], "bins": [-0.045074462890625, -0.04371213912963867, -0.042349815368652344, -0.040987491607666016, -0.03962516784667969, -0.03826284408569336, -0.03690052032470703, -0.0355381965637207, -0.034175872802734375, -0.03281354904174805, -0.03145122528076172, -0.03008890151977539, -0.028726577758789062, -0.027364253997802734, -0.026001930236816406, -0.024639606475830078, -0.02327728271484375, -0.021914958953857422, -0.020552635192871094, -0.019190311431884766, -0.017827987670898438, -0.01646566390991211, -0.015103340148925781, -0.013741016387939453, -0.012378692626953125, -0.011016368865966797, -0.009654045104980469, -0.00829172134399414, -0.0069293975830078125, -0.005567073822021484, -0.004204750061035156, -0.002842426300048828, -0.0014801025390625, -0.00011777877807617188, 0.0012445449829101562, 0.0026068687438964844, 0.0039691925048828125, 0.005331516265869141, 0.006693840026855469, 0.008056163787841797, 0.009418487548828125, 0.010780811309814453, 0.012143135070800781, 0.01350545883178711, 0.014867782592773438, 0.016230106353759766, 0.017592430114746094, 0.018954753875732422, 0.02031707763671875, 0.021679401397705078, 0.023041725158691406, 0.024404048919677734, 0.025766372680664062, 0.02712869644165039, 0.02849102020263672, 0.029853343963623047, 0.031215667724609375, 0.0325779914855957, 0.03394031524658203, 0.03530263900756836, 0.03666496276855469, 0.038027286529541016, 0.039389610290527344, 0.04075193405151367, 0.0421142578125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 2.0, 4.0, 2.0, 5.0, 5.0, 4.0, 7.0, 8.0, 10.0, 15.0, 23.0, 41.0, 55.0, 101.0, 137.0, 159.0, 139.0, 97.0, 63.0, 30.0, 21.0, 12.0, 10.0, 6.0, 6.0, 5.0, 6.0, 6.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004032135009765625, -0.003899216651916504, -0.003766298294067383, -0.0036333799362182617, -0.0035004615783691406, -0.0033675432205200195, -0.0032346248626708984, -0.0031017065048217773, -0.0029687881469726562, -0.002835869789123535, -0.002702951431274414, -0.002570033073425293, -0.002437114715576172, -0.0023041963577270508, -0.0021712779998779297, -0.0020383596420288086, -0.0019054412841796875, -0.0017725229263305664, -0.0016396045684814453, -0.0015066862106323242, -0.0013737678527832031, -0.001240849494934082, -0.001107931137084961, -0.0009750127792358398, -0.0008420944213867188, -0.0007091760635375977, -0.0005762577056884766, -0.00044333934783935547, -0.0003104209899902344, -0.00017750263214111328, -4.458427429199219e-05, 8.83340835571289e-05, 0.00022125244140625, 0.0003541707992553711, 0.0004870891571044922, 0.0006200075149536133, 0.0007529258728027344, 0.0008858442306518555, 0.0010187625885009766, 0.0011516809463500977, 0.0012845993041992188, 0.0014175176620483398, 0.001550436019897461, 0.001683354377746582, 0.0018162727355957031, 0.0019491910934448242, 0.0020821094512939453, 0.0022150278091430664, 0.0023479461669921875, 0.0024808645248413086, 0.0026137828826904297, 0.0027467012405395508, 0.002879619598388672, 0.003012537956237793, 0.003145456314086914, 0.003278374671936035, 0.0034112930297851562, 0.0035442113876342773, 0.0036771297454833984, 0.0038100481033325195, 0.003942966461181641, 0.004075884819030762, 0.004208803176879883, 0.004341721534729004, 0.004474639892578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 5.0, 4.0, 8.0, 12.0, 17.0, 21.0, 19.0, 12.0, 29.0, 24.0, 39.0, 42.0, 65.0, 174.0, 618.0, 5640.0, 836429.0, 201485.0, 3037.0, 395.0, 125.0, 74.0, 56.0, 38.0, 26.0, 35.0, 22.0, 17.0, 10.0, 14.0, 9.0, 8.0, 9.0, 9.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.204345703125, -0.19865036010742188, -0.19295501708984375, -0.18725967407226562, -0.1815643310546875, -0.17586898803710938, -0.17017364501953125, -0.16447830200195312, -0.158782958984375, -0.15308761596679688, -0.14739227294921875, -0.14169692993164062, -0.1360015869140625, -0.13030624389648438, -0.12461090087890625, -0.11891555786132812, -0.11322021484375, -0.10752487182617188, -0.10182952880859375, -0.09613418579101562, -0.0904388427734375, -0.08474349975585938, -0.07904815673828125, -0.07335281372070312, -0.067657470703125, -0.061962127685546875, -0.05626678466796875, -0.050571441650390625, -0.0448760986328125, -0.039180755615234375, -0.03348541259765625, -0.027790069580078125, -0.0220947265625, -0.016399383544921875, -0.01070404052734375, -0.005008697509765625, 0.0006866455078125, 0.006381988525390625, 0.01207733154296875, 0.017772674560546875, 0.023468017578125, 0.029163360595703125, 0.03485870361328125, 0.040554046630859375, 0.0462493896484375, 0.051944732666015625, 0.05764007568359375, 0.06333541870117188, 0.06903076171875, 0.07472610473632812, 0.08042144775390625, 0.08611679077148438, 0.0918121337890625, 0.09750747680664062, 0.10320281982421875, 0.10889816284179688, 0.114593505859375, 0.12028884887695312, 0.12598419189453125, 0.13167953491210938, 0.1373748779296875, 0.14307022094726562, 0.14876556396484375, 0.15446090698242188, 0.16015625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 9.0, 5.0, 11.0, 12.0, 20.0, 21.0, 37.0, 18.0, 30.0, 18.0, 40.0, 27.0, 43.0, 45.0, 34.0, 23.0, 43.0, 46.0, 43.0, 45.0, 45.0, 43.0, 33.0, 49.0, 32.0, 29.0, 30.0, 21.0, 27.0, 22.0, 10.0, 14.0, 8.0, 14.0, 12.0, 13.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.019287109375, -0.01876676082611084, -0.01824641227722168, -0.01772606372833252, -0.01720571517944336, -0.0166853666305542, -0.01616501808166504, -0.01564466953277588, -0.015124320983886719, -0.014603972434997559, -0.014083623886108398, -0.013563275337219238, -0.013042926788330078, -0.012522578239440918, -0.012002229690551758, -0.011481881141662598, -0.010961532592773438, -0.010441184043884277, -0.009920835494995117, -0.009400486946105957, -0.008880138397216797, -0.008359789848327637, -0.007839441299438477, -0.007319092750549316, -0.006798744201660156, -0.006278395652770996, -0.005758047103881836, -0.005237698554992676, -0.004717350006103516, -0.0041970014572143555, -0.0036766529083251953, -0.003156304359436035, -0.002635955810546875, -0.002115607261657715, -0.0015952587127685547, -0.0010749101638793945, -0.0005545616149902344, -3.421306610107422e-05, 0.00048613548278808594, 0.001006484031677246, 0.0015268325805664062, 0.0020471811294555664, 0.0025675296783447266, 0.0030878782272338867, 0.003608226776123047, 0.004128575325012207, 0.004648923873901367, 0.005169272422790527, 0.0056896209716796875, 0.006209969520568848, 0.006730318069458008, 0.007250666618347168, 0.007771015167236328, 0.008291363716125488, 0.008811712265014648, 0.009332060813903809, 0.009852409362792969, 0.010372757911682129, 0.010893106460571289, 0.01141345500946045, 0.01193380355834961, 0.01245415210723877, 0.01297450065612793, 0.01349484920501709, 0.01401519775390625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 10.0, 33.0, 105.0, 1003.0, 1046138.0, 1105.0, 105.0, 25.0, 12.0, 6.0, 7.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.36328125, -1.32489013671875, -1.2864990234375, -1.24810791015625, -1.209716796875, -1.17132568359375, -1.1329345703125, -1.09454345703125, -1.05615234375, -1.01776123046875, -0.9793701171875, -0.94097900390625, -0.902587890625, -0.86419677734375, -0.8258056640625, -0.78741455078125, -0.7490234375, -0.71063232421875, -0.6722412109375, -0.63385009765625, -0.595458984375, -0.55706787109375, -0.5186767578125, -0.48028564453125, -0.44189453125, -0.40350341796875, -0.3651123046875, -0.32672119140625, -0.288330078125, -0.24993896484375, -0.2115478515625, -0.17315673828125, -0.134765625, -0.09637451171875, -0.0579833984375, -0.01959228515625, 0.018798828125, 0.05718994140625, 0.0955810546875, 0.13397216796875, 0.17236328125, 0.21075439453125, 0.2491455078125, 0.28753662109375, 0.325927734375, 0.36431884765625, 0.4027099609375, 0.44110107421875, 0.4794921875, 0.51788330078125, 0.5562744140625, 0.59466552734375, 0.633056640625, 0.67144775390625, 0.7098388671875, 0.74822998046875, 0.78662109375, 0.82501220703125, 0.8634033203125, 0.90179443359375, 0.940185546875, 0.97857666015625, 1.0169677734375, 1.05535888671875, 1.09375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 9.0, 12.0, 32.0, 106.0, 474.0, 219.0, 39.0, 20.0, 18.0, 15.0, 10.0, 5.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00021576881408691406, -0.0002103373408317566, -0.00020490586757659912, -0.00019947439432144165, -0.00019404292106628418, -0.0001886114478111267, -0.00018317997455596924, -0.00017774850130081177, -0.0001723170280456543, -0.00016688555479049683, -0.00016145408153533936, -0.00015602260828018188, -0.00015059113502502441, -0.00014515966176986694, -0.00013972818851470947, -0.000134296715259552, -0.00012886524200439453, -0.00012343376874923706, -0.00011800229549407959, -0.00011257082223892212, -0.00010713934898376465, -0.00010170787572860718, -9.627640247344971e-05, -9.084492921829224e-05, -8.541345596313477e-05, -7.99819827079773e-05, -7.455050945281982e-05, -6.911903619766235e-05, -6.368756294250488e-05, -5.825608968734741e-05, -5.282461643218994e-05, -4.739314317703247e-05, -4.1961669921875e-05, -3.653019666671753e-05, -3.109872341156006e-05, -2.5667250156402588e-05, -2.0235776901245117e-05, -1.4804303646087646e-05, -9.372830390930176e-06, -3.941357135772705e-06, 1.4901161193847656e-06, 6.921589374542236e-06, 1.2353062629699707e-05, 1.7784535884857178e-05, 2.321600914001465e-05, 2.864748239517212e-05, 3.407895565032959e-05, 3.951042890548706e-05, 4.494190216064453e-05, 5.0373375415802e-05, 5.580484867095947e-05, 6.123632192611694e-05, 6.666779518127441e-05, 7.209926843643188e-05, 7.753074169158936e-05, 8.296221494674683e-05, 8.83936882019043e-05, 9.382516145706177e-05, 9.925663471221924e-05, 0.00010468810796737671, 0.00011011958122253418, 0.00011555105447769165, 0.00012098252773284912, 0.0001264140009880066, 0.00013184547424316406]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 26.0, 55.0, 124.0, 858.0, 22344.0, 1022825.0, 1933.0, 249.0, 67.0, 27.0, 12.0, 6.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7568359375, -0.7317581176757812, -0.7066802978515625, -0.6816024780273438, -0.656524658203125, -0.6314468383789062, -0.6063690185546875, -0.5812911987304688, -0.55621337890625, -0.5311355590820312, -0.5060577392578125, -0.48097991943359375, -0.455902099609375, -0.43082427978515625, -0.4057464599609375, -0.38066864013671875, -0.3555908203125, -0.33051300048828125, -0.3054351806640625, -0.28035736083984375, -0.255279541015625, -0.23020172119140625, -0.2051239013671875, -0.18004608154296875, -0.15496826171875, -0.12989044189453125, -0.1048126220703125, -0.07973480224609375, -0.054656982421875, -0.02957916259765625, -0.0045013427734375, 0.02057647705078125, 0.045654296875, 0.07073211669921875, 0.0958099365234375, 0.12088775634765625, 0.145965576171875, 0.17104339599609375, 0.1961212158203125, 0.22119903564453125, 0.24627685546875, 0.27135467529296875, 0.2964324951171875, 0.32151031494140625, 0.346588134765625, 0.37166595458984375, 0.3967437744140625, 0.42182159423828125, 0.4468994140625, 0.47197723388671875, 0.4970550537109375, 0.5221328735351562, 0.547210693359375, 0.5722885131835938, 0.5973663330078125, 0.6224441528320312, 0.64752197265625, 0.6725997924804688, 0.6976776123046875, 0.7227554321289062, 0.747833251953125, 0.7729110717773438, 0.7979888916015625, 0.8230667114257812, 0.84814453125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 7.0, 18.0, 56.0, 596.0, 237.0, 39.0, 14.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1358642578125, -0.1313037872314453, -0.12674331665039062, -0.12218284606933594, -0.11762237548828125, -0.11306190490722656, -0.10850143432617188, -0.10394096374511719, -0.0993804931640625, -0.09482002258300781, -0.09025955200195312, -0.08569908142089844, -0.08113861083984375, -0.07657814025878906, -0.07201766967773438, -0.06745719909667969, -0.062896728515625, -0.05833625793457031, -0.053775787353515625, -0.04921531677246094, -0.04465484619140625, -0.04009437561035156, -0.035533905029296875, -0.030973434448242188, -0.0264129638671875, -0.021852493286132812, -0.017292022705078125, -0.012731552124023438, -0.00817108154296875, -0.0036106109619140625, 0.000949859619140625, 0.0055103302001953125, 0.01007080078125, 0.014631271362304688, 0.019191741943359375, 0.023752212524414062, 0.02831268310546875, 0.03287315368652344, 0.037433624267578125, 0.04199409484863281, 0.0465545654296875, 0.05111503601074219, 0.055675506591796875, 0.06023597717285156, 0.06479644775390625, 0.06935691833496094, 0.07391738891601562, 0.07847785949707031, 0.083038330078125, 0.08759880065917969, 0.09215927124023438, 0.09671974182128906, 0.10128021240234375, 0.10584068298339844, 0.11040115356445312, 0.11496162414550781, 0.1195220947265625, 0.12408256530761719, 0.12864303588867188, 0.13320350646972656, 0.13776397705078125, 0.14232444763183594, 0.14688491821289062, 0.1514453887939453, 0.156005859375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 13.0, 14.0, 60.0, 208.0, 474.0, 176.0, 42.0, 12.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43253469467163086, -0.4124159812927246, -0.39229729771614075, -0.3721785843372345, -0.35205990076065063, -0.3319411873817444, -0.31182247400283813, -0.2917037606239319, -0.271585077047348, -0.2514663636684418, -0.2313476800918579, -0.21122896671295166, -0.1911102682352066, -0.17099156975746155, -0.1508728563785553, -0.13075415790081024, -0.11063545942306519, -0.09051676094532013, -0.07039805501699448, -0.05027935281395912, -0.030160650610923767, -0.010041952133178711, 0.010076753795146942, 0.030195459723472595, 0.05031415820121765, 0.07043285667896271, 0.09055156260728836, 0.11067026853561401, 0.13078896701335907, 0.15090766549110413, 0.17102637887001038, 0.19114507734775543, 0.2112637758255005, 0.23138247430324554, 0.2515011727809906, 0.27161988615989685, 0.2917385697364807, 0.31185728311538696, 0.3319759964942932, 0.35209470987319946, 0.3722133934497833, 0.3923321068286896, 0.41245079040527344, 0.4325695037841797, 0.45268821716308594, 0.4728069007396698, 0.49292561411857605, 0.5130442976951599, 0.5331630110740662, 0.5532817244529724, 0.5734004378318787, 0.5935190916061401, 0.6136378049850464, 0.6337565183639526, 0.6538752317428589, 0.6739939451217651, 0.6941126585006714, 0.7142313718795776, 0.7343500852584839, 0.7544687390327454, 0.7745874524116516, 0.7947061657905579, 0.8148248791694641, 0.8349435925483704, 0.8550622463226318]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 9.0, 18.0, 10.0, 16.0, 24.0, 27.0, 29.0, 39.0, 69.0, 63.0, 84.0, 93.0, 96.0, 77.0, 81.0, 68.0, 49.0, 42.0, 30.0, 14.0, 16.0, 7.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20982682704925537, -0.20254981517791748, -0.1952728033065796, -0.1879957914352417, -0.1807187795639038, -0.17344176769256592, -0.16616475582122803, -0.15888774394989014, -0.15161073207855225, -0.14433372020721436, -0.13705670833587646, -0.12977969646453857, -0.12250268459320068, -0.11522567272186279, -0.1079486608505249, -0.10067164897918701, -0.09339463710784912, -0.08611762523651123, -0.07884061336517334, -0.07156360149383545, -0.06428658962249756, -0.05700957775115967, -0.04973256587982178, -0.04245555400848389, -0.035178542137145996, -0.027901530265808105, -0.020624518394470215, -0.013347506523132324, -0.006070494651794434, 0.001206517219543457, 0.008483529090881348, 0.01576054096221924, 0.02303755283355713, 0.03031456470489502, 0.03759157657623291, 0.0448685884475708, 0.05214560031890869, 0.05942261219024658, 0.06669962406158447, 0.07397663593292236, 0.08125364780426025, 0.08853065967559814, 0.09580767154693604, 0.10308468341827393, 0.11036169528961182, 0.11763870716094971, 0.1249157190322876, 0.1321927309036255, 0.13946974277496338, 0.14674675464630127, 0.15402376651763916, 0.16130077838897705, 0.16857779026031494, 0.17585480213165283, 0.18313181400299072, 0.1904088258743286, 0.1976858377456665, 0.2049628496170044, 0.21223986148834229, 0.21951687335968018, 0.22679388523101807, 0.23407089710235596, 0.24134790897369385, 0.24862492084503174, 0.25590193271636963]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 8.0, 4.0, 10.0, 4.0, 8.0, 6.0, 4.0, 12.0, 8.0, 8.0, 6.0, 18.0, 16.0, 26.0, 22.0, 86.0, 2524.0, 4191077.0, 193.0, 30.0, 18.0, 32.0, 20.0, 12.0, 20.0, 12.0, 16.0, 16.0, 0.0, 6.0, 8.0, 4.0, 6.0, 4.0, 6.0, 0.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0], "bins": [-3.44140625, -3.343597412109375, -3.24578857421875, -3.147979736328125, -3.0501708984375, -2.952362060546875, -2.85455322265625, -2.756744384765625, -2.658935546875, -2.561126708984375, -2.46331787109375, -2.365509033203125, -2.2677001953125, -2.169891357421875, -2.07208251953125, -1.974273681640625, -1.87646484375, -1.778656005859375, -1.68084716796875, -1.583038330078125, -1.4852294921875, -1.387420654296875, -1.28961181640625, -1.191802978515625, -1.093994140625, -0.996185302734375, -0.89837646484375, -0.800567626953125, -0.7027587890625, -0.604949951171875, -0.50714111328125, -0.409332275390625, -0.3115234375, -0.213714599609375, -0.11590576171875, -0.018096923828125, 0.0797119140625, 0.177520751953125, 0.27532958984375, 0.373138427734375, 0.470947265625, 0.568756103515625, 0.66656494140625, 0.764373779296875, 0.8621826171875, 0.959991455078125, 1.05780029296875, 1.155609130859375, 1.25341796875, 1.351226806640625, 1.44903564453125, 1.546844482421875, 1.6446533203125, 1.742462158203125, 1.84027099609375, 1.938079833984375, 2.035888671875, 2.133697509765625, 2.23150634765625, 2.329315185546875, 2.4271240234375, 2.524932861328125, 2.62274169921875, 2.720550537109375, 2.818359375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 6.0, 9.0, 2.0, 10.0, 12.0, 14.0, 34.0, 38.0, 36.0, 68.0, 95.0, 118.0, 110.0, 110.0, 89.0, 62.0, 46.0, 44.0, 18.0, 13.0, 9.0, 11.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031795501708984375, -0.003062635660171509, -0.00294572114944458, -0.0028288066387176514, -0.0027118921279907227, -0.002594977617263794, -0.0024780631065368652, -0.0023611485958099365, -0.002244234085083008, -0.002127319574356079, -0.0020104050636291504, -0.0018934905529022217, -0.001776576042175293, -0.0016596615314483643, -0.0015427470207214355, -0.0014258325099945068, -0.0013089179992675781, -0.0011920034885406494, -0.0010750889778137207, -0.000958174467086792, -0.0008412599563598633, -0.0007243454456329346, -0.0006074309349060059, -0.0004905164241790771, -0.00037360191345214844, -0.0002566874027252197, -0.00013977289199829102, -2.2858381271362305e-05, 9.40561294555664e-05, 0.00021097064018249512, 0.00032788515090942383, 0.00044479966163635254, 0.0005617141723632812, 0.00067862868309021, 0.0007955431938171387, 0.0009124577045440674, 0.001029372215270996, 0.0011462867259979248, 0.0012632012367248535, 0.0013801157474517822, 0.001497030258178711, 0.0016139447689056396, 0.0017308592796325684, 0.001847773790359497, 0.0019646883010864258, 0.0020816028118133545, 0.002198517322540283, 0.002315431833267212, 0.0024323463439941406, 0.0025492608547210693, 0.002666175365447998, 0.0027830898761749268, 0.0029000043869018555, 0.003016918897628784, 0.003133833408355713, 0.0032507479190826416, 0.0033676624298095703, 0.003484576940536499, 0.0036014914512634277, 0.0037184059619903564, 0.003835320472717285, 0.003952234983444214, 0.004069149494171143, 0.004186064004898071, 0.004302978515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 11.0, 30.0, 51.0, 185.0, 2760.0, 4190839.0, 265.0, 82.0, 28.0, 14.0, 10.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.87353515625, -0.8017501831054688, -0.7299652099609375, -0.6581802368164062, -0.586395263671875, -0.5146102905273438, -0.4428253173828125, -0.37104034423828125, -0.29925537109375, -0.22747039794921875, -0.1556854248046875, -0.08390045166015625, -0.012115478515625, 0.05966949462890625, 0.1314544677734375, 0.20323944091796875, 0.2750244140625, 0.34680938720703125, 0.4185943603515625, 0.49037933349609375, 0.562164306640625, 0.6339492797851562, 0.7057342529296875, 0.7775192260742188, 0.84930419921875, 0.9210891723632812, 0.9928741455078125, 1.0646591186523438, 1.136444091796875, 1.2082290649414062, 1.2800140380859375, 1.3517990112304688, 1.423583984375, 1.4953689575195312, 1.5671539306640625, 1.6389389038085938, 1.710723876953125, 1.7825088500976562, 1.8542938232421875, 1.9260787963867188, 1.99786376953125, 2.0696487426757812, 2.1414337158203125, 2.2132186889648438, 2.285003662109375, 2.3567886352539062, 2.4285736083984375, 2.5003585815429688, 2.5721435546875, 2.6439285278320312, 2.7157135009765625, 2.7874984741210938, 2.859283447265625, 2.9310684204101562, 3.0028533935546875, 3.0746383666992188, 3.14642333984375, 3.2182083129882812, 3.2899932861328125, 3.3617782592773438, 3.433563232421875, 3.5053482055664062, 3.5771331787109375, 3.6489181518554688, 3.720703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 7.0, 11.0, 10.0, 20.0, 34.0, 43.0, 55.0, 82.0, 121.0, 212.0, 335.0, 1063.0, 1059.0, 346.0, 182.0, 132.0, 79.0, 76.0, 49.0, 35.0, 28.0, 20.0, 15.0, 8.0, 4.0, 13.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.007320404052734375, -0.007015407085418701, -0.006710410118103027, -0.0064054131507873535, -0.00610041618347168, -0.005795419216156006, -0.005490422248840332, -0.005185425281524658, -0.004880428314208984, -0.0045754313468933105, -0.004270434379577637, -0.003965437412261963, -0.003660440444946289, -0.0033554434776306152, -0.0030504465103149414, -0.0027454495429992676, -0.0024404525756835938, -0.00213545560836792, -0.001830458641052246, -0.0015254616737365723, -0.0012204647064208984, -0.0009154677391052246, -0.0006104707717895508, -0.00030547380447387695, -4.76837158203125e-07, 0.0003045201301574707, 0.0006095170974731445, 0.0009145140647888184, 0.0012195110321044922, 0.001524507999420166, 0.0018295049667358398, 0.0021345019340515137, 0.0024394989013671875, 0.0027444958686828613, 0.003049492835998535, 0.003354489803314209, 0.003659486770629883, 0.003964483737945557, 0.0042694807052612305, 0.004574477672576904, 0.004879474639892578, 0.005184471607208252, 0.005489468574523926, 0.0057944655418396, 0.0060994625091552734, 0.006404459476470947, 0.006709456443786621, 0.007014453411102295, 0.007319450378417969, 0.007624447345733643, 0.007929444313049316, 0.00823444128036499, 0.008539438247680664, 0.008844435214996338, 0.009149432182312012, 0.009454429149627686, 0.00975942611694336, 0.010064423084259033, 0.010369420051574707, 0.01067441701889038, 0.010979413986206055, 0.011284410953521729, 0.011589407920837402, 0.011894404888153076, 0.01219940185546875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 1014.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5046516060829163, -0.3558255434036255, -0.20699948072433472, -0.058173418045043945, 0.09065264463424683, 0.2394787073135376, 0.38830476999282837, 0.5371307730674744, 0.6859568953514099, 0.8347829580307007, 0.9836090207099915, 1.1324350833892822, 1.2812612056732178, 1.4300872087478638, 1.5789132118225098, 1.7277393341064453, 1.8765654563903809, 2.0253915786743164, 2.174217700958252, 2.3230435848236084, 2.471869707107544, 2.6206958293914795, 2.769521713256836, 2.9183478355407715, 3.067173957824707, 3.2160000801086426, 3.364826202392578, 3.5136520862579346, 3.66247820854187, 3.8113043308258057, 3.960130214691162, 4.108956336975098, 4.257781982421875, 4.4066081047058105, 4.555434226989746, 4.704260349273682, 4.853086471557617, 5.0019121170043945, 5.15073823928833, 5.299564361572266, 5.448390483856201, 5.597216606140137, 5.746042728424072, 5.894868850708008, 6.043694496154785, 6.192520618438721, 6.341346740722656, 6.490172863006592, 6.638998985290527, 6.787825107574463, 6.936651229858398, 7.085477352142334, 7.2343034744262695, 7.383129119873047, 7.531955242156982, 7.680781364440918, 7.8296074867248535, 7.978433609008789, 8.127259254455566, 8.27608585357666, 8.424911499023438, 8.573738098144531, 8.722563743591309, 8.871389389038086, 9.02021598815918]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 9.0, 16.0, 38.0, 69.0, 116.0, 169.0, 192.0, 174.0, 105.0, 66.0, 34.0, 14.0, 5.0, 6.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08072179555892944, -0.0755595788359642, -0.07039736211299896, -0.06523513793945312, -0.060072921216487885, -0.054910704493522644, -0.049748484045267105, -0.044586263597011566, -0.039424046874046326, -0.034261830151081085, -0.029099609702825546, -0.023937391117215157, -0.018775172531604767, -0.013612953945994377, -0.008450735360383987, -0.0032885149121284485, 0.001873701810836792, 0.007035920396447182, 0.012198138982057571, 0.01736035756766796, 0.02252257615327835, 0.02768479473888874, 0.03284701332449913, 0.03800923377275467, 0.04317145049571991, 0.04833366721868515, 0.05349588766694069, 0.05865810811519623, 0.06382032483816147, 0.06898254156112671, 0.07414476573467255, 0.07930698245763779, 0.08446919918060303, 0.08963141590356827, 0.09479363262653351, 0.09995585680007935, 0.10511807352304459, 0.11028029024600983, 0.11544251441955566, 0.1206047311425209, 0.12576694786548615, 0.13092917203903198, 0.13609138131141663, 0.14125360548496246, 0.1464158296585083, 0.15157803893089294, 0.15674026310443878, 0.16190248727798462, 0.16706469655036926, 0.1722269207239151, 0.17738912999629974, 0.18255135416984558, 0.18771356344223022, 0.19287578761577606, 0.1980380117893219, 0.20320022106170654, 0.20836244523525238, 0.21352466940879822, 0.21868687868118286, 0.2238491028547287, 0.22901132702827454, 0.23417353630065918, 0.23933576047420502, 0.24449798464775085, 0.2496601939201355]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 10.0, 14.0, 8.0, 17.0, 17.0, 19.0, 22.0, 29.0, 38.0, 37.0, 59.0, 44.0, 60.0, 182.0, 958337.0, 89129.0, 126.0, 56.0, 53.0, 63.0, 29.0, 36.0, 29.0, 18.0, 15.0, 19.0, 9.0, 12.0, 8.0, 9.0, 5.0, 7.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.6328125, -0.610137939453125, -0.58746337890625, -0.564788818359375, -0.5421142578125, -0.519439697265625, -0.49676513671875, -0.474090576171875, -0.451416015625, -0.428741455078125, -0.40606689453125, -0.383392333984375, -0.3607177734375, -0.338043212890625, -0.31536865234375, -0.292694091796875, -0.27001953125, -0.247344970703125, -0.22467041015625, -0.201995849609375, -0.1793212890625, -0.156646728515625, -0.13397216796875, -0.111297607421875, -0.088623046875, -0.065948486328125, -0.04327392578125, -0.020599365234375, 0.0020751953125, 0.024749755859375, 0.04742431640625, 0.070098876953125, 0.0927734375, 0.115447998046875, 0.13812255859375, 0.160797119140625, 0.1834716796875, 0.206146240234375, 0.22882080078125, 0.251495361328125, 0.274169921875, 0.296844482421875, 0.31951904296875, 0.342193603515625, 0.3648681640625, 0.387542724609375, 0.41021728515625, 0.432891845703125, 0.45556640625, 0.478240966796875, 0.50091552734375, 0.523590087890625, 0.5462646484375, 0.568939208984375, 0.59161376953125, 0.614288330078125, 0.636962890625, 0.659637451171875, 0.68231201171875, 0.704986572265625, 0.7276611328125, 0.750335693359375, 0.77301025390625, 0.795684814453125, 0.818359375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 15.0, 51.0, 154.0, 267.0, 264.0, 171.0, 71.0, 15.0, 10.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0204620361328125, -0.019614458084106445, -0.01876688003540039, -0.017919301986694336, -0.01707172393798828, -0.016224145889282227, -0.015376567840576172, -0.014528989791870117, -0.013681411743164062, -0.012833833694458008, -0.011986255645751953, -0.011138677597045898, -0.010291099548339844, -0.009443521499633789, -0.008595943450927734, -0.00774836540222168, -0.006900787353515625, -0.00605320930480957, -0.005205631256103516, -0.004358053207397461, -0.0035104751586914062, -0.0026628971099853516, -0.0018153190612792969, -0.0009677410125732422, -0.0001201629638671875, 0.0007274150848388672, 0.0015749931335449219, 0.0024225711822509766, 0.0032701492309570312, 0.004117727279663086, 0.004965305328369141, 0.005812883377075195, 0.00666046142578125, 0.007508039474487305, 0.00835561752319336, 0.009203195571899414, 0.010050773620605469, 0.010898351669311523, 0.011745929718017578, 0.012593507766723633, 0.013441085815429688, 0.014288663864135742, 0.015136241912841797, 0.01598381996154785, 0.016831398010253906, 0.01767897605895996, 0.018526554107666016, 0.01937413215637207, 0.020221710205078125, 0.02106928825378418, 0.021916866302490234, 0.02276444435119629, 0.023612022399902344, 0.0244596004486084, 0.025307178497314453, 0.026154756546020508, 0.027002334594726562, 0.027849912643432617, 0.028697490692138672, 0.029545068740844727, 0.03039264678955078, 0.031240224838256836, 0.03208780288696289, 0.032935380935668945, 0.033782958984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 10.0, 13.0, 7.0, 9.0, 16.0, 26.0, 22.0, 34.0, 55.0, 80.0, 140.0, 182.0, 320.0, 704.0, 1813.0, 7097.0, 63665.0, 840180.0, 119461.0, 10590.0, 2301.0, 761.0, 377.0, 237.0, 139.0, 75.0, 56.0, 52.0, 47.0, 24.0, 9.0, 10.0, 6.0, 7.0, 7.0, 5.0, 3.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2342529296875, -0.22659873962402344, -0.21894454956054688, -0.2112903594970703, -0.20363616943359375, -0.1959819793701172, -0.18832778930664062, -0.18067359924316406, -0.1730194091796875, -0.16536521911621094, -0.15771102905273438, -0.1500568389892578, -0.14240264892578125, -0.1347484588623047, -0.12709426879882812, -0.11944007873535156, -0.111785888671875, -0.10413169860839844, -0.09647750854492188, -0.08882331848144531, -0.08116912841796875, -0.07351493835449219, -0.06586074829101562, -0.05820655822753906, -0.0505523681640625, -0.04289817810058594, -0.035243988037109375, -0.027589797973632812, -0.01993560791015625, -0.012281417846679688, -0.004627227783203125, 0.0030269622802734375, 0.01068115234375, 0.018335342407226562, 0.025989532470703125, 0.03364372253417969, 0.04129791259765625, 0.04895210266113281, 0.056606292724609375, 0.06426048278808594, 0.0719146728515625, 0.07956886291503906, 0.08722305297851562, 0.09487724304199219, 0.10253143310546875, 0.11018562316894531, 0.11783981323242188, 0.12549400329589844, 0.133148193359375, 0.14080238342285156, 0.14845657348632812, 0.1561107635498047, 0.16376495361328125, 0.1714191436767578, 0.17907333374023438, 0.18672752380371094, 0.1943817138671875, 0.20203590393066406, 0.20969009399414062, 0.2173442840576172, 0.22499847412109375, 0.2326526641845703, 0.24030685424804688, 0.24796104431152344, 0.255615234375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 11.0, 10.0, 17.0, 19.0, 22.0, 39.0, 44.0, 42.0, 42.0, 49.0, 63.0, 65.0, 59.0, 64.0, 76.0, 58.0, 56.0, 45.0, 27.0, 25.0, 30.0, 24.0, 28.0, 10.0, 19.0, 12.0, 7.0, 3.0, 9.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.060516357421875, -0.058802127838134766, -0.05708789825439453, -0.0553736686706543, -0.05365943908691406, -0.05194520950317383, -0.050230979919433594, -0.04851675033569336, -0.046802520751953125, -0.04508829116821289, -0.043374061584472656, -0.04165983200073242, -0.03994560241699219, -0.03823137283325195, -0.03651714324951172, -0.034802913665771484, -0.03308868408203125, -0.031374454498291016, -0.02966022491455078, -0.027945995330810547, -0.026231765747070312, -0.024517536163330078, -0.022803306579589844, -0.02108907699584961, -0.019374847412109375, -0.01766061782836914, -0.015946388244628906, -0.014232158660888672, -0.012517929077148438, -0.010803699493408203, -0.009089469909667969, -0.007375240325927734, -0.0056610107421875, -0.003946781158447266, -0.0022325515747070312, -0.0005183219909667969, 0.0011959075927734375, 0.002910137176513672, 0.004624366760253906, 0.006338596343994141, 0.008052825927734375, 0.00976705551147461, 0.011481285095214844, 0.013195514678955078, 0.014909744262695312, 0.016623973846435547, 0.01833820343017578, 0.020052433013916016, 0.02176666259765625, 0.023480892181396484, 0.02519512176513672, 0.026909351348876953, 0.028623580932617188, 0.030337810516357422, 0.032052040100097656, 0.03376626968383789, 0.035480499267578125, 0.03719472885131836, 0.038908958435058594, 0.04062318801879883, 0.04233741760253906, 0.0440516471862793, 0.04576587677001953, 0.047480106353759766, 0.0491943359375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 3.0, 9.0, 7.0, 8.0, 7.0, 11.0, 19.0, 27.0, 34.0, 62.0, 172.0, 648.0, 3626.0, 134186.0, 901492.0, 6802.0, 922.0, 255.0, 92.0, 29.0, 30.0, 21.0, 22.0, 9.0, 9.0, 7.0, 6.0, 9.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.5066757202148438, -0.4904022216796875, -0.47412872314453125, -0.457855224609375, -0.44158172607421875, -0.4253082275390625, -0.40903472900390625, -0.39276123046875, -0.37648773193359375, -0.3602142333984375, -0.34394073486328125, -0.327667236328125, -0.31139373779296875, -0.2951202392578125, -0.27884674072265625, -0.2625732421875, -0.24629974365234375, -0.2300262451171875, -0.21375274658203125, -0.197479248046875, -0.18120574951171875, -0.1649322509765625, -0.14865875244140625, -0.13238525390625, -0.11611175537109375, -0.0998382568359375, -0.08356475830078125, -0.067291259765625, -0.05101776123046875, -0.0347442626953125, -0.01847076416015625, -0.002197265625, 0.01407623291015625, 0.0303497314453125, 0.04662322998046875, 0.062896728515625, 0.07917022705078125, 0.0954437255859375, 0.11171722412109375, 0.12799072265625, 0.14426422119140625, 0.1605377197265625, 0.17681121826171875, 0.193084716796875, 0.20935821533203125, 0.2256317138671875, 0.24190521240234375, 0.2581787109375, 0.27445220947265625, 0.2907257080078125, 0.30699920654296875, 0.323272705078125, 0.33954620361328125, 0.3558197021484375, 0.37209320068359375, 0.38836669921875, 0.40464019775390625, 0.4209136962890625, 0.43718719482421875, 0.453460693359375, 0.46973419189453125, 0.4860076904296875, 0.5022811889648438, 0.5185546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 5.0, 8.0, 5.0, 4.0, 6.0, 17.0, 22.0, 42.0, 50.0, 122.0, 213.0, 199.0, 100.0, 59.0, 40.0, 37.0, 19.0, 13.0, 12.0, 6.0, 12.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5643577575683594e-05, -3.4594908356666565e-05, -3.3546239137649536e-05, -3.249756991863251e-05, -3.144890069961548e-05, -3.040023148059845e-05, -2.935156226158142e-05, -2.8302893042564392e-05, -2.7254223823547363e-05, -2.6205554604530334e-05, -2.5156885385513306e-05, -2.4108216166496277e-05, -2.3059546947479248e-05, -2.201087772846222e-05, -2.096220850944519e-05, -1.991353929042816e-05, -1.8864870071411133e-05, -1.7816200852394104e-05, -1.6767531633377075e-05, -1.5718862414360046e-05, -1.4670193195343018e-05, -1.3621523976325989e-05, -1.257285475730896e-05, -1.1524185538291931e-05, -1.0475516319274902e-05, -9.426847100257874e-06, -8.378177881240845e-06, -7.329508662223816e-06, -6.280839443206787e-06, -5.232170224189758e-06, -4.1835010051727295e-06, -3.1348317861557007e-06, -2.086162567138672e-06, -1.037493348121643e-06, 1.1175870895385742e-08, 1.0598450899124146e-06, 2.1085143089294434e-06, 3.157183527946472e-06, 4.205852746963501e-06, 5.25452196598053e-06, 6.303191184997559e-06, 7.351860404014587e-06, 8.400529623031616e-06, 9.449198842048645e-06, 1.0497868061065674e-05, 1.1546537280082703e-05, 1.2595206499099731e-05, 1.364387571811676e-05, 1.4692544937133789e-05, 1.5741214156150818e-05, 1.6789883375167847e-05, 1.7838552594184875e-05, 1.8887221813201904e-05, 1.9935891032218933e-05, 2.0984560251235962e-05, 2.203322947025299e-05, 2.308189868927002e-05, 2.413056790828705e-05, 2.5179237127304077e-05, 2.6227906346321106e-05, 2.7276575565338135e-05, 2.8325244784355164e-05, 2.9373914003372192e-05, 3.042258322238922e-05, 3.147125244140625e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 10.0, 23.0, 38.0, 84.0, 269.0, 1156.0, 12707.0, 945622.0, 84122.0, 3717.0, 523.0, 146.0, 51.0, 27.0, 12.0, 10.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5205078125, -0.504119873046875, -0.48773193359375, -0.471343994140625, -0.4549560546875, -0.438568115234375, -0.42218017578125, -0.405792236328125, -0.389404296875, -0.373016357421875, -0.35662841796875, -0.340240478515625, -0.3238525390625, -0.307464599609375, -0.29107666015625, -0.274688720703125, -0.25830078125, -0.241912841796875, -0.22552490234375, -0.209136962890625, -0.1927490234375, -0.176361083984375, -0.15997314453125, -0.143585205078125, -0.127197265625, -0.110809326171875, -0.09442138671875, -0.078033447265625, -0.0616455078125, -0.045257568359375, -0.02886962890625, -0.012481689453125, 0.00390625, 0.020294189453125, 0.03668212890625, 0.053070068359375, 0.0694580078125, 0.085845947265625, 0.10223388671875, 0.118621826171875, 0.135009765625, 0.151397705078125, 0.16778564453125, 0.184173583984375, 0.2005615234375, 0.216949462890625, 0.23333740234375, 0.249725341796875, 0.26611328125, 0.282501220703125, 0.29888916015625, 0.315277099609375, 0.3316650390625, 0.348052978515625, 0.36444091796875, 0.380828857421875, 0.397216796875, 0.413604736328125, 0.42999267578125, 0.446380615234375, 0.4627685546875, 0.479156494140625, 0.49554443359375, 0.511932373046875, 0.5283203125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 3.0, 11.0, 10.0, 20.0, 37.0, 47.0, 102.0, 264.0, 230.0, 109.0, 47.0, 36.0, 25.0, 16.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.170654296875, -0.1651325225830078, -0.15961074829101562, -0.15408897399902344, -0.14856719970703125, -0.14304542541503906, -0.13752365112304688, -0.1320018768310547, -0.1264801025390625, -0.12095832824707031, -0.11543655395507812, -0.10991477966308594, -0.10439300537109375, -0.09887123107910156, -0.09334945678710938, -0.08782768249511719, -0.082305908203125, -0.07678413391113281, -0.07126235961914062, -0.06574058532714844, -0.06021881103515625, -0.05469703674316406, -0.049175262451171875, -0.04365348815917969, -0.0381317138671875, -0.03260993957519531, -0.027088165283203125, -0.021566390991210938, -0.01604461669921875, -0.010522842407226562, -0.005001068115234375, 0.0005207061767578125, 0.00604248046875, 0.011564254760742188, 0.017086029052734375, 0.022607803344726562, 0.02812957763671875, 0.03365135192871094, 0.039173126220703125, 0.04469490051269531, 0.0502166748046875, 0.05573844909667969, 0.061260223388671875, 0.06678199768066406, 0.07230377197265625, 0.07782554626464844, 0.08334732055664062, 0.08886909484863281, 0.094390869140625, 0.09991264343261719, 0.10543441772460938, 0.11095619201660156, 0.11647796630859375, 0.12199974060058594, 0.12752151489257812, 0.1330432891845703, 0.1385650634765625, 0.1440868377685547, 0.14960861206054688, 0.15513038635253906, 0.16065216064453125, 0.16617393493652344, 0.17169570922851562, 0.1772174835205078, 0.1827392578125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 960.0, 51.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2916741371154785, -1.698075532913208, -1.104476809501648, -0.5108780860900879, 0.08272051811218262, 0.6763191223144531, 1.2699179649353027, 1.8635163307189941, 2.4571151733398438, 3.0507137775421143, 3.6443123817443848, 4.237911224365234, 4.831509590148926, 5.425108432769775, 6.018707275390625, 6.612305641174316, 7.205904483795166, 7.799503326416016, 8.393101692199707, 8.986700057983398, 9.580299377441406, 10.173897743225098, 10.767496109008789, 11.361095428466797, 11.954693794250488, 12.54829216003418, 13.141891479492188, 13.735489845275879, 14.32908821105957, 14.922687530517578, 15.51628589630127, 16.10988426208496, 16.703481674194336, 17.297080993652344, 17.89067840576172, 18.484277725219727, 19.077877044677734, 19.67147445678711, 20.265073776245117, 20.858673095703125, 21.4522705078125, 22.045869827270508, 22.639467239379883, 23.23306655883789, 23.8266658782959, 24.420263290405273, 25.01386260986328, 25.607460021972656, 26.201061248779297, 26.794660568237305, 27.38825798034668, 27.981857299804688, 28.575456619262695, 29.16905403137207, 29.762653350830078, 30.356250762939453, 30.94985008239746, 31.54344940185547, 32.137046813964844, 32.73064422607422, 33.32424545288086, 33.917842864990234, 34.511444091796875, 35.10504150390625, 35.698638916015625]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 10.0, 17.0, 34.0, 67.0, 140.0, 158.0, 178.0, 175.0, 116.0, 64.0, 43.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8802896738052368, -0.8288059234619141, -0.7773221135139465, -0.7258383631706238, -0.6743545532226562, -0.6228708028793335, -0.5713870525360107, -0.519903302192688, -0.46841949224472046, -0.4169357120990753, -0.3654519319534302, -0.3139681816101074, -0.2624844014644623, -0.21100062131881714, -0.15951687097549438, -0.10803309082984924, -0.0565493106842041, -0.005065537989139557, 0.04641823470592499, 0.09790199995040894, 0.14938578009605408, 0.20086956024169922, 0.252353310585022, 0.3038370907306671, 0.35532087087631226, 0.4068046510219574, 0.45828843116760254, 0.5097721815109253, 0.561255931854248, 0.6127397418022156, 0.6642234921455383, 0.7157073020935059, 0.7671909332275391, 0.8186746835708618, 0.8701584935188293, 0.9216422438621521, 0.9731260538101196, 1.0246098041534424, 1.0760935544967651, 1.127577304840088, 1.1790611743927002, 1.230544924736023, 1.2820286750793457, 1.333512544631958, 1.3849962949752808, 1.4364800453186035, 1.4879637956619263, 1.539447546005249, 1.5909312963485718, 1.6424150466918945, 1.6938987970352173, 1.74538254737854, 1.7968664169311523, 1.848350167274475, 1.8998339176177979, 1.9513176679611206, 2.0028014183044434, 2.0542852878570557, 2.105768918991089, 2.157252788543701, 2.2087364196777344, 2.2602202892303467, 2.311704158782959, 2.363187789916992, 2.4146716594696045]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 13.0, 7.0, 10.0, 13.0, 19.0, 21.0, 33.0, 30.0, 39.0, 48.0, 82.0, 258.0, 38990.0, 4153547.0, 836.0, 210.0, 74.0, 21.0, 13.0, 12.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6943359375, -1.6240692138671875, -1.553802490234375, -1.4835357666015625, -1.41326904296875, -1.3430023193359375, -1.272735595703125, -1.2024688720703125, -1.1322021484375, -1.0619354248046875, -0.991668701171875, -0.9214019775390625, -0.85113525390625, -0.7808685302734375, -0.710601806640625, -0.6403350830078125, -0.570068359375, -0.4998016357421875, -0.429534912109375, -0.3592681884765625, -0.28900146484375, -0.2187347412109375, -0.148468017578125, -0.0782012939453125, -0.0079345703125, 0.0623321533203125, 0.132598876953125, 0.2028656005859375, 0.27313232421875, 0.3433990478515625, 0.413665771484375, 0.4839324951171875, 0.55419921875, 0.6244659423828125, 0.694732666015625, 0.7649993896484375, 0.83526611328125, 0.9055328369140625, 0.975799560546875, 1.0460662841796875, 1.1163330078125, 1.1865997314453125, 1.256866455078125, 1.3271331787109375, 1.39739990234375, 1.4676666259765625, 1.537933349609375, 1.6082000732421875, 1.678466796875, 1.7487335205078125, 1.819000244140625, 1.8892669677734375, 1.95953369140625, 2.0298004150390625, 2.100067138671875, 2.1703338623046875, 2.2406005859375, 2.3108673095703125, 2.381134033203125, 2.4514007568359375, 2.52166748046875, 2.5919342041015625, 2.662200927734375, 2.7324676513671875, 2.802734375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 24.0, 42.0, 141.0, 214.0, 263.0, 182.0, 99.0, 31.0, 9.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0265350341796875, -0.025227785110473633, -0.023920536041259766, -0.0226132869720459, -0.02130603790283203, -0.019998788833618164, -0.018691539764404297, -0.01738429069519043, -0.016077041625976562, -0.014769792556762695, -0.013462543487548828, -0.012155294418334961, -0.010848045349121094, -0.009540796279907227, -0.00823354721069336, -0.006926298141479492, -0.005619049072265625, -0.004311800003051758, -0.0030045509338378906, -0.0016973018646240234, -0.00039005279541015625, 0.0009171962738037109, 0.002224445343017578, 0.0035316944122314453, 0.0048389434814453125, 0.00614619255065918, 0.007453441619873047, 0.008760690689086914, 0.010067939758300781, 0.011375188827514648, 0.012682437896728516, 0.013989686965942383, 0.01529693603515625, 0.016604185104370117, 0.017911434173583984, 0.01921868324279785, 0.02052593231201172, 0.021833181381225586, 0.023140430450439453, 0.02444767951965332, 0.025754928588867188, 0.027062177658081055, 0.028369426727294922, 0.02967667579650879, 0.030983924865722656, 0.03229117393493652, 0.03359842300415039, 0.03490567207336426, 0.036212921142578125, 0.03752017021179199, 0.03882741928100586, 0.04013466835021973, 0.041441917419433594, 0.04274916648864746, 0.04405641555786133, 0.045363664627075195, 0.04667091369628906, 0.04797816276550293, 0.0492854118347168, 0.050592660903930664, 0.05189990997314453, 0.0532071590423584, 0.054514408111572266, 0.05582165718078613, 0.05712890625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 9.0, 40.0, 35.0, 51.0, 72.0, 73.0, 121.0, 174.0, 226.0, 2806.0, 4188492.0, 1382.0, 184.0, 175.0, 112.0, 89.0, 82.0, 53.0, 36.0, 33.0, 15.0, 9.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.1328125, -3.96368408203125, -3.7945556640625, -3.62542724609375, -3.456298828125, -3.28717041015625, -3.1180419921875, -2.94891357421875, -2.77978515625, -2.61065673828125, -2.4415283203125, -2.27239990234375, -2.103271484375, -1.93414306640625, -1.7650146484375, -1.59588623046875, -1.4267578125, -1.25762939453125, -1.0885009765625, -0.91937255859375, -0.750244140625, -0.58111572265625, -0.4119873046875, -0.24285888671875, -0.07373046875, 0.09539794921875, 0.2645263671875, 0.43365478515625, 0.602783203125, 0.77191162109375, 0.9410400390625, 1.11016845703125, 1.279296875, 1.44842529296875, 1.6175537109375, 1.78668212890625, 1.955810546875, 2.12493896484375, 2.2940673828125, 2.46319580078125, 2.63232421875, 2.80145263671875, 2.9705810546875, 3.13970947265625, 3.308837890625, 3.47796630859375, 3.6470947265625, 3.81622314453125, 3.9853515625, 4.15447998046875, 4.3236083984375, 4.49273681640625, 4.661865234375, 4.83099365234375, 5.0001220703125, 5.16925048828125, 5.33837890625, 5.50750732421875, 5.6766357421875, 5.84576416015625, 6.014892578125, 6.18402099609375, 6.3531494140625, 6.52227783203125, 6.69140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 13.0, 25.0, 73.0, 172.0, 1171.0, 2341.0, 173.0, 60.0, 19.0, 10.0, 11.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13671875, -0.13184547424316406, -0.12697219848632812, -0.12209892272949219, -0.11722564697265625, -0.11235237121582031, -0.10747909545898438, -0.10260581970214844, -0.0977325439453125, -0.09285926818847656, -0.08798599243164062, -0.08311271667480469, -0.07823944091796875, -0.07336616516113281, -0.06849288940429688, -0.06361961364746094, -0.058746337890625, -0.05387306213378906, -0.048999786376953125, -0.04412651062011719, -0.03925323486328125, -0.03437995910644531, -0.029506683349609375, -0.024633407592773438, -0.0197601318359375, -0.014886856079101562, -0.010013580322265625, -0.0051403045654296875, -0.00026702880859375, 0.0046062469482421875, 0.009479522705078125, 0.014352798461914062, 0.01922607421875, 0.024099349975585938, 0.028972625732421875, 0.03384590148925781, 0.03871917724609375, 0.04359245300292969, 0.048465728759765625, 0.05333900451660156, 0.0582122802734375, 0.06308555603027344, 0.06795883178710938, 0.07283210754394531, 0.07770538330078125, 0.08257865905761719, 0.08745193481445312, 0.09232521057128906, 0.097198486328125, 0.10207176208496094, 0.10694503784179688, 0.11181831359863281, 0.11669158935546875, 0.12156486511230469, 0.12643814086914062, 0.13131141662597656, 0.1361846923828125, 0.14105796813964844, 0.14593124389648438, 0.1508045196533203, 0.15567779541015625, 0.1605510711669922, 0.16542434692382812, 0.17029762268066406, 0.1751708984375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 34.0, 257.0, 635.0, 57.0, 14.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6357803344726562, -2.3764028549194336, -2.11702561378479, -1.857648253440857, -1.5982708930969238, -1.3388935327529907, -1.0795161724090576, -0.8201388120651245, -0.5607614517211914, -0.3013840913772583, -0.042006731033325195, 0.2173706293106079, 0.476747989654541, 0.7361253499984741, 0.9955027103424072, 1.2548800706863403, 1.5142574310302734, 1.7736347913742065, 2.0330121517181396, 2.292389392852783, 2.551766872406006, 2.8111443519592285, 3.070521593093872, 3.3298988342285156, 3.5892763137817383, 3.848653793334961, 4.108031272888184, 4.367408275604248, 4.626785755157471, 4.886163234710693, 5.145540237426758, 5.4049177169799805, 5.6642961502075195, 5.923673629760742, 6.183051109313965, 6.442428112030029, 6.701805591583252, 6.961183071136475, 7.220560073852539, 7.479937553405762, 7.739315032958984, 7.998692512512207, 8.25806999206543, 8.517447471618652, 8.776824951171875, 9.036201477050781, 9.295578956604004, 9.554956436157227, 9.81433391571045, 10.073711395263672, 10.333088874816895, 10.592466354370117, 10.851842880249023, 11.111220359802246, 11.370597839355469, 11.629975318908691, 11.889352798461914, 12.148730278015137, 12.40810775756836, 12.667485237121582, 12.926862716674805, 13.186239242553711, 13.445616722106934, 13.704994201660156, 13.964371681213379]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 5.0, 9.0, 23.0, 23.0, 51.0, 95.0, 120.0, 139.0, 132.0, 112.0, 93.0, 81.0, 53.0, 27.0, 11.0, 8.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7741677761077881, -0.7501190304756165, -0.7260702848434448, -0.7020215392112732, -0.6779727935791016, -0.6539240479469299, -0.6298753023147583, -0.6058265566825867, -0.581777811050415, -0.5577290654182434, -0.5336803197860718, -0.5096315741539001, -0.4855828285217285, -0.4615340828895569, -0.43748533725738525, -0.4134365916252136, -0.389387845993042, -0.36533910036087036, -0.34129035472869873, -0.3172416090965271, -0.29319286346435547, -0.26914411783218384, -0.2450953722000122, -0.22104662656784058, -0.19699788093566895, -0.17294913530349731, -0.14890038967132568, -0.12485164403915405, -0.10080289840698242, -0.07675415277481079, -0.05270540714263916, -0.02865666151046753, -0.0046079158782958984, 0.019440829753875732, 0.04348957538604736, 0.067538321018219, 0.09158706665039062, 0.11563581228256226, 0.1396845579147339, 0.16373330354690552, 0.18778204917907715, 0.21183079481124878, 0.2358795404434204, 0.25992828607559204, 0.28397703170776367, 0.3080257773399353, 0.33207452297210693, 0.35612326860427856, 0.3801720142364502, 0.4042207598686218, 0.42826950550079346, 0.4523182511329651, 0.4763669967651367, 0.5004157423973083, 0.52446448802948, 0.5485132336616516, 0.5725619792938232, 0.5966107249259949, 0.6206594705581665, 0.6447082161903381, 0.6687569618225098, 0.6928057074546814, 0.716854453086853, 0.7409031987190247, 0.7649519443511963]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 7.0, 5.0, 8.0, 14.0, 10.0, 23.0, 36.0, 50.0, 88.0, 125.0, 215.0, 395.0, 846.0, 2584.0, 13266.0, 203358.0, 789076.0, 31498.0, 4486.0, 1256.0, 499.0, 281.0, 146.0, 94.0, 53.0, 51.0, 15.0, 17.0, 10.0, 8.0, 4.0, 7.0, 8.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84765625, -0.8164825439453125, -0.785308837890625, -0.7541351318359375, -0.72296142578125, -0.6917877197265625, -0.660614013671875, -0.6294403076171875, -0.5982666015625, -0.5670928955078125, -0.535919189453125, -0.5047454833984375, -0.47357177734375, -0.4423980712890625, -0.411224365234375, -0.3800506591796875, -0.348876953125, -0.3177032470703125, -0.286529541015625, -0.2553558349609375, -0.22418212890625, -0.1930084228515625, -0.161834716796875, -0.1306610107421875, -0.0994873046875, -0.0683135986328125, -0.037139892578125, -0.0059661865234375, 0.02520751953125, 0.0563812255859375, 0.087554931640625, 0.1187286376953125, 0.14990234375, 0.1810760498046875, 0.212249755859375, 0.2434234619140625, 0.27459716796875, 0.3057708740234375, 0.336944580078125, 0.3681182861328125, 0.3992919921875, 0.4304656982421875, 0.461639404296875, 0.4928131103515625, 0.52398681640625, 0.5551605224609375, 0.586334228515625, 0.6175079345703125, 0.648681640625, 0.6798553466796875, 0.711029052734375, 0.7422027587890625, 0.77337646484375, 0.8045501708984375, 0.835723876953125, 0.8668975830078125, 0.8980712890625, 0.9292449951171875, 0.960418701171875, 0.9915924072265625, 1.02276611328125, 1.0539398193359375, 1.085113525390625, 1.1162872314453125, 1.1474609375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 13.0, 30.0, 60.0, 118.0, 137.0, 204.0, 164.0, 123.0, 87.0, 38.0, 15.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045013427734375, -0.043263912200927734, -0.04151439666748047, -0.0397648811340332, -0.03801536560058594, -0.03626585006713867, -0.034516334533691406, -0.03276681900024414, -0.031017303466796875, -0.02926778793334961, -0.027518272399902344, -0.025768756866455078, -0.024019241333007812, -0.022269725799560547, -0.02052021026611328, -0.018770694732666016, -0.01702117919921875, -0.015271663665771484, -0.013522148132324219, -0.011772632598876953, -0.010023117065429688, -0.008273601531982422, -0.006524085998535156, -0.004774570465087891, -0.003025054931640625, -0.0012755393981933594, 0.00047397613525390625, 0.002223491668701172, 0.0039730072021484375, 0.005722522735595703, 0.007472038269042969, 0.009221553802490234, 0.0109710693359375, 0.012720584869384766, 0.014470100402832031, 0.016219615936279297, 0.017969131469726562, 0.019718647003173828, 0.021468162536621094, 0.02321767807006836, 0.024967193603515625, 0.02671670913696289, 0.028466224670410156, 0.030215740203857422, 0.03196525573730469, 0.03371477127075195, 0.03546428680419922, 0.037213802337646484, 0.03896331787109375, 0.040712833404541016, 0.04246234893798828, 0.04421186447143555, 0.04596138000488281, 0.04771089553833008, 0.049460411071777344, 0.05120992660522461, 0.052959442138671875, 0.05470895767211914, 0.056458473205566406, 0.05820798873901367, 0.05995750427246094, 0.0617070198059082, 0.06345653533935547, 0.06520605087280273, 0.06695556640625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 7.0, 4.0, 6.0, 4.0, 11.0, 14.0, 21.0, 46.0, 75.0, 84.0, 127.0, 206.0, 425.0, 790.0, 1892.0, 6354.0, 32250.0, 321924.0, 613742.0, 56300.0, 9443.0, 2667.0, 1013.0, 465.0, 236.0, 153.0, 106.0, 59.0, 43.0, 29.0, 18.0, 12.0, 10.0, 9.0, 4.0, 3.0, 0.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432861328125, -0.4205436706542969, -0.40822601318359375, -0.3959083557128906, -0.3835906982421875, -0.3712730407714844, -0.35895538330078125, -0.3466377258300781, -0.334320068359375, -0.3220024108886719, -0.30968475341796875, -0.2973670959472656, -0.2850494384765625, -0.2727317810058594, -0.26041412353515625, -0.24809646606445312, -0.23577880859375, -0.22346115112304688, -0.21114349365234375, -0.19882583618164062, -0.1865081787109375, -0.17419052124023438, -0.16187286376953125, -0.14955520629882812, -0.137237548828125, -0.12491989135742188, -0.11260223388671875, -0.10028457641601562, -0.0879669189453125, -0.07564926147460938, -0.06333160400390625, -0.051013946533203125, -0.0386962890625, -0.026378631591796875, -0.01406097412109375, -0.001743316650390625, 0.0105743408203125, 0.022891998291015625, 0.03520965576171875, 0.047527313232421875, 0.059844970703125, 0.07216262817382812, 0.08448028564453125, 0.09679794311523438, 0.1091156005859375, 0.12143325805664062, 0.13375091552734375, 0.14606857299804688, 0.15838623046875, 0.17070388793945312, 0.18302154541015625, 0.19533920288085938, 0.2076568603515625, 0.21997451782226562, 0.23229217529296875, 0.24460983276367188, 0.256927490234375, 0.2692451477050781, 0.28156280517578125, 0.2938804626464844, 0.3061981201171875, 0.3185157775878906, 0.33083343505859375, 0.3431510925292969, 0.35546875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 1.0, 2.0, 4.0, 11.0, 10.0, 13.0, 25.0, 21.0, 31.0, 30.0, 52.0, 56.0, 38.0, 50.0, 53.0, 57.0, 48.0, 46.0, 50.0, 57.0, 56.0, 39.0, 44.0, 41.0, 37.0, 25.0, 28.0, 22.0, 12.0, 8.0, 8.0, 6.0, 9.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1385498046875, -0.13428306579589844, -0.13001632690429688, -0.1257495880126953, -0.12148284912109375, -0.11721611022949219, -0.11294937133789062, -0.10868263244628906, -0.1044158935546875, -0.10014915466308594, -0.09588241577148438, -0.09161567687988281, -0.08734893798828125, -0.08308219909667969, -0.07881546020507812, -0.07454872131347656, -0.070281982421875, -0.06601524353027344, -0.061748504638671875, -0.05748176574707031, -0.05321502685546875, -0.04894828796386719, -0.044681549072265625, -0.04041481018066406, -0.0361480712890625, -0.03188133239746094, -0.027614593505859375, -0.023347854614257812, -0.01908111572265625, -0.014814376831054688, -0.010547637939453125, -0.0062808990478515625, -0.00201416015625, 0.0022525787353515625, 0.006519317626953125, 0.010786056518554688, 0.01505279541015625, 0.019319534301757812, 0.023586273193359375, 0.027853012084960938, 0.0321197509765625, 0.03638648986816406, 0.040653228759765625, 0.04491996765136719, 0.04918670654296875, 0.05345344543457031, 0.057720184326171875, 0.06198692321777344, 0.066253662109375, 0.07052040100097656, 0.07478713989257812, 0.07905387878417969, 0.08332061767578125, 0.08758735656738281, 0.09185409545898438, 0.09612083435058594, 0.1003875732421875, 0.10465431213378906, 0.10892105102539062, 0.11318778991699219, 0.11745452880859375, 0.12172126770019531, 0.12598800659179688, 0.13025474548339844, 0.134521484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 4.0, 2.0, 10.0, 9.0, 11.0, 23.0, 28.0, 46.0, 60.0, 86.0, 108.0, 216.0, 414.0, 925.0, 2677.0, 9986.0, 65724.0, 853162.0, 97217.0, 12481.0, 3209.0, 1094.0, 447.0, 214.0, 115.0, 76.0, 56.0, 38.0, 26.0, 25.0, 13.0, 12.0, 7.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.416259765625, -0.40348052978515625, -0.3907012939453125, -0.37792205810546875, -0.365142822265625, -0.35236358642578125, -0.3395843505859375, -0.32680511474609375, -0.31402587890625, -0.30124664306640625, -0.2884674072265625, -0.27568817138671875, -0.262908935546875, -0.25012969970703125, -0.2373504638671875, -0.22457122802734375, -0.2117919921875, -0.19901275634765625, -0.1862335205078125, -0.17345428466796875, -0.160675048828125, -0.14789581298828125, -0.1351165771484375, -0.12233734130859375, -0.10955810546875, -0.09677886962890625, -0.0839996337890625, -0.07122039794921875, -0.058441162109375, -0.04566192626953125, -0.0328826904296875, -0.02010345458984375, -0.00732421875, 0.00545501708984375, 0.0182342529296875, 0.03101348876953125, 0.043792724609375, 0.05657196044921875, 0.0693511962890625, 0.08213043212890625, 0.09490966796875, 0.10768890380859375, 0.1204681396484375, 0.13324737548828125, 0.146026611328125, 0.15880584716796875, 0.1715850830078125, 0.18436431884765625, 0.1971435546875, 0.20992279052734375, 0.2227020263671875, 0.23548126220703125, 0.248260498046875, 0.26103973388671875, 0.2738189697265625, 0.28659820556640625, 0.29937744140625, 0.31215667724609375, 0.3249359130859375, 0.33771514892578125, 0.350494384765625, 0.36327362060546875, 0.3760528564453125, 0.38883209228515625, 0.401611328125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 4.0, 5.0, 10.0, 13.0, 23.0, 39.0, 43.0, 63.0, 126.0, 179.0, 190.0, 111.0, 67.0, 28.0, 18.0, 27.0, 13.0, 5.0, 8.0, 9.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.073713302612305e-05, -5.9001147747039795e-05, -5.726516246795654e-05, -5.552917718887329e-05, -5.379319190979004e-05, -5.205720663070679e-05, -5.0321221351623535e-05, -4.858523607254028e-05, -4.684925079345703e-05, -4.511326551437378e-05, -4.337728023529053e-05, -4.1641294956207275e-05, -3.9905309677124023e-05, -3.816932439804077e-05, -3.643333911895752e-05, -3.469735383987427e-05, -3.2961368560791016e-05, -3.1225383281707764e-05, -2.9489398002624512e-05, -2.775341272354126e-05, -2.6017427444458008e-05, -2.4281442165374756e-05, -2.2545456886291504e-05, -2.0809471607208252e-05, -1.9073486328125e-05, -1.7337501049041748e-05, -1.5601515769958496e-05, -1.3865530490875244e-05, -1.2129545211791992e-05, -1.039355993270874e-05, -8.657574653625488e-06, -6.921589374542236e-06, -5.185604095458984e-06, -3.4496188163757324e-06, -1.7136335372924805e-06, 2.2351741790771484e-08, 1.7583370208740234e-06, 3.4943222999572754e-06, 5.230307579040527e-06, 6.966292858123779e-06, 8.702278137207031e-06, 1.0438263416290283e-05, 1.2174248695373535e-05, 1.3910233974456787e-05, 1.564621925354004e-05, 1.738220453262329e-05, 1.9118189811706543e-05, 2.0854175090789795e-05, 2.2590160369873047e-05, 2.43261456489563e-05, 2.606213092803955e-05, 2.7798116207122803e-05, 2.9534101486206055e-05, 3.127008676528931e-05, 3.300607204437256e-05, 3.474205732345581e-05, 3.647804260253906e-05, 3.8214027881622314e-05, 3.9950013160705566e-05, 4.168599843978882e-05, 4.342198371887207e-05, 4.515796899795532e-05, 4.6893954277038574e-05, 4.8629939556121826e-05, 5.036592483520508e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 3.0, 2.0, 10.0, 32.0, 56.0, 95.0, 158.0, 344.0, 769.0, 2595.0, 17406.0, 766726.0, 246799.0, 10265.0, 2005.0, 666.0, 288.0, 163.0, 71.0, 44.0, 18.0, 20.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6162109375, -0.5955886840820312, -0.5749664306640625, -0.5543441772460938, -0.533721923828125, -0.5130996704101562, -0.4924774169921875, -0.47185516357421875, -0.45123291015625, -0.43061065673828125, -0.4099884033203125, -0.38936614990234375, -0.368743896484375, -0.34812164306640625, -0.3274993896484375, -0.30687713623046875, -0.2862548828125, -0.26563262939453125, -0.2450103759765625, -0.22438812255859375, -0.203765869140625, -0.18314361572265625, -0.1625213623046875, -0.14189910888671875, -0.12127685546875, -0.10065460205078125, -0.0800323486328125, -0.05941009521484375, -0.038787841796875, -0.01816558837890625, 0.0024566650390625, 0.02307891845703125, 0.043701171875, 0.06432342529296875, 0.0849456787109375, 0.10556793212890625, 0.126190185546875, 0.14681243896484375, 0.1674346923828125, 0.18805694580078125, 0.20867919921875, 0.22930145263671875, 0.2499237060546875, 0.27054595947265625, 0.291168212890625, 0.31179046630859375, 0.3324127197265625, 0.35303497314453125, 0.3736572265625, 0.39427947998046875, 0.4149017333984375, 0.43552398681640625, 0.456146240234375, 0.47676849365234375, 0.4973907470703125, 0.5180130004882812, 0.53863525390625, 0.5592575073242188, 0.5798797607421875, 0.6005020141601562, 0.621124267578125, 0.6417465209960938, 0.6623687744140625, 0.6829910278320312, 0.70361328125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 8.0, 4.0, 24.0, 23.0, 39.0, 76.0, 140.0, 141.0, 166.0, 147.0, 81.0, 46.0, 40.0, 18.0, 12.0, 10.0, 8.0, 9.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1651611328125, -0.1583271026611328, -0.15149307250976562, -0.14465904235839844, -0.13782501220703125, -0.13099098205566406, -0.12415695190429688, -0.11732292175292969, -0.1104888916015625, -0.10365486145019531, -0.09682083129882812, -0.08998680114746094, -0.08315277099609375, -0.07631874084472656, -0.06948471069335938, -0.06265068054199219, -0.055816650390625, -0.04898262023925781, -0.042148590087890625, -0.03531455993652344, -0.02848052978515625, -0.021646499633789062, -0.014812469482421875, -0.007978439331054688, -0.0011444091796875, 0.0056896209716796875, 0.012523651123046875, 0.019357681274414062, 0.02619171142578125, 0.03302574157714844, 0.039859771728515625, 0.04669380187988281, 0.05352783203125, 0.06036186218261719, 0.06719589233398438, 0.07402992248535156, 0.08086395263671875, 0.08769798278808594, 0.09453201293945312, 0.10136604309082031, 0.1082000732421875, 0.11503410339355469, 0.12186813354492188, 0.12870216369628906, 0.13553619384765625, 0.14237022399902344, 0.14920425415039062, 0.1560382843017578, 0.162872314453125, 0.1697063446044922, 0.17654037475585938, 0.18337440490722656, 0.19020843505859375, 0.19704246520996094, 0.20387649536132812, 0.2107105255126953, 0.2175445556640625, 0.2243785858154297, 0.23121261596679688, 0.23804664611816406, 0.24488067626953125, 0.25171470642089844, 0.2585487365722656, 0.2653827667236328, 0.272216796875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 72.0, 613.0, 309.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0145845413208, -10.752126693725586, -10.489669799804688, -10.227212905883789, -9.964755058288574, -9.70229721069336, -9.439840316772461, -9.177383422851562, -8.914925575256348, -8.652467727661133, -8.390010833740234, -8.127553939819336, -7.865096092224121, -7.6026387214660645, -7.340181350708008, -7.077723979949951, -6.8152666091918945, -6.552809238433838, -6.290351867675781, -6.027894496917725, -5.765437126159668, -5.502979755401611, -5.240522384643555, -4.978065013885498, -4.715607643127441, -4.453150272369385, -4.190692901611328, -3.9282355308532715, -3.665778160095215, -3.403320789337158, -3.1408634185791016, -2.878406047821045, -2.6159486770629883, -2.3534913063049316, -2.091033935546875, -1.8285765647888184, -1.5661191940307617, -1.303661823272705, -1.0412044525146484, -0.7787470817565918, -0.5162897109985352, -0.2538323402404785, 0.008625030517578125, 0.27108240127563477, 0.5335397720336914, 0.795997142791748, 1.0584545135498047, 1.3209118843078613, 1.583369255065918, 1.8458266258239746, 2.1082839965820312, 2.370741367340088, 2.6331987380981445, 2.895656108856201, 3.158113479614258, 3.4205708503723145, 3.683028221130371, 3.9454855918884277, 4.207942962646484, 4.470400333404541, 4.732857704162598, 4.995315074920654, 5.257772445678711, 5.520229816436768, 5.782687187194824]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 6.0, 4.0, 10.0, 3.0, 14.0, 6.0, 15.0, 22.0, 16.0, 19.0, 32.0, 39.0, 44.0, 49.0, 57.0, 55.0, 56.0, 61.0, 60.0, 51.0, 46.0, 58.0, 47.0, 38.0, 44.0, 28.0, 27.0, 26.0, 24.0, 13.0, 9.0, 8.0, 7.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.860492467880249, -0.8258423209190369, -0.7911921739578247, -0.7565420269966125, -0.7218918800354004, -0.687241792678833, -0.6525916457176208, -0.6179414987564087, -0.5832913517951965, -0.5486412048339844, -0.5139910578727722, -0.47934094071388245, -0.4446907937526703, -0.41004064679145813, -0.37539052963256836, -0.3407403826713562, -0.30609023571014404, -0.2714400887489319, -0.23678995668888092, -0.20213982462882996, -0.1674896776676178, -0.13283953070640564, -0.09818939864635468, -0.06353926658630371, -0.028889119625091553, 0.0057610198855400085, 0.04041115939617157, 0.07506129890680313, 0.10971143841743469, 0.14436158537864685, 0.17901171743869781, 0.21366184949874878, 0.24831199645996094, 0.2829621434211731, 0.31761229038238525, 0.352262407541275, 0.3869125545024872, 0.42156270146369934, 0.4562128186225891, 0.49086296558380127, 0.5255131125450134, 0.5601632595062256, 0.5948134064674377, 0.6294635534286499, 0.6641136407852173, 0.6987638473510742, 0.7334139347076416, 0.7680640816688538, 0.8027142286300659, 0.8373643755912781, 0.8720145225524902, 0.9066646695137024, 0.9413148164749146, 0.9759649038314819, 1.0106151103973389, 1.0452651977539062, 1.0799152851104736, 1.114565372467041, 1.149215579032898, 1.1838656663894653, 1.2185158729553223, 1.2531659603118896, 1.2878161668777466, 1.322466254234314, 1.357116460800171]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 1.0, 1.0, 5.0, 9.0, 11.0, 8.0, 9.0, 36.0, 42.0, 44.0, 109.0, 113.0, 275.0, 591.0, 2180.0, 15450.0, 4037533.0, 128686.0, 6916.0, 1449.0, 406.0, 189.0, 104.0, 59.0, 24.0, 17.0, 4.0, 8.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.576171875, -2.502105712890625, -2.42803955078125, -2.353973388671875, -2.2799072265625, -2.205841064453125, -2.13177490234375, -2.057708740234375, -1.983642578125, -1.909576416015625, -1.83551025390625, -1.761444091796875, -1.6873779296875, -1.613311767578125, -1.53924560546875, -1.465179443359375, -1.39111328125, -1.317047119140625, -1.24298095703125, -1.168914794921875, -1.0948486328125, -1.020782470703125, -0.94671630859375, -0.872650146484375, -0.798583984375, -0.724517822265625, -0.65045166015625, -0.576385498046875, -0.5023193359375, -0.428253173828125, -0.35418701171875, -0.280120849609375, -0.2060546875, -0.131988525390625, -0.05792236328125, 0.016143798828125, 0.0902099609375, 0.164276123046875, 0.23834228515625, 0.312408447265625, 0.386474609375, 0.460540771484375, 0.53460693359375, 0.608673095703125, 0.6827392578125, 0.756805419921875, 0.83087158203125, 0.904937744140625, 0.97900390625, 1.053070068359375, 1.12713623046875, 1.201202392578125, 1.2752685546875, 1.349334716796875, 1.42340087890625, 1.497467041015625, 1.571533203125, 1.645599365234375, 1.71966552734375, 1.793731689453125, 1.8677978515625, 1.941864013671875, 2.01593017578125, 2.089996337890625, 2.1640625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 7.0, 10.0, 15.0, 24.0, 46.0, 83.0, 103.0, 108.0, 139.0, 143.0, 91.0, 100.0, 63.0, 37.0, 17.0, 9.0, 6.0, 5.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0251007080078125, -0.023402929306030273, -0.021705150604248047, -0.02000737190246582, -0.018309593200683594, -0.016611814498901367, -0.01491403579711914, -0.013216257095336914, -0.011518478393554688, -0.009820699691772461, -0.008122920989990234, -0.006425142288208008, -0.004727363586425781, -0.0030295848846435547, -0.0013318061828613281, 0.00036597251892089844, 0.002063751220703125, 0.0037615299224853516, 0.005459308624267578, 0.007157087326049805, 0.008854866027832031, 0.010552644729614258, 0.012250423431396484, 0.013948202133178711, 0.015645980834960938, 0.017343759536743164, 0.01904153823852539, 0.020739316940307617, 0.022437095642089844, 0.02413487434387207, 0.025832653045654297, 0.027530431747436523, 0.02922821044921875, 0.030925989151000977, 0.0326237678527832, 0.03432154655456543, 0.036019325256347656, 0.03771710395812988, 0.03941488265991211, 0.041112661361694336, 0.04281044006347656, 0.04450821876525879, 0.046205997467041016, 0.04790377616882324, 0.04960155487060547, 0.051299333572387695, 0.05299711227416992, 0.05469489097595215, 0.056392669677734375, 0.0580904483795166, 0.05978822708129883, 0.061486005783081055, 0.06318378448486328, 0.06488156318664551, 0.06657934188842773, 0.06827712059020996, 0.06997489929199219, 0.07167267799377441, 0.07337045669555664, 0.07506823539733887, 0.0767660140991211, 0.07846379280090332, 0.08016157150268555, 0.08185935020446777, 0.08355712890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 13.0, 35.0, 136.0, 552.0, 10451.0, 4175157.0, 7169.0, 553.0, 150.0, 33.0, 17.0, 10.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.49835205078125, -2.2974853515625, -2.09661865234375, -1.895751953125, -1.69488525390625, -1.4940185546875, -1.29315185546875, -1.09228515625, -0.89141845703125, -0.6905517578125, -0.48968505859375, -0.288818359375, -0.08795166015625, 0.1129150390625, 0.31378173828125, 0.5146484375, 0.71551513671875, 0.9163818359375, 1.11724853515625, 1.318115234375, 1.51898193359375, 1.7198486328125, 1.92071533203125, 2.12158203125, 2.32244873046875, 2.5233154296875, 2.72418212890625, 2.925048828125, 3.12591552734375, 3.3267822265625, 3.52764892578125, 3.728515625, 3.92938232421875, 4.1302490234375, 4.33111572265625, 4.531982421875, 4.73284912109375, 4.9337158203125, 5.13458251953125, 5.33544921875, 5.53631591796875, 5.7371826171875, 5.93804931640625, 6.138916015625, 6.33978271484375, 6.5406494140625, 6.74151611328125, 6.9423828125, 7.14324951171875, 7.3441162109375, 7.54498291015625, 7.745849609375, 7.94671630859375, 8.1475830078125, 8.34844970703125, 8.54931640625, 8.75018310546875, 8.9510498046875, 9.15191650390625, 9.352783203125, 9.55364990234375, 9.7545166015625, 9.95538330078125, 10.15625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 5.0, 10.0, 28.0, 69.0, 181.0, 2766.0, 837.0, 109.0, 34.0, 12.0, 5.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1463623046875, -0.13147926330566406, -0.11659622192382812, -0.10171318054199219, -0.08683013916015625, -0.07194709777832031, -0.057064056396484375, -0.04218101501464844, -0.0272979736328125, -0.012414932250976562, 0.002468109130859375, 0.017351150512695312, 0.03223419189453125, 0.04711723327636719, 0.062000274658203125, 0.07688331604003906, 0.091766357421875, 0.10664939880371094, 0.12153244018554688, 0.1364154815673828, 0.15129852294921875, 0.1661815643310547, 0.18106460571289062, 0.19594764709472656, 0.2108306884765625, 0.22571372985839844, 0.24059677124023438, 0.2554798126220703, 0.27036285400390625, 0.2852458953857422, 0.3001289367675781, 0.31501197814941406, 0.32989501953125, 0.34477806091308594, 0.3596611022949219, 0.3745441436767578, 0.38942718505859375, 0.4043102264404297, 0.4191932678222656, 0.43407630920410156, 0.4489593505859375, 0.46384239196777344, 0.4787254333496094, 0.4936084747314453, 0.5084915161132812, 0.5233745574951172, 0.5382575988769531, 0.5531406402587891, 0.568023681640625, 0.5829067230224609, 0.5977897644042969, 0.6126728057861328, 0.6275558471679688, 0.6424388885498047, 0.6573219299316406, 0.6722049713134766, 0.6870880126953125, 0.7019710540771484, 0.7168540954589844, 0.7317371368408203, 0.7466201782226562, 0.7615032196044922, 0.7763862609863281, 0.7912693023681641, 0.80615234375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 84.0, 712.0, 177.0, 25.0, 10.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.265885353088379, -11.024155616760254, -10.782425880432129, -10.540696144104004, -10.298966407775879, -10.057236671447754, -9.815506935119629, -9.573777198791504, -9.332047462463379, -9.090317726135254, -8.848587989807129, -8.606858253479004, -8.365128517150879, -8.123398780822754, -7.881669044494629, -7.639939308166504, -7.398210048675537, -7.156480312347412, -6.914750576019287, -6.673020839691162, -6.431291103363037, -6.189561367034912, -5.947832107543945, -5.70610237121582, -5.464372634887695, -5.22264289855957, -4.980913162231445, -4.73918342590332, -4.497453689575195, -4.25572395324707, -4.013994216918945, -3.7722647190093994, -3.5305352210998535, -3.2888054847717285, -3.0470757484436035, -2.8053460121154785, -2.5636162757873535, -2.3218865394592285, -2.0801570415496826, -1.8384273052215576, -1.5966975688934326, -1.3549678325653076, -1.1132380962371826, -0.8715084791183472, -0.6297787427902222, -0.38804900646209717, -0.14631938934326172, 0.09541034698486328, 0.3371400833129883, 0.5788698196411133, 0.8205994963645935, 1.0623291730880737, 1.3040589094161987, 1.5457886457443237, 1.7875182628631592, 2.029247999191284, 2.270977735519409, 2.512707471847534, 2.754437208175659, 2.996166706085205, 3.23789644241333, 3.479626178741455, 3.72135591506958, 3.963085651397705, 4.20481538772583]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 10.0, 10.0, 20.0, 36.0, 44.0, 47.0, 73.0, 88.0, 87.0, 101.0, 97.0, 99.0, 64.0, 54.0, 40.0, 50.0, 32.0, 20.0, 17.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4191651344299316, -1.3642014265060425, -1.3092378377914429, -1.2542741298675537, -1.199310541152954, -1.144346833229065, -1.0893831253051758, -1.0344195365905762, -0.979455828666687, -0.9244921803474426, -0.8695285320281982, -0.8145648241043091, -0.7596011757850647, -0.7046375274658203, -0.6496738195419312, -0.5947101712226868, -0.5397465229034424, -0.484782874584198, -0.4298191964626312, -0.37485551834106445, -0.31989187002182007, -0.2649282217025757, -0.2099645435810089, -0.15500086545944214, -0.10003721714019775, -0.045073553919792175, 0.009890109300613403, 0.06485377252101898, 0.11981743574142456, 0.17478108406066895, 0.22974476218223572, 0.2847084403038025, 0.3396720886230469, 0.39463573694229126, 0.44959941506385803, 0.5045630931854248, 0.5595267415046692, 0.6144903898239136, 0.6694540977478027, 0.7244177460670471, 0.7793813943862915, 0.8343450427055359, 0.8893086910247803, 0.9442723989486694, 0.9992360472679138, 1.0541996955871582, 1.1091634035110474, 1.1641271114349365, 1.2190907001495361, 1.2740544080734253, 1.329017996788025, 1.383981704711914, 1.4389452934265137, 1.4939090013504028, 1.548872709274292, 1.6038362979888916, 1.6588000059127808, 1.71376371383667, 1.7687273025512695, 1.8236910104751587, 1.8786547183990479, 1.9336183071136475, 1.9885820150375366, 2.043545722961426, 2.0985093116760254]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 8.0, 3.0, 9.0, 17.0, 14.0, 31.0, 41.0, 40.0, 76.0, 109.0, 158.0, 263.0, 475.0, 843.0, 1975.0, 5832.0, 25956.0, 174307.0, 689127.0, 121359.0, 19674.0, 4770.0, 1609.0, 716.0, 414.0, 249.0, 136.0, 102.0, 66.0, 43.0, 49.0, 16.0, 16.0, 12.0, 12.0, 7.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.57275390625, -0.5525970458984375, -0.532440185546875, -0.5122833251953125, -0.49212646484375, -0.4719696044921875, -0.451812744140625, -0.4316558837890625, -0.4114990234375, -0.3913421630859375, -0.371185302734375, -0.3510284423828125, -0.33087158203125, -0.3107147216796875, -0.290557861328125, -0.2704010009765625, -0.250244140625, -0.2300872802734375, -0.209930419921875, -0.1897735595703125, -0.16961669921875, -0.1494598388671875, -0.129302978515625, -0.1091461181640625, -0.0889892578125, -0.0688323974609375, -0.048675537109375, -0.0285186767578125, -0.00836181640625, 0.0117950439453125, 0.031951904296875, 0.0521087646484375, 0.072265625, 0.0924224853515625, 0.112579345703125, 0.1327362060546875, 0.15289306640625, 0.1730499267578125, 0.193206787109375, 0.2133636474609375, 0.2335205078125, 0.2536773681640625, 0.273834228515625, 0.2939910888671875, 0.31414794921875, 0.3343048095703125, 0.354461669921875, 0.3746185302734375, 0.394775390625, 0.4149322509765625, 0.435089111328125, 0.4552459716796875, 0.47540283203125, 0.4955596923828125, 0.515716552734375, 0.5358734130859375, 0.5560302734375, 0.5761871337890625, 0.596343994140625, 0.6165008544921875, 0.63665771484375, 0.6568145751953125, 0.676971435546875, 0.6971282958984375, 0.71728515625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 6.0, 16.0, 7.0, 12.0, 25.0, 24.0, 38.0, 50.0, 55.0, 56.0, 72.0, 76.0, 89.0, 88.0, 73.0, 70.0, 51.0, 46.0, 31.0, 38.0, 30.0, 14.0, 18.0, 11.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0667724609375, -0.06397819519042969, -0.061183929443359375, -0.05838966369628906, -0.05559539794921875, -0.05280113220214844, -0.050006866455078125, -0.04721260070800781, -0.0444183349609375, -0.04162406921386719, -0.038829803466796875, -0.03603553771972656, -0.03324127197265625, -0.030447006225585938, -0.027652740478515625, -0.024858474731445312, -0.022064208984375, -0.019269943237304688, -0.016475677490234375, -0.013681411743164062, -0.01088714599609375, -0.008092880249023438, -0.005298614501953125, -0.0025043487548828125, 0.0002899169921875, 0.0030841827392578125, 0.005878448486328125, 0.008672714233398438, 0.01146697998046875, 0.014261245727539062, 0.017055511474609375, 0.019849777221679688, 0.02264404296875, 0.025438308715820312, 0.028232574462890625, 0.031026840209960938, 0.03382110595703125, 0.03661537170410156, 0.039409637451171875, 0.04220390319824219, 0.0449981689453125, 0.04779243469238281, 0.050586700439453125, 0.05338096618652344, 0.05617523193359375, 0.05896949768066406, 0.061763763427734375, 0.06455802917480469, 0.067352294921875, 0.07014656066894531, 0.07294082641601562, 0.07573509216308594, 0.07852935791015625, 0.08132362365722656, 0.08411788940429688, 0.08691215515136719, 0.0897064208984375, 0.09250068664550781, 0.09529495239257812, 0.09808921813964844, 0.10088348388671875, 0.10367774963378906, 0.10647201538085938, 0.10926628112792969, 0.112060546875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 6.0, 16.0, 16.0, 24.0, 44.0, 62.0, 78.0, 171.0, 359.0, 950.0, 3213.0, 18640.0, 370516.0, 620325.0, 28041.0, 4129.0, 1091.0, 385.0, 173.0, 119.0, 54.0, 45.0, 30.0, 25.0, 14.0, 13.0, 0.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.89990234375, -0.8762741088867188, -0.8526458740234375, -0.8290176391601562, -0.805389404296875, -0.7817611694335938, -0.7581329345703125, -0.7345046997070312, -0.71087646484375, -0.6872482299804688, -0.6636199951171875, -0.6399917602539062, -0.616363525390625, -0.5927352905273438, -0.5691070556640625, -0.5454788208007812, -0.5218505859375, -0.49822235107421875, -0.4745941162109375, -0.45096588134765625, -0.427337646484375, -0.40370941162109375, -0.3800811767578125, -0.35645294189453125, -0.33282470703125, -0.30919647216796875, -0.2855682373046875, -0.26194000244140625, -0.238311767578125, -0.21468353271484375, -0.1910552978515625, -0.16742706298828125, -0.143798828125, -0.12017059326171875, -0.0965423583984375, -0.07291412353515625, -0.049285888671875, -0.02565765380859375, -0.0020294189453125, 0.02159881591796875, 0.04522705078125, 0.06885528564453125, 0.0924835205078125, 0.11611175537109375, 0.139739990234375, 0.16336822509765625, 0.1869964599609375, 0.21062469482421875, 0.2342529296875, 0.25788116455078125, 0.2815093994140625, 0.30513763427734375, 0.328765869140625, 0.35239410400390625, 0.3760223388671875, 0.39965057373046875, 0.42327880859375, 0.44690704345703125, 0.4705352783203125, 0.49416351318359375, 0.517791748046875, 0.5414199829101562, 0.5650482177734375, 0.5886764526367188, 0.6123046875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 10.0, 11.0, 11.0, 12.0, 22.0, 23.0, 25.0, 31.0, 54.0, 58.0, 74.0, 60.0, 83.0, 70.0, 75.0, 72.0, 72.0, 63.0, 40.0, 30.0, 24.0, 14.0, 23.0, 10.0, 6.0, 7.0, 11.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5615234375, -0.5478935241699219, -0.5342636108398438, -0.5206336975097656, -0.5070037841796875, -0.4933738708496094, -0.47974395751953125, -0.4661140441894531, -0.452484130859375, -0.4388542175292969, -0.42522430419921875, -0.4115943908691406, -0.3979644775390625, -0.3843345642089844, -0.37070465087890625, -0.3570747375488281, -0.34344482421875, -0.3298149108886719, -0.31618499755859375, -0.3025550842285156, -0.2889251708984375, -0.2752952575683594, -0.26166534423828125, -0.24803543090820312, -0.234405517578125, -0.22077560424804688, -0.20714569091796875, -0.19351577758789062, -0.1798858642578125, -0.16625595092773438, -0.15262603759765625, -0.13899612426757812, -0.1253662109375, -0.11173629760742188, -0.09810638427734375, -0.08447647094726562, -0.0708465576171875, -0.057216644287109375, -0.04358673095703125, -0.029956817626953125, -0.016326904296875, -0.002696990966796875, 0.01093292236328125, 0.024562835693359375, 0.0381927490234375, 0.051822662353515625, 0.06545257568359375, 0.07908248901367188, 0.09271240234375, 0.10634231567382812, 0.11997222900390625, 0.13360214233398438, 0.1472320556640625, 0.16086196899414062, 0.17449188232421875, 0.18812179565429688, 0.201751708984375, 0.21538162231445312, 0.22901153564453125, 0.24264144897460938, 0.2562713623046875, 0.2699012756347656, 0.28353118896484375, 0.2971611022949219, 0.310791015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 16.0, 6.0, 20.0, 24.0, 52.0, 76.0, 152.0, 298.0, 652.0, 1517.0, 4253.0, 16111.0, 200558.0, 777018.0, 36786.0, 6938.0, 2305.0, 880.0, 400.0, 196.0, 91.0, 75.0, 37.0, 21.0, 19.0, 13.0, 7.0, 4.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.44580078125, -0.4319610595703125, -0.418121337890625, -0.4042816162109375, -0.39044189453125, -0.3766021728515625, -0.362762451171875, -0.3489227294921875, -0.3350830078125, -0.3212432861328125, -0.307403564453125, -0.2935638427734375, -0.27972412109375, -0.2658843994140625, -0.252044677734375, -0.2382049560546875, -0.224365234375, -0.2105255126953125, -0.196685791015625, -0.1828460693359375, -0.16900634765625, -0.1551666259765625, -0.141326904296875, -0.1274871826171875, -0.1136474609375, -0.0998077392578125, -0.085968017578125, -0.0721282958984375, -0.05828857421875, -0.0444488525390625, -0.030609130859375, -0.0167694091796875, -0.0029296875, 0.0109100341796875, 0.024749755859375, 0.0385894775390625, 0.05242919921875, 0.0662689208984375, 0.080108642578125, 0.0939483642578125, 0.1077880859375, 0.1216278076171875, 0.135467529296875, 0.1493072509765625, 0.16314697265625, 0.1769866943359375, 0.190826416015625, 0.2046661376953125, 0.218505859375, 0.2323455810546875, 0.246185302734375, 0.2600250244140625, 0.27386474609375, 0.2877044677734375, 0.301544189453125, 0.3153839111328125, 0.3292236328125, 0.3430633544921875, 0.356903076171875, 0.3707427978515625, 0.38458251953125, 0.3984222412109375, 0.412261962890625, 0.4261016845703125, 0.43994140625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 10.0, 6.0, 5.0, 6.0, 8.0, 20.0, 27.0, 53.0, 68.0, 119.0, 224.0, 163.0, 109.0, 52.0, 35.0, 19.0, 12.0, 13.0, 7.0, 8.0, 7.0, 5.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.979703903198242e-05, -6.760004907846451e-05, -6.54030591249466e-05, -6.320606917142868e-05, -6.1009079217910767e-05, -5.881208926439285e-05, -5.661509931087494e-05, -5.4418109357357025e-05, -5.222111940383911e-05, -5.00241294503212e-05, -4.7827139496803284e-05, -4.563014954328537e-05, -4.3433159589767456e-05, -4.123616963624954e-05, -3.903917968273163e-05, -3.6842189729213715e-05, -3.46451997756958e-05, -3.244820982217789e-05, -3.0251219868659973e-05, -2.805422991514206e-05, -2.5857239961624146e-05, -2.366025000810623e-05, -2.1463260054588318e-05, -1.9266270101070404e-05, -1.706928014755249e-05, -1.4872290194034576e-05, -1.2675300240516663e-05, -1.0478310286998749e-05, -8.281320333480835e-06, -6.084330379962921e-06, -3.887340426445007e-06, -1.6903504729270935e-06, 5.066394805908203e-07, 2.703629434108734e-06, 4.900619387626648e-06, 7.097609341144562e-06, 9.294599294662476e-06, 1.149158924818039e-05, 1.3688579201698303e-05, 1.5885569155216217e-05, 1.808255910873413e-05, 2.0279549062252045e-05, 2.247653901576996e-05, 2.4673528969287872e-05, 2.6870518922805786e-05, 2.90675088763237e-05, 3.1264498829841614e-05, 3.346148878335953e-05, 3.565847873687744e-05, 3.7855468690395355e-05, 4.005245864391327e-05, 4.224944859743118e-05, 4.44464385509491e-05, 4.664342850446701e-05, 4.8840418457984924e-05, 5.103740841150284e-05, 5.323439836502075e-05, 5.5431388318538666e-05, 5.762837827205658e-05, 5.9825368225574493e-05, 6.202235817909241e-05, 6.421934813261032e-05, 6.641633808612823e-05, 6.861332803964615e-05, 7.081031799316406e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 6.0, 11.0, 22.0, 30.0, 62.0, 89.0, 174.0, 298.0, 602.0, 1322.0, 3023.0, 8837.0, 40019.0, 549565.0, 398511.0, 33020.0, 7851.0, 2688.0, 1192.0, 548.0, 301.0, 158.0, 85.0, 45.0, 28.0, 16.0, 11.0, 6.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33447265625, -0.3229179382324219, -0.31136322021484375, -0.2998085021972656, -0.2882537841796875, -0.2766990661621094, -0.26514434814453125, -0.2535896301269531, -0.242034912109375, -0.23048019409179688, -0.21892547607421875, -0.20737075805664062, -0.1958160400390625, -0.18426132202148438, -0.17270660400390625, -0.16115188598632812, -0.14959716796875, -0.13804244995117188, -0.12648773193359375, -0.11493301391601562, -0.1033782958984375, -0.09182357788085938, -0.08026885986328125, -0.06871414184570312, -0.057159423828125, -0.045604705810546875, -0.03404998779296875, -0.022495269775390625, -0.0109405517578125, 0.000614166259765625, 0.01216888427734375, 0.023723602294921875, 0.0352783203125, 0.046833038330078125, 0.05838775634765625, 0.06994247436523438, 0.0814971923828125, 0.09305191040039062, 0.10460662841796875, 0.11616134643554688, 0.127716064453125, 0.13927078247070312, 0.15082550048828125, 0.16238021850585938, 0.1739349365234375, 0.18548965454101562, 0.19704437255859375, 0.20859909057617188, 0.22015380859375, 0.23170852661132812, 0.24326324462890625, 0.2548179626464844, 0.2663726806640625, 0.2779273986816406, 0.28948211669921875, 0.3010368347167969, 0.312591552734375, 0.3241462707519531, 0.33570098876953125, 0.3472557067871094, 0.3588104248046875, 0.3703651428222656, 0.38191986083984375, 0.3934745788574219, 0.405029296875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 8.0, 10.0, 11.0, 13.0, 8.0, 16.0, 18.0, 33.0, 23.0, 38.0, 45.0, 48.0, 70.0, 65.0, 69.0, 74.0, 65.0, 54.0, 61.0, 40.0, 37.0, 28.0, 29.0, 34.0, 22.0, 16.0, 8.0, 12.0, 4.0, 7.0, 0.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.11669921875, -0.11297798156738281, -0.10925674438476562, -0.10553550720214844, -0.10181427001953125, -0.09809303283691406, -0.09437179565429688, -0.09065055847167969, -0.0869293212890625, -0.08320808410644531, -0.07948684692382812, -0.07576560974121094, -0.07204437255859375, -0.06832313537597656, -0.06460189819335938, -0.06088066101074219, -0.057159423828125, -0.05343818664550781, -0.049716949462890625, -0.04599571228027344, -0.04227447509765625, -0.03855323791503906, -0.034832000732421875, -0.031110763549804688, -0.0273895263671875, -0.023668289184570312, -0.019947052001953125, -0.016225814819335938, -0.01250457763671875, -0.008783340454101562, -0.005062103271484375, -0.0013408660888671875, 0.00238037109375, 0.0061016082763671875, 0.009822845458984375, 0.013544082641601562, 0.01726531982421875, 0.020986557006835938, 0.024707794189453125, 0.028429031372070312, 0.0321502685546875, 0.03587150573730469, 0.039592742919921875, 0.04331398010253906, 0.04703521728515625, 0.05075645446777344, 0.054477691650390625, 0.05819892883300781, 0.061920166015625, 0.06564140319824219, 0.06936264038085938, 0.07308387756347656, 0.07680511474609375, 0.08052635192871094, 0.08424758911132812, 0.08796882629394531, 0.0916900634765625, 0.09541130065917969, 0.09913253784179688, 0.10285377502441406, 0.10657501220703125, 0.11029624938964844, 0.11401748657226562, 0.11773872375488281, 0.1214599609375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 35.0, 120.0, 410.0, 301.0, 97.0, 23.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.70315933227539, -10.504842758178711, -10.306526184082031, -10.108210563659668, -9.909893989562988, -9.711577415466309, -9.513260841369629, -9.31494426727295, -9.116628646850586, -8.918312072753906, -8.719995498657227, -8.521679878234863, -8.323363304138184, -8.125046730041504, -7.926730155944824, -7.728414058685303, -7.530097007751465, -7.331780433654785, -7.133464336395264, -6.935147762298584, -6.7368316650390625, -6.538515090942383, -6.340198516845703, -6.141882419586182, -5.94356632232666, -5.7452497482299805, -5.546933650970459, -5.348617076873779, -5.150300979614258, -4.951984405517578, -4.753667831420898, -4.555351734161377, -4.357034683227539, -4.158718109130859, -3.960402011871338, -3.762085437774658, -3.5637691020965576, -3.365452766418457, -3.1671364307403564, -2.968820095062256, -2.7705037593841553, -2.5721874237060547, -2.373871088027954, -2.1755547523498535, -1.9772381782531738, -1.7789218425750732, -1.5806055068969727, -1.3822890520095825, -1.183972716331482, -0.9856563210487366, -0.7873399257659912, -0.5890235900878906, -0.39070719480514526, -0.1923907995223999, 0.005925536155700684, 0.20424199104309082, 0.4025583267211914, 0.6008747220039368, 0.7991911172866821, 0.9975074529647827, 1.1958239078521729, 1.3941402435302734, 1.592456579208374, 1.7907730340957642, 1.9890893697738647]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 9.0, 9.0, 12.0, 19.0, 17.0, 46.0, 42.0, 46.0, 69.0, 60.0, 77.0, 57.0, 65.0, 71.0, 66.0, 59.0, 55.0, 47.0, 42.0, 34.0, 25.0, 21.0, 17.0, 15.0, 4.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9832431077957153, -1.9075418710708618, -1.8318407535552979, -1.7561395168304443, -1.6804382801055908, -1.6047370433807373, -1.5290359258651733, -1.4533346891403198, -1.3776335716247559, -1.3019323348999023, -1.2262312173843384, -1.1505299806594849, -1.0748287439346313, -0.9991275668144226, -0.9234263896942139, -0.8477251529693604, -0.7720239162445068, -0.6963227391242981, -0.6206215023994446, -0.5449203252792358, -0.4692191183567047, -0.3935179114341736, -0.31781673431396484, -0.24211549758911133, -0.1664143204689026, -0.09071312099695206, -0.015011921525001526, 0.06068927049636841, 0.13639047741889954, 0.21209168434143066, 0.2877928614616394, 0.3634940981864929, 0.4391953945159912, 0.5148965716362, 0.5905978083610535, 0.6662989854812622, 0.7420002222061157, 0.8177013993263245, 0.8934025764465332, 0.9691038131713867, 1.0448050498962402, 1.1205062866210938, 1.1962074041366577, 1.2719086408615112, 1.3476098775863647, 1.4233109951019287, 1.4990122318267822, 1.5747134685516357, 1.6504145860671997, 1.7261158227920532, 1.8018169403076172, 1.8775181770324707, 1.9532194137573242, 2.0289206504821777, 2.1046218872070312, 2.1803231239318848, 2.256024122238159, 2.3317253589630127, 2.407426595687866, 2.4831275939941406, 2.558828830718994, 2.6345300674438477, 2.710231304168701, 2.7859325408935547, 2.861633777618408]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 6.0, 14.0, 19.0, 10.0, 13.0, 29.0, 43.0, 50.0, 87.0, 159.0, 234.0, 569.0, 1412.0, 4421.0, 27290.0, 4066457.0, 81711.0, 7900.0, 2244.0, 828.0, 356.0, 181.0, 74.0, 59.0, 30.0, 27.0, 9.0, 10.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.279296875, -2.221832275390625, -2.16436767578125, -2.106903076171875, -2.0494384765625, -1.991973876953125, -1.93450927734375, -1.877044677734375, -1.819580078125, -1.762115478515625, -1.70465087890625, -1.647186279296875, -1.5897216796875, -1.532257080078125, -1.47479248046875, -1.417327880859375, -1.35986328125, -1.302398681640625, -1.24493408203125, -1.187469482421875, -1.1300048828125, -1.072540283203125, -1.01507568359375, -0.957611083984375, -0.900146484375, -0.842681884765625, -0.78521728515625, -0.727752685546875, -0.6702880859375, -0.612823486328125, -0.55535888671875, -0.497894287109375, -0.4404296875, -0.382965087890625, -0.32550048828125, -0.268035888671875, -0.2105712890625, -0.153106689453125, -0.09564208984375, -0.038177490234375, 0.019287109375, 0.076751708984375, 0.13421630859375, 0.191680908203125, 0.2491455078125, 0.306610107421875, 0.36407470703125, 0.421539306640625, 0.47900390625, 0.536468505859375, 0.59393310546875, 0.651397705078125, 0.7088623046875, 0.766326904296875, 0.82379150390625, 0.881256103515625, 0.938720703125, 0.996185302734375, 1.05364990234375, 1.111114501953125, 1.1685791015625, 1.226043701171875, 1.28350830078125, 1.340972900390625, 1.3984375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 10.0, 8.0, 10.0, 21.0, 35.0, 35.0, 60.0, 63.0, 69.0, 83.0, 107.0, 100.0, 90.0, 79.0, 64.0, 51.0, 40.0, 31.0, 18.0, 8.0, 10.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08355712890625, -0.08021259307861328, -0.07686805725097656, -0.07352352142333984, -0.07017898559570312, -0.0668344497680664, -0.06348991394042969, -0.06014537811279297, -0.05680084228515625, -0.05345630645751953, -0.05011177062988281, -0.046767234802246094, -0.043422698974609375, -0.040078163146972656, -0.03673362731933594, -0.03338909149169922, -0.0300445556640625, -0.02670001983642578, -0.023355484008789062, -0.020010948181152344, -0.016666412353515625, -0.013321876525878906, -0.009977340698242188, -0.006632804870605469, -0.00328826904296875, 5.626678466796875e-05, 0.0034008026123046875, 0.006745338439941406, 0.010089874267578125, 0.013434410095214844, 0.016778945922851562, 0.02012348175048828, 0.023468017578125, 0.02681255340576172, 0.030157089233398438, 0.033501625061035156, 0.036846160888671875, 0.040190696716308594, 0.04353523254394531, 0.04687976837158203, 0.05022430419921875, 0.05356884002685547, 0.05691337585449219, 0.060257911682128906, 0.06360244750976562, 0.06694698333740234, 0.07029151916503906, 0.07363605499267578, 0.0769805908203125, 0.08032512664794922, 0.08366966247558594, 0.08701419830322266, 0.09035873413085938, 0.0937032699584961, 0.09704780578613281, 0.10039234161376953, 0.10373687744140625, 0.10708141326904297, 0.11042594909667969, 0.1137704849243164, 0.11711502075195312, 0.12045955657958984, 0.12380409240722656, 0.12714862823486328, 0.1304931640625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 28.0, 64.0, 202.0, 581.0, 2259.0, 4098789.0, 89888.0, 1739.0, 487.0, 153.0, 51.0, 15.0, 8.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.90625, -8.7122802734375, -8.518310546875, -8.3243408203125, -8.13037109375, -7.9364013671875, -7.742431640625, -7.5484619140625, -7.3544921875, -7.1605224609375, -6.966552734375, -6.7725830078125, -6.57861328125, -6.3846435546875, -6.190673828125, -5.9967041015625, -5.802734375, -5.6087646484375, -5.414794921875, -5.2208251953125, -5.02685546875, -4.8328857421875, -4.638916015625, -4.4449462890625, -4.2509765625, -4.0570068359375, -3.863037109375, -3.6690673828125, -3.47509765625, -3.2811279296875, -3.087158203125, -2.8931884765625, -2.69921875, -2.5052490234375, -2.311279296875, -2.1173095703125, -1.92333984375, -1.7293701171875, -1.535400390625, -1.3414306640625, -1.1474609375, -0.9534912109375, -0.759521484375, -0.5655517578125, -0.37158203125, -0.1776123046875, 0.016357421875, 0.2103271484375, 0.404296875, 0.5982666015625, 0.792236328125, 0.9862060546875, 1.18017578125, 1.3741455078125, 1.568115234375, 1.7620849609375, 1.9560546875, 2.1500244140625, 2.343994140625, 2.5379638671875, 2.73193359375, 2.9259033203125, 3.119873046875, 3.3138427734375, 3.5078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 51.0, 421.0, 3474.0, 98.0, 18.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.404296875, -1.3745613098144531, -1.3448257446289062, -1.3150901794433594, -1.2853546142578125, -1.2556190490722656, -1.2258834838867188, -1.1961479187011719, -1.166412353515625, -1.1366767883300781, -1.1069412231445312, -1.0772056579589844, -1.0474700927734375, -1.0177345275878906, -0.9879989624023438, -0.9582633972167969, -0.92852783203125, -0.8987922668457031, -0.8690567016601562, -0.8393211364746094, -0.8095855712890625, -0.7798500061035156, -0.7501144409179688, -0.7203788757324219, -0.690643310546875, -0.6609077453613281, -0.6311721801757812, -0.6014366149902344, -0.5717010498046875, -0.5419654846191406, -0.5122299194335938, -0.4824943542480469, -0.4527587890625, -0.4230232238769531, -0.39328765869140625, -0.3635520935058594, -0.3338165283203125, -0.3040809631347656, -0.27434539794921875, -0.24460983276367188, -0.214874267578125, -0.18513870239257812, -0.15540313720703125, -0.12566757202148438, -0.0959320068359375, -0.06619644165039062, -0.03646087646484375, -0.006725311279296875, 0.02301025390625, 0.052745819091796875, 0.08248138427734375, 0.11221694946289062, 0.1419525146484375, 0.17168807983398438, 0.20142364501953125, 0.23115921020507812, 0.260894775390625, 0.2906303405761719, 0.32036590576171875, 0.3501014709472656, 0.3798370361328125, 0.4095726013183594, 0.43930816650390625, 0.4690437316894531, 0.498779296875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 149.0, 837.0, 19.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.259843826293945, -10.728723526000977, -10.197602272033691, -9.666481018066406, -9.135360717773438, -8.604240417480469, -8.073119163513184, -7.541998386383057, -7.01087760925293, -6.479756832122803, -5.948636054992676, -5.417515277862549, -4.886394500732422, -4.355273723602295, -3.824152946472168, -3.293032169342041, -2.761911392211914, -2.230790615081787, -1.6996698379516602, -1.1685490608215332, -0.6374282836914062, -0.1063075065612793, 0.42481327056884766, 0.9559340476989746, 1.4870548248291016, 2.0181756019592285, 2.5492963790893555, 3.0804171562194824, 3.6115379333496094, 4.142658710479736, 4.673779487609863, 5.20490026473999, 5.73602294921875, 6.267143726348877, 6.798264503479004, 7.329385280609131, 7.860506057739258, 8.391626358032227, 8.922747611999512, 9.453868865966797, 9.984989166259766, 10.516109466552734, 11.04723072052002, 11.578351974487305, 12.109472274780273, 12.640592575073242, 13.171713829040527, 13.702835083007812, 14.233955383300781, 14.76507568359375, 15.296196937561035, 15.82731819152832, 16.35843849182129, 16.889558792114258, 17.42068099975586, 17.951801300048828, 18.482921600341797, 19.014041900634766, 19.545162200927734, 20.076284408569336, 20.607404708862305, 21.138525009155273, 21.669647216796875, 22.200767517089844, 22.731887817382812]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 14.0, 19.0, 41.0, 85.0, 114.0, 166.0, 170.0, 151.0, 112.0, 59.0, 38.0, 17.0, 11.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1737537384033203, -2.0916032791137695, -2.0094528198242188, -1.927302360534668, -1.8451519012451172, -1.7630014419555664, -1.6808509826660156, -1.5987005233764648, -1.516550064086914, -1.4343996047973633, -1.3522491455078125, -1.2700986862182617, -1.187948226928711, -1.1057977676391602, -1.0236473083496094, -0.9414967894554138, -0.8593462705612183, -0.7771958112716675, -0.6950453519821167, -0.6128948926925659, -0.5307444334030151, -0.44859394431114197, -0.3664434552192688, -0.284292995929718, -0.20214253664016724, -0.11999206990003586, -0.03784160315990448, 0.044308871030807495, 0.12645933032035828, 0.20860978960990906, 0.2907602787017822, 0.372910737991333, 0.4550611972808838, 0.5372116565704346, 0.6193621158599854, 0.7015125751495361, 0.7836630344390869, 0.8658134937286377, 0.9479640126228333, 1.0301144123077393, 1.11226487159729, 1.1944153308868408, 1.2765657901763916, 1.3587162494659424, 1.4408667087554932, 1.523017168045044, 1.6051676273345947, 1.6873180866241455, 1.7694686651229858, 1.8516191244125366, 1.9337695837020874, 2.0159201622009277, 2.0980706214904785, 2.1802210807800293, 2.26237154006958, 2.344521999359131, 2.4266724586486816, 2.5088229179382324, 2.590973377227783, 2.673123836517334, 2.7552742958068848, 2.8374247550964355, 2.9195752143859863, 3.001725673675537, 3.083876132965088]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 9.0, 6.0, 12.0, 11.0, 21.0, 33.0, 41.0, 75.0, 123.0, 178.0, 329.0, 670.0, 1606.0, 4312.0, 19014.0, 180778.0, 744886.0, 79471.0, 11341.0, 3113.0, 1225.0, 571.0, 307.0, 158.0, 90.0, 66.0, 38.0, 20.0, 18.0, 8.0, 11.0, 5.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.90283203125, -0.87799072265625, -0.8531494140625, -0.82830810546875, -0.803466796875, -0.77862548828125, -0.7537841796875, -0.72894287109375, -0.7041015625, -0.67926025390625, -0.6544189453125, -0.62957763671875, -0.604736328125, -0.57989501953125, -0.5550537109375, -0.53021240234375, -0.50537109375, -0.48052978515625, -0.4556884765625, -0.43084716796875, -0.406005859375, -0.38116455078125, -0.3563232421875, -0.33148193359375, -0.306640625, -0.28179931640625, -0.2569580078125, -0.23211669921875, -0.207275390625, -0.18243408203125, -0.1575927734375, -0.13275146484375, -0.10791015625, -0.08306884765625, -0.0582275390625, -0.03338623046875, -0.008544921875, 0.01629638671875, 0.0411376953125, 0.06597900390625, 0.0908203125, 0.11566162109375, 0.1405029296875, 0.16534423828125, 0.190185546875, 0.21502685546875, 0.2398681640625, 0.26470947265625, 0.28955078125, 0.31439208984375, 0.3392333984375, 0.36407470703125, 0.388916015625, 0.41375732421875, 0.4385986328125, 0.46343994140625, 0.48828125, 0.51312255859375, 0.5379638671875, 0.56280517578125, 0.587646484375, 0.61248779296875, 0.6373291015625, 0.66217041015625, 0.68701171875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 15.0, 15.0, 27.0, 19.0, 33.0, 44.0, 62.0, 56.0, 59.0, 61.0, 64.0, 77.0, 93.0, 70.0, 64.0, 45.0, 47.0, 31.0, 23.0, 31.0, 19.0, 13.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08294677734375, -0.08010578155517578, -0.07726478576660156, -0.07442378997802734, -0.07158279418945312, -0.0687417984008789, -0.06590080261230469, -0.06305980682373047, -0.06021881103515625, -0.05737781524658203, -0.05453681945800781, -0.051695823669433594, -0.048854827880859375, -0.046013832092285156, -0.04317283630371094, -0.04033184051513672, -0.0374908447265625, -0.03464984893798828, -0.03180885314941406, -0.028967857360839844, -0.026126861572265625, -0.023285865783691406, -0.020444869995117188, -0.01760387420654297, -0.01476287841796875, -0.011921882629394531, -0.009080886840820312, -0.006239891052246094, -0.003398895263671875, -0.0005578994750976562, 0.0022830963134765625, 0.005124092102050781, 0.007965087890625, 0.010806083679199219, 0.013647079467773438, 0.016488075256347656, 0.019329071044921875, 0.022170066833496094, 0.025011062622070312, 0.02785205841064453, 0.03069305419921875, 0.03353404998779297, 0.03637504577636719, 0.039216041564941406, 0.042057037353515625, 0.044898033142089844, 0.04773902893066406, 0.05058002471923828, 0.0534210205078125, 0.05626201629638672, 0.05910301208496094, 0.061944007873535156, 0.06478500366210938, 0.0676259994506836, 0.07046699523925781, 0.07330799102783203, 0.07614898681640625, 0.07898998260498047, 0.08183097839355469, 0.0846719741821289, 0.08751296997070312, 0.09035396575927734, 0.09319496154785156, 0.09603595733642578, 0.098876953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 13.0, 8.0, 16.0, 28.0, 28.0, 40.0, 75.0, 88.0, 172.0, 293.0, 536.0, 1112.0, 2982.0, 10614.0, 63208.0, 585161.0, 337194.0, 35841.0, 6924.0, 2162.0, 905.0, 497.0, 223.0, 144.0, 89.0, 58.0, 43.0, 29.0, 14.0, 13.0, 11.0, 7.0, 3.0, 4.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.398193359375, -0.3815040588378906, -0.36481475830078125, -0.3481254577636719, -0.3314361572265625, -0.3147468566894531, -0.29805755615234375, -0.2813682556152344, -0.264678955078125, -0.24798965454101562, -0.23130035400390625, -0.21461105346679688, -0.1979217529296875, -0.18123245239257812, -0.16454315185546875, -0.14785385131835938, -0.13116455078125, -0.11447525024414062, -0.09778594970703125, -0.08109664916992188, -0.0644073486328125, -0.047718048095703125, -0.03102874755859375, -0.014339447021484375, 0.002349853515625, 0.019039154052734375, 0.03572845458984375, 0.052417755126953125, 0.0691070556640625, 0.08579635620117188, 0.10248565673828125, 0.11917495727539062, 0.1358642578125, 0.15255355834960938, 0.16924285888671875, 0.18593215942382812, 0.2026214599609375, 0.21931076049804688, 0.23600006103515625, 0.2526893615722656, 0.269378662109375, 0.2860679626464844, 0.30275726318359375, 0.3194465637207031, 0.3361358642578125, 0.3528251647949219, 0.36951446533203125, 0.3862037658691406, 0.40289306640625, 0.4195823669433594, 0.43627166748046875, 0.4529609680175781, 0.4696502685546875, 0.4863395690917969, 0.5030288696289062, 0.5197181701660156, 0.536407470703125, 0.5530967712402344, 0.5697860717773438, 0.5864753723144531, 0.6031646728515625, 0.6198539733886719, 0.6365432739257812, 0.6532325744628906, 0.669921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 2.0, 5.0, 1.0, 5.0, 8.0, 12.0, 9.0, 12.0, 21.0, 13.0, 19.0, 24.0, 34.0, 41.0, 41.0, 45.0, 53.0, 51.0, 61.0, 55.0, 46.0, 64.0, 39.0, 43.0, 39.0, 36.0, 40.0, 41.0, 25.0, 20.0, 24.0, 18.0, 19.0, 7.0, 10.0, 13.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2274169921875, -0.21751976013183594, -0.20762252807617188, -0.1977252960205078, -0.18782806396484375, -0.1779308319091797, -0.16803359985351562, -0.15813636779785156, -0.1482391357421875, -0.13834190368652344, -0.12844467163085938, -0.11854743957519531, -0.10865020751953125, -0.09875297546386719, -0.08885574340820312, -0.07895851135253906, -0.069061279296875, -0.05916404724121094, -0.049266815185546875, -0.03936958312988281, -0.02947235107421875, -0.019575119018554688, -0.009677886962890625, 0.0002193450927734375, 0.0101165771484375, 0.020013809204101562, 0.029911041259765625, 0.03980827331542969, 0.04970550537109375, 0.05960273742675781, 0.06949996948242188, 0.07939720153808594, 0.08929443359375, 0.09919166564941406, 0.10908889770507812, 0.11898612976074219, 0.12888336181640625, 0.1387805938720703, 0.14867782592773438, 0.15857505798339844, 0.1684722900390625, 0.17836952209472656, 0.18826675415039062, 0.1981639862060547, 0.20806121826171875, 0.2179584503173828, 0.22785568237304688, 0.23775291442871094, 0.247650146484375, 0.25754737854003906, 0.2674446105957031, 0.2773418426513672, 0.28723907470703125, 0.2971363067626953, 0.3070335388183594, 0.31693077087402344, 0.3268280029296875, 0.33672523498535156, 0.3466224670410156, 0.3565196990966797, 0.36641693115234375, 0.3763141632080078, 0.3862113952636719, 0.39610862731933594, 0.406005859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 5.0, 7.0, 11.0, 19.0, 22.0, 33.0, 56.0, 116.0, 199.0, 485.0, 1235.0, 3776.0, 16793.0, 220592.0, 759400.0, 36372.0, 6171.0, 1878.0, 693.0, 286.0, 153.0, 82.0, 67.0, 24.0, 13.0, 16.0, 13.0, 7.0, 4.0, 2.0, 4.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3544921875, -0.3419189453125, -0.329345703125, -0.3167724609375, -0.30419921875, -0.2916259765625, -0.279052734375, -0.2664794921875, -0.25390625, -0.2413330078125, -0.228759765625, -0.2161865234375, -0.20361328125, -0.1910400390625, -0.178466796875, -0.1658935546875, -0.1533203125, -0.1407470703125, -0.128173828125, -0.1156005859375, -0.10302734375, -0.0904541015625, -0.077880859375, -0.0653076171875, -0.052734375, -0.0401611328125, -0.027587890625, -0.0150146484375, -0.00244140625, 0.0101318359375, 0.022705078125, 0.0352783203125, 0.0478515625, 0.0604248046875, 0.072998046875, 0.0855712890625, 0.09814453125, 0.1107177734375, 0.123291015625, 0.1358642578125, 0.1484375, 0.1610107421875, 0.173583984375, 0.1861572265625, 0.19873046875, 0.2113037109375, 0.223876953125, 0.2364501953125, 0.2490234375, 0.2615966796875, 0.274169921875, 0.2867431640625, 0.29931640625, 0.3118896484375, 0.324462890625, 0.3370361328125, 0.349609375, 0.3621826171875, 0.374755859375, 0.3873291015625, 0.39990234375, 0.4124755859375, 0.425048828125, 0.4376220703125, 0.4501953125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 5.0, 5.0, 5.0, 11.0, 8.0, 17.0, 25.0, 30.0, 39.0, 58.0, 79.0, 102.0, 126.0, 133.0, 91.0, 63.0, 64.0, 34.0, 23.0, 17.0, 10.0, 9.0, 10.0, 9.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.4286251068115234e-05, -4.311557859182358e-05, -4.194490611553192e-05, -4.0774233639240265e-05, -3.960356116294861e-05, -3.843288868665695e-05, -3.7262216210365295e-05, -3.609154373407364e-05, -3.492087125778198e-05, -3.3750198781490326e-05, -3.257952630519867e-05, -3.140885382890701e-05, -3.0238181352615356e-05, -2.90675088763237e-05, -2.7896836400032043e-05, -2.6726163923740387e-05, -2.555549144744873e-05, -2.4384818971157074e-05, -2.3214146494865417e-05, -2.204347401857376e-05, -2.0872801542282104e-05, -1.9702129065990448e-05, -1.853145658969879e-05, -1.7360784113407135e-05, -1.619011163711548e-05, -1.5019439160823822e-05, -1.3848766684532166e-05, -1.2678094208240509e-05, -1.1507421731948853e-05, -1.0336749255657196e-05, -9.16607677936554e-06, -7.995404303073883e-06, -6.8247318267822266e-06, -5.65405935049057e-06, -4.4833868741989136e-06, -3.312714397907257e-06, -2.1420419216156006e-06, -9.71369445323944e-07, 1.993030309677124e-07, 1.369975507259369e-06, 2.5406479835510254e-06, 3.711320459842682e-06, 4.881992936134338e-06, 6.052665412425995e-06, 7.223337888717651e-06, 8.394010365009308e-06, 9.564682841300964e-06, 1.0735355317592621e-05, 1.1906027793884277e-05, 1.3076700270175934e-05, 1.424737274646759e-05, 1.5418045222759247e-05, 1.6588717699050903e-05, 1.775939017534256e-05, 1.8930062651634216e-05, 2.0100735127925873e-05, 2.127140760421753e-05, 2.2442080080509186e-05, 2.3612752556800842e-05, 2.47834250330925e-05, 2.5954097509384155e-05, 2.7124769985675812e-05, 2.8295442461967468e-05, 2.9466114938259125e-05, 3.063678741455078e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 9.0, 7.0, 11.0, 13.0, 23.0, 26.0, 45.0, 73.0, 120.0, 227.0, 440.0, 976.0, 2706.0, 10761.0, 121170.0, 865714.0, 37037.0, 5914.0, 1756.0, 701.0, 349.0, 172.0, 114.0, 76.0, 40.0, 19.0, 19.0, 12.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4287109375, -0.41241455078125, -0.3961181640625, -0.37982177734375, -0.363525390625, -0.34722900390625, -0.3309326171875, -0.31463623046875, -0.29833984375, -0.28204345703125, -0.2657470703125, -0.24945068359375, -0.233154296875, -0.21685791015625, -0.2005615234375, -0.18426513671875, -0.16796875, -0.15167236328125, -0.1353759765625, -0.11907958984375, -0.102783203125, -0.08648681640625, -0.0701904296875, -0.05389404296875, -0.03759765625, -0.02130126953125, -0.0050048828125, 0.01129150390625, 0.027587890625, 0.04388427734375, 0.0601806640625, 0.07647705078125, 0.0927734375, 0.10906982421875, 0.1253662109375, 0.14166259765625, 0.157958984375, 0.17425537109375, 0.1905517578125, 0.20684814453125, 0.22314453125, 0.23944091796875, 0.2557373046875, 0.27203369140625, 0.288330078125, 0.30462646484375, 0.3209228515625, 0.33721923828125, 0.353515625, 0.36981201171875, 0.3861083984375, 0.40240478515625, 0.418701171875, 0.43499755859375, 0.4512939453125, 0.46759033203125, 0.48388671875, 0.50018310546875, 0.5164794921875, 0.53277587890625, 0.549072265625, 0.56536865234375, 0.5816650390625, 0.59796142578125, 0.6142578125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 13.0, 13.0, 8.0, 19.0, 34.0, 38.0, 72.0, 88.0, 123.0, 134.0, 120.0, 94.0, 70.0, 68.0, 26.0, 16.0, 19.0, 6.0, 6.0, 11.0, 5.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.150634765625, -0.14421463012695312, -0.13779449462890625, -0.13137435913085938, -0.1249542236328125, -0.11853408813476562, -0.11211395263671875, -0.10569381713867188, -0.099273681640625, -0.09285354614257812, -0.08643341064453125, -0.08001327514648438, -0.0735931396484375, -0.06717300415039062, -0.06075286865234375, -0.054332733154296875, -0.04791259765625, -0.041492462158203125, -0.03507232666015625, -0.028652191162109375, -0.0222320556640625, -0.015811920166015625, -0.00939178466796875, -0.002971649169921875, 0.003448486328125, 0.009868621826171875, 0.01628875732421875, 0.022708892822265625, 0.0291290283203125, 0.035549163818359375, 0.04196929931640625, 0.048389434814453125, 0.0548095703125, 0.061229705810546875, 0.06764984130859375, 0.07406997680664062, 0.0804901123046875, 0.08691024780273438, 0.09333038330078125, 0.09975051879882812, 0.106170654296875, 0.11259078979492188, 0.11901092529296875, 0.12543106079101562, 0.1318511962890625, 0.13827133178710938, 0.14469146728515625, 0.15111160278320312, 0.15753173828125, 0.16395187377929688, 0.17037200927734375, 0.17679214477539062, 0.1832122802734375, 0.18963241577148438, 0.19605255126953125, 0.20247268676757812, 0.208892822265625, 0.21531295776367188, 0.22173309326171875, 0.22815322875976562, 0.2345733642578125, 0.24099349975585938, 0.24741363525390625, 0.2538337707519531, 0.26025390625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 5.0, 15.0, 18.0, 32.0, 83.0, 161.0, 192.0, 197.0, 138.0, 76.0, 38.0, 18.0, 13.0, 10.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.616629123687744, -3.518491506576538, -3.420354127883911, -3.322216510772705, -3.224079132080078, -3.125941514968872, -3.027804136276245, -2.929666519165039, -2.831529140472412, -2.733391523361206, -2.635254144668579, -2.537116527557373, -2.438979148864746, -2.34084153175354, -2.242704153060913, -2.144566535949707, -2.04642915725708, -1.9482916593551636, -1.850154161453247, -1.7520166635513306, -1.653879165649414, -1.5557416677474976, -1.457604169845581, -1.359466552734375, -1.261328935623169, -1.1631914377212524, -1.065053939819336, -0.9669164419174194, -0.8687789440155029, -0.7706414461135864, -0.6725038886070251, -0.5743663907051086, -0.4762289524078369, -0.3780914545059204, -0.2799539566040039, -0.18181642889976501, -0.08367893099784851, 0.014458566904067993, 0.11259609460830688, 0.2107335925102234, 0.3088710904121399, 0.4070085883140564, 0.5051460862159729, 0.6032836437225342, 0.7014211416244507, 0.7995586395263672, 0.8976961374282837, 0.9958336353302002, 1.0939711332321167, 1.1921086311340332, 1.2902461290359497, 1.3883836269378662, 1.4865211248397827, 1.5846586227416992, 1.6827962398529053, 1.7809336185455322, 1.8790712356567383, 1.9772087335586548, 2.0753462314605713, 2.1734838485717773, 2.2716212272644043, 2.3697588443756104, 2.4678962230682373, 2.5660338401794434, 2.6641712188720703]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 9.0, 4.0, 5.0, 8.0, 7.0, 13.0, 10.0, 22.0, 17.0, 15.0, 25.0, 30.0, 47.0, 28.0, 38.0, 49.0, 47.0, 54.0, 43.0, 48.0, 55.0, 42.0, 43.0, 46.0, 38.0, 44.0, 35.0, 27.0, 25.0, 28.0, 20.0, 16.0, 9.0, 12.0, 12.0, 5.0, 11.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0], "bins": [-1.9739840030670166, -1.9223936796188354, -1.8708032369613647, -1.8192129135131836, -1.767622470855713, -1.7160321474075317, -1.664441704750061, -1.6128513813018799, -1.5612609386444092, -1.509670615196228, -1.4580801725387573, -1.4064898490905762, -1.3548994064331055, -1.3033090829849243, -1.2517186403274536, -1.2001283168792725, -1.1485378742218018, -1.0969475507736206, -1.04535710811615, -0.993766725063324, -0.942176342010498, -0.8905860185623169, -0.8389955759048462, -0.787405252456665, -0.7358149290084839, -0.684224545955658, -0.632634162902832, -0.5810437798500061, -0.5294533967971802, -0.47786304354667664, -0.4262726604938507, -0.3746822774410248, -0.32309186458587646, -0.27150148153305054, -0.2199110984802246, -0.16832073032855988, -0.11673034727573395, -0.06513997912406921, -0.013549596071243286, 0.03804078698158264, 0.08963117003440857, 0.1412215530872345, 0.19281193614006042, 0.24440230429172516, 0.2959926724433899, 0.3475830554962158, 0.39917343854904175, 0.4507638216018677, 0.5023542046546936, 0.5539445877075195, 0.6055349707603455, 0.6571253538131714, 0.7087157368659973, 0.7603061199188232, 0.8118964433670044, 0.8634868860244751, 0.9150772094726562, 0.9666675925254822, 1.018257975578308, 1.0698482990264893, 1.12143874168396, 1.1730290651321411, 1.2246195077896118, 1.276209831237793, 1.3278002738952637]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 3.0, 10.0, 5.0, 12.0, 18.0, 30.0, 34.0, 49.0, 57.0, 68.0, 115.0, 192.0, 324.0, 582.0, 1234.0, 2980.0, 10494.0, 59118.0, 3926299.0, 164523.0, 19108.0, 5294.0, 1919.0, 847.0, 417.0, 211.0, 120.0, 76.0, 45.0, 39.0, 15.0, 14.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.7197265625, -1.6794281005859375, -1.639129638671875, -1.5988311767578125, -1.55853271484375, -1.5182342529296875, -1.477935791015625, -1.4376373291015625, -1.3973388671875, -1.3570404052734375, -1.316741943359375, -1.2764434814453125, -1.23614501953125, -1.1958465576171875, -1.155548095703125, -1.1152496337890625, -1.074951171875, -1.0346527099609375, -0.994354248046875, -0.9540557861328125, -0.91375732421875, -0.8734588623046875, -0.833160400390625, -0.7928619384765625, -0.7525634765625, -0.7122650146484375, -0.671966552734375, -0.6316680908203125, -0.59136962890625, -0.5510711669921875, -0.510772705078125, -0.4704742431640625, -0.43017578125, -0.3898773193359375, -0.349578857421875, -0.3092803955078125, -0.26898193359375, -0.2286834716796875, -0.188385009765625, -0.1480865478515625, -0.1077880859375, -0.0674896240234375, -0.027191162109375, 0.0131072998046875, 0.05340576171875, 0.0937042236328125, 0.134002685546875, 0.1743011474609375, 0.214599609375, 0.2548980712890625, 0.295196533203125, 0.3354949951171875, 0.37579345703125, 0.4160919189453125, 0.456390380859375, 0.4966888427734375, 0.5369873046875, 0.5772857666015625, 0.617584228515625, 0.6578826904296875, 0.69818115234375, 0.7384796142578125, 0.778778076171875, 0.8190765380859375, 0.859375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 15.0, 6.0, 6.0, 22.0, 23.0, 17.0, 37.0, 41.0, 35.0, 42.0, 45.0, 55.0, 45.0, 59.0, 85.0, 67.0, 66.0, 57.0, 61.0, 44.0, 41.0, 28.0, 33.0, 14.0, 16.0, 10.0, 7.0, 10.0, 10.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0675048828125, -0.06503582000732422, -0.06256675720214844, -0.060097694396972656, -0.057628631591796875, -0.055159568786621094, -0.05269050598144531, -0.05022144317626953, -0.04775238037109375, -0.04528331756591797, -0.04281425476074219, -0.040345191955566406, -0.037876129150390625, -0.035407066345214844, -0.03293800354003906, -0.03046894073486328, -0.0279998779296875, -0.02553081512451172, -0.023061752319335938, -0.020592689514160156, -0.018123626708984375, -0.015654563903808594, -0.013185501098632812, -0.010716438293457031, -0.00824737548828125, -0.005778312683105469, -0.0033092498779296875, -0.0008401870727539062, 0.001628875732421875, 0.004097938537597656, 0.0065670013427734375, 0.009036064147949219, 0.011505126953125, 0.013974189758300781, 0.016443252563476562, 0.018912315368652344, 0.021381378173828125, 0.023850440979003906, 0.026319503784179688, 0.02878856658935547, 0.03125762939453125, 0.03372669219970703, 0.03619575500488281, 0.038664817810058594, 0.041133880615234375, 0.043602943420410156, 0.04607200622558594, 0.04854106903076172, 0.0510101318359375, 0.05347919464111328, 0.05594825744628906, 0.058417320251464844, 0.060886383056640625, 0.0633554458618164, 0.06582450866699219, 0.06829357147216797, 0.07076263427734375, 0.07323169708251953, 0.07570075988769531, 0.0781698226928711, 0.08063888549804688, 0.08310794830322266, 0.08557701110839844, 0.08804607391357422, 0.09051513671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 13.0, 23.0, 20.0, 51.0, 101.0, 192.0, 763.0, 7729.0, 4177451.0, 6677.0, 744.0, 236.0, 113.0, 75.0, 39.0, 20.0, 15.0, 13.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.60546875, -3.37274169921875, -3.1400146484375, -2.90728759765625, -2.674560546875, -2.44183349609375, -2.2091064453125, -1.97637939453125, -1.74365234375, -1.51092529296875, -1.2781982421875, -1.04547119140625, -0.812744140625, -0.58001708984375, -0.3472900390625, -0.11456298828125, 0.1181640625, 0.35089111328125, 0.5836181640625, 0.81634521484375, 1.049072265625, 1.28179931640625, 1.5145263671875, 1.74725341796875, 1.97998046875, 2.21270751953125, 2.4454345703125, 2.67816162109375, 2.910888671875, 3.14361572265625, 3.3763427734375, 3.60906982421875, 3.841796875, 4.07452392578125, 4.3072509765625, 4.53997802734375, 4.772705078125, 5.00543212890625, 5.2381591796875, 5.47088623046875, 5.70361328125, 5.93634033203125, 6.1690673828125, 6.40179443359375, 6.634521484375, 6.86724853515625, 7.0999755859375, 7.33270263671875, 7.5654296875, 7.79815673828125, 8.0308837890625, 8.26361083984375, 8.496337890625, 8.72906494140625, 8.9617919921875, 9.19451904296875, 9.42724609375, 9.65997314453125, 9.8927001953125, 10.12542724609375, 10.358154296875, 10.59088134765625, 10.8236083984375, 11.05633544921875, 11.2890625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 6.0, 3.0, 9.0, 17.0, 40.0, 99.0, 925.0, 2762.0, 157.0, 40.0, 11.0, 8.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.391357421875, -0.3562049865722656, -0.32105255126953125, -0.2859001159667969, -0.2507476806640625, -0.21559524536132812, -0.18044281005859375, -0.14529037475585938, -0.110137939453125, -0.07498550415039062, -0.03983306884765625, -0.004680633544921875, 0.0304718017578125, 0.06562423706054688, 0.10077667236328125, 0.13592910766601562, 0.17108154296875, 0.20623397827148438, 0.24138641357421875, 0.2765388488769531, 0.3116912841796875, 0.3468437194824219, 0.38199615478515625, 0.4171485900878906, 0.452301025390625, 0.4874534606933594, 0.5226058959960938, 0.5577583312988281, 0.5929107666015625, 0.6280632019042969, 0.6632156372070312, 0.6983680725097656, 0.7335205078125, 0.7686729431152344, 0.8038253784179688, 0.8389778137207031, 0.8741302490234375, 0.9092826843261719, 0.9444351196289062, 0.9795875549316406, 1.014739990234375, 1.0498924255371094, 1.0850448608398438, 1.1201972961425781, 1.1553497314453125, 1.1905021667480469, 1.2256546020507812, 1.2608070373535156, 1.29595947265625, 1.3311119079589844, 1.3662643432617188, 1.4014167785644531, 1.4365692138671875, 1.4717216491699219, 1.5068740844726562, 1.5420265197753906, 1.577178955078125, 1.6123313903808594, 1.6474838256835938, 1.6826362609863281, 1.7177886962890625, 1.7529411315917969, 1.7880935668945312, 1.8232460021972656, 1.8583984375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 12.0, 125.0, 784.0, 72.0, 11.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.818769454956055, -22.293041229248047, -21.76731300354004, -21.24158477783203, -20.715858459472656, -20.19013023376465, -19.66440200805664, -19.138673782348633, -18.612945556640625, -18.087217330932617, -17.56148910522461, -17.0357608795166, -16.510032653808594, -15.984305381774902, -15.458578109741211, -14.932849884033203, -14.407121658325195, -13.881393432617188, -13.35566520690918, -12.829937934875488, -12.30420970916748, -11.778481483459473, -11.252754211425781, -10.727025985717773, -10.201297760009766, -9.675569534301758, -9.14984130859375, -8.624114036560059, -8.09838581085205, -7.572657585144043, -7.046929836273193, -6.521202087402344, -5.9954729080200195, -5.469744682312012, -4.944016933441162, -4.4182891845703125, -3.8925609588623047, -3.366832971572876, -2.8411049842834473, -2.3153769969940186, -1.7896490097045898, -1.2639210224151611, -0.7381930351257324, -0.2124650478363037, 0.313262939453125, 0.8389909267425537, 1.3647189140319824, 1.8904469013214111, 2.41617488861084, 2.9419028759002686, 3.4676308631896973, 3.993358850479126, 4.519086837768555, 5.0448150634765625, 5.570542812347412, 6.096270561218262, 6.6219987869262695, 7.147727012634277, 7.673454761505127, 8.199182510375977, 8.724910736083984, 9.250638961791992, 9.7763671875, 10.302094459533691, 10.8278226852417]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 1.0, 0.0, 8.0, 19.0, 17.0, 42.0, 49.0, 52.0, 94.0, 107.0, 114.0, 109.0, 87.0, 83.0, 71.0, 48.0, 37.0, 19.0, 20.0, 7.0, 8.0, 4.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7925572395324707, -3.6911697387695312, -3.589782238006592, -3.4883947372436523, -3.387007474899292, -3.2856199741363525, -3.184232473373413, -3.0828449726104736, -2.981457471847534, -2.8800699710845947, -2.7786824703216553, -2.677295207977295, -2.5759077072143555, -2.474520206451416, -2.3731327056884766, -2.271745204925537, -2.1703577041625977, -2.068970203399658, -1.9675828218460083, -1.8661953210830688, -1.7648078203201294, -1.6634204387664795, -1.56203293800354, -1.4606454372406006, -1.3592581748962402, -1.2578706741333008, -1.1564832925796509, -1.0550957918167114, -0.953708291053772, -0.8523208498954773, -0.7509334087371826, -0.6495459079742432, -0.5481584072113037, -0.44677093625068665, -0.3453834652900696, -0.2439960241317749, -0.14260855317115784, -0.04122108221054077, 0.060166358947753906, 0.16155385971069336, 0.26294130086898804, 0.3643287718296051, 0.46571624279022217, 0.5671036839485168, 0.6684911251068115, 0.769878625869751, 0.8712660670280457, 0.9726535677909851, 1.0740410089492798, 1.1754285097122192, 1.2768158912658691, 1.3782033920288086, 1.479590892791748, 1.5809783935546875, 1.6823657751083374, 1.7837532758712769, 1.8851406574249268, 1.9865281581878662, 2.0879156589508057, 2.189302921295166, 2.2906904220581055, 2.392077922821045, 2.4934654235839844, 2.594852924346924, 2.6962404251098633]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 10.0, 14.0, 23.0, 26.0, 35.0, 63.0, 91.0, 122.0, 201.0, 309.0, 514.0, 836.0, 1654.0, 4183.0, 15312.0, 100504.0, 711979.0, 180031.0, 22427.0, 5466.0, 2207.0, 1014.0, 580.0, 350.0, 203.0, 141.0, 90.0, 48.0, 31.0, 31.0, 19.0, 10.0, 8.0, 7.0, 3.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80810546875, -0.7817153930664062, -0.7553253173828125, -0.7289352416992188, -0.702545166015625, -0.6761550903320312, -0.6497650146484375, -0.6233749389648438, -0.59698486328125, -0.5705947875976562, -0.5442047119140625, -0.5178146362304688, -0.491424560546875, -0.46503448486328125, -0.4386444091796875, -0.41225433349609375, -0.3858642578125, -0.35947418212890625, -0.3330841064453125, -0.30669403076171875, -0.280303955078125, -0.25391387939453125, -0.2275238037109375, -0.20113372802734375, -0.17474365234375, -0.14835357666015625, -0.1219635009765625, -0.09557342529296875, -0.069183349609375, -0.04279327392578125, -0.0164031982421875, 0.00998687744140625, 0.036376953125, 0.06276702880859375, 0.0891571044921875, 0.11554718017578125, 0.141937255859375, 0.16832733154296875, 0.1947174072265625, 0.22110748291015625, 0.24749755859375, 0.27388763427734375, 0.3002777099609375, 0.32666778564453125, 0.353057861328125, 0.37944793701171875, 0.4058380126953125, 0.43222808837890625, 0.4586181640625, 0.48500823974609375, 0.5113983154296875, 0.5377883911132812, 0.564178466796875, 0.5905685424804688, 0.6169586181640625, 0.6433486938476562, 0.66973876953125, 0.6961288452148438, 0.7225189208984375, 0.7489089965820312, 0.775299072265625, 0.8016891479492188, 0.8280792236328125, 0.8544692993164062, 0.880859375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 4.0, 13.0, 16.0, 27.0, 36.0, 40.0, 52.0, 55.0, 67.0, 81.0, 72.0, 71.0, 93.0, 68.0, 58.0, 42.0, 58.0, 46.0, 24.0, 21.0, 13.0, 15.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.154052734375, -0.1501312255859375, -0.146209716796875, -0.1422882080078125, -0.13836669921875, -0.1344451904296875, -0.130523681640625, -0.1266021728515625, -0.1226806640625, -0.1187591552734375, -0.114837646484375, -0.1109161376953125, -0.10699462890625, -0.1030731201171875, -0.099151611328125, -0.0952301025390625, -0.09130859375, -0.0873870849609375, -0.083465576171875, -0.0795440673828125, -0.07562255859375, -0.0717010498046875, -0.067779541015625, -0.0638580322265625, -0.0599365234375, -0.0560150146484375, -0.052093505859375, -0.0481719970703125, -0.04425048828125, -0.0403289794921875, -0.036407470703125, -0.0324859619140625, -0.028564453125, -0.0246429443359375, -0.020721435546875, -0.0167999267578125, -0.01287841796875, -0.0089569091796875, -0.005035400390625, -0.0011138916015625, 0.0028076171875, 0.0067291259765625, 0.010650634765625, 0.0145721435546875, 0.01849365234375, 0.0224151611328125, 0.026336669921875, 0.0302581787109375, 0.0341796875, 0.0381011962890625, 0.042022705078125, 0.0459442138671875, 0.04986572265625, 0.0537872314453125, 0.057708740234375, 0.0616302490234375, 0.0655517578125, 0.0694732666015625, 0.073394775390625, 0.0773162841796875, 0.08123779296875, 0.0851593017578125, 0.089080810546875, 0.0930023193359375, 0.096923828125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 4.0, 3.0, 4.0, 9.0, 9.0, 16.0, 16.0, 28.0, 42.0, 62.0, 100.0, 185.0, 391.0, 924.0, 2826.0, 10762.0, 57871.0, 397164.0, 486332.0, 73604.0, 12921.0, 3345.0, 991.0, 405.0, 209.0, 97.0, 68.0, 31.0, 29.0, 31.0, 16.0, 13.0, 10.0, 8.0, 11.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.402587890625, -0.3887367248535156, -0.37488555908203125, -0.3610343933105469, -0.3471832275390625, -0.3333320617675781, -0.31948089599609375, -0.3056297302246094, -0.291778564453125, -0.2779273986816406, -0.26407623291015625, -0.2502250671386719, -0.2363739013671875, -0.22252273559570312, -0.20867156982421875, -0.19482040405273438, -0.18096923828125, -0.16711807250976562, -0.15326690673828125, -0.13941574096679688, -0.1255645751953125, -0.11171340942382812, -0.09786224365234375, -0.08401107788085938, -0.070159912109375, -0.056308746337890625, -0.04245758056640625, -0.028606414794921875, -0.0147552490234375, -0.000904083251953125, 0.01294708251953125, 0.026798248291015625, 0.0406494140625, 0.054500579833984375, 0.06835174560546875, 0.08220291137695312, 0.0960540771484375, 0.10990524291992188, 0.12375640869140625, 0.13760757446289062, 0.151458740234375, 0.16530990600585938, 0.17916107177734375, 0.19301223754882812, 0.2068634033203125, 0.22071456909179688, 0.23456573486328125, 0.24841690063476562, 0.26226806640625, 0.2761192321777344, 0.28997039794921875, 0.3038215637207031, 0.3176727294921875, 0.3315238952636719, 0.34537506103515625, 0.3592262268066406, 0.373077392578125, 0.3869285583496094, 0.40077972412109375, 0.4146308898925781, 0.4284820556640625, 0.4423332214355469, 0.45618438720703125, 0.4700355529785156, 0.48388671875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 2.0, 5.0, 3.0, 3.0, 8.0, 13.0, 9.0, 9.0, 17.0, 16.0, 22.0, 23.0, 20.0, 20.0, 30.0, 26.0, 25.0, 31.0, 35.0, 44.0, 48.0, 45.0, 43.0, 35.0, 37.0, 46.0, 40.0, 33.0, 34.0, 32.0, 29.0, 27.0, 30.0, 27.0, 20.0, 10.0, 13.0, 14.0, 17.0, 10.0, 13.0, 8.0, 7.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.2548828125, -0.24712562561035156, -0.23936843872070312, -0.2316112518310547, -0.22385406494140625, -0.2160968780517578, -0.20833969116210938, -0.20058250427246094, -0.1928253173828125, -0.18506813049316406, -0.17731094360351562, -0.1695537567138672, -0.16179656982421875, -0.1540393829345703, -0.14628219604492188, -0.13852500915527344, -0.130767822265625, -0.12301063537597656, -0.11525344848632812, -0.10749626159667969, -0.09973907470703125, -0.09198188781738281, -0.08422470092773438, -0.07646751403808594, -0.0687103271484375, -0.06095314025878906, -0.053195953369140625, -0.04543876647949219, -0.03768157958984375, -0.029924392700195312, -0.022167205810546875, -0.014410018920898438, -0.00665283203125, 0.0011043548583984375, 0.008861541748046875, 0.016618728637695312, 0.02437591552734375, 0.03213310241699219, 0.039890289306640625, 0.04764747619628906, 0.0554046630859375, 0.06316184997558594, 0.07091903686523438, 0.07867622375488281, 0.08643341064453125, 0.09419059753417969, 0.10194778442382812, 0.10970497131347656, 0.117462158203125, 0.12521934509277344, 0.13297653198242188, 0.1407337188720703, 0.14849090576171875, 0.1562480926513672, 0.16400527954101562, 0.17176246643066406, 0.1795196533203125, 0.18727684020996094, 0.19503402709960938, 0.2027912139892578, 0.21054840087890625, 0.2183055877685547, 0.22606277465820312, 0.23381996154785156, 0.2415771484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 7.0, 7.0, 16.0, 19.0, 37.0, 86.0, 143.0, 261.0, 496.0, 974.0, 1945.0, 4602.0, 14531.0, 81412.0, 760116.0, 152719.0, 20445.0, 5928.0, 2392.0, 1118.0, 600.0, 302.0, 192.0, 90.0, 50.0, 26.0, 17.0, 7.0, 8.0, 6.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.30615234375, -0.2975578308105469, -0.28896331787109375, -0.2803688049316406, -0.2717742919921875, -0.2631797790527344, -0.25458526611328125, -0.24599075317382812, -0.237396240234375, -0.22880172729492188, -0.22020721435546875, -0.21161270141601562, -0.2030181884765625, -0.19442367553710938, -0.18582916259765625, -0.17723464965820312, -0.16864013671875, -0.16004562377929688, -0.15145111083984375, -0.14285659790039062, -0.1342620849609375, -0.12566757202148438, -0.11707305908203125, -0.10847854614257812, -0.099884033203125, -0.09128952026367188, -0.08269500732421875, -0.07410049438476562, -0.0655059814453125, -0.056911468505859375, -0.04831695556640625, -0.039722442626953125, -0.0311279296875, -0.022533416748046875, -0.01393890380859375, -0.005344390869140625, 0.0032501220703125, 0.011844635009765625, 0.02043914794921875, 0.029033660888671875, 0.037628173828125, 0.046222686767578125, 0.05481719970703125, 0.06341171264648438, 0.0720062255859375, 0.08060073852539062, 0.08919525146484375, 0.09778976440429688, 0.10638427734375, 0.11497879028320312, 0.12357330322265625, 0.13216781616210938, 0.1407623291015625, 0.14935684204101562, 0.15795135498046875, 0.16654586791992188, 0.175140380859375, 0.18373489379882812, 0.19232940673828125, 0.20092391967773438, 0.2095184326171875, 0.21811294555664062, 0.22670745849609375, 0.23530197143554688, 0.243896484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 10.0, 15.0, 25.0, 28.0, 37.0, 90.0, 169.0, 219.0, 154.0, 103.0, 43.0, 29.0, 19.0, 19.0, 10.0, 9.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4776668548583984e-05, -5.263276398181915e-05, -5.048885941505432e-05, -4.834495484828949e-05, -4.620105028152466e-05, -4.405714571475983e-05, -4.1913241147994995e-05, -3.9769336581230164e-05, -3.762543201446533e-05, -3.54815274477005e-05, -3.333762288093567e-05, -3.119371831417084e-05, -2.9049813747406006e-05, -2.6905909180641174e-05, -2.4762004613876343e-05, -2.261810004711151e-05, -2.047419548034668e-05, -1.8330290913581848e-05, -1.6186386346817017e-05, -1.4042481780052185e-05, -1.1898577213287354e-05, -9.754672646522522e-06, -7.6107680797576904e-06, -5.466863512992859e-06, -3.3229589462280273e-06, -1.1790543794631958e-06, 9.648501873016357e-07, 3.1087547540664673e-06, 5.252659320831299e-06, 7.39656388759613e-06, 9.540468454360962e-06, 1.1684373021125793e-05, 1.3828277587890625e-05, 1.5972182154655457e-05, 1.8116086721420288e-05, 2.025999128818512e-05, 2.240389585494995e-05, 2.4547800421714783e-05, 2.6691704988479614e-05, 2.8835609555244446e-05, 3.097951412200928e-05, 3.312341868877411e-05, 3.526732325553894e-05, 3.741122782230377e-05, 3.9555132389068604e-05, 4.1699036955833435e-05, 4.3842941522598267e-05, 4.59868460893631e-05, 4.813075065612793e-05, 5.027465522289276e-05, 5.241855978965759e-05, 5.4562464356422424e-05, 5.6706368923187256e-05, 5.885027348995209e-05, 6.099417805671692e-05, 6.313808262348175e-05, 6.528198719024658e-05, 6.742589175701141e-05, 6.956979632377625e-05, 7.171370089054108e-05, 7.385760545730591e-05, 7.600151002407074e-05, 7.814541459083557e-05, 8.02893191576004e-05, 8.243322372436523e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 8.0, 4.0, 12.0, 15.0, 29.0, 45.0, 105.0, 229.0, 464.0, 1066.0, 2613.0, 7386.0, 35376.0, 758713.0, 216877.0, 17233.0, 4962.0, 1922.0, 803.0, 369.0, 158.0, 77.0, 39.0, 15.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34521484375, -0.3327980041503906, -0.32038116455078125, -0.3079643249511719, -0.2955474853515625, -0.2831306457519531, -0.27071380615234375, -0.2582969665527344, -0.245880126953125, -0.23346328735351562, -0.22104644775390625, -0.20862960815429688, -0.1962127685546875, -0.18379592895507812, -0.17137908935546875, -0.15896224975585938, -0.14654541015625, -0.13412857055664062, -0.12171173095703125, -0.10929489135742188, -0.0968780517578125, -0.08446121215820312, -0.07204437255859375, -0.059627532958984375, -0.047210693359375, -0.034793853759765625, -0.02237701416015625, -0.009960174560546875, 0.0024566650390625, 0.014873504638671875, 0.02729034423828125, 0.039707183837890625, 0.0521240234375, 0.06454086303710938, 0.07695770263671875, 0.08937454223632812, 0.1017913818359375, 0.11420822143554688, 0.12662506103515625, 0.13904190063476562, 0.151458740234375, 0.16387557983398438, 0.17629241943359375, 0.18870925903320312, 0.2011260986328125, 0.21354293823242188, 0.22595977783203125, 0.23837661743164062, 0.25079345703125, 0.2632102966308594, 0.27562713623046875, 0.2880439758300781, 0.3004608154296875, 0.3128776550292969, 0.32529449462890625, 0.3377113342285156, 0.350128173828125, 0.3625450134277344, 0.37496185302734375, 0.3873786926269531, 0.3997955322265625, 0.4122123718261719, 0.42462921142578125, 0.4370460510253906, 0.449462890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 5.0, 7.0, 7.0, 8.0, 6.0, 10.0, 17.0, 32.0, 30.0, 59.0, 88.0, 92.0, 128.0, 147.0, 103.0, 71.0, 59.0, 43.0, 25.0, 10.0, 10.0, 8.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.172119140625, -0.16617584228515625, -0.1602325439453125, -0.15428924560546875, -0.148345947265625, -0.14240264892578125, -0.1364593505859375, -0.13051605224609375, -0.12457275390625, -0.11862945556640625, -0.1126861572265625, -0.10674285888671875, -0.100799560546875, -0.09485626220703125, -0.0889129638671875, -0.08296966552734375, -0.0770263671875, -0.07108306884765625, -0.0651397705078125, -0.05919647216796875, -0.053253173828125, -0.04730987548828125, -0.0413665771484375, -0.03542327880859375, -0.02947998046875, -0.02353668212890625, -0.0175933837890625, -0.01165008544921875, -0.005706787109375, 0.00023651123046875, 0.0061798095703125, 0.01212310791015625, 0.01806640625, 0.02400970458984375, 0.0299530029296875, 0.03589630126953125, 0.041839599609375, 0.04778289794921875, 0.0537261962890625, 0.05966949462890625, 0.06561279296875, 0.07155609130859375, 0.0774993896484375, 0.08344268798828125, 0.089385986328125, 0.09532928466796875, 0.1012725830078125, 0.10721588134765625, 0.1131591796875, 0.11910247802734375, 0.1250457763671875, 0.13098907470703125, 0.136932373046875, 0.14287567138671875, 0.1488189697265625, 0.15476226806640625, 0.16070556640625, 0.16664886474609375, 0.1725921630859375, 0.17853546142578125, 0.184478759765625, 0.19042205810546875, 0.1963653564453125, 0.20230865478515625, 0.208251953125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 13.0, 34.0, 199.0, 498.0, 213.0, 43.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.953251838684082, -12.691709518432617, -12.430166244506836, -12.168623924255371, -11.90708065032959, -11.645538330078125, -11.383995056152344, -11.122452735900879, -10.860910415649414, -10.59936809539795, -10.337824821472168, -10.076282501220703, -9.814739227294922, -9.553196907043457, -9.291653633117676, -9.030111312866211, -8.76856803894043, -8.507025718688965, -8.245482444763184, -7.9839396476745605, -7.7223968505859375, -7.460854530334473, -7.19931173324585, -6.937768936157227, -6.6762261390686035, -6.4146833419799805, -6.153140544891357, -5.891597747802734, -5.6300554275512695, -5.368512153625488, -5.106969833374023, -4.8454270362854, -4.583883285522461, -4.322340488433838, -4.060797691345215, -3.799255132675171, -3.537712335586548, -3.276169538497925, -3.014626979827881, -2.753084182739258, -2.4915413856506348, -2.2299985885620117, -1.9684559106826782, -1.7069132328033447, -1.4453704357147217, -1.1838276386260986, -0.9222849607467651, -0.6607422828674316, -0.3991994857788086, -0.13765674829483032, 0.12388598918914795, 0.3854287266731262, 0.6469714641571045, 0.9085142612457275, 1.170056939125061, 1.4315996170043945, 1.6931424140930176, 1.9546852111816406, 2.2162280082702637, 2.4777705669403076, 2.7393133640289307, 3.0008561611175537, 3.2623987197875977, 3.5239415168762207, 3.7854843139648438]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 9.0, 7.0, 18.0, 11.0, 8.0, 18.0, 17.0, 20.0, 32.0, 38.0, 32.0, 45.0, 32.0, 33.0, 56.0, 46.0, 50.0, 39.0, 55.0, 52.0, 49.0, 46.0, 45.0, 43.0, 34.0, 39.0, 33.0, 16.0, 18.0, 13.0, 8.0, 5.0, 11.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.314886450767517, -1.2609148025512695, -1.2069432735443115, -1.152971625328064, -1.0989999771118164, -1.0450284481048584, -0.9910567998886108, -0.9370852112770081, -0.8831136226654053, -0.8291420340538025, -0.7751704454421997, -0.7211987972259521, -0.6672272086143494, -0.6132556200027466, -0.559283971786499, -0.5053123831748962, -0.45134079456329346, -0.3973692059516907, -0.3433975875377655, -0.28942596912384033, -0.23545438051223755, -0.18148279190063477, -0.1275111734867096, -0.07353955507278442, -0.01956796646118164, 0.034403637051582336, 0.08837524056434631, 0.1423468440771103, 0.19631844758987427, 0.25029003620147705, 0.3042616546154022, 0.3582332730293274, 0.4122049808502197, 0.4661765694618225, 0.5201481580734253, 0.5741198062896729, 0.6280913949012756, 0.6820629835128784, 0.736034631729126, 0.7900062203407288, 0.8439778089523315, 0.8979493975639343, 0.9519209861755371, 1.0058926343917847, 1.0598642826080322, 1.1138358116149902, 1.1678074598312378, 1.2217791080474854, 1.2757506370544434, 1.329722285270691, 1.383693814277649, 1.4376654624938965, 1.4916369915008545, 1.545608639717102, 1.5995802879333496, 1.6535518169403076, 1.7075234651565552, 1.7614951133728027, 1.8154666423797607, 1.8694382905960083, 1.9234099388122559, 1.9773814678192139, 2.031352996826172, 2.085324764251709, 2.139296293258667]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 2.0, 7.0, 17.0, 24.0, 24.0, 26.0, 31.0, 49.0, 63.0, 45.0, 82.0, 108.0, 152.0, 198.0, 289.0, 498.0, 1018.0, 2326.0, 6708.0, 29136.0, 4042306.0, 92702.0, 11167.0, 3820.0, 1609.0, 774.0, 390.0, 222.0, 129.0, 101.0, 51.0, 44.0, 35.0, 34.0, 14.0, 18.0, 17.0, 8.0, 10.0, 7.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.16796875, -1.128631591796875, -1.08929443359375, -1.049957275390625, -1.0106201171875, -0.971282958984375, -0.93194580078125, -0.892608642578125, -0.853271484375, -0.813934326171875, -0.77459716796875, -0.735260009765625, -0.6959228515625, -0.656585693359375, -0.61724853515625, -0.577911376953125, -0.53857421875, -0.499237060546875, -0.45989990234375, -0.420562744140625, -0.3812255859375, -0.341888427734375, -0.30255126953125, -0.263214111328125, -0.223876953125, -0.184539794921875, -0.14520263671875, -0.105865478515625, -0.0665283203125, -0.027191162109375, 0.01214599609375, 0.051483154296875, 0.0908203125, 0.130157470703125, 0.16949462890625, 0.208831787109375, 0.2481689453125, 0.287506103515625, 0.32684326171875, 0.366180419921875, 0.405517578125, 0.444854736328125, 0.48419189453125, 0.523529052734375, 0.5628662109375, 0.602203369140625, 0.64154052734375, 0.680877685546875, 0.72021484375, 0.759552001953125, 0.79888916015625, 0.838226318359375, 0.8775634765625, 0.916900634765625, 0.95623779296875, 0.995574951171875, 1.034912109375, 1.074249267578125, 1.11358642578125, 1.152923583984375, 1.1922607421875, 1.231597900390625, 1.27093505859375, 1.310272216796875, 1.349609375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 9.0, 6.0, 14.0, 17.0, 29.0, 35.0, 44.0, 56.0, 51.0, 58.0, 73.0, 73.0, 77.0, 59.0, 65.0, 75.0, 49.0, 41.0, 43.0, 38.0, 16.0, 11.0, 16.0, 13.0, 12.0, 3.0, 2.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1444091796875, -0.14074325561523438, -0.13707733154296875, -0.13341140747070312, -0.1297454833984375, -0.12607955932617188, -0.12241363525390625, -0.11874771118164062, -0.115081787109375, -0.11141586303710938, -0.10774993896484375, -0.10408401489257812, -0.1004180908203125, -0.09675216674804688, -0.09308624267578125, -0.08942031860351562, -0.08575439453125, -0.08208847045898438, -0.07842254638671875, -0.07475662231445312, -0.0710906982421875, -0.06742477416992188, -0.06375885009765625, -0.060092926025390625, -0.056427001953125, -0.052761077880859375, -0.04909515380859375, -0.045429229736328125, -0.0417633056640625, -0.038097381591796875, -0.03443145751953125, -0.030765533447265625, -0.027099609375, -0.023433685302734375, -0.01976776123046875, -0.016101837158203125, -0.0124359130859375, -0.008769989013671875, -0.00510406494140625, -0.001438140869140625, 0.002227783203125, 0.005893707275390625, 0.00955963134765625, 0.013225555419921875, 0.0168914794921875, 0.020557403564453125, 0.02422332763671875, 0.027889251708984375, 0.03155517578125, 0.035221099853515625, 0.03888702392578125, 0.042552947998046875, 0.0462188720703125, 0.049884796142578125, 0.05355072021484375, 0.057216644287109375, 0.060882568359375, 0.06454849243164062, 0.06821441650390625, 0.07188034057617188, 0.0755462646484375, 0.07921218872070312, 0.08287811279296875, 0.08654403686523438, 0.0902099609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 11.0, 10.0, 24.0, 29.0, 66.0, 88.0, 154.0, 330.0, 1178.0, 16566.0, 4159722.0, 14200.0, 1124.0, 355.0, 151.0, 111.0, 63.0, 40.0, 22.0, 16.0, 14.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.943634033203125, -1.83843994140625, -1.733245849609375, -1.6280517578125, -1.522857666015625, -1.41766357421875, -1.312469482421875, -1.207275390625, -1.102081298828125, -0.99688720703125, -0.891693115234375, -0.7864990234375, -0.681304931640625, -0.57611083984375, -0.470916748046875, -0.36572265625, -0.260528564453125, -0.15533447265625, -0.050140380859375, 0.0550537109375, 0.160247802734375, 0.26544189453125, 0.370635986328125, 0.475830078125, 0.581024169921875, 0.68621826171875, 0.791412353515625, 0.8966064453125, 1.001800537109375, 1.10699462890625, 1.212188720703125, 1.3173828125, 1.422576904296875, 1.52777099609375, 1.632965087890625, 1.7381591796875, 1.843353271484375, 1.94854736328125, 2.053741455078125, 2.158935546875, 2.264129638671875, 2.36932373046875, 2.474517822265625, 2.5797119140625, 2.684906005859375, 2.79010009765625, 2.895294189453125, 3.00048828125, 3.105682373046875, 3.21087646484375, 3.316070556640625, 3.4212646484375, 3.526458740234375, 3.63165283203125, 3.736846923828125, 3.842041015625, 3.947235107421875, 4.05242919921875, 4.157623291015625, 4.2628173828125, 4.368011474609375, 4.47320556640625, 4.578399658203125, 4.68359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 11.0, 24.0, 53.0, 119.0, 1270.0, 2355.0, 129.0, 47.0, 28.0, 14.0, 13.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40673828125, -0.38910675048828125, -0.3714752197265625, -0.35384368896484375, -0.336212158203125, -0.31858062744140625, -0.3009490966796875, -0.28331756591796875, -0.26568603515625, -0.24805450439453125, -0.2304229736328125, -0.21279144287109375, -0.195159912109375, -0.17752838134765625, -0.1598968505859375, -0.14226531982421875, -0.1246337890625, -0.10700225830078125, -0.0893707275390625, -0.07173919677734375, -0.054107666015625, -0.03647613525390625, -0.0188446044921875, -0.00121307373046875, 0.01641845703125, 0.03404998779296875, 0.0516815185546875, 0.06931304931640625, 0.086944580078125, 0.10457611083984375, 0.1222076416015625, 0.13983917236328125, 0.157470703125, 0.17510223388671875, 0.1927337646484375, 0.21036529541015625, 0.227996826171875, 0.24562835693359375, 0.2632598876953125, 0.28089141845703125, 0.29852294921875, 0.31615447998046875, 0.3337860107421875, 0.35141754150390625, 0.369049072265625, 0.38668060302734375, 0.4043121337890625, 0.42194366455078125, 0.4395751953125, 0.45720672607421875, 0.4748382568359375, 0.49246978759765625, 0.510101318359375, 0.5277328491210938, 0.5453643798828125, 0.5629959106445312, 0.58062744140625, 0.5982589721679688, 0.6158905029296875, 0.6335220336914062, 0.651153564453125, 0.6687850952148438, 0.6864166259765625, 0.7040481567382812, 0.7216796875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 13.0, 54.0, 432.0, 425.0, 64.0, 18.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.034736633300781, -8.842652320861816, -8.650568962097168, -8.458484649658203, -8.266400337219238, -8.07431697845459, -7.882232666015625, -7.69014835357666, -7.4980645179748535, -7.305980682373047, -7.113896369934082, -6.921812534332275, -6.729728698730469, -6.537644386291504, -6.345560550689697, -6.153476715087891, -5.961392402648926, -5.769308567047119, -5.577224254608154, -5.385140419006348, -5.193056583404541, -5.000972270965576, -4.8088884353637695, -4.616804122924805, -4.424720764160156, -4.23263692855835, -4.040552616119385, -3.848468780517578, -3.6563847064971924, -3.4643006324768066, -3.272216796875, -3.0801327228546143, -2.8880486488342285, -2.6959645748138428, -2.503880739212036, -2.3117966651916504, -2.1197125911712646, -1.9276286363601685, -1.7355446815490723, -1.5434606075286865, -1.3513766527175903, -1.1592926979064941, -0.9672086238861084, -0.7751246690750122, -0.5830406546592712, -0.3909566402435303, -0.19887268543243408, -0.00678861141204834, 0.18529534339904785, 0.3773793578147888, 0.5694633722305298, 0.761547327041626, 0.9536313414573669, 1.145715355873108, 1.337799310684204, 1.5298833847045898, 1.721967339515686, 1.9140512943267822, 2.106135368347168, 2.2982192039489746, 2.4903032779693604, 2.682387351989746, 2.8744711875915527, 3.0665555000305176, 3.258639335632324]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 10.0, 7.0, 5.0, 10.0, 9.0, 10.0, 17.0, 12.0, 27.0, 26.0, 34.0, 41.0, 45.0, 46.0, 45.0, 43.0, 41.0, 48.0, 60.0, 56.0, 49.0, 51.0, 47.0, 35.0, 40.0, 30.0, 31.0, 29.0, 21.0, 15.0, 15.0, 7.0, 11.0, 13.0, 3.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8361718058586121, -0.8124577403068542, -0.7887436747550964, -0.7650296688079834, -0.7413156032562256, -0.7176015377044678, -0.69388747215271, -0.6701734066009521, -0.6464593410491943, -0.6227452754974365, -0.5990312099456787, -0.5753171443939209, -0.5516031384468079, -0.52788907289505, -0.5041750073432922, -0.4804609417915344, -0.456746906042099, -0.4330328404903412, -0.40931880474090576, -0.38560473918914795, -0.36189067363739014, -0.3381766080856323, -0.3144625723361969, -0.2907485067844391, -0.26703447103500366, -0.24332042038440704, -0.21960635483264923, -0.1958923041820526, -0.1721782386302948, -0.14846418797969818, -0.12475013732910156, -0.10103607177734375, -0.07732200622558594, -0.05360794812440872, -0.029893893748521805, -0.006179839372634888, 0.017534218728542328, 0.04124827682971954, 0.06496232748031616, 0.08867639303207397, 0.1123904436826706, 0.1361044943332672, 0.15981855988502502, 0.18353261053562164, 0.20724666118621826, 0.23096072673797607, 0.2546747922897339, 0.2783888578414917, 0.3021028935909271, 0.32581695914268494, 0.34953099489212036, 0.3732450604438782, 0.396959125995636, 0.4206731915473938, 0.4443872272968292, 0.46810129284858704, 0.49181532859802246, 0.5155293941497803, 0.5392434597015381, 0.5629575252532959, 0.5866715312004089, 0.6103855967521667, 0.6340996623039246, 0.6578137278556824, 0.6815277934074402]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 7.0, 8.0, 8.0, 12.0, 16.0, 23.0, 31.0, 36.0, 33.0, 48.0, 72.0, 120.0, 147.0, 186.0, 277.0, 493.0, 907.0, 1815.0, 4184.0, 11022.0, 40240.0, 285683.0, 594000.0, 80031.0, 17722.0, 5865.0, 2494.0, 1182.0, 697.0, 397.0, 229.0, 161.0, 125.0, 66.0, 65.0, 39.0, 28.0, 21.0, 22.0, 14.0, 14.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64208984375, -0.6201019287109375, -0.598114013671875, -0.5761260986328125, -0.55413818359375, -0.5321502685546875, -0.510162353515625, -0.4881744384765625, -0.4661865234375, -0.4441986083984375, -0.422210693359375, -0.4002227783203125, -0.37823486328125, -0.3562469482421875, -0.334259033203125, -0.3122711181640625, -0.290283203125, -0.2682952880859375, -0.246307373046875, -0.2243194580078125, -0.20233154296875, -0.1803436279296875, -0.158355712890625, -0.1363677978515625, -0.1143798828125, -0.0923919677734375, -0.070404052734375, -0.0484161376953125, -0.02642822265625, -0.0044403076171875, 0.017547607421875, 0.0395355224609375, 0.0615234375, 0.0835113525390625, 0.105499267578125, 0.1274871826171875, 0.14947509765625, 0.1714630126953125, 0.193450927734375, 0.2154388427734375, 0.2374267578125, 0.2594146728515625, 0.281402587890625, 0.3033905029296875, 0.32537841796875, 0.3473663330078125, 0.369354248046875, 0.3913421630859375, 0.413330078125, 0.4353179931640625, 0.457305908203125, 0.4792938232421875, 0.50128173828125, 0.5232696533203125, 0.545257568359375, 0.5672454833984375, 0.5892333984375, 0.6112213134765625, 0.633209228515625, 0.6551971435546875, 0.67718505859375, 0.6991729736328125, 0.721160888671875, 0.7431488037109375, 0.76513671875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 3.0, 9.0, 13.0, 26.0, 25.0, 38.0, 42.0, 57.0, 58.0, 69.0, 68.0, 75.0, 62.0, 78.0, 68.0, 61.0, 56.0, 44.0, 34.0, 27.0, 22.0, 12.0, 10.0, 7.0, 8.0, 6.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139892578125, -0.1357889175415039, -0.1316852569580078, -0.12758159637451172, -0.12347793579101562, -0.11937427520751953, -0.11527061462402344, -0.11116695404052734, -0.10706329345703125, -0.10295963287353516, -0.09885597229003906, -0.09475231170654297, -0.09064865112304688, -0.08654499053955078, -0.08244132995605469, -0.0783376693725586, -0.0742340087890625, -0.0701303482055664, -0.06602668762207031, -0.06192302703857422, -0.057819366455078125, -0.05371570587158203, -0.04961204528808594, -0.045508384704589844, -0.04140472412109375, -0.037301063537597656, -0.03319740295410156, -0.02909374237060547, -0.024990081787109375, -0.02088642120361328, -0.016782760620117188, -0.012679100036621094, -0.008575439453125, -0.004471778869628906, -0.0003681182861328125, 0.0037355422973632812, 0.007839202880859375, 0.011942863464355469, 0.016046524047851562, 0.020150184631347656, 0.02425384521484375, 0.028357505798339844, 0.03246116638183594, 0.03656482696533203, 0.040668487548828125, 0.04477214813232422, 0.04887580871582031, 0.052979469299316406, 0.0570831298828125, 0.061186790466308594, 0.06529045104980469, 0.06939411163330078, 0.07349777221679688, 0.07760143280029297, 0.08170509338378906, 0.08580875396728516, 0.08991241455078125, 0.09401607513427734, 0.09811973571777344, 0.10222339630126953, 0.10632705688476562, 0.11043071746826172, 0.11453437805175781, 0.1186380386352539, 0.12274169921875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 10.0, 13.0, 17.0, 23.0, 28.0, 54.0, 89.0, 143.0, 303.0, 567.0, 1224.0, 2864.0, 7981.0, 30044.0, 185754.0, 648301.0, 135860.0, 23909.0, 6661.0, 2497.0, 1013.0, 541.0, 281.0, 140.0, 82.0, 44.0, 35.0, 22.0, 17.0, 8.0, 6.0, 8.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.372314453125, -0.3576698303222656, -0.34302520751953125, -0.3283805847167969, -0.3137359619140625, -0.2990913391113281, -0.28444671630859375, -0.2698020935058594, -0.255157470703125, -0.24051284790039062, -0.22586822509765625, -0.21122360229492188, -0.1965789794921875, -0.18193435668945312, -0.16728973388671875, -0.15264511108398438, -0.13800048828125, -0.12335586547851562, -0.10871124267578125, -0.09406661987304688, -0.0794219970703125, -0.06477737426757812, -0.05013275146484375, -0.035488128662109375, -0.020843505859375, -0.006198883056640625, 0.00844573974609375, 0.023090362548828125, 0.0377349853515625, 0.052379608154296875, 0.06702423095703125, 0.08166885375976562, 0.0963134765625, 0.11095809936523438, 0.12560272216796875, 0.14024734497070312, 0.1548919677734375, 0.16953659057617188, 0.18418121337890625, 0.19882583618164062, 0.213470458984375, 0.22811508178710938, 0.24275970458984375, 0.2574043273925781, 0.2720489501953125, 0.2866935729980469, 0.30133819580078125, 0.3159828186035156, 0.33062744140625, 0.3452720642089844, 0.35991668701171875, 0.3745613098144531, 0.3892059326171875, 0.4038505554199219, 0.41849517822265625, 0.4331398010253906, 0.447784423828125, 0.4624290466308594, 0.47707366943359375, 0.4917182922363281, 0.5063629150390625, 0.5210075378417969, 0.5356521606445312, 0.5502967834472656, 0.56494140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 11.0, 11.0, 13.0, 6.0, 13.0, 21.0, 20.0, 22.0, 29.0, 29.0, 32.0, 50.0, 48.0, 56.0, 53.0, 51.0, 50.0, 59.0, 54.0, 48.0, 37.0, 32.0, 47.0, 33.0, 27.0, 25.0, 24.0, 18.0, 15.0, 21.0, 11.0, 7.0, 3.0, 6.0, 8.0, 4.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.354248046875, -0.3427276611328125, -0.331207275390625, -0.3196868896484375, -0.30816650390625, -0.2966461181640625, -0.285125732421875, -0.2736053466796875, -0.2620849609375, -0.2505645751953125, -0.239044189453125, -0.2275238037109375, -0.21600341796875, -0.2044830322265625, -0.192962646484375, -0.1814422607421875, -0.169921875, -0.1584014892578125, -0.146881103515625, -0.1353607177734375, -0.12384033203125, -0.1123199462890625, -0.100799560546875, -0.0892791748046875, -0.0777587890625, -0.0662384033203125, -0.054718017578125, -0.0431976318359375, -0.03167724609375, -0.0201568603515625, -0.008636474609375, 0.0028839111328125, 0.014404296875, 0.0259246826171875, 0.037445068359375, 0.0489654541015625, 0.06048583984375, 0.0720062255859375, 0.083526611328125, 0.0950469970703125, 0.1065673828125, 0.1180877685546875, 0.129608154296875, 0.1411285400390625, 0.15264892578125, 0.1641693115234375, 0.175689697265625, 0.1872100830078125, 0.19873046875, 0.2102508544921875, 0.221771240234375, 0.2332916259765625, 0.24481201171875, 0.2563323974609375, 0.267852783203125, 0.2793731689453125, 0.2908935546875, 0.3024139404296875, 0.313934326171875, 0.3254547119140625, 0.33697509765625, 0.3484954833984375, 0.360015869140625, 0.3715362548828125, 0.383056640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 7.0, 8.0, 6.0, 11.0, 24.0, 38.0, 51.0, 87.0, 139.0, 249.0, 449.0, 942.0, 1792.0, 3885.0, 10321.0, 34301.0, 199144.0, 637847.0, 120248.0, 24589.0, 7910.0, 3269.0, 1495.0, 739.0, 392.0, 251.0, 129.0, 83.0, 54.0, 28.0, 24.0, 18.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.21630859375, -0.21052169799804688, -0.20473480224609375, -0.19894790649414062, -0.1931610107421875, -0.18737411499023438, -0.18158721923828125, -0.17580032348632812, -0.170013427734375, -0.16422653198242188, -0.15843963623046875, -0.15265274047851562, -0.1468658447265625, -0.14107894897460938, -0.13529205322265625, -0.12950515747070312, -0.12371826171875, -0.11793136596679688, -0.11214447021484375, -0.10635757446289062, -0.1005706787109375, -0.09478378295898438, -0.08899688720703125, -0.08320999145507812, -0.077423095703125, -0.07163619995117188, -0.06584930419921875, -0.060062408447265625, -0.0542755126953125, -0.048488616943359375, -0.04270172119140625, -0.036914825439453125, -0.0311279296875, -0.025341033935546875, -0.01955413818359375, -0.013767242431640625, -0.0079803466796875, -0.002193450927734375, 0.00359344482421875, 0.009380340576171875, 0.015167236328125, 0.020954132080078125, 0.02674102783203125, 0.032527923583984375, 0.0383148193359375, 0.044101715087890625, 0.04988861083984375, 0.055675506591796875, 0.06146240234375, 0.06724929809570312, 0.07303619384765625, 0.07882308959960938, 0.0846099853515625, 0.09039688110351562, 0.09618377685546875, 0.10197067260742188, 0.107757568359375, 0.11354446411132812, 0.11933135986328125, 0.12511825561523438, 0.1309051513671875, 0.13669204711914062, 0.14247894287109375, 0.14826583862304688, 0.154052734375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 11.0, 5.0, 9.0, 16.0, 15.0, 32.0, 48.0, 60.0, 100.0, 118.0, 167.0, 142.0, 88.0, 51.0, 25.0, 30.0, 13.0, 18.0, 10.0, 5.0, 5.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.4226646423339844e-05, -4.282314330339432e-05, -4.141964018344879e-05, -4.0016137063503265e-05, -3.861263394355774e-05, -3.720913082361221e-05, -3.580562770366669e-05, -3.440212458372116e-05, -3.2998621463775635e-05, -3.159511834383011e-05, -3.0191615223884583e-05, -2.8788112103939056e-05, -2.738460898399353e-05, -2.5981105864048004e-05, -2.4577602744102478e-05, -2.3174099624156952e-05, -2.1770596504211426e-05, -2.03670933842659e-05, -1.8963590264320374e-05, -1.7560087144374847e-05, -1.615658402442932e-05, -1.4753080904483795e-05, -1.3349577784538269e-05, -1.1946074664592743e-05, -1.0542571544647217e-05, -9.13906842470169e-06, -7.735565304756165e-06, -6.3320621848106384e-06, -4.928559064865112e-06, -3.525055944919586e-06, -2.12155282497406e-06, -7.180497050285339e-07, 6.854534149169922e-07, 2.0889565348625183e-06, 3.4924596548080444e-06, 4.8959627747535706e-06, 6.299465894699097e-06, 7.702969014644623e-06, 9.106472134590149e-06, 1.0509975254535675e-05, 1.1913478374481201e-05, 1.3316981494426727e-05, 1.4720484614372253e-05, 1.612398773431778e-05, 1.7527490854263306e-05, 1.8930993974208832e-05, 2.0334497094154358e-05, 2.1738000214099884e-05, 2.314150333404541e-05, 2.4545006453990936e-05, 2.5948509573936462e-05, 2.735201269388199e-05, 2.8755515813827515e-05, 3.015901893377304e-05, 3.156252205371857e-05, 3.296602517366409e-05, 3.436952829360962e-05, 3.5773031413555145e-05, 3.717653453350067e-05, 3.85800376534462e-05, 3.9983540773391724e-05, 4.138704389333725e-05, 4.2790547013282776e-05, 4.41940501332283e-05, 4.559755325317383e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 9.0, 14.0, 16.0, 25.0, 48.0, 64.0, 125.0, 204.0, 439.0, 993.0, 2119.0, 6202.0, 29211.0, 452437.0, 513959.0, 31665.0, 6812.0, 2261.0, 930.0, 467.0, 248.0, 119.0, 71.0, 41.0, 31.0, 11.0, 15.0, 9.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.28173828125, -0.2723541259765625, -0.262969970703125, -0.2535858154296875, -0.24420166015625, -0.2348175048828125, -0.225433349609375, -0.2160491943359375, -0.2066650390625, -0.1972808837890625, -0.187896728515625, -0.1785125732421875, -0.16912841796875, -0.1597442626953125, -0.150360107421875, -0.1409759521484375, -0.131591796875, -0.1222076416015625, -0.112823486328125, -0.1034393310546875, -0.09405517578125, -0.0846710205078125, -0.075286865234375, -0.0659027099609375, -0.0565185546875, -0.0471343994140625, -0.037750244140625, -0.0283660888671875, -0.01898193359375, -0.0095977783203125, -0.000213623046875, 0.0091705322265625, 0.0185546875, 0.0279388427734375, 0.037322998046875, 0.0467071533203125, 0.05609130859375, 0.0654754638671875, 0.074859619140625, 0.0842437744140625, 0.0936279296875, 0.1030120849609375, 0.112396240234375, 0.1217803955078125, 0.13116455078125, 0.1405487060546875, 0.149932861328125, 0.1593170166015625, 0.168701171875, 0.1780853271484375, 0.187469482421875, 0.1968536376953125, 0.20623779296875, 0.2156219482421875, 0.225006103515625, 0.2343902587890625, 0.2437744140625, 0.2531585693359375, 0.262542724609375, 0.2719268798828125, 0.28131103515625, 0.2906951904296875, 0.300079345703125, 0.3094635009765625, 0.31884765625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 5.0, 8.0, 11.0, 14.0, 11.0, 24.0, 28.0, 37.0, 57.0, 56.0, 89.0, 138.0, 112.0, 88.0, 106.0, 54.0, 37.0, 20.0, 31.0, 19.0, 10.0, 10.0, 6.0, 3.0, 5.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.159912109375, -0.15479278564453125, -0.1496734619140625, -0.14455413818359375, -0.139434814453125, -0.13431549072265625, -0.1291961669921875, -0.12407684326171875, -0.11895751953125, -0.11383819580078125, -0.1087188720703125, -0.10359954833984375, -0.098480224609375, -0.09336090087890625, -0.0882415771484375, -0.08312225341796875, -0.0780029296875, -0.07288360595703125, -0.0677642822265625, -0.06264495849609375, -0.057525634765625, -0.05240631103515625, -0.0472869873046875, -0.04216766357421875, -0.03704833984375, -0.03192901611328125, -0.0268096923828125, -0.02169036865234375, -0.016571044921875, -0.01145172119140625, -0.0063323974609375, -0.00121307373046875, 0.00390625, 0.00902557373046875, 0.0141448974609375, 0.01926422119140625, 0.024383544921875, 0.02950286865234375, 0.0346221923828125, 0.03974151611328125, 0.04486083984375, 0.04998016357421875, 0.0550994873046875, 0.06021881103515625, 0.065338134765625, 0.07045745849609375, 0.0755767822265625, 0.08069610595703125, 0.0858154296875, 0.09093475341796875, 0.0960540771484375, 0.10117340087890625, 0.106292724609375, 0.11141204833984375, 0.1165313720703125, 0.12165069580078125, 0.12677001953125, 0.13188934326171875, 0.1370086669921875, 0.14212799072265625, 0.147247314453125, 0.15236663818359375, 0.1574859619140625, 0.16260528564453125, 0.167724609375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 16.0, 41.0, 137.0, 375.0, 307.0, 103.0, 18.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7570672035217285, -4.540345668792725, -4.3236236572265625, -4.106902122497559, -3.8901805877685547, -3.6734588146209717, -3.4567370414733887, -3.2400155067443848, -3.0232937335968018, -2.8065719604492188, -2.589850425720215, -2.373128652572632, -2.156406879425049, -1.939685344696045, -1.722963571548462, -1.5062419176101685, -1.289520263671875, -1.0727986097335815, -0.8560768961906433, -0.6393551826477051, -0.4226335287094116, -0.20591187477111816, 0.010809898376464844, 0.2275315523147583, 0.44425320625305176, 0.6609748601913452, 0.8776965737342834, 1.0944182872772217, 1.3111399412155151, 1.5278615951538086, 1.7445833683013916, 1.961305022239685, 2.1780261993408203, 2.3947479724884033, 2.6114695072174072, 2.8281912803649902, 3.044912815093994, 3.261634588241577, 3.47835636138916, 3.695077896118164, 3.911799669265747, 4.12852144241333, 4.345242977142334, 4.561964988708496, 4.7786865234375, 4.995408058166504, 5.212129592895508, 5.42885160446167, 5.645573139190674, 5.862294673919678, 6.07901668548584, 6.295738220214844, 6.512459754943848, 6.729181289672852, 6.945903301239014, 7.162624835968018, 7.37934684753418, 7.596068382263184, 7.812790393829346, 8.029512405395508, 8.246233940124512, 8.462955474853516, 8.67967700958252, 8.896398544311523, 9.113120079040527]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 10.0, 10.0, 14.0, 7.0, 7.0, 18.0, 21.0, 15.0, 20.0, 21.0, 27.0, 40.0, 36.0, 39.0, 41.0, 39.0, 44.0, 42.0, 45.0, 46.0, 31.0, 40.0, 36.0, 37.0, 27.0, 35.0, 29.0, 30.0, 29.0, 22.0, 18.0, 18.0, 11.0, 18.0, 12.0, 12.0, 11.0, 11.0, 7.0, 3.0, 1.0, 1.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7789396047592163, -1.7249284982681274, -1.6709175109863281, -1.6169064044952393, -1.56289541721344, -1.508884310722351, -1.4548733234405518, -1.400862216949463, -1.346851110458374, -1.2928400039672852, -1.2388290166854858, -1.184817910194397, -1.1308069229125977, -1.0767958164215088, -1.02278470993042, -0.9687737226486206, -0.9147627353668213, -0.8607516884803772, -0.8067406415939331, -0.7527295351028442, -0.6987185478210449, -0.644707441329956, -0.590696394443512, -0.5366853475570679, -0.4826743006706238, -0.4286632537841797, -0.3746522068977356, -0.3206411302089691, -0.266630083322525, -0.21261903643608093, -0.15860795974731445, -0.10459691286087036, -0.05058574676513672, 0.00342530757188797, 0.05743636190891266, 0.11144742369651794, 0.16545847058296204, 0.21946951746940613, 0.2734805941581726, 0.3274916410446167, 0.3815026879310608, 0.4355137348175049, 0.489524781703949, 0.5435358285903931, 0.5975469350814819, 0.6515579223632812, 0.7055690288543701, 0.7595800757408142, 0.8135911226272583, 0.8676021695137024, 0.9216132164001465, 0.9756243228912354, 1.0296353101730347, 1.0836464166641235, 1.1376574039459229, 1.1916685104370117, 1.2456796169281006, 1.2996907234191895, 1.3537017107009888, 1.4077128171920776, 1.461723804473877, 1.5157349109649658, 1.5697460174560547, 1.623757004737854, 1.6777679920196533]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 10.0, 8.0, 12.0, 15.0, 22.0, 27.0, 43.0, 66.0, 97.0, 150.0, 262.0, 465.0, 905.0, 2345.0, 8555.0, 126287.0, 4029817.0, 18685.0, 3931.0, 1322.0, 568.0, 277.0, 127.0, 106.0, 58.0, 29.0, 22.0, 22.0, 13.0, 7.0, 7.0, 3.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4267578125, -1.377899169921875, -1.32904052734375, -1.280181884765625, -1.2313232421875, -1.182464599609375, -1.13360595703125, -1.084747314453125, -1.035888671875, -0.987030029296875, -0.93817138671875, -0.889312744140625, -0.8404541015625, -0.791595458984375, -0.74273681640625, -0.693878173828125, -0.64501953125, -0.596160888671875, -0.54730224609375, -0.498443603515625, -0.4495849609375, -0.400726318359375, -0.35186767578125, -0.303009033203125, -0.254150390625, -0.205291748046875, -0.15643310546875, -0.107574462890625, -0.0587158203125, -0.009857177734375, 0.03900146484375, 0.087860107421875, 0.13671875, 0.185577392578125, 0.23443603515625, 0.283294677734375, 0.3321533203125, 0.381011962890625, 0.42987060546875, 0.478729248046875, 0.527587890625, 0.576446533203125, 0.62530517578125, 0.674163818359375, 0.7230224609375, 0.771881103515625, 0.82073974609375, 0.869598388671875, 0.91845703125, 0.967315673828125, 1.01617431640625, 1.065032958984375, 1.1138916015625, 1.162750244140625, 1.21160888671875, 1.260467529296875, 1.309326171875, 1.358184814453125, 1.40704345703125, 1.455902099609375, 1.5047607421875, 1.553619384765625, 1.60247802734375, 1.651336669921875, 1.7001953125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 5.0, 8.0, 9.0, 11.0, 13.0, 18.0, 32.0, 47.0, 47.0, 39.0, 51.0, 71.0, 62.0, 72.0, 71.0, 53.0, 59.0, 50.0, 52.0, 40.0, 45.0, 36.0, 25.0, 26.0, 6.0, 11.0, 10.0, 6.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13330078125, -0.12950611114501953, -0.12571144104003906, -0.1219167709350586, -0.11812210083007812, -0.11432743072509766, -0.11053276062011719, -0.10673809051513672, -0.10294342041015625, -0.09914875030517578, -0.09535408020019531, -0.09155941009521484, -0.08776473999023438, -0.0839700698852539, -0.08017539978027344, -0.07638072967529297, -0.0725860595703125, -0.06879138946533203, -0.06499671936035156, -0.061202049255371094, -0.057407379150390625, -0.053612709045410156, -0.04981803894042969, -0.04602336883544922, -0.04222869873046875, -0.03843402862548828, -0.03463935852050781, -0.030844688415527344, -0.027050018310546875, -0.023255348205566406, -0.019460678100585938, -0.01566600799560547, -0.011871337890625, -0.008076667785644531, -0.0042819976806640625, -0.00048732757568359375, 0.003307342529296875, 0.007102012634277344, 0.010896682739257812, 0.014691352844238281, 0.01848602294921875, 0.02228069305419922, 0.026075363159179688, 0.029870033264160156, 0.033664703369140625, 0.037459373474121094, 0.04125404357910156, 0.04504871368408203, 0.0488433837890625, 0.05263805389404297, 0.05643272399902344, 0.060227394104003906, 0.06402206420898438, 0.06781673431396484, 0.07161140441894531, 0.07540607452392578, 0.07920074462890625, 0.08299541473388672, 0.08679008483886719, 0.09058475494384766, 0.09437942504882812, 0.0981740951538086, 0.10196876525878906, 0.10576343536376953, 0.10955810546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 8.0, 8.0, 30.0, 44.0, 75.0, 130.0, 267.0, 728.0, 4631.0, 4083887.0, 101117.0, 2356.0, 506.0, 207.0, 123.0, 63.0, 50.0, 20.0, 13.0, 9.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.330078125, -2.223480224609375, -2.11688232421875, -2.010284423828125, -1.9036865234375, -1.797088623046875, -1.69049072265625, -1.583892822265625, -1.477294921875, -1.370697021484375, -1.26409912109375, -1.157501220703125, -1.0509033203125, -0.944305419921875, -0.83770751953125, -0.731109619140625, -0.62451171875, -0.517913818359375, -0.41131591796875, -0.304718017578125, -0.1981201171875, -0.091522216796875, 0.01507568359375, 0.121673583984375, 0.228271484375, 0.334869384765625, 0.44146728515625, 0.548065185546875, 0.6546630859375, 0.761260986328125, 0.86785888671875, 0.974456787109375, 1.0810546875, 1.187652587890625, 1.29425048828125, 1.400848388671875, 1.5074462890625, 1.614044189453125, 1.72064208984375, 1.827239990234375, 1.933837890625, 2.040435791015625, 2.14703369140625, 2.253631591796875, 2.3602294921875, 2.466827392578125, 2.57342529296875, 2.680023193359375, 2.78662109375, 2.893218994140625, 2.99981689453125, 3.106414794921875, 3.2130126953125, 3.319610595703125, 3.42620849609375, 3.532806396484375, 3.639404296875, 3.746002197265625, 3.85260009765625, 3.959197998046875, 4.0657958984375, 4.172393798828125, 4.27899169921875, 4.385589599609375, 4.4921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 16.0, 25.0, 30.0, 99.0, 1660.0, 2048.0, 107.0, 53.0, 17.0, 9.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5224609375, -0.4976043701171875, -0.472747802734375, -0.4478912353515625, -0.42303466796875, -0.3981781005859375, -0.373321533203125, -0.3484649658203125, -0.3236083984375, -0.2987518310546875, -0.273895263671875, -0.2490386962890625, -0.22418212890625, -0.1993255615234375, -0.174468994140625, -0.1496124267578125, -0.124755859375, -0.0998992919921875, -0.075042724609375, -0.0501861572265625, -0.02532958984375, -0.0004730224609375, 0.024383544921875, 0.0492401123046875, 0.0740966796875, 0.0989532470703125, 0.123809814453125, 0.1486663818359375, 0.17352294921875, 0.1983795166015625, 0.223236083984375, 0.2480926513671875, 0.27294921875, 0.2978057861328125, 0.322662353515625, 0.3475189208984375, 0.37237548828125, 0.3972320556640625, 0.422088623046875, 0.4469451904296875, 0.4718017578125, 0.4966583251953125, 0.521514892578125, 0.5463714599609375, 0.57122802734375, 0.5960845947265625, 0.620941162109375, 0.6457977294921875, 0.670654296875, 0.6955108642578125, 0.720367431640625, 0.7452239990234375, 0.77008056640625, 0.7949371337890625, 0.819793701171875, 0.8446502685546875, 0.8695068359375, 0.8943634033203125, 0.919219970703125, 0.9440765380859375, 0.96893310546875, 0.9937896728515625, 1.018646240234375, 1.0435028076171875, 1.068359375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 19.0, 60.0, 235.0, 463.0, 145.0, 52.0, 8.0, 10.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.52065372467041, -6.373555660247803, -6.226457595825195, -6.079359531402588, -5.9322614669799805, -5.785163879394531, -5.638065814971924, -5.490967750549316, -5.343869686126709, -5.196771621704102, -5.049673557281494, -4.902575492858887, -4.7554779052734375, -4.60837984085083, -4.461281776428223, -4.314183712005615, -4.167085647583008, -4.0199875831604, -3.872889518737793, -3.7257916927337646, -3.5786936283111572, -3.43159556388855, -3.2844977378845215, -3.137399673461914, -2.9903016090393066, -2.843203544616699, -2.696105480194092, -2.5490076541900635, -2.401909589767456, -2.2548115253448486, -2.1077136993408203, -1.960615634918213, -1.8135180473327637, -1.6664199829101562, -1.5193220376968384, -1.3722240924835205, -1.225126028060913, -1.0780279636383057, -0.9309300184249878, -0.7838320732116699, -0.6367340087890625, -0.48963600397109985, -0.3425379991531372, -0.19543999433517456, -0.048341989517211914, 0.09875601530075073, 0.24585402011871338, 0.39295196533203125, 0.5400500297546387, 0.6871480345726013, 0.834246039390564, 0.9813440442085266, 1.1284420490264893, 1.2755401134490967, 1.4226380586624146, 1.5697360038757324, 1.7168340682983398, 1.8639321327209473, 2.0110301971435547, 2.158128023147583, 2.3052260875701904, 2.452324151992798, 2.599421977996826, 2.7465200424194336, 2.893618106842041]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 11.0, 19.0, 26.0, 33.0, 50.0, 71.0, 96.0, 103.0, 113.0, 90.0, 92.0, 79.0, 76.0, 48.0, 28.0, 24.0, 14.0, 9.0, 9.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7571296691894531, -1.6938321590423584, -1.6305346488952637, -1.567237138748169, -1.5039396286010742, -1.4406421184539795, -1.3773447275161743, -1.3140472173690796, -1.2507497072219849, -1.1874521970748901, -1.1241546869277954, -1.0608571767807007, -0.9975597262382507, -0.934262216091156, -0.870964765548706, -0.8076672554016113, -0.7443697452545166, -0.6810722351074219, -0.6177747249603271, -0.5544772744178772, -0.49117976427078247, -0.42788225412368774, -0.3645847737789154, -0.30128729343414307, -0.23798978328704834, -0.1746922880411148, -0.11139479279518127, -0.04809729754924774, 0.015200197696685791, 0.07849770784378052, 0.14179518818855286, 0.2050926685333252, 0.2683901786804199, 0.33168768882751465, 0.394985169172287, 0.4582826495170593, 0.521580159664154, 0.5848776698112488, 0.6481751203536987, 0.7114726305007935, 0.7747701406478882, 0.8380676507949829, 0.9013651609420776, 0.9646626114845276, 1.0279600620269775, 1.0912575721740723, 1.154555082321167, 1.2178525924682617, 1.2811501026153564, 1.3444476127624512, 1.407745122909546, 1.4710426330566406, 1.5343401432037354, 1.59763765335083, 1.6609350442886353, 1.72423255443573, 1.7875300645828247, 1.8508275747299194, 1.9141250848770142, 1.9774225950241089, 2.040719985961914, 2.104017496109009, 2.1673150062561035, 2.2306125164031982, 2.293910026550293]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 8.0, 7.0, 10.0, 20.0, 23.0, 42.0, 59.0, 86.0, 182.0, 242.0, 435.0, 845.0, 1920.0, 5179.0, 19603.0, 150139.0, 743585.0, 102610.0, 15699.0, 4275.0, 1751.0, 746.0, 411.0, 258.0, 142.0, 113.0, 46.0, 25.0, 27.0, 18.0, 12.0, 11.0, 2.0, 2.0, 4.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.78369140625, -0.7570571899414062, -0.7304229736328125, -0.7037887573242188, -0.677154541015625, -0.6505203247070312, -0.6238861083984375, -0.5972518920898438, -0.57061767578125, -0.5439834594726562, -0.5173492431640625, -0.49071502685546875, -0.464080810546875, -0.43744659423828125, -0.4108123779296875, -0.38417816162109375, -0.3575439453125, -0.33090972900390625, -0.3042755126953125, -0.27764129638671875, -0.251007080078125, -0.22437286376953125, -0.1977386474609375, -0.17110443115234375, -0.14447021484375, -0.11783599853515625, -0.0912017822265625, -0.06456756591796875, -0.037933349609375, -0.01129913330078125, 0.0153350830078125, 0.04196929931640625, 0.068603515625, 0.09523773193359375, 0.1218719482421875, 0.14850616455078125, 0.175140380859375, 0.20177459716796875, 0.2284088134765625, 0.25504302978515625, 0.28167724609375, 0.30831146240234375, 0.3349456787109375, 0.36157989501953125, 0.388214111328125, 0.41484832763671875, 0.4414825439453125, 0.46811676025390625, 0.4947509765625, 0.5213851928710938, 0.5480194091796875, 0.5746536254882812, 0.601287841796875, 0.6279220581054688, 0.6545562744140625, 0.6811904907226562, 0.70782470703125, 0.7344589233398438, 0.7610931396484375, 0.7877273559570312, 0.814361572265625, 0.8409957885742188, 0.8676300048828125, 0.8942642211914062, 0.9208984375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 5.0, 10.0, 11.0, 17.0, 18.0, 18.0, 33.0, 42.0, 44.0, 58.0, 52.0, 61.0, 53.0, 57.0, 55.0, 68.0, 51.0, 42.0, 41.0, 50.0, 30.0, 43.0, 22.0, 19.0, 20.0, 12.0, 11.0, 10.0, 4.0, 5.0, 5.0, 3.0, 4.0, 6.0, 2.0, 0.0, 1.0, 5.0], "bins": [-0.1470947265625, -0.1434154510498047, -0.13973617553710938, -0.13605690002441406, -0.13237762451171875, -0.12869834899902344, -0.12501907348632812, -0.12133979797363281, -0.1176605224609375, -0.11398124694824219, -0.11030197143554688, -0.10662269592285156, -0.10294342041015625, -0.09926414489746094, -0.09558486938476562, -0.09190559387207031, -0.088226318359375, -0.08454704284667969, -0.08086776733398438, -0.07718849182128906, -0.07350921630859375, -0.06982994079589844, -0.06615066528320312, -0.06247138977050781, -0.0587921142578125, -0.05511283874511719, -0.051433563232421875, -0.04775428771972656, -0.04407501220703125, -0.04039573669433594, -0.036716461181640625, -0.03303718566894531, -0.02935791015625, -0.025678634643554688, -0.021999359130859375, -0.018320083618164062, -0.01464080810546875, -0.010961532592773438, -0.007282257080078125, -0.0036029815673828125, 7.62939453125e-05, 0.0037555694580078125, 0.007434844970703125, 0.011114120483398438, 0.01479339599609375, 0.018472671508789062, 0.022151947021484375, 0.025831222534179688, 0.029510498046875, 0.03318977355957031, 0.036869049072265625, 0.04054832458496094, 0.04422760009765625, 0.04790687561035156, 0.051586151123046875, 0.05526542663574219, 0.0589447021484375, 0.06262397766113281, 0.06630325317382812, 0.06998252868652344, 0.07366180419921875, 0.07734107971191406, 0.08102035522460938, 0.08469963073730469, 0.08837890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 6.0, 15.0, 21.0, 18.0, 43.0, 54.0, 97.0, 160.0, 293.0, 625.0, 1668.0, 5080.0, 20011.0, 139923.0, 710948.0, 141235.0, 20306.0, 5017.0, 1643.0, 628.0, 297.0, 170.0, 94.0, 69.0, 29.0, 13.0, 13.0, 20.0, 8.0, 8.0, 9.0, 5.0, 2.0, 8.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.525390625, -0.5087127685546875, -0.492034912109375, -0.4753570556640625, -0.45867919921875, -0.4420013427734375, -0.425323486328125, -0.4086456298828125, -0.3919677734375, -0.3752899169921875, -0.358612060546875, -0.3419342041015625, -0.32525634765625, -0.3085784912109375, -0.291900634765625, -0.2752227783203125, -0.258544921875, -0.2418670654296875, -0.225189208984375, -0.2085113525390625, -0.19183349609375, -0.1751556396484375, -0.158477783203125, -0.1417999267578125, -0.1251220703125, -0.1084442138671875, -0.091766357421875, -0.0750885009765625, -0.05841064453125, -0.0417327880859375, -0.025054931640625, -0.0083770751953125, 0.00830078125, 0.0249786376953125, 0.041656494140625, 0.0583343505859375, 0.07501220703125, 0.0916900634765625, 0.108367919921875, 0.1250457763671875, 0.1417236328125, 0.1584014892578125, 0.175079345703125, 0.1917572021484375, 0.20843505859375, 0.2251129150390625, 0.241790771484375, 0.2584686279296875, 0.275146484375, 0.2918243408203125, 0.308502197265625, 0.3251800537109375, 0.34185791015625, 0.3585357666015625, 0.375213623046875, 0.3918914794921875, 0.4085693359375, 0.4252471923828125, 0.441925048828125, 0.4586029052734375, 0.47528076171875, 0.4919586181640625, 0.508636474609375, 0.5253143310546875, 0.5419921875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 8.0, 15.0, 16.0, 14.0, 14.0, 19.0, 20.0, 24.0, 27.0, 31.0, 38.0, 36.0, 40.0, 44.0, 51.0, 54.0, 61.0, 39.0, 49.0, 51.0, 36.0, 36.0, 39.0, 36.0, 28.0, 32.0, 16.0, 23.0, 23.0, 17.0, 10.0, 9.0, 9.0, 7.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3583984375, -0.34630584716796875, -0.3342132568359375, -0.32212066650390625, -0.310028076171875, -0.29793548583984375, -0.2858428955078125, -0.27375030517578125, -0.26165771484375, -0.24956512451171875, -0.2374725341796875, -0.22537994384765625, -0.213287353515625, -0.20119476318359375, -0.1891021728515625, -0.17700958251953125, -0.1649169921875, -0.15282440185546875, -0.1407318115234375, -0.12863922119140625, -0.116546630859375, -0.10445404052734375, -0.0923614501953125, -0.08026885986328125, -0.06817626953125, -0.05608367919921875, -0.0439910888671875, -0.03189849853515625, -0.019805908203125, -0.00771331787109375, 0.0043792724609375, 0.01647186279296875, 0.028564453125, 0.04065704345703125, 0.0527496337890625, 0.06484222412109375, 0.076934814453125, 0.08902740478515625, 0.1011199951171875, 0.11321258544921875, 0.12530517578125, 0.13739776611328125, 0.1494903564453125, 0.16158294677734375, 0.173675537109375, 0.18576812744140625, 0.1978607177734375, 0.20995330810546875, 0.2220458984375, 0.23413848876953125, 0.2462310791015625, 0.25832366943359375, 0.270416259765625, 0.28250885009765625, 0.2946014404296875, 0.30669403076171875, 0.31878662109375, 0.33087921142578125, 0.3429718017578125, 0.35506439208984375, 0.367156982421875, 0.37924957275390625, 0.3913421630859375, 0.40343475341796875, 0.41552734375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 9.0, 5.0, 12.0, 19.0, 24.0, 29.0, 60.0, 83.0, 164.0, 254.0, 479.0, 1073.0, 2888.0, 10464.0, 61322.0, 593243.0, 333653.0, 33931.0, 6971.0, 2072.0, 843.0, 392.0, 203.0, 108.0, 83.0, 50.0, 37.0, 25.0, 13.0, 8.0, 7.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1461181640625, -0.14067649841308594, -0.13523483276367188, -0.1297931671142578, -0.12435150146484375, -0.11890983581542969, -0.11346817016601562, -0.10802650451660156, -0.1025848388671875, -0.09714317321777344, -0.09170150756835938, -0.08625984191894531, -0.08081817626953125, -0.07537651062011719, -0.06993484497070312, -0.06449317932128906, -0.059051513671875, -0.05360984802246094, -0.048168182373046875, -0.04272651672363281, -0.03728485107421875, -0.03184318542480469, -0.026401519775390625, -0.020959854125976562, -0.0155181884765625, -0.010076522827148438, -0.004634857177734375, 0.0008068084716796875, 0.00624847412109375, 0.011690139770507812, 0.017131805419921875, 0.022573471069335938, 0.02801513671875, 0.03345680236816406, 0.038898468017578125, 0.04434013366699219, 0.04978179931640625, 0.05522346496582031, 0.060665130615234375, 0.06610679626464844, 0.0715484619140625, 0.07699012756347656, 0.08243179321289062, 0.08787345886230469, 0.09331512451171875, 0.09875679016113281, 0.10419845581054688, 0.10964012145996094, 0.115081787109375, 0.12052345275878906, 0.12596511840820312, 0.1314067840576172, 0.13684844970703125, 0.1422901153564453, 0.14773178100585938, 0.15317344665527344, 0.1586151123046875, 0.16405677795410156, 0.16949844360351562, 0.1749401092529297, 0.18038177490234375, 0.1858234405517578, 0.19126510620117188, 0.19670677185058594, 0.2021484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 7.0, 3.0, 4.0, 10.0, 17.0, 15.0, 25.0, 25.0, 43.0, 70.0, 81.0, 138.0, 145.0, 111.0, 84.0, 57.0, 35.0, 25.0, 28.0, 20.0, 10.0, 7.0, 12.0, 6.0, 4.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.647804260253906e-05, -3.5313889384269714e-05, -3.4149736166000366e-05, -3.298558294773102e-05, -3.182142972946167e-05, -3.065727651119232e-05, -2.9493123292922974e-05, -2.8328970074653625e-05, -2.7164816856384277e-05, -2.600066363811493e-05, -2.483651041984558e-05, -2.3672357201576233e-05, -2.2508203983306885e-05, -2.1344050765037537e-05, -2.017989754676819e-05, -1.901574432849884e-05, -1.7851591110229492e-05, -1.6687437891960144e-05, -1.5523284673690796e-05, -1.4359131455421448e-05, -1.31949782371521e-05, -1.2030825018882751e-05, -1.0866671800613403e-05, -9.702518582344055e-06, -8.538365364074707e-06, -7.374212145805359e-06, -6.210058927536011e-06, -5.045905709266663e-06, -3.8817524909973145e-06, -2.7175992727279663e-06, -1.5534460544586182e-06, -3.8929283618927e-07, 7.748603820800781e-07, 1.9390136003494263e-06, 3.1031668186187744e-06, 4.2673200368881226e-06, 5.431473255157471e-06, 6.595626473426819e-06, 7.759779691696167e-06, 8.923932909965515e-06, 1.0088086128234863e-05, 1.1252239346504211e-05, 1.241639256477356e-05, 1.3580545783042908e-05, 1.4744699001312256e-05, 1.5908852219581604e-05, 1.7073005437850952e-05, 1.82371586561203e-05, 1.940131187438965e-05, 2.0565465092658997e-05, 2.1729618310928345e-05, 2.2893771529197693e-05, 2.405792474746704e-05, 2.522207796573639e-05, 2.6386231184005737e-05, 2.7550384402275085e-05, 2.8714537620544434e-05, 2.9878690838813782e-05, 3.104284405708313e-05, 3.220699727535248e-05, 3.3371150493621826e-05, 3.4535303711891174e-05, 3.569945693016052e-05, 3.686361014842987e-05, 3.802776336669922e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 15.0, 17.0, 23.0, 44.0, 94.0, 203.0, 398.0, 1141.0, 3965.0, 20100.0, 264550.0, 706593.0, 41988.0, 6629.0, 1714.0, 559.0, 265.0, 108.0, 49.0, 28.0, 21.0, 10.0, 13.0, 2.0, 2.0, 5.0, 8.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.32861328125, -0.3206329345703125, -0.312652587890625, -0.3046722412109375, -0.29669189453125, -0.2887115478515625, -0.280731201171875, -0.2727508544921875, -0.2647705078125, -0.2567901611328125, -0.248809814453125, -0.2408294677734375, -0.23284912109375, -0.2248687744140625, -0.216888427734375, -0.2089080810546875, -0.200927734375, -0.1929473876953125, -0.184967041015625, -0.1769866943359375, -0.16900634765625, -0.1610260009765625, -0.153045654296875, -0.1450653076171875, -0.1370849609375, -0.1291046142578125, -0.121124267578125, -0.1131439208984375, -0.10516357421875, -0.0971832275390625, -0.089202880859375, -0.0812225341796875, -0.0732421875, -0.0652618408203125, -0.057281494140625, -0.0493011474609375, -0.04132080078125, -0.0333404541015625, -0.025360107421875, -0.0173797607421875, -0.0093994140625, -0.0014190673828125, 0.006561279296875, 0.0145416259765625, 0.02252197265625, 0.0305023193359375, 0.038482666015625, 0.0464630126953125, 0.054443359375, 0.0624237060546875, 0.070404052734375, 0.0783843994140625, 0.08636474609375, 0.0943450927734375, 0.102325439453125, 0.1103057861328125, 0.1182861328125, 0.1262664794921875, 0.134246826171875, 0.1422271728515625, 0.15020751953125, 0.1581878662109375, 0.166168212890625, 0.1741485595703125, 0.18212890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 6.0, 7.0, 15.0, 4.0, 22.0, 3.0, 23.0, 37.0, 58.0, 80.0, 97.0, 142.0, 107.0, 113.0, 75.0, 61.0, 49.0, 24.0, 19.0, 13.0, 10.0, 8.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1724853515625, -0.1674365997314453, -0.16238784790039062, -0.15733909606933594, -0.15229034423828125, -0.14724159240722656, -0.14219284057617188, -0.1371440887451172, -0.1320953369140625, -0.1270465850830078, -0.12199783325195312, -0.11694908142089844, -0.11190032958984375, -0.10685157775878906, -0.10180282592773438, -0.09675407409667969, -0.091705322265625, -0.08665657043457031, -0.08160781860351562, -0.07655906677246094, -0.07151031494140625, -0.06646156311035156, -0.061412811279296875, -0.05636405944824219, -0.0513153076171875, -0.04626655578613281, -0.041217803955078125, -0.03616905212402344, -0.03112030029296875, -0.026071548461914062, -0.021022796630859375, -0.015974044799804688, -0.01092529296875, -0.0058765411376953125, -0.000827789306640625, 0.0042209625244140625, 0.00926971435546875, 0.014318466186523438, 0.019367218017578125, 0.024415969848632812, 0.0294647216796875, 0.03451347351074219, 0.039562225341796875, 0.04461097717285156, 0.04965972900390625, 0.05470848083496094, 0.059757232666015625, 0.06480598449707031, 0.069854736328125, 0.07490348815917969, 0.07995223999023438, 0.08500099182128906, 0.09004974365234375, 0.09509849548339844, 0.10014724731445312, 0.10519599914550781, 0.1102447509765625, 0.11529350280761719, 0.12034225463867188, 0.12539100646972656, 0.13043975830078125, 0.13548851013183594, 0.14053726196289062, 0.1455860137939453, 0.150634765625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 7.0, 24.0, 196.0, 561.0, 186.0, 38.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.596883773803711, -14.302331924438477, -14.007779121398926, -13.713227272033691, -13.41867446899414, -13.124122619628906, -12.829569816589355, -12.535017967224121, -12.24046516418457, -11.945913314819336, -11.651360511779785, -11.35680866241455, -11.062255859375, -10.767704010009766, -10.473151206970215, -10.17859935760498, -9.884047508239746, -9.589495658874512, -9.294942855834961, -9.000391006469727, -8.705838203430176, -8.411286354064941, -8.11673355102539, -7.822181701660156, -7.527629375457764, -7.233077049255371, -6.9385247230529785, -6.643972396850586, -6.349420547485352, -6.054867744445801, -5.760315895080566, -5.465763568878174, -5.171210289001465, -4.876657962799072, -4.58210563659668, -4.287553310394287, -3.9930012226104736, -3.698448896408081, -3.4038968086242676, -3.109344482421875, -2.8147921562194824, -2.52023983001709, -2.2256875038146973, -1.9311354160308838, -1.6365830898284912, -1.3420307636260986, -1.0474785566329956, -0.7529263496398926, -0.4583740234375, -0.1638217568397522, 0.1307305097579956, 0.4252827763557434, 0.7198350429534912, 1.0143873691558838, 1.3089395761489868, 1.6034917831420898, 1.8980441093444824, 2.192596435546875, 2.4871487617492676, 2.781700849533081, 3.0762531757354736, 3.370805501937866, 3.6653575897216797, 3.9599099159240723, 4.254462242126465]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 7.0, 9.0, 15.0, 12.0, 26.0, 21.0, 14.0, 23.0, 30.0, 32.0, 33.0, 44.0, 46.0, 33.0, 47.0, 36.0, 35.0, 49.0, 39.0, 49.0, 38.0, 53.0, 49.0, 30.0, 22.0, 32.0, 24.0, 24.0, 14.0, 10.0, 15.0, 14.0, 10.0, 20.0, 8.0, 8.0, 8.0, 4.0, 2.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7205265760421753, -1.66422438621521, -1.6079221963882446, -1.5516200065612793, -1.495317816734314, -1.4390156269073486, -1.3827133178710938, -1.326411247253418, -1.270108938217163, -1.2138067483901978, -1.1575045585632324, -1.101202368736267, -1.0449001789093018, -0.9885979890823364, -0.9322957396507263, -0.875993549823761, -0.8196914196014404, -0.7633892297744751, -0.7070870399475098, -0.6507848501205444, -0.5944826602935791, -0.5381804704666138, -0.48187822103500366, -0.42557603120803833, -0.369273841381073, -0.31297165155410767, -0.25666946172714233, -0.20036724209785461, -0.14406505227088928, -0.08776286244392395, -0.03146064281463623, 0.0248415470123291, 0.08114361763000488, 0.13744580745697021, 0.19374801218509674, 0.25005021691322327, 0.3063524067401886, 0.36265459656715393, 0.41895681619644165, 0.475259006023407, 0.5315611958503723, 0.5878633856773376, 0.644165575504303, 0.7004678249359131, 0.7567700147628784, 0.8130722045898438, 0.8693743944168091, 0.9256765842437744, 0.9819787740707397, 1.038280963897705, 1.0945831537246704, 1.1508853435516357, 1.207187533378601, 1.2634897232055664, 1.3197920322418213, 1.376094102859497, 1.432396411895752, 1.4886986017227173, 1.5450007915496826, 1.601302981376648, 1.6576051712036133, 1.7139073610305786, 1.770209550857544, 1.8265118598937988, 1.8828139305114746]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 6.0, 2.0, 7.0, 7.0, 8.0, 5.0, 5.0, 12.0, 17.0, 24.0, 28.0, 64.0, 106.0, 135.0, 268.0, 502.0, 876.0, 2649.0, 19050.0, 4152345.0, 14031.0, 2317.0, 836.0, 401.0, 224.0, 130.0, 84.0, 34.0, 31.0, 19.0, 12.0, 8.0, 8.0, 5.0, 10.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5390625, -2.460784912109375, -2.38250732421875, -2.304229736328125, -2.2259521484375, -2.147674560546875, -2.06939697265625, -1.991119384765625, -1.912841796875, -1.834564208984375, -1.75628662109375, -1.678009033203125, -1.5997314453125, -1.521453857421875, -1.44317626953125, -1.364898681640625, -1.28662109375, -1.208343505859375, -1.13006591796875, -1.051788330078125, -0.9735107421875, -0.895233154296875, -0.81695556640625, -0.738677978515625, -0.660400390625, -0.582122802734375, -0.50384521484375, -0.425567626953125, -0.3472900390625, -0.269012451171875, -0.19073486328125, -0.112457275390625, -0.0341796875, 0.044097900390625, 0.12237548828125, 0.200653076171875, 0.2789306640625, 0.357208251953125, 0.43548583984375, 0.513763427734375, 0.592041015625, 0.670318603515625, 0.74859619140625, 0.826873779296875, 0.9051513671875, 0.983428955078125, 1.06170654296875, 1.139984130859375, 1.21826171875, 1.296539306640625, 1.37481689453125, 1.453094482421875, 1.5313720703125, 1.609649658203125, 1.68792724609375, 1.766204833984375, 1.844482421875, 1.922760009765625, 2.00103759765625, 2.079315185546875, 2.1575927734375, 2.235870361328125, 2.31414794921875, 2.392425537109375, 2.470703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 7.0, 4.0, 10.0, 15.0, 14.0, 12.0, 26.0, 29.0, 33.0, 48.0, 51.0, 46.0, 68.0, 60.0, 53.0, 59.0, 60.0, 55.0, 50.0, 44.0, 44.0, 30.0, 31.0, 27.0, 25.0, 20.0, 15.0, 18.0, 9.0, 5.0, 8.0, 4.0, 1.0, 6.0, 3.0, 4.0, 6.0, 1.0, 1.0], "bins": [-0.150146484375, -0.14642906188964844, -0.14271163940429688, -0.1389942169189453, -0.13527679443359375, -0.1315593719482422, -0.12784194946289062, -0.12412452697753906, -0.1204071044921875, -0.11668968200683594, -0.11297225952148438, -0.10925483703613281, -0.10553741455078125, -0.10181999206542969, -0.09810256958007812, -0.09438514709472656, -0.090667724609375, -0.08695030212402344, -0.08323287963867188, -0.07951545715332031, -0.07579803466796875, -0.07208061218261719, -0.06836318969726562, -0.06464576721191406, -0.0609283447265625, -0.05721092224121094, -0.053493499755859375, -0.04977607727050781, -0.04605865478515625, -0.04234123229980469, -0.038623809814453125, -0.03490638732910156, -0.03118896484375, -0.027471542358398438, -0.023754119873046875, -0.020036697387695312, -0.01631927490234375, -0.012601852416992188, -0.008884429931640625, -0.0051670074462890625, -0.0014495849609375, 0.0022678375244140625, 0.005985260009765625, 0.009702682495117188, 0.01342010498046875, 0.017137527465820312, 0.020854949951171875, 0.024572372436523438, 0.028289794921875, 0.03200721740722656, 0.035724639892578125, 0.03944206237792969, 0.04315948486328125, 0.04687690734863281, 0.050594329833984375, 0.05431175231933594, 0.0580291748046875, 0.06174659729003906, 0.06546401977539062, 0.06918144226074219, 0.07289886474609375, 0.07661628723144531, 0.08033370971679688, 0.08405113220214844, 0.0877685546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 9.0, 7.0, 5.0, 15.0, 13.0, 24.0, 33.0, 43.0, 58.0, 80.0, 163.0, 458.0, 3053.0, 4183549.0, 5697.0, 577.0, 170.0, 99.0, 61.0, 48.0, 40.0, 24.0, 22.0, 16.0, 9.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.375, -4.1395263671875, -3.904052734375, -3.6685791015625, -3.43310546875, -3.1976318359375, -2.962158203125, -2.7266845703125, -2.4912109375, -2.2557373046875, -2.020263671875, -1.7847900390625, -1.54931640625, -1.3138427734375, -1.078369140625, -0.8428955078125, -0.607421875, -0.3719482421875, -0.136474609375, 0.0989990234375, 0.33447265625, 0.5699462890625, 0.805419921875, 1.0408935546875, 1.2763671875, 1.5118408203125, 1.747314453125, 1.9827880859375, 2.21826171875, 2.4537353515625, 2.689208984375, 2.9246826171875, 3.16015625, 3.3956298828125, 3.631103515625, 3.8665771484375, 4.10205078125, 4.3375244140625, 4.572998046875, 4.8084716796875, 5.0439453125, 5.2794189453125, 5.514892578125, 5.7503662109375, 5.98583984375, 6.2213134765625, 6.456787109375, 6.6922607421875, 6.927734375, 7.1632080078125, 7.398681640625, 7.6341552734375, 7.86962890625, 8.1051025390625, 8.340576171875, 8.5760498046875, 8.8115234375, 9.0469970703125, 9.282470703125, 9.5179443359375, 9.75341796875, 9.9888916015625, 10.224365234375, 10.4598388671875, 10.6953125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 9.0, 24.0, 127.0, 3803.0, 87.0, 25.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75634765625, -0.7039718627929688, -0.6515960693359375, -0.5992202758789062, -0.546844482421875, -0.49446868896484375, -0.4420928955078125, -0.38971710205078125, -0.33734130859375, -0.28496551513671875, -0.2325897216796875, -0.18021392822265625, -0.127838134765625, -0.07546234130859375, -0.0230865478515625, 0.02928924560546875, 0.0816650390625, 0.13404083251953125, 0.1864166259765625, 0.23879241943359375, 0.291168212890625, 0.34354400634765625, 0.3959197998046875, 0.44829559326171875, 0.50067138671875, 0.5530471801757812, 0.6054229736328125, 0.6577987670898438, 0.710174560546875, 0.7625503540039062, 0.8149261474609375, 0.8673019409179688, 0.919677734375, 0.9720535278320312, 1.0244293212890625, 1.0768051147460938, 1.129180908203125, 1.1815567016601562, 1.2339324951171875, 1.2863082885742188, 1.33868408203125, 1.3910598754882812, 1.4434356689453125, 1.4958114624023438, 1.548187255859375, 1.6005630493164062, 1.6529388427734375, 1.7053146362304688, 1.7576904296875, 1.8100662231445312, 1.8624420166015625, 1.9148178100585938, 1.967193603515625, 2.0195693969726562, 2.0719451904296875, 2.1243209838867188, 2.17669677734375, 2.2290725708007812, 2.2814483642578125, 2.3338241577148438, 2.386199951171875, 2.4385757446289062, 2.4909515380859375, 2.5433273315429688, 2.595703125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 8.0, 12.0, 24.0, 79.0, 446.0, 324.0, 68.0, 28.0, 15.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.499883651733398, -6.258271217346191, -6.016658782958984, -5.775046348571777, -5.53343391418457, -5.291821479797363, -5.050209045410156, -4.808596611022949, -4.566984176635742, -4.325371742248535, -4.083759307861328, -3.842146873474121, -3.600534439086914, -3.358922004699707, -3.117309808731079, -2.875697374343872, -2.634085178375244, -2.392472743988037, -2.15086030960083, -1.9092479944229126, -1.6676355600357056, -1.4260231256484985, -1.184410810470581, -0.942798376083374, -0.701185941696167, -0.45957353711128235, -0.2179611325263977, 0.02365124225616455, 0.2652636766433716, 0.5068761110305786, 0.7484884262084961, 0.9901008605957031, 1.2317132949829102, 1.4733257293701172, 1.7149381637573242, 1.9565504789352417, 2.1981630325317383, 2.4397754669189453, 2.6813876628875732, 2.9230000972747803, 3.1646125316619873, 3.4062249660491943, 3.6478374004364014, 3.8894495964050293, 4.131062030792236, 4.372674465179443, 4.61428689956665, 4.855899333953857, 5.0975117683410645, 5.3391242027282715, 5.5807366371154785, 5.8223490715026855, 6.063961505889893, 6.3055739402771, 6.547185897827148, 6.7887983322143555, 7.0304107666015625, 7.2720232009887695, 7.513635635375977, 7.755248069763184, 7.996860504150391, 8.238472938537598, 8.480085372924805, 8.721697807312012, 8.963310241699219]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 3.0, 11.0, 22.0, 35.0, 82.0, 122.0, 167.0, 148.0, 146.0, 126.0, 62.0, 35.0, 10.0, 16.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.834344863891602, -4.701873302459717, -4.569401741027832, -4.436930179595947, -4.3044586181640625, -4.171987056732178, -4.039515495300293, -3.907043933868408, -3.7745723724365234, -3.6421008110046387, -3.509629249572754, -3.377157688140869, -3.2446861267089844, -3.1122145652770996, -2.979743003845215, -2.84727144241333, -2.7148001194000244, -2.5823285579681396, -2.449856996536255, -2.31738543510437, -2.1849138736724854, -2.0524423122406006, -1.9199708700180054, -1.7874993085861206, -1.6550277471542358, -1.522556185722351, -1.3900846242904663, -1.257613182067871, -1.1251416206359863, -0.9926699995994568, -0.8601984977722168, -0.727726936340332, -0.5952553749084473, -0.4627838134765625, -0.3303122818470001, -0.19784075021743774, -0.06536918878555298, 0.06710237264633179, 0.19957387447357178, 0.33204543590545654, 0.4645169973373413, 0.5969885587692261, 0.7294601202011108, 0.8619316220283508, 0.9944031834602356, 1.1268746852874756, 1.2593462467193604, 1.3918178081512451, 1.5242893695831299, 1.6567609310150146, 1.7892324924468994, 1.9217040538787842, 2.054175615310669, 2.1866471767425537, 2.3191184997558594, 2.451590061187744, 2.584061622619629, 2.7165331840515137, 2.8490047454833984, 2.981476306915283, 3.113947868347168, 3.2464194297790527, 3.3788909912109375, 3.5113625526428223, 3.643834114074707]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 10.0, 15.0, 21.0, 29.0, 34.0, 42.0, 70.0, 94.0, 136.0, 218.0, 313.0, 552.0, 985.0, 1825.0, 4039.0, 10507.0, 37414.0, 233058.0, 628491.0, 96637.0, 20911.0, 6906.0, 2843.0, 1386.0, 735.0, 453.0, 248.0, 179.0, 113.0, 81.0, 60.0, 38.0, 32.0, 16.0, 15.0, 11.0, 7.0, 6.0, 3.0, 5.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.71826171875, -0.6953048706054688, -0.6723480224609375, -0.6493911743164062, -0.626434326171875, -0.6034774780273438, -0.5805206298828125, -0.5575637817382812, -0.53460693359375, -0.5116500854492188, -0.4886932373046875, -0.46573638916015625, -0.442779541015625, -0.41982269287109375, -0.3968658447265625, -0.37390899658203125, -0.3509521484375, -0.32799530029296875, -0.3050384521484375, -0.28208160400390625, -0.259124755859375, -0.23616790771484375, -0.2132110595703125, -0.19025421142578125, -0.16729736328125, -0.14434051513671875, -0.1213836669921875, -0.09842681884765625, -0.075469970703125, -0.05251312255859375, -0.0295562744140625, -0.00659942626953125, 0.016357421875, 0.03931427001953125, 0.0622711181640625, 0.08522796630859375, 0.108184814453125, 0.13114166259765625, 0.1540985107421875, 0.17705535888671875, 0.20001220703125, 0.22296905517578125, 0.2459259033203125, 0.26888275146484375, 0.291839599609375, 0.31479644775390625, 0.3377532958984375, 0.36071014404296875, 0.3836669921875, 0.40662384033203125, 0.4295806884765625, 0.45253753662109375, 0.475494384765625, 0.49845123291015625, 0.5214080810546875, 0.5443649291992188, 0.56732177734375, 0.5902786254882812, 0.6132354736328125, 0.6361923217773438, 0.659149169921875, 0.6821060180664062, 0.7050628662109375, 0.7280197143554688, 0.7509765625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 3.0, 7.0, 0.0, 7.0, 13.0, 13.0, 22.0, 38.0, 41.0, 60.0, 74.0, 72.0, 78.0, 98.0, 69.0, 84.0, 75.0, 63.0, 48.0, 41.0, 23.0, 27.0, 13.0, 8.0, 8.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255126953125, -0.24779129028320312, -0.24045562744140625, -0.23311996459960938, -0.2257843017578125, -0.21844863891601562, -0.21111297607421875, -0.20377731323242188, -0.196441650390625, -0.18910598754882812, -0.18177032470703125, -0.17443466186523438, -0.1670989990234375, -0.15976333618164062, -0.15242767333984375, -0.14509201049804688, -0.13775634765625, -0.13042068481445312, -0.12308502197265625, -0.11574935913085938, -0.1084136962890625, -0.10107803344726562, -0.09374237060546875, -0.08640670776367188, -0.079071044921875, -0.07173538208007812, -0.06439971923828125, -0.057064056396484375, -0.0497283935546875, -0.042392730712890625, -0.03505706787109375, -0.027721405029296875, -0.0203857421875, -0.013050079345703125, -0.00571441650390625, 0.001621246337890625, 0.0089569091796875, 0.016292572021484375, 0.02362823486328125, 0.030963897705078125, 0.038299560546875, 0.045635223388671875, 0.05297088623046875, 0.060306549072265625, 0.0676422119140625, 0.07497787475585938, 0.08231353759765625, 0.08964920043945312, 0.09698486328125, 0.10432052612304688, 0.11165618896484375, 0.11899185180664062, 0.1263275146484375, 0.13366317749023438, 0.14099884033203125, 0.14833450317382812, 0.155670166015625, 0.16300582885742188, 0.17034149169921875, 0.17767715454101562, 0.1850128173828125, 0.19234848022460938, 0.19968414306640625, 0.20701980590820312, 0.21435546875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 0.0, 4.0, 6.0, 9.0, 11.0, 19.0, 23.0, 26.0, 36.0, 55.0, 112.0, 232.0, 477.0, 1105.0, 3053.0, 11389.0, 61851.0, 479376.0, 421674.0, 54080.0, 10238.0, 2782.0, 1057.0, 420.0, 214.0, 100.0, 67.0, 32.0, 29.0, 14.0, 13.0, 12.0, 9.0, 8.0, 3.0, 1.0, 3.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4775390625, -0.46105194091796875, -0.4445648193359375, -0.42807769775390625, -0.411590576171875, -0.39510345458984375, -0.3786163330078125, -0.36212921142578125, -0.34564208984375, -0.32915496826171875, -0.3126678466796875, -0.29618072509765625, -0.279693603515625, -0.26320648193359375, -0.2467193603515625, -0.23023223876953125, -0.2137451171875, -0.19725799560546875, -0.1807708740234375, -0.16428375244140625, -0.147796630859375, -0.13130950927734375, -0.1148223876953125, -0.09833526611328125, -0.08184814453125, -0.06536102294921875, -0.0488739013671875, -0.03238677978515625, -0.015899658203125, 0.00058746337890625, 0.0170745849609375, 0.03356170654296875, 0.050048828125, 0.06653594970703125, 0.0830230712890625, 0.09951019287109375, 0.115997314453125, 0.13248443603515625, 0.1489715576171875, 0.16545867919921875, 0.18194580078125, 0.19843292236328125, 0.2149200439453125, 0.23140716552734375, 0.247894287109375, 0.26438140869140625, 0.2808685302734375, 0.29735565185546875, 0.3138427734375, 0.33032989501953125, 0.3468170166015625, 0.36330413818359375, 0.379791259765625, 0.39627838134765625, 0.4127655029296875, 0.42925262451171875, 0.44573974609375, 0.46222686767578125, 0.4787139892578125, 0.49520111083984375, 0.511688232421875, 0.5281753540039062, 0.5446624755859375, 0.5611495971679688, 0.57763671875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 7.0, 14.0, 10.0, 13.0, 19.0, 14.0, 18.0, 26.0, 27.0, 37.0, 45.0, 40.0, 42.0, 36.0, 36.0, 44.0, 54.0, 47.0, 28.0, 34.0, 41.0, 40.0, 38.0, 34.0, 33.0, 29.0, 29.0, 22.0, 16.0, 19.0, 16.0, 17.0, 19.0, 8.0, 7.0, 4.0, 3.0, 6.0, 8.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389892578125, -0.3774566650390625, -0.365020751953125, -0.3525848388671875, -0.34014892578125, -0.3277130126953125, -0.315277099609375, -0.3028411865234375, -0.2904052734375, -0.2779693603515625, -0.265533447265625, -0.2530975341796875, -0.24066162109375, -0.2282257080078125, -0.215789794921875, -0.2033538818359375, -0.19091796875, -0.1784820556640625, -0.166046142578125, -0.1536102294921875, -0.14117431640625, -0.1287384033203125, -0.116302490234375, -0.1038665771484375, -0.0914306640625, -0.0789947509765625, -0.066558837890625, -0.0541229248046875, -0.04168701171875, -0.0292510986328125, -0.016815185546875, -0.0043792724609375, 0.008056640625, 0.0204925537109375, 0.032928466796875, 0.0453643798828125, 0.05780029296875, 0.0702362060546875, 0.082672119140625, 0.0951080322265625, 0.1075439453125, 0.1199798583984375, 0.132415771484375, 0.1448516845703125, 0.15728759765625, 0.1697235107421875, 0.182159423828125, 0.1945953369140625, 0.20703125, 0.2194671630859375, 0.231903076171875, 0.2443389892578125, 0.25677490234375, 0.2692108154296875, 0.281646728515625, 0.2940826416015625, 0.3065185546875, 0.3189544677734375, 0.331390380859375, 0.3438262939453125, 0.35626220703125, 0.3686981201171875, 0.381134033203125, 0.3935699462890625, 0.406005859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 18.0, 18.0, 38.0, 51.0, 83.0, 130.0, 252.0, 383.0, 668.0, 1316.0, 2941.0, 8656.0, 52742.0, 791991.0, 165794.0, 15466.0, 4220.0, 1741.0, 878.0, 472.0, 255.0, 178.0, 103.0, 56.0, 47.0, 27.0, 11.0, 9.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35205078125, -0.3416023254394531, -0.33115386962890625, -0.3207054138183594, -0.3102569580078125, -0.2998085021972656, -0.28936004638671875, -0.2789115905761719, -0.268463134765625, -0.2580146789550781, -0.24756622314453125, -0.23711776733398438, -0.2266693115234375, -0.21622085571289062, -0.20577239990234375, -0.19532394409179688, -0.18487548828125, -0.17442703247070312, -0.16397857666015625, -0.15353012084960938, -0.1430816650390625, -0.13263320922851562, -0.12218475341796875, -0.11173629760742188, -0.101287841796875, -0.09083938598632812, -0.08039093017578125, -0.06994247436523438, -0.0594940185546875, -0.049045562744140625, -0.03859710693359375, -0.028148651123046875, -0.0177001953125, -0.007251739501953125, 0.00319671630859375, 0.013645172119140625, 0.0240936279296875, 0.034542083740234375, 0.04499053955078125, 0.055438995361328125, 0.065887451171875, 0.07633590698242188, 0.08678436279296875, 0.09723281860351562, 0.1076812744140625, 0.11812973022460938, 0.12857818603515625, 0.13902664184570312, 0.14947509765625, 0.15992355346679688, 0.17037200927734375, 0.18082046508789062, 0.1912689208984375, 0.20171737670898438, 0.21216583251953125, 0.22261428833007812, 0.233062744140625, 0.24351119995117188, 0.25395965576171875, 0.2644081115722656, 0.2748565673828125, 0.2853050231933594, 0.29575347900390625, 0.3062019348144531, 0.316650390625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 7.0, 8.0, 12.0, 15.0, 36.0, 48.0, 96.0, 176.0, 232.0, 170.0, 81.0, 45.0, 26.0, 15.0, 7.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.285045623779297e-05, -8.064322173595428e-05, -7.84359872341156e-05, -7.622875273227692e-05, -7.402151823043823e-05, -7.181428372859955e-05, -6.960704922676086e-05, -6.739981472492218e-05, -6.51925802230835e-05, -6.298534572124481e-05, -6.077811121940613e-05, -5.8570876717567444e-05, -5.636364221572876e-05, -5.4156407713890076e-05, -5.194917321205139e-05, -4.974193871021271e-05, -4.7534704208374023e-05, -4.532746970653534e-05, -4.3120235204696655e-05, -4.091300070285797e-05, -3.870576620101929e-05, -3.64985316991806e-05, -3.429129719734192e-05, -3.2084062695503235e-05, -2.987682819366455e-05, -2.7669593691825867e-05, -2.5462359189987183e-05, -2.32551246881485e-05, -2.1047890186309814e-05, -1.884065568447113e-05, -1.6633421182632446e-05, -1.4426186680793762e-05, -1.2218952178955078e-05, -1.0011717677116394e-05, -7.80448317527771e-06, -5.597248673439026e-06, -3.390014171600342e-06, -1.1827796697616577e-06, 1.0244548320770264e-06, 3.2316893339157104e-06, 5.4389238357543945e-06, 7.646158337593079e-06, 9.853392839431763e-06, 1.2060627341270447e-05, 1.4267861843109131e-05, 1.6475096344947815e-05, 1.86823308467865e-05, 2.0889565348625183e-05, 2.3096799850463867e-05, 2.530403435230255e-05, 2.7511268854141235e-05, 2.971850335597992e-05, 3.1925737857818604e-05, 3.413297235965729e-05, 3.634020686149597e-05, 3.8547441363334656e-05, 4.075467586517334e-05, 4.2961910367012024e-05, 4.516914486885071e-05, 4.737637937068939e-05, 4.9583613872528076e-05, 5.179084837436676e-05, 5.3998082876205444e-05, 5.620531737804413e-05, 5.841255187988281e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 8.0, 3.0, 6.0, 21.0, 29.0, 49.0, 89.0, 196.0, 496.0, 1551.0, 6150.0, 38308.0, 758732.0, 221433.0, 16595.0, 3367.0, 969.0, 302.0, 121.0, 52.0, 26.0, 16.0, 19.0, 10.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.232177734375, -0.22044754028320312, -0.20871734619140625, -0.19698715209960938, -0.1852569580078125, -0.17352676391601562, -0.16179656982421875, -0.15006637573242188, -0.138336181640625, -0.12660598754882812, -0.11487579345703125, -0.10314559936523438, -0.0914154052734375, -0.07968521118164062, -0.06795501708984375, -0.056224822998046875, -0.04449462890625, -0.032764434814453125, -0.02103424072265625, -0.009304046630859375, 0.0024261474609375, 0.014156341552734375, 0.02588653564453125, 0.037616729736328125, 0.049346923828125, 0.061077117919921875, 0.07280731201171875, 0.08453750610351562, 0.0962677001953125, 0.10799789428710938, 0.11972808837890625, 0.13145828247070312, 0.1431884765625, 0.15491867065429688, 0.16664886474609375, 0.17837905883789062, 0.1901092529296875, 0.20183944702148438, 0.21356964111328125, 0.22529983520507812, 0.237030029296875, 0.24876022338867188, 0.26049041748046875, 0.2722206115722656, 0.2839508056640625, 0.2956809997558594, 0.30741119384765625, 0.3191413879394531, 0.33087158203125, 0.3426017761230469, 0.35433197021484375, 0.3660621643066406, 0.3777923583984375, 0.3895225524902344, 0.40125274658203125, 0.4129829406738281, 0.424713134765625, 0.4364433288574219, 0.44817352294921875, 0.4599037170410156, 0.4716339111328125, 0.4833641052246094, 0.49509429931640625, 0.5068244934082031, 0.5185546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 12.0, 9.0, 9.0, 12.0, 22.0, 26.0, 40.0, 59.0, 101.0, 113.0, 131.0, 127.0, 106.0, 78.0, 48.0, 29.0, 15.0, 25.0, 10.0, 7.0, 5.0, 5.0, 5.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1019287109375, -0.09494972229003906, -0.08797073364257812, -0.08099174499511719, -0.07401275634765625, -0.06703376770019531, -0.060054779052734375, -0.05307579040527344, -0.0460968017578125, -0.03911781311035156, -0.032138824462890625, -0.025159835815429688, -0.01818084716796875, -0.011201858520507812, -0.004222869873046875, 0.0027561187744140625, 0.009735107421875, 0.016714096069335938, 0.023693084716796875, 0.030672073364257812, 0.03765106201171875, 0.04463005065917969, 0.051609039306640625, 0.05858802795410156, 0.0655670166015625, 0.07254600524902344, 0.07952499389648438, 0.08650398254394531, 0.09348297119140625, 0.10046195983886719, 0.10744094848632812, 0.11441993713378906, 0.12139892578125, 0.12837791442871094, 0.13535690307617188, 0.1423358917236328, 0.14931488037109375, 0.1562938690185547, 0.16327285766601562, 0.17025184631347656, 0.1772308349609375, 0.18420982360839844, 0.19118881225585938, 0.1981678009033203, 0.20514678955078125, 0.2121257781982422, 0.21910476684570312, 0.22608375549316406, 0.233062744140625, 0.24004173278808594, 0.24702072143554688, 0.2539997100830078, 0.26097869873046875, 0.2679576873779297, 0.2749366760253906, 0.28191566467285156, 0.2888946533203125, 0.29587364196777344, 0.3028526306152344, 0.3098316192626953, 0.31681060791015625, 0.3237895965576172, 0.3307685852050781, 0.33774757385253906, 0.3447265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 16.0, 68.0, 343.0, 439.0, 120.0, 20.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.581859588623047, -17.262699127197266, -16.94353675842285, -16.62437629699707, -16.305213928222656, -15.986052513122559, -15.666891098022461, -15.347729682922363, -15.028568267822266, -14.709406852722168, -14.39024543762207, -14.071084022521973, -13.751922607421875, -13.432761192321777, -13.11359977722168, -12.794438362121582, -12.475276947021484, -12.156115531921387, -11.836954116821289, -11.517792701721191, -11.198631286621094, -10.879469871520996, -10.560308456420898, -10.2411470413208, -9.92198657989502, -9.602825164794922, -9.283663749694824, -8.964502334594727, -8.645340919494629, -8.326179504394531, -8.007018089294434, -7.687856674194336, -7.3686957359313965, -7.049534320831299, -6.730372905731201, -6.4112114906311035, -6.092050075531006, -5.772888660430908, -5.453727722167969, -5.134566307067871, -4.815404891967773, -4.496243476867676, -4.177082061767578, -3.8579206466674805, -3.538759231567383, -3.219597816467285, -2.9004366397857666, -2.581275224685669, -2.262113571166992, -1.9429521560668945, -1.6237907409667969, -1.3046294450759888, -0.9854680299758911, -0.6663066148757935, -0.34714531898498535, -0.027983903884887695, 0.29117751121520996, 0.6103389263153076, 0.9295002818107605, 1.2486616373062134, 1.567823052406311, 1.8869844675064087, 2.206145763397217, 2.5253071784973145, 2.844468593597412]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 9.0, 9.0, 13.0, 14.0, 9.0, 15.0, 28.0, 27.0, 18.0, 30.0, 25.0, 29.0, 39.0, 45.0, 40.0, 31.0, 35.0, 44.0, 37.0, 32.0, 43.0, 26.0, 32.0, 42.0, 32.0, 34.0, 33.0, 32.0, 33.0, 28.0, 21.0, 18.0, 13.0, 15.0, 12.0, 10.0, 11.0, 4.0, 4.0, 3.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.8922216892242432, -1.8328442573547363, -1.773466944694519, -1.7140895128250122, -1.654712200164795, -1.595334768295288, -1.5359573364257812, -1.476580023765564, -1.4172025918960571, -1.3578251600265503, -1.298447847366333, -1.2390704154968262, -1.1796931028366089, -1.120315670967102, -1.0609383583068848, -1.001560926437378, -0.9421835541725159, -0.8828061819076538, -0.8234288096427917, -0.7640514373779297, -0.7046740055084229, -0.6452966332435608, -0.5859192609786987, -0.5265418291091919, -0.4671644866466522, -0.40778711438179016, -0.3484097123146057, -0.28903234004974365, -0.2296549528837204, -0.17027756571769714, -0.11090019345283508, -0.051522791385650635, 0.007854580879211426, 0.06723196804523468, 0.12660935521125793, 0.18598672747612, 0.24536411464214325, 0.3047415018081665, 0.36411887407302856, 0.423496276140213, 0.4828736484050751, 0.5422510504722595, 0.6016284227371216, 0.6610057950019836, 0.7203831672668457, 0.7797605991363525, 0.8391379117965698, 0.8985153436660767, 0.9578927159309387, 1.0172700881958008, 1.0766475200653076, 1.136024832725525, 1.1954022645950317, 1.254779577255249, 1.3141570091247559, 1.3735344409942627, 1.43291175365448, 1.4922891855239868, 1.551666498184204, 1.611043930053711, 1.6704212427139282, 1.729798674583435, 1.7891759872436523, 1.8485534191131592, 1.907930850982666]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 7.0, 6.0, 8.0, 8.0, 14.0, 22.0, 18.0, 27.0, 52.0, 63.0, 92.0, 150.0, 235.0, 407.0, 752.0, 1700.0, 4654.0, 27813.0, 4121201.0, 28650.0, 5023.0, 1626.0, 753.0, 414.0, 212.0, 98.0, 98.0, 43.0, 29.0, 27.0, 17.0, 16.0, 7.0, 7.0, 4.0, 5.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.65625, -2.5814208984375, -2.506591796875, -2.4317626953125, -2.35693359375, -2.2821044921875, -2.207275390625, -2.1324462890625, -2.0576171875, -1.9827880859375, -1.907958984375, -1.8331298828125, -1.75830078125, -1.6834716796875, -1.608642578125, -1.5338134765625, -1.458984375, -1.3841552734375, -1.309326171875, -1.2344970703125, -1.15966796875, -1.0848388671875, -1.010009765625, -0.9351806640625, -0.8603515625, -0.7855224609375, -0.710693359375, -0.6358642578125, -0.56103515625, -0.4862060546875, -0.411376953125, -0.3365478515625, -0.26171875, -0.1868896484375, -0.112060546875, -0.0372314453125, 0.03759765625, 0.1124267578125, 0.187255859375, 0.2620849609375, 0.3369140625, 0.4117431640625, 0.486572265625, 0.5614013671875, 0.63623046875, 0.7110595703125, 0.785888671875, 0.8607177734375, 0.935546875, 1.0103759765625, 1.085205078125, 1.1600341796875, 1.23486328125, 1.3096923828125, 1.384521484375, 1.4593505859375, 1.5341796875, 1.6090087890625, 1.683837890625, 1.7586669921875, 1.83349609375, 1.9083251953125, 1.983154296875, 2.0579833984375, 2.1328125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 0.0, 3.0, 4.0, 1.0, 5.0, 15.0, 15.0, 21.0, 34.0, 30.0, 51.0, 54.0, 57.0, 73.0, 89.0, 94.0, 71.0, 64.0, 64.0, 77.0, 35.0, 42.0, 31.0, 17.0, 21.0, 11.0, 5.0, 3.0, 8.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24072265625, -0.23375511169433594, -0.22678756713867188, -0.2198200225830078, -0.21285247802734375, -0.2058849334716797, -0.19891738891601562, -0.19194984436035156, -0.1849822998046875, -0.17801475524902344, -0.17104721069335938, -0.1640796661376953, -0.15711212158203125, -0.1501445770263672, -0.14317703247070312, -0.13620948791503906, -0.129241943359375, -0.12227439880371094, -0.11530685424804688, -0.10833930969238281, -0.10137176513671875, -0.09440422058105469, -0.08743667602539062, -0.08046913146972656, -0.0735015869140625, -0.06653404235839844, -0.059566497802734375, -0.05259895324707031, -0.04563140869140625, -0.03866386413574219, -0.031696319580078125, -0.024728775024414062, -0.01776123046875, -0.010793685913085938, -0.003826141357421875, 0.0031414031982421875, 0.01010894775390625, 0.017076492309570312, 0.024044036865234375, 0.031011581420898438, 0.0379791259765625, 0.04494667053222656, 0.051914215087890625, 0.05888175964355469, 0.06584930419921875, 0.07281684875488281, 0.07978439331054688, 0.08675193786621094, 0.093719482421875, 0.10068702697753906, 0.10765457153320312, 0.11462211608886719, 0.12158966064453125, 0.1285572052001953, 0.13552474975585938, 0.14249229431152344, 0.1494598388671875, 0.15642738342285156, 0.16339492797851562, 0.1703624725341797, 0.17733001708984375, 0.1842975616455078, 0.19126510620117188, 0.19823265075683594, 0.2052001953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 7.0, 6.0, 9.0, 15.0, 19.0, 36.0, 53.0, 86.0, 145.0, 199.0, 394.0, 777.0, 2202.0, 8923.0, 180407.0, 3983389.0, 12739.0, 2856.0, 985.0, 411.0, 226.0, 126.0, 85.0, 69.0, 39.0, 18.0, 15.0, 13.0, 11.0, 8.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-3.595703125, -3.5102996826171875, -3.424896240234375, -3.3394927978515625, -3.25408935546875, -3.1686859130859375, -3.083282470703125, -2.9978790283203125, -2.9124755859375, -2.8270721435546875, -2.741668701171875, -2.6562652587890625, -2.57086181640625, -2.4854583740234375, -2.400054931640625, -2.3146514892578125, -2.229248046875, -2.1438446044921875, -2.058441162109375, -1.9730377197265625, -1.88763427734375, -1.8022308349609375, -1.716827392578125, -1.6314239501953125, -1.5460205078125, -1.4606170654296875, -1.375213623046875, -1.2898101806640625, -1.20440673828125, -1.1190032958984375, -1.033599853515625, -0.9481964111328125, -0.86279296875, -0.7773895263671875, -0.691986083984375, -0.6065826416015625, -0.52117919921875, -0.4357757568359375, -0.350372314453125, -0.2649688720703125, -0.1795654296875, -0.0941619873046875, -0.008758544921875, 0.0766448974609375, 0.16204833984375, 0.2474517822265625, 0.332855224609375, 0.4182586669921875, 0.503662109375, 0.5890655517578125, 0.674468994140625, 0.7598724365234375, 0.84527587890625, 0.9306793212890625, 1.016082763671875, 1.1014862060546875, 1.1868896484375, 1.2722930908203125, 1.357696533203125, 1.4430999755859375, 1.52850341796875, 1.6139068603515625, 1.699310302734375, 1.7847137451171875, 1.8701171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 2.0, 2.0, 9.0, 8.0, 14.0, 22.0, 40.0, 126.0, 3244.0, 456.0, 67.0, 24.0, 22.0, 16.0, 9.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.86962890625, -0.8488235473632812, -0.8280181884765625, -0.8072128295898438, -0.786407470703125, -0.7656021118164062, -0.7447967529296875, -0.7239913940429688, -0.70318603515625, -0.6823806762695312, -0.6615753173828125, -0.6407699584960938, -0.619964599609375, -0.5991592407226562, -0.5783538818359375, -0.5575485229492188, -0.5367431640625, -0.5159378051757812, -0.4951324462890625, -0.47432708740234375, -0.453521728515625, -0.43271636962890625, -0.4119110107421875, -0.39110565185546875, -0.37030029296875, -0.34949493408203125, -0.3286895751953125, -0.30788421630859375, -0.287078857421875, -0.26627349853515625, -0.2454681396484375, -0.22466278076171875, -0.203857421875, -0.18305206298828125, -0.1622467041015625, -0.14144134521484375, -0.120635986328125, -0.09983062744140625, -0.0790252685546875, -0.05821990966796875, -0.03741455078125, -0.01660919189453125, 0.0041961669921875, 0.02500152587890625, 0.045806884765625, 0.06661224365234375, 0.0874176025390625, 0.10822296142578125, 0.1290283203125, 0.14983367919921875, 0.1706390380859375, 0.19144439697265625, 0.212249755859375, 0.23305511474609375, 0.2538604736328125, 0.27466583251953125, 0.29547119140625, 0.31627655029296875, 0.3370819091796875, 0.35788726806640625, 0.378692626953125, 0.39949798583984375, 0.4203033447265625, 0.44110870361328125, 0.4619140625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 13.0, 18.0, 56.0, 147.0, 363.0, 234.0, 83.0, 38.0, 20.0, 9.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0790014266967773, -2.968052864074707, -2.8571040630340576, -2.746155261993408, -2.635206699371338, -2.5242581367492676, -2.413309335708618, -2.3023605346679688, -2.1914119720458984, -2.080463409423828, -1.9695146083831787, -1.8585659265518188, -1.747617244720459, -1.6366685628890991, -1.5257198810577393, -1.4147711992263794, -1.3038225173950195, -1.1928738355636597, -1.0819251537322998, -0.9709764719009399, -0.8600277900695801, -0.7490791082382202, -0.6381304264068604, -0.5271817445755005, -0.4162330627441406, -0.30528438091278076, -0.1943356990814209, -0.08338701725006104, 0.027561664581298828, 0.1385103464126587, 0.24945902824401855, 0.3604077100753784, 0.4713563919067383, 0.5823050737380981, 0.693253755569458, 0.8042024374008179, 0.9151511192321777, 1.0260998010635376, 1.1370484828948975, 1.2479971647262573, 1.3589458465576172, 1.469894528388977, 1.580843210220337, 1.6917918920516968, 1.8027405738830566, 1.9136892557144165, 2.0246379375457764, 2.135586738586426, 2.246535301208496, 2.3574838638305664, 2.468432664871216, 2.5793814659118652, 2.6903300285339355, 2.801278591156006, 2.9122273921966553, 3.0231761932373047, 3.134124755859375, 3.2450733184814453, 3.3560221195220947, 3.466970920562744, 3.5779194831848145, 3.6888680458068848, 3.799816846847534, 3.9107656478881836, 4.021714210510254]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 14.0, 20.0, 31.0, 46.0, 66.0, 77.0, 90.0, 116.0, 112.0, 105.0, 78.0, 73.0, 58.0, 33.0, 27.0, 20.0, 13.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9555420875549316, -1.8951339721679688, -1.8347258567810059, -1.774317741394043, -1.71390962600708, -1.6535015106201172, -1.5930933952331543, -1.5326852798461914, -1.4722771644592285, -1.4118690490722656, -1.3514609336853027, -1.2910528182983398, -1.230644702911377, -1.170236587524414, -1.1098284721374512, -1.0494203567504883, -0.9890123009681702, -0.9286041855812073, -0.8681960701942444, -0.8077879548072815, -0.7473798394203186, -0.6869717836380005, -0.6265636682510376, -0.5661555528640747, -0.5057474374771118, -0.4453393220901489, -0.38493120670318604, -0.32452309131622314, -0.26411497592926025, -0.20370689034461975, -0.14329877495765686, -0.08289065957069397, -0.02248251438140869, 0.0379255972802639, 0.09833370894193649, 0.1587418168783188, 0.21914993226528168, 0.2795580327510834, 0.33996614813804626, 0.40037426352500916, 0.46078237891197205, 0.5211904644966125, 0.5815985798835754, 0.6420066952705383, 0.7024148106575012, 0.7628229260444641, 0.823231041431427, 0.8836391568183899, 0.9440472722053528, 1.004455327987671, 1.0648634433746338, 1.1252715587615967, 1.1856796741485596, 1.2460877895355225, 1.3064959049224854, 1.3669040203094482, 1.4273121356964111, 1.487720251083374, 1.548128366470337, 1.6085364818572998, 1.6689445972442627, 1.7293527126312256, 1.7897608280181885, 1.8501689434051514, 1.9105770587921143]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 8.0, 8.0, 9.0, 14.0, 16.0, 18.0, 19.0, 30.0, 38.0, 74.0, 86.0, 125.0, 157.0, 275.0, 399.0, 709.0, 1206.0, 2303.0, 5093.0, 13277.0, 44668.0, 257357.0, 585929.0, 97785.0, 23399.0, 7991.0, 3401.0, 1673.0, 877.0, 510.0, 313.0, 228.0, 160.0, 99.0, 79.0, 44.0, 38.0, 36.0, 22.0, 19.0, 12.0, 13.0, 7.0, 4.0, 3.0, 5.0, 1.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.798828125, -0.7748031616210938, -0.7507781982421875, -0.7267532348632812, -0.702728271484375, -0.6787033081054688, -0.6546783447265625, -0.6306533813476562, -0.60662841796875, -0.5826034545898438, -0.5585784912109375, -0.5345535278320312, -0.510528564453125, -0.48650360107421875, -0.4624786376953125, -0.43845367431640625, -0.4144287109375, -0.39040374755859375, -0.3663787841796875, -0.34235382080078125, -0.318328857421875, -0.29430389404296875, -0.2702789306640625, -0.24625396728515625, -0.22222900390625, -0.19820404052734375, -0.1741790771484375, -0.15015411376953125, -0.126129150390625, -0.10210418701171875, -0.0780792236328125, -0.05405426025390625, -0.030029296875, -0.00600433349609375, 0.0180206298828125, 0.04204559326171875, 0.066070556640625, 0.09009552001953125, 0.1141204833984375, 0.13814544677734375, 0.16217041015625, 0.18619537353515625, 0.2102203369140625, 0.23424530029296875, 0.258270263671875, 0.28229522705078125, 0.3063201904296875, 0.33034515380859375, 0.3543701171875, 0.37839508056640625, 0.4024200439453125, 0.42644500732421875, 0.450469970703125, 0.47449493408203125, 0.4985198974609375, 0.5225448608398438, 0.54656982421875, 0.5705947875976562, 0.5946197509765625, 0.6186447143554688, 0.642669677734375, 0.6666946411132812, 0.6907196044921875, 0.7147445678710938, 0.73876953125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 2.0, 10.0, 17.0, 25.0, 29.0, 39.0, 48.0, 65.0, 67.0, 91.0, 80.0, 85.0, 69.0, 76.0, 66.0, 56.0, 41.0, 29.0, 32.0, 18.0, 17.0, 8.0, 9.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2765789031982422, -0.2687339782714844, -0.26088905334472656, -0.25304412841796875, -0.24519920349121094, -0.23735427856445312, -0.2295093536376953, -0.2216644287109375, -0.2138195037841797, -0.20597457885742188, -0.19812965393066406, -0.19028472900390625, -0.18243980407714844, -0.17459487915039062, -0.1667499542236328, -0.158905029296875, -0.1510601043701172, -0.14321517944335938, -0.13537025451660156, -0.12752532958984375, -0.11968040466308594, -0.11183547973632812, -0.10399055480957031, -0.0961456298828125, -0.08830070495605469, -0.08045578002929688, -0.07261085510253906, -0.06476593017578125, -0.05692100524902344, -0.049076080322265625, -0.04123115539550781, -0.03338623046875, -0.025541305541992188, -0.017696380615234375, -0.009851455688476562, -0.00200653076171875, 0.0058383941650390625, 0.013683319091796875, 0.021528244018554688, 0.0293731689453125, 0.03721809387207031, 0.045063018798828125, 0.05290794372558594, 0.06075286865234375, 0.06859779357910156, 0.07644271850585938, 0.08428764343261719, 0.092132568359375, 0.09997749328613281, 0.10782241821289062, 0.11566734313964844, 0.12351226806640625, 0.13135719299316406, 0.13920211791992188, 0.1470470428466797, 0.1548919677734375, 0.1627368927001953, 0.17058181762695312, 0.17842674255371094, 0.18627166748046875, 0.19411659240722656, 0.20196151733398438, 0.2098064422607422, 0.2176513671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 7.0, 5.0, 1.0, 9.0, 14.0, 17.0, 27.0, 38.0, 58.0, 86.0, 170.0, 290.0, 639.0, 1452.0, 4381.0, 15688.0, 82079.0, 617582.0, 275672.0, 36922.0, 8630.0, 2739.0, 1006.0, 440.0, 238.0, 144.0, 81.0, 42.0, 28.0, 23.0, 10.0, 14.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59375, -0.5750656127929688, -0.5563812255859375, -0.5376968383789062, -0.519012451171875, -0.5003280639648438, -0.4816436767578125, -0.46295928955078125, -0.44427490234375, -0.42559051513671875, -0.4069061279296875, -0.38822174072265625, -0.369537353515625, -0.35085296630859375, -0.3321685791015625, -0.31348419189453125, -0.2947998046875, -0.27611541748046875, -0.2574310302734375, -0.23874664306640625, -0.220062255859375, -0.20137786865234375, -0.1826934814453125, -0.16400909423828125, -0.14532470703125, -0.12664031982421875, -0.1079559326171875, -0.08927154541015625, -0.070587158203125, -0.05190277099609375, -0.0332183837890625, -0.01453399658203125, 0.004150390625, 0.02283477783203125, 0.0415191650390625, 0.06020355224609375, 0.078887939453125, 0.09757232666015625, 0.1162567138671875, 0.13494110107421875, 0.15362548828125, 0.17230987548828125, 0.1909942626953125, 0.20967864990234375, 0.228363037109375, 0.24704742431640625, 0.2657318115234375, 0.28441619873046875, 0.3031005859375, 0.32178497314453125, 0.3404693603515625, 0.35915374755859375, 0.377838134765625, 0.39652252197265625, 0.4152069091796875, 0.43389129638671875, 0.45257568359375, 0.47126007080078125, 0.4899444580078125, 0.5086288452148438, 0.527313232421875, 0.5459976196289062, 0.5646820068359375, 0.5833663940429688, 0.60205078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 5.0, 5.0, 13.0, 10.0, 16.0, 16.0, 20.0, 20.0, 21.0, 21.0, 29.0, 31.0, 28.0, 31.0, 46.0, 32.0, 46.0, 49.0, 34.0, 39.0, 52.0, 41.0, 50.0, 28.0, 40.0, 23.0, 34.0, 36.0, 30.0, 31.0, 23.0, 15.0, 14.0, 7.0, 10.0, 10.0, 9.0, 7.0, 2.0, 6.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.493896484375, -0.4783287048339844, -0.46276092529296875, -0.4471931457519531, -0.4316253662109375, -0.4160575866699219, -0.40048980712890625, -0.3849220275878906, -0.369354248046875, -0.3537864685058594, -0.33821868896484375, -0.3226509094238281, -0.3070831298828125, -0.2915153503417969, -0.27594757080078125, -0.2603797912597656, -0.24481201171875, -0.22924423217773438, -0.21367645263671875, -0.19810867309570312, -0.1825408935546875, -0.16697311401367188, -0.15140533447265625, -0.13583755493164062, -0.120269775390625, -0.10470199584960938, -0.08913421630859375, -0.07356643676757812, -0.0579986572265625, -0.042430877685546875, -0.02686309814453125, -0.011295318603515625, 0.0042724609375, 0.019840240478515625, 0.03540802001953125, 0.050975799560546875, 0.0665435791015625, 0.08211135864257812, 0.09767913818359375, 0.11324691772460938, 0.128814697265625, 0.14438247680664062, 0.15995025634765625, 0.17551803588867188, 0.1910858154296875, 0.20665359497070312, 0.22222137451171875, 0.23778915405273438, 0.25335693359375, 0.2689247131347656, 0.28449249267578125, 0.3000602722167969, 0.3156280517578125, 0.3311958312988281, 0.34676361083984375, 0.3623313903808594, 0.377899169921875, 0.3934669494628906, 0.40903472900390625, 0.4246025085449219, 0.4401702880859375, 0.4557380676269531, 0.47130584716796875, 0.4868736267089844, 0.50244140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 8.0, 5.0, 20.0, 26.0, 53.0, 96.0, 188.0, 353.0, 902.0, 3289.0, 21723.0, 298388.0, 669272.0, 46018.0, 5937.0, 1325.0, 437.0, 234.0, 109.0, 79.0, 38.0, 23.0, 11.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.275146484375, -0.26421356201171875, -0.2532806396484375, -0.24234771728515625, -0.231414794921875, -0.22048187255859375, -0.2095489501953125, -0.19861602783203125, -0.18768310546875, -0.17675018310546875, -0.1658172607421875, -0.15488433837890625, -0.143951416015625, -0.13301849365234375, -0.1220855712890625, -0.11115264892578125, -0.1002197265625, -0.08928680419921875, -0.0783538818359375, -0.06742095947265625, -0.056488037109375, -0.04555511474609375, -0.0346221923828125, -0.02368927001953125, -0.01275634765625, -0.00182342529296875, 0.0091094970703125, 0.02004241943359375, 0.030975341796875, 0.04190826416015625, 0.0528411865234375, 0.06377410888671875, 0.07470703125, 0.08563995361328125, 0.0965728759765625, 0.10750579833984375, 0.118438720703125, 0.12937164306640625, 0.1403045654296875, 0.15123748779296875, 0.16217041015625, 0.17310333251953125, 0.1840362548828125, 0.19496917724609375, 0.205902099609375, 0.21683502197265625, 0.2277679443359375, 0.23870086669921875, 0.2496337890625, 0.26056671142578125, 0.2714996337890625, 0.28243255615234375, 0.293365478515625, 0.30429840087890625, 0.3152313232421875, 0.32616424560546875, 0.33709716796875, 0.34803009033203125, 0.3589630126953125, 0.36989593505859375, 0.380828857421875, 0.39176177978515625, 0.4026947021484375, 0.41362762451171875, 0.424560546875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 12.0, 6.0, 7.0, 18.0, 24.0, 51.0, 77.0, 117.0, 170.0, 176.0, 128.0, 74.0, 46.0, 37.0, 25.0, 13.0, 5.0, 6.0, 8.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.470348358154297e-05, -4.233699291944504e-05, -3.997050225734711e-05, -3.7604011595249176e-05, -3.5237520933151245e-05, -3.2871030271053314e-05, -3.0504539608955383e-05, -2.8138048946857452e-05, -2.577155828475952e-05, -2.340506762266159e-05, -2.103857696056366e-05, -1.867208629846573e-05, -1.6305595636367798e-05, -1.3939104974269867e-05, -1.1572614312171936e-05, -9.206123650074005e-06, -6.839632987976074e-06, -4.473142325878143e-06, -2.1066516637802124e-06, 2.598389983177185e-07, 2.6263296604156494e-06, 4.99282032251358e-06, 7.359310984611511e-06, 9.725801646709442e-06, 1.2092292308807373e-05, 1.4458782970905304e-05, 1.6825273633003235e-05, 1.9191764295101166e-05, 2.1558254957199097e-05, 2.3924745619297028e-05, 2.629123628139496e-05, 2.865772694349289e-05, 3.102421760559082e-05, 3.339070826768875e-05, 3.575719892978668e-05, 3.812368959188461e-05, 4.0490180253982544e-05, 4.2856670916080475e-05, 4.5223161578178406e-05, 4.758965224027634e-05, 4.995614290237427e-05, 5.23226335644722e-05, 5.468912422657013e-05, 5.705561488866806e-05, 5.942210555076599e-05, 6.178859621286392e-05, 6.415508687496185e-05, 6.652157753705978e-05, 6.888806819915771e-05, 7.125455886125565e-05, 7.362104952335358e-05, 7.598754018545151e-05, 7.835403084754944e-05, 8.072052150964737e-05, 8.30870121717453e-05, 8.545350283384323e-05, 8.781999349594116e-05, 9.018648415803909e-05, 9.255297482013702e-05, 9.491946548223495e-05, 9.728595614433289e-05, 9.965244680643082e-05, 0.00010201893746852875, 0.00010438542813062668, 0.00010675191879272461]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 8.0, 15.0, 12.0, 17.0, 42.0, 56.0, 106.0, 229.0, 423.0, 1086.0, 2659.0, 7535.0, 23250.0, 91196.0, 430330.0, 380465.0, 79722.0, 20715.0, 6406.0, 2359.0, 954.0, 444.0, 222.0, 110.0, 68.0, 49.0, 26.0, 12.0, 10.0, 8.0, 3.0, 8.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.252197265625, -0.2449817657470703, -0.23776626586914062, -0.23055076599121094, -0.22333526611328125, -0.21611976623535156, -0.20890426635742188, -0.2016887664794922, -0.1944732666015625, -0.1872577667236328, -0.18004226684570312, -0.17282676696777344, -0.16561126708984375, -0.15839576721191406, -0.15118026733398438, -0.1439647674560547, -0.136749267578125, -0.1295337677001953, -0.12231826782226562, -0.11510276794433594, -0.10788726806640625, -0.10067176818847656, -0.09345626831054688, -0.08624076843261719, -0.0790252685546875, -0.07180976867675781, -0.06459426879882812, -0.05737876892089844, -0.05016326904296875, -0.04294776916503906, -0.035732269287109375, -0.028516769409179688, -0.02130126953125, -0.014085769653320312, -0.006870269775390625, 0.0003452301025390625, 0.00756072998046875, 0.014776229858398438, 0.021991729736328125, 0.029207229614257812, 0.0364227294921875, 0.04363822937011719, 0.050853729248046875, 0.05806922912597656, 0.06528472900390625, 0.07250022888183594, 0.07971572875976562, 0.08693122863769531, 0.094146728515625, 0.10136222839355469, 0.10857772827148438, 0.11579322814941406, 0.12300872802734375, 0.13022422790527344, 0.13743972778320312, 0.1446552276611328, 0.1518707275390625, 0.1590862274169922, 0.16630172729492188, 0.17351722717285156, 0.18073272705078125, 0.18794822692871094, 0.19516372680664062, 0.2023792266845703, 0.2095947265625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 10.0, 7.0, 15.0, 15.0, 11.0, 25.0, 33.0, 30.0, 35.0, 56.0, 61.0, 47.0, 54.0, 53.0, 85.0, 77.0, 61.0, 41.0, 48.0, 41.0, 33.0, 30.0, 21.0, 30.0, 18.0, 11.0, 12.0, 10.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1517333984375, -0.14715003967285156, -0.14256668090820312, -0.1379833221435547, -0.13339996337890625, -0.1288166046142578, -0.12423324584960938, -0.11964988708496094, -0.1150665283203125, -0.11048316955566406, -0.10589981079101562, -0.10131645202636719, -0.09673309326171875, -0.09214973449707031, -0.08756637573242188, -0.08298301696777344, -0.078399658203125, -0.07381629943847656, -0.06923294067382812, -0.06464958190917969, -0.06006622314453125, -0.05548286437988281, -0.050899505615234375, -0.04631614685058594, -0.0417327880859375, -0.03714942932128906, -0.032566070556640625, -0.027982711791992188, -0.02339935302734375, -0.018815994262695312, -0.014232635498046875, -0.009649276733398438, -0.00506591796875, -0.0004825592041015625, 0.004100799560546875, 0.008684158325195312, 0.01326751708984375, 0.017850875854492188, 0.022434234619140625, 0.027017593383789062, 0.0316009521484375, 0.03618431091308594, 0.040767669677734375, 0.04535102844238281, 0.04993438720703125, 0.05451774597167969, 0.059101104736328125, 0.06368446350097656, 0.068267822265625, 0.07285118103027344, 0.07743453979492188, 0.08201789855957031, 0.08660125732421875, 0.09118461608886719, 0.09576797485351562, 0.10035133361816406, 0.1049346923828125, 0.10951805114746094, 0.11410140991210938, 0.11868476867675781, 0.12326812744140625, 0.1278514862060547, 0.13243484497070312, 0.13701820373535156, 0.1416015625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 13.0, 16.0, 31.0, 79.0, 155.0, 207.0, 233.0, 137.0, 84.0, 28.0, 11.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.218921661376953, -9.038656234741211, -8.858390808105469, -8.678125381469727, -8.497859001159668, -8.317593574523926, -8.137328147888184, -7.957062721252441, -7.776797294616699, -7.596531867980957, -7.416265964508057, -7.2360005378723145, -7.055735111236572, -6.875469207763672, -6.69520378112793, -6.5149383544921875, -6.334672451019287, -6.154407024383545, -5.9741411209106445, -5.793875694274902, -5.61361026763916, -5.433344841003418, -5.253078937530518, -5.072813510894775, -4.892547607421875, -4.712282180786133, -4.532016277313232, -4.35175085067749, -4.171485424041748, -3.9912197589874268, -3.8109540939331055, -3.6306886672973633, -3.450423002243042, -3.2701573371887207, -3.0898919105529785, -2.9096262454986572, -2.729360580444336, -2.5490951538085938, -2.3688294887542725, -2.188563823699951, -2.008298397064209, -1.8280328512191772, -1.6477673053741455, -1.4675016403198242, -1.2872360944747925, -1.1069705486297607, -0.9267048835754395, -0.7464393377304077, -0.566173791885376, -0.38590821623802185, -0.20564264059066772, -0.02537703514099121, 0.15488851070404053, 0.33515405654907227, 0.5154197216033936, 0.6956852674484253, 0.875950813293457, 1.0562163591384888, 1.2364819049835205, 1.4167475700378418, 1.5970131158828735, 1.7772786617279053, 1.9575443267822266, 2.1378097534179688, 2.31807541847229]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 7.0, 13.0, 10.0, 8.0, 16.0, 21.0, 21.0, 13.0, 14.0, 31.0, 24.0, 34.0, 48.0, 44.0, 39.0, 36.0, 46.0, 41.0, 32.0, 43.0, 40.0, 41.0, 41.0, 40.0, 25.0, 34.0, 30.0, 31.0, 27.0, 24.0, 19.0, 19.0, 12.0, 11.0, 15.0, 12.0, 3.0, 5.0, 8.0, 9.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2936625480651855, -2.2171123027801514, -2.140562057495117, -2.064011573791504, -1.9874613285064697, -1.9109110832214355, -1.8343608379364014, -1.7578105926513672, -1.6812602281570435, -1.6047099828720093, -1.5281596183776855, -1.4516093730926514, -1.3750591278076172, -1.2985087633132935, -1.2219585180282593, -1.1454081535339355, -1.0688579082489014, -0.9923076033592224, -0.9157572984695435, -0.8392070531845093, -0.7626567482948303, -0.6861064434051514, -0.6095561981201172, -0.5330058932304382, -0.4564555883407593, -0.3799052834510803, -0.30335500836372375, -0.226804718375206, -0.15025442838668823, -0.07370412349700928, 0.00284615159034729, 0.07939642667770386, 0.1559467315673828, 0.23249702155590057, 0.30904731154441833, 0.3855975866317749, 0.46214789152145386, 0.5386981964111328, 0.615248441696167, 0.691798746585846, 0.7683490514755249, 0.8448993563652039, 0.9214496612548828, 0.997999906539917, 1.0745501518249512, 1.151100516319275, 1.227650761604309, 1.3042011260986328, 1.380751371383667, 1.4573016166687012, 1.533851981163025, 1.610402226448059, 1.6869525909423828, 1.763502836227417, 1.8400530815124512, 1.9166033267974854, 1.993153691291809, 2.069704055786133, 2.146254301071167, 2.222804546356201, 2.2993547916412354, 2.3759050369262695, 2.452455520629883, 2.529005765914917, 2.605556011199951]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 3.0, 9.0, 13.0, 9.0, 16.0, 25.0, 30.0, 49.0, 58.0, 107.0, 165.0, 220.0, 465.0, 893.0, 2296.0, 8157.0, 118049.0, 4043248.0, 14496.0, 3432.0, 1251.0, 577.0, 294.0, 151.0, 89.0, 60.0, 35.0, 23.0, 14.0, 14.0, 8.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.5, -2.4308624267578125, -2.361724853515625, -2.2925872802734375, -2.22344970703125, -2.1543121337890625, -2.085174560546875, -2.0160369873046875, -1.9468994140625, -1.8777618408203125, -1.808624267578125, -1.7394866943359375, -1.67034912109375, -1.6012115478515625, -1.532073974609375, -1.4629364013671875, -1.393798828125, -1.3246612548828125, -1.255523681640625, -1.1863861083984375, -1.11724853515625, -1.0481109619140625, -0.978973388671875, -0.9098358154296875, -0.8406982421875, -0.7715606689453125, -0.702423095703125, -0.6332855224609375, -0.56414794921875, -0.4950103759765625, -0.425872802734375, -0.3567352294921875, -0.28759765625, -0.2184600830078125, -0.149322509765625, -0.0801849365234375, -0.01104736328125, 0.0580902099609375, 0.127227783203125, 0.1963653564453125, 0.2655029296875, 0.3346405029296875, 0.403778076171875, 0.4729156494140625, 0.54205322265625, 0.6111907958984375, 0.680328369140625, 0.7494659423828125, 0.818603515625, 0.8877410888671875, 0.956878662109375, 1.0260162353515625, 1.09515380859375, 1.1642913818359375, 1.233428955078125, 1.3025665283203125, 1.3717041015625, 1.4408416748046875, 1.509979248046875, 1.5791168212890625, 1.64825439453125, 1.7173919677734375, 1.786529541015625, 1.8556671142578125, 1.9248046875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 3.0, 7.0, 8.0, 18.0, 27.0, 31.0, 35.0, 63.0, 49.0, 63.0, 83.0, 108.0, 82.0, 83.0, 71.0, 57.0, 64.0, 34.0, 32.0, 26.0, 21.0, 9.0, 11.0, 12.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.283447265625, -0.2753753662109375, -0.267303466796875, -0.2592315673828125, -0.25115966796875, -0.2430877685546875, -0.235015869140625, -0.2269439697265625, -0.2188720703125, -0.2108001708984375, -0.202728271484375, -0.1946563720703125, -0.18658447265625, -0.1785125732421875, -0.170440673828125, -0.1623687744140625, -0.154296875, -0.1462249755859375, -0.138153076171875, -0.1300811767578125, -0.12200927734375, -0.1139373779296875, -0.105865478515625, -0.0977935791015625, -0.0897216796875, -0.0816497802734375, -0.073577880859375, -0.0655059814453125, -0.05743408203125, -0.0493621826171875, -0.041290283203125, -0.0332183837890625, -0.025146484375, -0.0170745849609375, -0.009002685546875, -0.0009307861328125, 0.00714111328125, 0.0152130126953125, 0.023284912109375, 0.0313568115234375, 0.0394287109375, 0.0475006103515625, 0.055572509765625, 0.0636444091796875, 0.07171630859375, 0.0797882080078125, 0.087860107421875, 0.0959320068359375, 0.10400390625, 0.1120758056640625, 0.120147705078125, 0.1282196044921875, 0.13629150390625, 0.1443634033203125, 0.152435302734375, 0.1605072021484375, 0.1685791015625, 0.1766510009765625, 0.184722900390625, 0.1927947998046875, 0.20086669921875, 0.2089385986328125, 0.217010498046875, 0.2250823974609375, 0.233154296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 13.0, 15.0, 26.0, 50.0, 46.0, 72.0, 143.0, 227.0, 337.0, 640.0, 1148.0, 2489.0, 6286.0, 22470.0, 3946624.0, 190844.0, 13975.0, 4655.0, 1922.0, 946.0, 505.0, 283.0, 189.0, 129.0, 81.0, 54.0, 32.0, 28.0, 11.0, 8.0, 8.0, 4.0, 8.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5947265625, -1.5353240966796875, -1.475921630859375, -1.4165191650390625, -1.35711669921875, -1.2977142333984375, -1.238311767578125, -1.1789093017578125, -1.1195068359375, -1.0601043701171875, -1.000701904296875, -0.9412994384765625, -0.88189697265625, -0.8224945068359375, -0.763092041015625, -0.7036895751953125, -0.644287109375, -0.5848846435546875, -0.525482177734375, -0.4660797119140625, -0.40667724609375, -0.3472747802734375, -0.287872314453125, -0.2284698486328125, -0.1690673828125, -0.1096649169921875, -0.050262451171875, 0.0091400146484375, 0.06854248046875, 0.1279449462890625, 0.187347412109375, 0.2467498779296875, 0.30615234375, 0.3655548095703125, 0.424957275390625, 0.4843597412109375, 0.54376220703125, 0.6031646728515625, 0.662567138671875, 0.7219696044921875, 0.7813720703125, 0.8407745361328125, 0.900177001953125, 0.9595794677734375, 1.01898193359375, 1.0783843994140625, 1.137786865234375, 1.1971893310546875, 1.256591796875, 1.3159942626953125, 1.375396728515625, 1.4347991943359375, 1.49420166015625, 1.5536041259765625, 1.613006591796875, 1.6724090576171875, 1.7318115234375, 1.7912139892578125, 1.850616455078125, 1.9100189208984375, 1.96942138671875, 2.0288238525390625, 2.088226318359375, 2.1476287841796875, 2.20703125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 2.0, 6.0, 7.0, 12.0, 7.0, 13.0, 19.0, 68.0, 176.0, 3184.0, 383.0, 91.0, 45.0, 18.0, 7.0, 9.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60302734375, -0.5804290771484375, -0.557830810546875, -0.5352325439453125, -0.51263427734375, -0.4900360107421875, -0.467437744140625, -0.4448394775390625, -0.4222412109375, -0.3996429443359375, -0.377044677734375, -0.3544464111328125, -0.33184814453125, -0.3092498779296875, -0.286651611328125, -0.2640533447265625, -0.241455078125, -0.2188568115234375, -0.196258544921875, -0.1736602783203125, -0.15106201171875, -0.1284637451171875, -0.105865478515625, -0.0832672119140625, -0.0606689453125, -0.0380706787109375, -0.015472412109375, 0.0071258544921875, 0.02972412109375, 0.0523223876953125, 0.074920654296875, 0.0975189208984375, 0.1201171875, 0.1427154541015625, 0.165313720703125, 0.1879119873046875, 0.21051025390625, 0.2331085205078125, 0.255706787109375, 0.2783050537109375, 0.3009033203125, 0.3235015869140625, 0.346099853515625, 0.3686981201171875, 0.39129638671875, 0.4138946533203125, 0.436492919921875, 0.4590911865234375, 0.481689453125, 0.5042877197265625, 0.526885986328125, 0.5494842529296875, 0.57208251953125, 0.5946807861328125, 0.617279052734375, 0.6398773193359375, 0.6624755859375, 0.6850738525390625, 0.707672119140625, 0.7302703857421875, 0.75286865234375, 0.7754669189453125, 0.798065185546875, 0.8206634521484375, 0.84326171875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 21.0, 77.0, 388.0, 414.0, 63.0, 25.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.38399887084961, -11.125666618347168, -10.86733341217041, -10.609001159667969, -10.350668907165527, -10.092336654663086, -9.834003448486328, -9.575671195983887, -9.317338943481445, -9.059006690979004, -8.800673484802246, -8.542341232299805, -8.284008979797363, -8.025676727294922, -7.767343521118164, -7.509011268615723, -7.250678062438965, -6.992345333099365, -6.734013080596924, -6.475680351257324, -6.217348098754883, -5.959015369415283, -5.700682640075684, -5.442350387573242, -5.184017658233643, -4.925684928894043, -4.667352676391602, -4.409019947052002, -4.150687217712402, -3.892354965209961, -3.6340222358703613, -3.375689744949341, -3.117356300354004, -2.8590238094329834, -2.600691318511963, -2.3423585891723633, -2.0840260982513428, -1.8256936073303223, -1.5673609972000122, -1.3090283870697021, -1.0506958961486816, -0.7923633456230164, -0.5340307950973511, -0.2756982445716858, -0.017365694046020508, 0.240966796875, 0.49929940700531006, 0.7576320171356201, 1.0159645080566406, 1.2742969989776611, 1.5326296091079712, 1.7909622192382812, 2.0492947101593018, 2.3076272010803223, 2.565959930419922, 2.8242924213409424, 3.082624912261963, 3.3409574031829834, 3.599289894104004, 3.8576226234436035, 4.115955352783203, 4.3742876052856445, 4.632620334625244, 4.890953063964844, 5.149285316467285]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 9.0, 25.0, 29.0, 46.0, 54.0, 67.0, 101.0, 94.0, 112.0, 102.0, 102.0, 88.0, 69.0, 40.0, 21.0, 16.0, 9.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1993274688720703, -3.115741491317749, -3.0321555137634277, -2.9485695362091064, -2.864983558654785, -2.781397819519043, -2.6978116035461426, -2.6142258644104004, -2.530639886856079, -2.447053909301758, -2.3634679317474365, -2.2798819541931152, -2.196295976638794, -2.1127099990844727, -2.0291242599487305, -1.9455382823944092, -1.8619521856307983, -1.778366208076477, -1.6947802305221558, -1.611194372177124, -1.5276083946228027, -1.4440224170684814, -1.3604364395141602, -1.2768504619598389, -1.1932644844055176, -1.1096785068511963, -1.026092529296875, -0.9425066113471985, -0.858920693397522, -0.7753347158432007, -0.6917487382888794, -0.6081628203392029, -0.5245769023895264, -0.44099095463752747, -0.35740500688552856, -0.2738190293312073, -0.19023308157920837, -0.10664713382720947, -0.023061156272888184, 0.06052476167678833, 0.14411073923110962, 0.22769668698310852, 0.3112826347351074, 0.3948686122894287, 0.4784545600414276, 0.5620405077934265, 0.6456264853477478, 0.7292124032974243, 0.8127983808517456, 0.8963843584060669, 0.9799702763557434, 1.06355619430542, 1.1471421718597412, 1.2307281494140625, 1.3143141269683838, 1.397900104522705, 1.4814860820770264, 1.5650720596313477, 1.648658037185669, 1.7322440147399902, 1.815829873085022, 1.8994158506393433, 1.9830018281936646, 2.0665876865386963, 2.1501736640930176]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 5.0, 3.0, 3.0, 4.0, 4.0, 10.0, 18.0, 20.0, 16.0, 28.0, 37.0, 71.0, 88.0, 133.0, 226.0, 344.0, 610.0, 1104.0, 2405.0, 5647.0, 19052.0, 96586.0, 666151.0, 209208.0, 31882.0, 8447.0, 3077.0, 1394.0, 724.0, 445.0, 240.0, 174.0, 125.0, 71.0, 54.0, 37.0, 38.0, 21.0, 10.0, 4.0, 14.0, 13.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.0302734375, -1.0005645751953125, -0.970855712890625, -0.9411468505859375, -0.91143798828125, -0.8817291259765625, -0.852020263671875, -0.8223114013671875, -0.7926025390625, -0.7628936767578125, -0.733184814453125, -0.7034759521484375, -0.67376708984375, -0.6440582275390625, -0.614349365234375, -0.5846405029296875, -0.554931640625, -0.5252227783203125, -0.495513916015625, -0.4658050537109375, -0.43609619140625, -0.4063873291015625, -0.376678466796875, -0.3469696044921875, -0.3172607421875, -0.2875518798828125, -0.257843017578125, -0.2281341552734375, -0.19842529296875, -0.1687164306640625, -0.139007568359375, -0.1092987060546875, -0.07958984375, -0.0498809814453125, -0.020172119140625, 0.0095367431640625, 0.03924560546875, 0.0689544677734375, 0.098663330078125, 0.1283721923828125, 0.1580810546875, 0.1877899169921875, 0.217498779296875, 0.2472076416015625, 0.27691650390625, 0.3066253662109375, 0.336334228515625, 0.3660430908203125, 0.395751953125, 0.4254608154296875, 0.455169677734375, 0.4848785400390625, 0.51458740234375, 0.5442962646484375, 0.574005126953125, 0.6037139892578125, 0.6334228515625, 0.6631317138671875, 0.692840576171875, 0.7225494384765625, 0.75225830078125, 0.7819671630859375, 0.811676025390625, 0.8413848876953125, 0.87109375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 4.0, 9.0, 8.0, 16.0, 21.0, 29.0, 43.0, 37.0, 62.0, 71.0, 76.0, 116.0, 67.0, 84.0, 66.0, 74.0, 46.0, 45.0, 28.0, 33.0, 22.0, 18.0, 13.0, 10.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302001953125, -0.2931938171386719, -0.28438568115234375, -0.2755775451660156, -0.2667694091796875, -0.2579612731933594, -0.24915313720703125, -0.24034500122070312, -0.231536865234375, -0.22272872924804688, -0.21392059326171875, -0.20511245727539062, -0.1963043212890625, -0.18749618530273438, -0.17868804931640625, -0.16987991333007812, -0.16107177734375, -0.15226364135742188, -0.14345550537109375, -0.13464736938476562, -0.1258392333984375, -0.11703109741210938, -0.10822296142578125, -0.09941482543945312, -0.090606689453125, -0.08179855346679688, -0.07299041748046875, -0.06418228149414062, -0.0553741455078125, -0.046566009521484375, -0.03775787353515625, -0.028949737548828125, -0.0201416015625, -0.011333465576171875, -0.00252532958984375, 0.006282806396484375, 0.0150909423828125, 0.023899078369140625, 0.03270721435546875, 0.041515350341796875, 0.050323486328125, 0.059131622314453125, 0.06793975830078125, 0.07674789428710938, 0.0855560302734375, 0.09436416625976562, 0.10317230224609375, 0.11198043823242188, 0.12078857421875, 0.12959671020507812, 0.13840484619140625, 0.14721298217773438, 0.1560211181640625, 0.16482925415039062, 0.17363739013671875, 0.18244552612304688, 0.191253662109375, 0.20006179809570312, 0.20886993408203125, 0.21767807006835938, 0.2264862060546875, 0.23529434204101562, 0.24410247802734375, 0.2529106140136719, 0.26171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 9.0, 16.0, 13.0, 20.0, 35.0, 50.0, 70.0, 99.0, 156.0, 305.0, 512.0, 975.0, 2129.0, 5923.0, 18402.0, 76256.0, 468128.0, 386369.0, 63851.0, 15856.0, 5212.0, 2047.0, 896.0, 461.0, 272.0, 149.0, 100.0, 62.0, 48.0, 43.0, 23.0, 14.0, 16.0, 6.0, 3.0, 7.0, 7.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.580078125, -0.562469482421875, -0.54486083984375, -0.527252197265625, -0.5096435546875, -0.492034912109375, -0.47442626953125, -0.456817626953125, -0.439208984375, -0.421600341796875, -0.40399169921875, -0.386383056640625, -0.3687744140625, -0.351165771484375, -0.33355712890625, -0.315948486328125, -0.29833984375, -0.280731201171875, -0.26312255859375, -0.245513916015625, -0.2279052734375, -0.210296630859375, -0.19268798828125, -0.175079345703125, -0.157470703125, -0.139862060546875, -0.12225341796875, -0.104644775390625, -0.0870361328125, -0.069427490234375, -0.05181884765625, -0.034210205078125, -0.0166015625, 0.001007080078125, 0.01861572265625, 0.036224365234375, 0.0538330078125, 0.071441650390625, 0.08905029296875, 0.106658935546875, 0.124267578125, 0.141876220703125, 0.15948486328125, 0.177093505859375, 0.1947021484375, 0.212310791015625, 0.22991943359375, 0.247528076171875, 0.26513671875, 0.282745361328125, 0.30035400390625, 0.317962646484375, 0.3355712890625, 0.353179931640625, 0.37078857421875, 0.388397216796875, 0.406005859375, 0.423614501953125, 0.44122314453125, 0.458831787109375, 0.4764404296875, 0.494049072265625, 0.51165771484375, 0.529266357421875, 0.546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 5.0, 6.0, 10.0, 12.0, 12.0, 15.0, 18.0, 19.0, 31.0, 23.0, 30.0, 36.0, 43.0, 43.0, 42.0, 46.0, 43.0, 39.0, 34.0, 47.0, 46.0, 35.0, 47.0, 42.0, 34.0, 42.0, 31.0, 27.0, 26.0, 23.0, 20.0, 16.0, 15.0, 11.0, 5.0, 8.0, 10.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6689453125, -0.649139404296875, -0.62933349609375, -0.609527587890625, -0.5897216796875, -0.569915771484375, -0.55010986328125, -0.530303955078125, -0.510498046875, -0.490692138671875, -0.47088623046875, -0.451080322265625, -0.4312744140625, -0.411468505859375, -0.39166259765625, -0.371856689453125, -0.35205078125, -0.332244873046875, -0.31243896484375, -0.292633056640625, -0.2728271484375, -0.253021240234375, -0.23321533203125, -0.213409423828125, -0.193603515625, -0.173797607421875, -0.15399169921875, -0.134185791015625, -0.1143798828125, -0.094573974609375, -0.07476806640625, -0.054962158203125, -0.03515625, -0.015350341796875, 0.00445556640625, 0.024261474609375, 0.0440673828125, 0.063873291015625, 0.08367919921875, 0.103485107421875, 0.123291015625, 0.143096923828125, 0.16290283203125, 0.182708740234375, 0.2025146484375, 0.222320556640625, 0.24212646484375, 0.261932373046875, 0.28173828125, 0.301544189453125, 0.32135009765625, 0.341156005859375, 0.3609619140625, 0.380767822265625, 0.40057373046875, 0.420379638671875, 0.440185546875, 0.459991455078125, 0.47979736328125, 0.499603271484375, 0.5194091796875, 0.539215087890625, 0.55902099609375, 0.578826904296875, 0.5986328125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 7.0, 3.0, 10.0, 23.0, 22.0, 44.0, 78.0, 151.0, 262.0, 532.0, 1014.0, 2393.0, 6419.0, 24129.0, 211515.0, 712925.0, 69224.0, 12630.0, 3945.0, 1609.0, 748.0, 395.0, 194.0, 119.0, 68.0, 33.0, 33.0, 10.0, 5.0, 12.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.361083984375, -0.35189056396484375, -0.3426971435546875, -0.33350372314453125, -0.324310302734375, -0.31511688232421875, -0.3059234619140625, -0.29673004150390625, -0.28753662109375, -0.27834320068359375, -0.2691497802734375, -0.25995635986328125, -0.250762939453125, -0.24156951904296875, -0.2323760986328125, -0.22318267822265625, -0.2139892578125, -0.20479583740234375, -0.1956024169921875, -0.18640899658203125, -0.177215576171875, -0.16802215576171875, -0.1588287353515625, -0.14963531494140625, -0.14044189453125, -0.13124847412109375, -0.1220550537109375, -0.11286163330078125, -0.103668212890625, -0.09447479248046875, -0.0852813720703125, -0.07608795166015625, -0.06689453125, -0.05770111083984375, -0.0485076904296875, -0.03931427001953125, -0.030120849609375, -0.02092742919921875, -0.0117340087890625, -0.00254058837890625, 0.00665283203125, 0.01584625244140625, 0.0250396728515625, 0.03423309326171875, 0.043426513671875, 0.05261993408203125, 0.0618133544921875, 0.07100677490234375, 0.0802001953125, 0.08939361572265625, 0.0985870361328125, 0.10778045654296875, 0.116973876953125, 0.12616729736328125, 0.1353607177734375, 0.14455413818359375, 0.15374755859375, 0.16294097900390625, 0.1721343994140625, 0.18132781982421875, 0.190521240234375, 0.19971466064453125, 0.2089080810546875, 0.21810150146484375, 0.227294921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 14.0, 9.0, 38.0, 52.0, 74.0, 128.0, 196.0, 181.0, 109.0, 83.0, 42.0, 24.0, 11.0, 4.0, 4.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.204843521118164e-05, -5.9645622968673706e-05, -5.724281072616577e-05, -5.483999848365784e-05, -5.24371862411499e-05, -5.003437399864197e-05, -4.763156175613403e-05, -4.52287495136261e-05, -4.2825937271118164e-05, -4.042312502861023e-05, -3.8020312786102295e-05, -3.561750054359436e-05, -3.3214688301086426e-05, -3.081187605857849e-05, -2.8409063816070557e-05, -2.6006251573562622e-05, -2.3603439331054688e-05, -2.1200627088546753e-05, -1.879781484603882e-05, -1.6395002603530884e-05, -1.399219036102295e-05, -1.1589378118515015e-05, -9.18656587600708e-06, -6.7837536334991455e-06, -4.380941390991211e-06, -1.9781291484832764e-06, 4.246830940246582e-07, 2.8274953365325928e-06, 5.230307579040527e-06, 7.633119821548462e-06, 1.0035932064056396e-05, 1.2438744306564331e-05, 1.4841556549072266e-05, 1.72443687915802e-05, 1.9647181034088135e-05, 2.204999327659607e-05, 2.4452805519104004e-05, 2.685561776161194e-05, 2.9258430004119873e-05, 3.166124224662781e-05, 3.406405448913574e-05, 3.646686673164368e-05, 3.886967897415161e-05, 4.1272491216659546e-05, 4.367530345916748e-05, 4.6078115701675415e-05, 4.848092794418335e-05, 5.0883740186691284e-05, 5.328655242919922e-05, 5.568936467170715e-05, 5.809217691421509e-05, 6.049498915672302e-05, 6.289780139923096e-05, 6.530061364173889e-05, 6.770342588424683e-05, 7.010623812675476e-05, 7.25090503692627e-05, 7.491186261177063e-05, 7.731467485427856e-05, 7.97174870967865e-05, 8.212029933929443e-05, 8.452311158180237e-05, 8.69259238243103e-05, 8.932873606681824e-05, 9.173154830932617e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 8.0, 11.0, 16.0, 18.0, 39.0, 51.0, 88.0, 110.0, 199.0, 332.0, 622.0, 1207.0, 2348.0, 5606.0, 17403.0, 93781.0, 708789.0, 178970.0, 25393.0, 7351.0, 3029.0, 1385.0, 738.0, 403.0, 218.0, 160.0, 99.0, 62.0, 39.0, 24.0, 19.0, 17.0, 1.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.28515625, -0.275848388671875, -0.26654052734375, -0.257232666015625, -0.2479248046875, -0.238616943359375, -0.22930908203125, -0.220001220703125, -0.210693359375, -0.201385498046875, -0.19207763671875, -0.182769775390625, -0.1734619140625, -0.164154052734375, -0.15484619140625, -0.145538330078125, -0.13623046875, -0.126922607421875, -0.11761474609375, -0.108306884765625, -0.0989990234375, -0.089691162109375, -0.08038330078125, -0.071075439453125, -0.061767578125, -0.052459716796875, -0.04315185546875, -0.033843994140625, -0.0245361328125, -0.015228271484375, -0.00592041015625, 0.003387451171875, 0.0126953125, 0.022003173828125, 0.03131103515625, 0.040618896484375, 0.0499267578125, 0.059234619140625, 0.06854248046875, 0.077850341796875, 0.087158203125, 0.096466064453125, 0.10577392578125, 0.115081787109375, 0.1243896484375, 0.133697509765625, 0.14300537109375, 0.152313232421875, 0.16162109375, 0.170928955078125, 0.18023681640625, 0.189544677734375, 0.1988525390625, 0.208160400390625, 0.21746826171875, 0.226776123046875, 0.236083984375, 0.245391845703125, 0.25469970703125, 0.264007568359375, 0.2733154296875, 0.282623291015625, 0.29193115234375, 0.301239013671875, 0.310546875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 8.0, 5.0, 16.0, 14.0, 21.0, 27.0, 36.0, 43.0, 78.0, 80.0, 107.0, 90.0, 102.0, 87.0, 71.0, 51.0, 44.0, 28.0, 20.0, 13.0, 8.0, 13.0, 8.0, 4.0, 7.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2091064453125, -0.2022686004638672, -0.19543075561523438, -0.18859291076660156, -0.18175506591796875, -0.17491722106933594, -0.16807937622070312, -0.1612415313720703, -0.1544036865234375, -0.1475658416748047, -0.14072799682617188, -0.13389015197753906, -0.12705230712890625, -0.12021446228027344, -0.11337661743164062, -0.10653877258300781, -0.099700927734375, -0.09286308288574219, -0.08602523803710938, -0.07918739318847656, -0.07234954833984375, -0.06551170349121094, -0.058673858642578125, -0.05183601379394531, -0.0449981689453125, -0.03816032409667969, -0.031322479248046875, -0.024484634399414062, -0.01764678955078125, -0.010808944702148438, -0.003971099853515625, 0.0028667449951171875, 0.00970458984375, 0.016542434692382812, 0.023380279541015625, 0.030218124389648438, 0.03705596923828125, 0.04389381408691406, 0.050731658935546875, 0.05756950378417969, 0.0644073486328125, 0.07124519348144531, 0.07808303833007812, 0.08492088317871094, 0.09175872802734375, 0.09859657287597656, 0.10543441772460938, 0.11227226257324219, 0.119110107421875, 0.1259479522705078, 0.13278579711914062, 0.13962364196777344, 0.14646148681640625, 0.15329933166503906, 0.16013717651367188, 0.1669750213623047, 0.1738128662109375, 0.1806507110595703, 0.18748855590820312, 0.19432640075683594, 0.20116424560546875, 0.20800209045410156, 0.21483993530273438, 0.2216777801513672, 0.228515625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 20.0, 107.0, 475.0, 323.0, 72.0, 11.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.858182907104492, -4.408928394317627, -3.9596736431121826, -3.5104188919067383, -3.061164379119873, -2.6119096279144287, -2.1626548767089844, -1.7134003639221191, -1.2641456127166748, -0.81489098072052, -0.36563628911972046, 0.0836184024810791, 0.5328730344772339, 0.9821276664733887, 1.431382417678833, 1.8806369304656982, 2.3298916816711426, 2.779146432876587, 3.228400945663452, 3.6776556968688965, 4.126910209655762, 4.576165199279785, 5.02541971206665, 5.474674224853516, 5.923929214477539, 6.373183727264404, 6.822438716888428, 7.271693229675293, 7.720947742462158, 8.170202255249023, 8.619457244873047, 9.06871223449707, 9.517966270446777, 9.9672212600708, 10.416475296020508, 10.865730285644531, 11.314985275268555, 11.764239311218262, 12.213494300842285, 12.662748336791992, 13.112003326416016, 13.561258316040039, 14.010512351989746, 14.45976734161377, 14.909022331237793, 15.3582763671875, 15.807531356811523, 16.256786346435547, 16.70604133605957, 17.155296325683594, 17.604551315307617, 18.05380630493164, 18.50305938720703, 18.952314376831055, 19.401569366455078, 19.8508243560791, 20.300077438354492, 20.749332427978516, 21.19858741760254, 21.647842407226562, 22.097095489501953, 22.546350479125977, 22.99560546875, 23.444860458374023, 23.894115447998047]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 4.0, 3.0, 5.0, 10.0, 9.0, 6.0, 11.0, 17.0, 15.0, 19.0, 20.0, 14.0, 32.0, 29.0, 40.0, 30.0, 45.0, 51.0, 56.0, 38.0, 45.0, 60.0, 50.0, 38.0, 51.0, 37.0, 34.0, 40.0, 26.0, 29.0, 16.0, 21.0, 18.0, 11.0, 10.0, 10.0, 9.0, 6.0, 5.0, 5.0, 3.0, 10.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.0028162002563477, -2.9053938388824463, -2.807971477508545, -2.7105491161346436, -2.613126754760742, -2.5157041549682617, -2.4182817935943604, -2.320859432220459, -2.2234370708465576, -2.1260147094726562, -2.028592348098755, -1.931169867515564, -1.8337475061416626, -1.7363251447677612, -1.6389026641845703, -1.541480302810669, -1.4440579414367676, -1.3466355800628662, -1.2492132186889648, -1.151790738105774, -1.0543683767318726, -0.9569460153579712, -0.859523594379425, -0.7621011734008789, -0.6646788120269775, -0.5672564506530762, -0.46983402967453003, -0.3724116384983063, -0.2749892473220825, -0.17756685614585876, -0.08014446496963501, 0.017277956008911133, 0.1147000789642334, 0.21212247014045715, 0.3095448613166809, 0.40696725249290466, 0.5043896436691284, 0.6018120050430298, 0.6992344260215759, 0.7966568470001221, 0.8940792083740234, 0.9915015697479248, 1.0889239311218262, 1.186346411705017, 1.2837687730789185, 1.3811911344528198, 1.4786136150360107, 1.576035976409912, 1.6734583377838135, 1.7708806991577148, 1.8683030605316162, 1.9657255411148071, 2.063148021697998, 2.1605703830718994, 2.257992744445801, 2.355415105819702, 2.4528374671936035, 2.550259828567505, 2.6476821899414062, 2.7451045513153076, 2.842526912689209, 2.9399495124816895, 3.037371873855591, 3.134794235229492, 3.2322165966033936]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 4.0, 6.0, 11.0, 7.0, 17.0, 43.0, 41.0, 86.0, 101.0, 233.0, 693.0, 6357.0, 4184468.0, 1452.0, 362.0, 146.0, 95.0, 42.0, 43.0, 19.0, 19.0, 11.0, 2.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.609375, -7.386962890625, -7.16455078125, -6.942138671875, -6.7197265625, -6.497314453125, -6.27490234375, -6.052490234375, -5.830078125, -5.607666015625, -5.38525390625, -5.162841796875, -4.9404296875, -4.718017578125, -4.49560546875, -4.273193359375, -4.05078125, -3.828369140625, -3.60595703125, -3.383544921875, -3.1611328125, -2.938720703125, -2.71630859375, -2.493896484375, -2.271484375, -2.049072265625, -1.82666015625, -1.604248046875, -1.3818359375, -1.159423828125, -0.93701171875, -0.714599609375, -0.4921875, -0.269775390625, -0.04736328125, 0.175048828125, 0.3974609375, 0.619873046875, 0.84228515625, 1.064697265625, 1.287109375, 1.509521484375, 1.73193359375, 1.954345703125, 2.1767578125, 2.399169921875, 2.62158203125, 2.843994140625, 3.06640625, 3.288818359375, 3.51123046875, 3.733642578125, 3.9560546875, 4.178466796875, 4.40087890625, 4.623291015625, 4.845703125, 5.068115234375, 5.29052734375, 5.512939453125, 5.7353515625, 5.957763671875, 6.18017578125, 6.402587890625, 6.625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 14.0, 10.0, 30.0, 28.0, 37.0, 54.0, 62.0, 76.0, 84.0, 97.0, 90.0, 77.0, 57.0, 66.0, 45.0, 35.0, 44.0, 22.0, 10.0, 20.0, 19.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3046875, -0.29571533203125, -0.2867431640625, -0.27777099609375, -0.268798828125, -0.25982666015625, -0.2508544921875, -0.24188232421875, -0.23291015625, -0.22393798828125, -0.2149658203125, -0.20599365234375, -0.197021484375, -0.18804931640625, -0.1790771484375, -0.17010498046875, -0.1611328125, -0.15216064453125, -0.1431884765625, -0.13421630859375, -0.125244140625, -0.11627197265625, -0.1072998046875, -0.09832763671875, -0.08935546875, -0.08038330078125, -0.0714111328125, -0.06243896484375, -0.053466796875, -0.04449462890625, -0.0355224609375, -0.02655029296875, -0.017578125, -0.00860595703125, 0.0003662109375, 0.00933837890625, 0.018310546875, 0.02728271484375, 0.0362548828125, 0.04522705078125, 0.05419921875, 0.06317138671875, 0.0721435546875, 0.08111572265625, 0.090087890625, 0.09906005859375, 0.1080322265625, 0.11700439453125, 0.1259765625, 0.13494873046875, 0.1439208984375, 0.15289306640625, 0.161865234375, 0.17083740234375, 0.1798095703125, 0.18878173828125, 0.19775390625, 0.20672607421875, 0.2156982421875, 0.22467041015625, 0.233642578125, 0.24261474609375, 0.2515869140625, 0.26055908203125, 0.26953125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 6.0, 7.0, 11.0, 8.0, 13.0, 22.0, 25.0, 29.0, 33.0, 51.0, 71.0, 131.0, 248.0, 434.0, 919.0, 2477.0, 19109.0, 4162955.0, 4982.0, 1341.0, 570.0, 289.0, 165.0, 117.0, 62.0, 43.0, 37.0, 26.0, 21.0, 14.0, 15.0, 8.0, 14.0, 5.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.134765625, -3.048248291015625, -2.96173095703125, -2.875213623046875, -2.7886962890625, -2.702178955078125, -2.61566162109375, -2.529144287109375, -2.442626953125, -2.356109619140625, -2.26959228515625, -2.183074951171875, -2.0965576171875, -2.010040283203125, -1.92352294921875, -1.837005615234375, -1.75048828125, -1.663970947265625, -1.57745361328125, -1.490936279296875, -1.4044189453125, -1.317901611328125, -1.23138427734375, -1.144866943359375, -1.058349609375, -0.971832275390625, -0.88531494140625, -0.798797607421875, -0.7122802734375, -0.625762939453125, -0.53924560546875, -0.452728271484375, -0.3662109375, -0.279693603515625, -0.19317626953125, -0.106658935546875, -0.0201416015625, 0.066375732421875, 0.15289306640625, 0.239410400390625, 0.325927734375, 0.412445068359375, 0.49896240234375, 0.585479736328125, 0.6719970703125, 0.758514404296875, 0.84503173828125, 0.931549072265625, 1.01806640625, 1.104583740234375, 1.19110107421875, 1.277618408203125, 1.3641357421875, 1.450653076171875, 1.53717041015625, 1.623687744140625, 1.710205078125, 1.796722412109375, 1.88323974609375, 1.969757080078125, 2.0562744140625, 2.142791748046875, 2.22930908203125, 2.315826416015625, 2.40234375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 36.0, 3967.0, 38.0, 7.0, 6.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26611328125, -0.25247955322265625, -0.2388458251953125, -0.22521209716796875, -0.211578369140625, -0.19794464111328125, -0.1843109130859375, -0.17067718505859375, -0.15704345703125, -0.14340972900390625, -0.1297760009765625, -0.11614227294921875, -0.102508544921875, -0.08887481689453125, -0.0752410888671875, -0.06160736083984375, -0.0479736328125, -0.03433990478515625, -0.0207061767578125, -0.00707244873046875, 0.006561279296875, 0.02019500732421875, 0.0338287353515625, 0.04746246337890625, 0.06109619140625, 0.07472991943359375, 0.0883636474609375, 0.10199737548828125, 0.115631103515625, 0.12926483154296875, 0.1428985595703125, 0.15653228759765625, 0.170166015625, 0.18379974365234375, 0.1974334716796875, 0.21106719970703125, 0.224700927734375, 0.23833465576171875, 0.2519683837890625, 0.26560211181640625, 0.27923583984375, 0.29286956787109375, 0.3065032958984375, 0.32013702392578125, 0.333770751953125, 0.34740447998046875, 0.3610382080078125, 0.37467193603515625, 0.3883056640625, 0.40193939208984375, 0.4155731201171875, 0.42920684814453125, 0.442840576171875, 0.45647430419921875, 0.4701080322265625, 0.48374176025390625, 0.49737548828125, 0.5110092163085938, 0.5246429443359375, 0.5382766723632812, 0.551910400390625, 0.5655441284179688, 0.5791778564453125, 0.5928115844726562, 0.6064453125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 16.0, 35.0, 49.0, 79.0, 213.0, 326.0, 151.0, 63.0, 27.0, 15.0, 10.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9659733772277832, -1.9196730852127075, -1.8733729124069214, -1.8270726203918457, -1.7807724475860596, -1.7344721555709839, -1.6881719827651978, -1.641871690750122, -1.595571517944336, -1.5492712259292603, -1.5029710531234741, -1.4566707611083984, -1.4103705883026123, -1.3640702962875366, -1.3177701234817505, -1.2714698314666748, -1.2251696586608887, -1.178869366645813, -1.1325691938400269, -1.0862689018249512, -1.039968729019165, -0.9936684966087341, -0.9473682641983032, -0.9010679721832275, -0.8547676801681519, -0.808467447757721, -0.76216721534729, -0.7158669829368591, -0.6695667505264282, -0.6232665181159973, -0.5769662857055664, -0.5306659936904907, -0.4843657612800598, -0.4380655288696289, -0.391765296459198, -0.3454650640487671, -0.2991648316383362, -0.2528645992279053, -0.20656433701515198, -0.16026410460472107, -0.11396387219429016, -0.06766363978385925, -0.021363399922847748, 0.024936839938163757, 0.07123707234859467, 0.11753730475902557, 0.16383755207061768, 0.21013778448104858, 0.2564380168914795, 0.3027382493019104, 0.3490384817123413, 0.3953387141227722, 0.4416389465332031, 0.48793917894363403, 0.5342394113540649, 0.5805397033691406, 0.6268398761749268, 0.6731401085853577, 0.7194403409957886, 0.7657405734062195, 0.8120408058166504, 0.8583410382270813, 0.9046412706375122, 0.9509415626525879, 0.9972417950630188]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 4.0, 7.0, 11.0, 11.0, 11.0, 13.0, 13.0, 17.0, 19.0, 16.0, 20.0, 23.0, 34.0, 38.0, 37.0, 39.0, 44.0, 55.0, 30.0, 39.0, 50.0, 43.0, 55.0, 40.0, 33.0, 36.0, 31.0, 35.0, 34.0, 28.0, 17.0, 25.0, 22.0, 11.0, 8.0, 7.0, 12.0, 7.0, 8.0, 7.0, 7.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.4631257653236389, -0.450195848941803, -0.43726593255996704, -0.4243360161781311, -0.41140609979629517, -0.39847618341445923, -0.3855462968349457, -0.37261638045310974, -0.3596864640712738, -0.34675654768943787, -0.33382663130760193, -0.320896714925766, -0.30796682834625244, -0.2950369119644165, -0.28210699558258057, -0.26917707920074463, -0.2562471628189087, -0.24331724643707275, -0.23038733005523682, -0.21745742857456207, -0.20452751219272614, -0.1915975958108902, -0.17866769433021545, -0.16573777794837952, -0.15280786156654358, -0.13987794518470764, -0.1269480288028717, -0.11401812732219696, -0.10108821094036102, -0.08815829455852509, -0.07522838562726974, -0.062298476696014404, -0.04936856031417847, -0.03643864765763283, -0.02350873500108719, -0.01057882234454155, 0.0023510903120040894, 0.015281006693840027, 0.028210915625095367, 0.04114082455635071, 0.054070740938186646, 0.06700065732002258, 0.07993056625127792, 0.09286047518253326, 0.1057903915643692, 0.11872030794620514, 0.13165020942687988, 0.14458012580871582, 0.15751004219055176, 0.1704399585723877, 0.18336987495422363, 0.19629977643489838, 0.20922969281673431, 0.22215960919857025, 0.235089510679245, 0.24801942706108093, 0.26094934344291687, 0.2738792598247528, 0.28680917620658875, 0.2997390925884247, 0.31266897916793823, 0.32559889554977417, 0.3385288119316101, 0.35145872831344604, 0.364388644695282]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 6.0, 9.0, 11.0, 12.0, 16.0, 27.0, 41.0, 55.0, 62.0, 85.0, 113.0, 157.0, 226.0, 337.0, 612.0, 1019.0, 1816.0, 3728.0, 7962.0, 20061.0, 59765.0, 227062.0, 485840.0, 164617.0, 45458.0, 15677.0, 6542.0, 3070.0, 1631.0, 890.0, 523.0, 333.0, 201.0, 155.0, 97.0, 80.0, 68.0, 43.0, 38.0, 27.0, 19.0, 19.0, 12.0, 8.0, 4.0, 6.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.479736328125, -0.4639472961425781, -0.44815826416015625, -0.4323692321777344, -0.4165802001953125, -0.4007911682128906, -0.38500213623046875, -0.3692131042480469, -0.353424072265625, -0.3376350402832031, -0.32184600830078125, -0.3060569763183594, -0.2902679443359375, -0.2744789123535156, -0.25868988037109375, -0.24290084838867188, -0.22711181640625, -0.21132278442382812, -0.19553375244140625, -0.17974472045898438, -0.1639556884765625, -0.14816665649414062, -0.13237762451171875, -0.11658859252929688, -0.100799560546875, -0.08501052856445312, -0.06922149658203125, -0.053432464599609375, -0.0376434326171875, -0.021854400634765625, -0.00606536865234375, 0.009723663330078125, 0.0255126953125, 0.041301727294921875, 0.05709075927734375, 0.07287979125976562, 0.0886688232421875, 0.10445785522460938, 0.12024688720703125, 0.13603591918945312, 0.151824951171875, 0.16761398315429688, 0.18340301513671875, 0.19919204711914062, 0.2149810791015625, 0.23077011108398438, 0.24655914306640625, 0.2623481750488281, 0.27813720703125, 0.2939262390136719, 0.30971527099609375, 0.3255043029785156, 0.3412933349609375, 0.3570823669433594, 0.37287139892578125, 0.3886604309082031, 0.404449462890625, 0.4202384948730469, 0.43602752685546875, 0.4518165588378906, 0.4676055908203125, 0.4833946228027344, 0.49918365478515625, 0.5149726867675781, 0.53076171875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 7.0, 13.0, 25.0, 29.0, 40.0, 48.0, 50.0, 62.0, 71.0, 75.0, 83.0, 63.0, 78.0, 71.0, 49.0, 43.0, 50.0, 38.0, 26.0, 22.0, 17.0, 8.0, 8.0, 8.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302490234375, -0.2935600280761719, -0.28462982177734375, -0.2756996154785156, -0.2667694091796875, -0.2578392028808594, -0.24890899658203125, -0.23997879028320312, -0.231048583984375, -0.22211837768554688, -0.21318817138671875, -0.20425796508789062, -0.1953277587890625, -0.18639755249023438, -0.17746734619140625, -0.16853713989257812, -0.15960693359375, -0.15067672729492188, -0.14174652099609375, -0.13281631469726562, -0.1238861083984375, -0.11495590209960938, -0.10602569580078125, -0.09709548950195312, -0.088165283203125, -0.07923507690429688, -0.07030487060546875, -0.061374664306640625, -0.0524444580078125, -0.043514251708984375, -0.03458404541015625, -0.025653839111328125, -0.0167236328125, -0.007793426513671875, 0.00113677978515625, 0.010066986083984375, 0.0189971923828125, 0.027927398681640625, 0.03685760498046875, 0.045787811279296875, 0.054718017578125, 0.06364822387695312, 0.07257843017578125, 0.08150863647460938, 0.0904388427734375, 0.09936904907226562, 0.10829925537109375, 0.11722946166992188, 0.12615966796875, 0.13508987426757812, 0.14402008056640625, 0.15295028686523438, 0.1618804931640625, 0.17081069946289062, 0.17974090576171875, 0.18867111206054688, 0.197601318359375, 0.20653152465820312, 0.21546173095703125, 0.22439193725585938, 0.2333221435546875, 0.24225234985351562, 0.25118255615234375, 0.2601127624511719, 0.26904296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 6.0, 7.0, 6.0, 7.0, 8.0, 21.0, 26.0, 33.0, 45.0, 88.0, 176.0, 322.0, 598.0, 1172.0, 2931.0, 7485.0, 24501.0, 118728.0, 657310.0, 185615.0, 33379.0, 9634.0, 3467.0, 1456.0, 663.0, 346.0, 167.0, 129.0, 65.0, 44.0, 32.0, 27.0, 17.0, 8.0, 10.0, 9.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5693359375, -0.55010986328125, -0.5308837890625, -0.51165771484375, -0.492431640625, -0.47320556640625, -0.4539794921875, -0.43475341796875, -0.41552734375, -0.39630126953125, -0.3770751953125, -0.35784912109375, -0.338623046875, -0.31939697265625, -0.3001708984375, -0.28094482421875, -0.26171875, -0.24249267578125, -0.2232666015625, -0.20404052734375, -0.184814453125, -0.16558837890625, -0.1463623046875, -0.12713623046875, -0.10791015625, -0.08868408203125, -0.0694580078125, -0.05023193359375, -0.031005859375, -0.01177978515625, 0.0074462890625, 0.02667236328125, 0.0458984375, 0.06512451171875, 0.0843505859375, 0.10357666015625, 0.122802734375, 0.14202880859375, 0.1612548828125, 0.18048095703125, 0.19970703125, 0.21893310546875, 0.2381591796875, 0.25738525390625, 0.276611328125, 0.29583740234375, 0.3150634765625, 0.33428955078125, 0.353515625, 0.37274169921875, 0.3919677734375, 0.41119384765625, 0.430419921875, 0.44964599609375, 0.4688720703125, 0.48809814453125, 0.50732421875, 0.52655029296875, 0.5457763671875, 0.56500244140625, 0.584228515625, 0.60345458984375, 0.6226806640625, 0.64190673828125, 0.6611328125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 10.0, 6.0, 3.0, 9.0, 8.0, 15.0, 9.0, 23.0, 20.0, 16.0, 14.0, 26.0, 20.0, 20.0, 31.0, 36.0, 33.0, 27.0, 46.0, 41.0, 46.0, 42.0, 41.0, 37.0, 38.0, 34.0, 23.0, 24.0, 24.0, 26.0, 36.0, 25.0, 27.0, 20.0, 23.0, 21.0, 18.0, 10.0, 14.0, 14.0, 9.0, 7.0, 4.0, 4.0, 9.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0], "bins": [-0.65478515625, -0.6360092163085938, -0.6172332763671875, -0.5984573364257812, -0.579681396484375, -0.5609054565429688, -0.5421295166015625, -0.5233535766601562, -0.50457763671875, -0.48580169677734375, -0.4670257568359375, -0.44824981689453125, -0.429473876953125, -0.41069793701171875, -0.3919219970703125, -0.37314605712890625, -0.3543701171875, -0.33559417724609375, -0.3168182373046875, -0.29804229736328125, -0.279266357421875, -0.26049041748046875, -0.2417144775390625, -0.22293853759765625, -0.20416259765625, -0.18538665771484375, -0.1666107177734375, -0.14783477783203125, -0.129058837890625, -0.11028289794921875, -0.0915069580078125, -0.07273101806640625, -0.053955078125, -0.03517913818359375, -0.0164031982421875, 0.00237274169921875, 0.021148681640625, 0.03992462158203125, 0.0587005615234375, 0.07747650146484375, 0.09625244140625, 0.11502838134765625, 0.1338043212890625, 0.15258026123046875, 0.171356201171875, 0.19013214111328125, 0.2089080810546875, 0.22768402099609375, 0.2464599609375, 0.26523590087890625, 0.2840118408203125, 0.30278778076171875, 0.321563720703125, 0.34033966064453125, 0.3591156005859375, 0.37789154052734375, 0.39666748046875, 0.41544342041015625, 0.4342193603515625, 0.45299530029296875, 0.471771240234375, 0.49054718017578125, 0.5093231201171875, 0.5280990600585938, 0.546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 6.0, 9.0, 13.0, 25.0, 25.0, 67.0, 76.0, 95.0, 189.0, 329.0, 687.0, 1661.0, 4793.0, 20600.0, 164650.0, 734100.0, 99894.0, 14825.0, 3780.0, 1369.0, 565.0, 302.0, 183.0, 104.0, 65.0, 43.0, 28.0, 19.0, 18.0, 5.0, 9.0, 4.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25830078125, -0.25032806396484375, -0.2423553466796875, -0.23438262939453125, -0.226409912109375, -0.21843719482421875, -0.2104644775390625, -0.20249176025390625, -0.19451904296875, -0.18654632568359375, -0.1785736083984375, -0.17060089111328125, -0.162628173828125, -0.15465545654296875, -0.1466827392578125, -0.13871002197265625, -0.1307373046875, -0.12276458740234375, -0.1147918701171875, -0.10681915283203125, -0.098846435546875, -0.09087371826171875, -0.0829010009765625, -0.07492828369140625, -0.06695556640625, -0.05898284912109375, -0.0510101318359375, -0.04303741455078125, -0.035064697265625, -0.02709197998046875, -0.0191192626953125, -0.01114654541015625, -0.003173828125, 0.00479888916015625, 0.0127716064453125, 0.02074432373046875, 0.028717041015625, 0.03668975830078125, 0.0446624755859375, 0.05263519287109375, 0.06060791015625, 0.06858062744140625, 0.0765533447265625, 0.08452606201171875, 0.092498779296875, 0.10047149658203125, 0.1084442138671875, 0.11641693115234375, 0.1243896484375, 0.13236236572265625, 0.1403350830078125, 0.14830780029296875, 0.156280517578125, 0.16425323486328125, 0.1722259521484375, 0.18019866943359375, 0.18817138671875, 0.19614410400390625, 0.2041168212890625, 0.21208953857421875, 0.220062255859375, 0.22803497314453125, 0.2360076904296875, 0.24398040771484375, 0.251953125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 2.0, 2.0, 5.0, 3.0, 7.0, 7.0, 22.0, 8.0, 16.0, 25.0, 19.0, 45.0, 48.0, 57.0, 88.0, 96.0, 122.0, 96.0, 86.0, 72.0, 34.0, 34.0, 22.0, 15.0, 22.0, 12.0, 7.0, 8.0, 7.0, 3.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.70280647277832e-05, -4.565343260765076e-05, -4.427880048751831e-05, -4.2904168367385864e-05, -4.152953624725342e-05, -4.015490412712097e-05, -3.8780272006988525e-05, -3.740563988685608e-05, -3.603100776672363e-05, -3.4656375646591187e-05, -3.328174352645874e-05, -3.1907111406326294e-05, -3.053247928619385e-05, -2.91578471660614e-05, -2.7783215045928955e-05, -2.640858292579651e-05, -2.5033950805664062e-05, -2.3659318685531616e-05, -2.228468656539917e-05, -2.0910054445266724e-05, -1.9535422325134277e-05, -1.816079020500183e-05, -1.6786158084869385e-05, -1.541152596473694e-05, -1.4036893844604492e-05, -1.2662261724472046e-05, -1.12876296043396e-05, -9.912997484207153e-06, -8.538365364074707e-06, -7.163733243942261e-06, -5.7891011238098145e-06, -4.414469003677368e-06, -3.039836883544922e-06, -1.6652047634124756e-06, -2.905726432800293e-07, 1.084059476852417e-06, 2.4586915969848633e-06, 3.8333237171173096e-06, 5.207955837249756e-06, 6.582587957382202e-06, 7.957220077514648e-06, 9.331852197647095e-06, 1.0706484317779541e-05, 1.2081116437911987e-05, 1.3455748558044434e-05, 1.483038067817688e-05, 1.6205012798309326e-05, 1.7579644918441772e-05, 1.895427703857422e-05, 2.0328909158706665e-05, 2.170354127883911e-05, 2.3078173398971558e-05, 2.4452805519104004e-05, 2.582743763923645e-05, 2.7202069759368896e-05, 2.8576701879501343e-05, 2.995133399963379e-05, 3.1325966119766235e-05, 3.270059823989868e-05, 3.407523036003113e-05, 3.5449862480163574e-05, 3.682449460029602e-05, 3.819912672042847e-05, 3.957375884056091e-05, 4.094839096069336e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 5.0, 12.0, 15.0, 27.0, 39.0, 54.0, 92.0, 201.0, 372.0, 875.0, 2672.0, 12509.0, 126276.0, 809475.0, 82736.0, 9483.0, 2155.0, 747.0, 347.0, 202.0, 91.0, 54.0, 35.0, 29.0, 17.0, 9.0, 8.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.268798828125, -0.2577934265136719, -0.24678802490234375, -0.23578262329101562, -0.2247772216796875, -0.21377182006835938, -0.20276641845703125, -0.19176101684570312, -0.180755615234375, -0.16975021362304688, -0.15874481201171875, -0.14773941040039062, -0.1367340087890625, -0.12572860717773438, -0.11472320556640625, -0.10371780395507812, -0.09271240234375, -0.08170700073242188, -0.07070159912109375, -0.059696197509765625, -0.0486907958984375, -0.037685394287109375, -0.02667999267578125, -0.015674591064453125, -0.004669189453125, 0.006336212158203125, 0.01734161376953125, 0.028347015380859375, 0.0393524169921875, 0.050357818603515625, 0.06136322021484375, 0.07236862182617188, 0.0833740234375, 0.09437942504882812, 0.10538482666015625, 0.11639022827148438, 0.1273956298828125, 0.13840103149414062, 0.14940643310546875, 0.16041183471679688, 0.171417236328125, 0.18242263793945312, 0.19342803955078125, 0.20443344116210938, 0.2154388427734375, 0.22644424438476562, 0.23744964599609375, 0.24845504760742188, 0.25946044921875, 0.2704658508300781, 0.28147125244140625, 0.2924766540527344, 0.3034820556640625, 0.3144874572753906, 0.32549285888671875, 0.3364982604980469, 0.347503662109375, 0.3585090637207031, 0.36951446533203125, 0.3805198669433594, 0.3915252685546875, 0.4025306701660156, 0.41353607177734375, 0.4245414733886719, 0.435546875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 13.0, 10.0, 18.0, 30.0, 56.0, 84.0, 104.0, 130.0, 128.0, 124.0, 99.0, 62.0, 48.0, 38.0, 24.0, 13.0, 8.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2265625, -0.2168731689453125, -0.207183837890625, -0.1974945068359375, -0.18780517578125, -0.1781158447265625, -0.168426513671875, -0.1587371826171875, -0.1490478515625, -0.1393585205078125, -0.129669189453125, -0.1199798583984375, -0.11029052734375, -0.1006011962890625, -0.090911865234375, -0.0812225341796875, -0.071533203125, -0.0618438720703125, -0.052154541015625, -0.0424652099609375, -0.03277587890625, -0.0230865478515625, -0.013397216796875, -0.0037078857421875, 0.0059814453125, 0.0156707763671875, 0.025360107421875, 0.0350494384765625, 0.04473876953125, 0.0544281005859375, 0.064117431640625, 0.0738067626953125, 0.08349609375, 0.0931854248046875, 0.102874755859375, 0.1125640869140625, 0.12225341796875, 0.1319427490234375, 0.141632080078125, 0.1513214111328125, 0.1610107421875, 0.1707000732421875, 0.180389404296875, 0.1900787353515625, 0.19976806640625, 0.2094573974609375, 0.219146728515625, 0.2288360595703125, 0.238525390625, 0.2482147216796875, 0.257904052734375, 0.2675933837890625, 0.27728271484375, 0.2869720458984375, 0.296661376953125, 0.3063507080078125, 0.3160400390625, 0.3257293701171875, 0.335418701171875, 0.3451080322265625, 0.35479736328125, 0.3644866943359375, 0.374176025390625, 0.3838653564453125, 0.3935546875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 11.0, 43.0, 181.0, 408.0, 269.0, 72.0, 18.0, 3.0, 3.0, 1.0, 1.0], "bins": [-22.551422119140625, -22.15372657775879, -21.756031036376953, -21.358335494995117, -20.96063995361328, -20.562944412231445, -20.16524887084961, -19.76755142211914, -19.369855880737305, -18.97216033935547, -18.574464797973633, -18.176769256591797, -17.77907371520996, -17.381378173828125, -16.983680725097656, -16.585987091064453, -16.188291549682617, -15.790596008300781, -15.392900466918945, -14.99520492553711, -14.597508430480957, -14.199812889099121, -13.802117347717285, -13.40442180633545, -13.006725311279297, -12.609029769897461, -12.211334228515625, -11.813638687133789, -11.415942192077637, -11.0182466506958, -10.620551109313965, -10.222855567932129, -9.825160026550293, -9.427464485168457, -9.029768943786621, -8.632072448730469, -8.234376907348633, -7.836681365966797, -7.438985824584961, -7.041290283203125, -6.643594741821289, -6.245899200439453, -5.848203182220459, -5.450507640838623, -5.052812099456787, -4.655116081237793, -4.257420539855957, -3.859724998474121, -3.462028980255127, -3.064333200454712, -2.666637659072876, -2.268941879272461, -1.8712462186813354, -1.47355055809021, -1.075854778289795, -0.678159236907959, -0.28046345710754395, 0.11723223328590393, 0.5149279236793518, 0.9126236438751221, 1.3103193044662476, 1.708014965057373, 2.105710744857788, 2.503406286239624, 2.901102066040039]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 6.0, 11.0, 6.0, 12.0, 8.0, 12.0, 15.0, 15.0, 39.0, 24.0, 21.0, 31.0, 36.0, 36.0, 51.0, 60.0, 52.0, 48.0, 74.0, 55.0, 53.0, 32.0, 41.0, 35.0, 43.0, 34.0, 27.0, 23.0, 16.0, 19.0, 20.0, 15.0, 12.0, 4.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.799252510070801, -3.672935724258423, -3.546618938446045, -3.420302152633667, -3.293985366821289, -3.167668581008911, -3.041351795196533, -2.9150350093841553, -2.7887182235717773, -2.6624014377593994, -2.5360846519470215, -2.4097678661346436, -2.2834510803222656, -2.1571342945098877, -2.0308175086975098, -1.9045007228851318, -1.778183937072754, -1.651867151260376, -1.525550365447998, -1.3992335796356201, -1.2729167938232422, -1.1466000080108643, -1.0202832221984863, -0.8939664363861084, -0.7676496505737305, -0.6413328647613525, -0.5150160789489746, -0.3886992931365967, -0.26238250732421875, -0.13606572151184082, -0.00974893569946289, 0.11656785011291504, 0.24288511276245117, 0.3692018985748291, 0.49551868438720703, 0.621835470199585, 0.7481522560119629, 0.8744690418243408, 1.0007858276367188, 1.1271026134490967, 1.2534193992614746, 1.3797361850738525, 1.5060529708862305, 1.6323697566986084, 1.7586865425109863, 1.8850033283233643, 2.011320114135742, 2.13763689994812, 2.263953685760498, 2.390270471572876, 2.516587257385254, 2.642904043197632, 2.7692208290100098, 2.8955376148223877, 3.0218544006347656, 3.1481711864471436, 3.2744879722595215, 3.4008047580718994, 3.5271215438842773, 3.6534383296966553, 3.779755115509033, 3.906071901321411, 4.032388687133789, 4.158705711364746, 4.285022258758545]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 6.0, 7.0, 10.0, 11.0, 19.0, 29.0, 39.0, 62.0, 107.0, 179.0, 312.0, 643.0, 1690.0, 4166612.0, 21849.0, 1360.0, 548.0, 301.0, 194.0, 95.0, 68.0, 39.0, 30.0, 17.0, 10.0, 11.0, 5.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.25, -4.124664306640625, -3.99932861328125, -3.873992919921875, -3.7486572265625, -3.623321533203125, -3.49798583984375, -3.372650146484375, -3.247314453125, -3.121978759765625, -2.99664306640625, -2.871307373046875, -2.7459716796875, -2.620635986328125, -2.49530029296875, -2.369964599609375, -2.24462890625, -2.119293212890625, -1.99395751953125, -1.868621826171875, -1.7432861328125, -1.617950439453125, -1.49261474609375, -1.367279052734375, -1.241943359375, -1.116607666015625, -0.99127197265625, -0.865936279296875, -0.7406005859375, -0.615264892578125, -0.48992919921875, -0.364593505859375, -0.2392578125, -0.113922119140625, 0.01141357421875, 0.136749267578125, 0.2620849609375, 0.387420654296875, 0.51275634765625, 0.638092041015625, 0.763427734375, 0.888763427734375, 1.01409912109375, 1.139434814453125, 1.2647705078125, 1.390106201171875, 1.51544189453125, 1.640777587890625, 1.76611328125, 1.891448974609375, 2.01678466796875, 2.142120361328125, 2.2674560546875, 2.392791748046875, 2.51812744140625, 2.643463134765625, 2.768798828125, 2.894134521484375, 3.01947021484375, 3.144805908203125, 3.2701416015625, 3.395477294921875, 3.52081298828125, 3.646148681640625, 3.771484375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 7.0, 11.0, 14.0, 22.0, 18.0, 26.0, 30.0, 55.0, 52.0, 81.0, 61.0, 78.0, 72.0, 85.0, 78.0, 60.0, 59.0, 41.0, 39.0, 24.0, 25.0, 19.0, 15.0, 9.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310546875, -0.30152130126953125, -0.2924957275390625, -0.28347015380859375, -0.274444580078125, -0.26541900634765625, -0.2563934326171875, -0.24736785888671875, -0.23834228515625, -0.22931671142578125, -0.2202911376953125, -0.21126556396484375, -0.202239990234375, -0.19321441650390625, -0.1841888427734375, -0.17516326904296875, -0.1661376953125, -0.15711212158203125, -0.1480865478515625, -0.13906097412109375, -0.130035400390625, -0.12100982666015625, -0.1119842529296875, -0.10295867919921875, -0.09393310546875, -0.08490753173828125, -0.0758819580078125, -0.06685638427734375, -0.057830810546875, -0.04880523681640625, -0.0397796630859375, -0.03075408935546875, -0.021728515625, -0.01270294189453125, -0.0036773681640625, 0.00534820556640625, 0.014373779296875, 0.02339935302734375, 0.0324249267578125, 0.04145050048828125, 0.05047607421875, 0.05950164794921875, 0.0685272216796875, 0.07755279541015625, 0.086578369140625, 0.09560394287109375, 0.1046295166015625, 0.11365509033203125, 0.1226806640625, 0.13170623779296875, 0.1407318115234375, 0.14975738525390625, 0.158782958984375, 0.16780853271484375, 0.1768341064453125, 0.18585968017578125, 0.19488525390625, 0.20391082763671875, 0.2129364013671875, 0.22196197509765625, 0.230987548828125, 0.24001312255859375, 0.2490386962890625, 0.25806427001953125, 0.26708984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 12.0, 13.0, 20.0, 12.0, 21.0, 22.0, 56.0, 69.0, 100.0, 144.0, 184.0, 320.0, 579.0, 944.0, 1824.0, 5297.0, 60337.0, 4110736.0, 8345.0, 2402.0, 1042.0, 685.0, 393.0, 218.0, 136.0, 105.0, 90.0, 43.0, 31.0, 21.0, 15.0, 19.0, 15.0, 12.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.52734375, -1.48126220703125, -1.4351806640625, -1.38909912109375, -1.343017578125, -1.29693603515625, -1.2508544921875, -1.20477294921875, -1.15869140625, -1.11260986328125, -1.0665283203125, -1.02044677734375, -0.974365234375, -0.92828369140625, -0.8822021484375, -0.83612060546875, -0.7900390625, -0.74395751953125, -0.6978759765625, -0.65179443359375, -0.605712890625, -0.55963134765625, -0.5135498046875, -0.46746826171875, -0.42138671875, -0.37530517578125, -0.3292236328125, -0.28314208984375, -0.237060546875, -0.19097900390625, -0.1448974609375, -0.09881591796875, -0.052734375, -0.00665283203125, 0.0394287109375, 0.08551025390625, 0.131591796875, 0.17767333984375, 0.2237548828125, 0.26983642578125, 0.31591796875, 0.36199951171875, 0.4080810546875, 0.45416259765625, 0.500244140625, 0.54632568359375, 0.5924072265625, 0.63848876953125, 0.6845703125, 0.73065185546875, 0.7767333984375, 0.82281494140625, 0.868896484375, 0.91497802734375, 0.9610595703125, 1.00714111328125, 1.05322265625, 1.09930419921875, 1.1453857421875, 1.19146728515625, 1.237548828125, 1.28363037109375, 1.3297119140625, 1.37579345703125, 1.421875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 13.0, 12.0, 46.0, 3814.0, 127.0, 26.0, 10.0, 9.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3037109375, -0.29384613037109375, -0.2839813232421875, -0.27411651611328125, -0.264251708984375, -0.25438690185546875, -0.2445220947265625, -0.23465728759765625, -0.22479248046875, -0.21492767333984375, -0.2050628662109375, -0.19519805908203125, -0.185333251953125, -0.17546844482421875, -0.1656036376953125, -0.15573883056640625, -0.1458740234375, -0.13600921630859375, -0.1261444091796875, -0.11627960205078125, -0.106414794921875, -0.09654998779296875, -0.0866851806640625, -0.07682037353515625, -0.06695556640625, -0.05709075927734375, -0.0472259521484375, -0.03736114501953125, -0.027496337890625, -0.01763153076171875, -0.0077667236328125, 0.00209808349609375, 0.011962890625, 0.02182769775390625, 0.0316925048828125, 0.04155731201171875, 0.051422119140625, 0.06128692626953125, 0.0711517333984375, 0.08101654052734375, 0.09088134765625, 0.10074615478515625, 0.1106109619140625, 0.12047576904296875, 0.130340576171875, 0.14020538330078125, 0.1500701904296875, 0.15993499755859375, 0.1697998046875, 0.17966461181640625, 0.1895294189453125, 0.19939422607421875, 0.209259033203125, 0.21912384033203125, 0.2289886474609375, 0.23885345458984375, 0.24871826171875, 0.25858306884765625, 0.2684478759765625, 0.27831268310546875, 0.288177490234375, 0.29804229736328125, 0.3079071044921875, 0.31777191162109375, 0.32763671875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 6.0, 7.0, 8.0, 18.0, 23.0, 50.0, 63.0, 119.0, 180.0, 159.0, 131.0, 74.0, 59.0, 36.0, 28.0, 13.0, 8.0, 7.0, 10.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4852113723754883, -0.45683056116104126, -0.42844974994659424, -0.4000689387321472, -0.3716881275177002, -0.3433073163032532, -0.31492650508880615, -0.28654569387435913, -0.2581648826599121, -0.2297840714454651, -0.20140326023101807, -0.17302244901657104, -0.14464163780212402, -0.116260826587677, -0.08788001537322998, -0.05949920415878296, -0.031118392944335938, -0.002737581729888916, 0.025643229484558105, 0.05402404069900513, 0.08240485191345215, 0.11078566312789917, 0.1391664743423462, 0.1675472855567932, 0.19592809677124023, 0.22430890798568726, 0.2526897192001343, 0.2810705304145813, 0.3094513416290283, 0.33783215284347534, 0.36621296405792236, 0.3945937752723694, 0.4229745864868164, 0.4513553977012634, 0.47973620891571045, 0.5081170201301575, 0.5364978313446045, 0.5648786425590515, 0.5932594537734985, 0.6216402649879456, 0.6500210762023926, 0.6784018874168396, 0.7067826986312866, 0.7351635098457336, 0.7635443210601807, 0.7919251322746277, 0.8203059434890747, 0.8486867547035217, 0.8770675659179688, 0.9054483771324158, 0.9338291883468628, 0.9622099995613098, 0.9905908107757568, 1.0189716815948486, 1.0473524332046509, 1.0757331848144531, 1.104114055633545, 1.1324949264526367, 1.160875678062439, 1.1892564296722412, 1.217637300491333, 1.2460181713104248, 1.274398922920227, 1.3027796745300293, 1.331160545349121]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 8.0, 4.0, 8.0, 7.0, 6.0, 15.0, 12.0, 7.0, 19.0, 15.0, 21.0, 22.0, 30.0, 26.0, 28.0, 39.0, 37.0, 34.0, 42.0, 35.0, 40.0, 42.0, 40.0, 33.0, 30.0, 30.0, 34.0, 38.0, 25.0, 30.0, 30.0, 27.0, 24.0, 20.0, 22.0, 16.0, 15.0, 19.0, 11.0, 10.0, 7.0, 13.0, 5.0, 3.0, 3.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.34016501903533936, -0.33031991124153137, -0.320474773645401, -0.310629665851593, -0.30078455805778503, -0.29093945026397705, -0.2810943126678467, -0.2712492048740387, -0.2614040970802307, -0.25155898928642273, -0.24171386659145355, -0.23186874389648438, -0.2220236361026764, -0.21217851340770721, -0.20233339071273804, -0.19248828291893005, -0.18264314532279968, -0.1727980226278305, -0.16295291483402252, -0.15310779213905334, -0.14326268434524536, -0.13341756165027618, -0.123572438955307, -0.11372732371091843, -0.10388220846652985, -0.09403709322214127, -0.08419197797775269, -0.07434685528278351, -0.06450174003839493, -0.05465662479400635, -0.04481150582432747, -0.03496638685464859, -0.02512127161026001, -0.01527615450322628, -0.005431037396192551, 0.004414079710841179, 0.014259196817874908, 0.02410431206226349, 0.03394943103194237, 0.043794550001621246, 0.05363966524600983, 0.06348478049039841, 0.07332989573478699, 0.08317501842975616, 0.09302013367414474, 0.10286524891853333, 0.1127103716135025, 0.12255548685789108, 0.13240060210227966, 0.14224572479724884, 0.15209083259105682, 0.161935955286026, 0.17178106307983398, 0.18162618577480316, 0.19147130846977234, 0.20131641626358032, 0.2111615389585495, 0.22100666165351868, 0.23085176944732666, 0.24069689214229584, 0.250542014837265, 0.260387122631073, 0.270232230424881, 0.28007736802101135, 0.28992247581481934]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 5.0, 14.0, 21.0, 24.0, 61.0, 68.0, 115.0, 155.0, 248.0, 427.0, 816.0, 1759.0, 4511.0, 14534.0, 61365.0, 421278.0, 452784.0, 66588.0, 15277.0, 4665.0, 1802.0, 855.0, 421.0, 283.0, 144.0, 115.0, 69.0, 41.0, 35.0, 22.0, 10.0, 13.0, 4.0, 1.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.78076171875, -0.7578125, -0.73486328125, -0.7119140625, -0.68896484375, -0.666015625, -0.64306640625, -0.6201171875, -0.59716796875, -0.57421875, -0.55126953125, -0.5283203125, -0.50537109375, -0.482421875, -0.45947265625, -0.4365234375, -0.41357421875, -0.390625, -0.36767578125, -0.3447265625, -0.32177734375, -0.298828125, -0.27587890625, -0.2529296875, -0.22998046875, -0.20703125, -0.18408203125, -0.1611328125, -0.13818359375, -0.115234375, -0.09228515625, -0.0693359375, -0.04638671875, -0.0234375, -0.00048828125, 0.0224609375, 0.04541015625, 0.068359375, 0.09130859375, 0.1142578125, 0.13720703125, 0.16015625, 0.18310546875, 0.2060546875, 0.22900390625, 0.251953125, 0.27490234375, 0.2978515625, 0.32080078125, 0.34375, 0.36669921875, 0.3896484375, 0.41259765625, 0.435546875, 0.45849609375, 0.4814453125, 0.50439453125, 0.52734375, 0.55029296875, 0.5732421875, 0.59619140625, 0.619140625, 0.64208984375, 0.6650390625, 0.68798828125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 10.0, 10.0, 12.0, 22.0, 24.0, 20.0, 42.0, 42.0, 50.0, 70.0, 63.0, 66.0, 82.0, 67.0, 79.0, 74.0, 65.0, 41.0, 40.0, 16.0, 21.0, 26.0, 20.0, 12.0, 12.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.307861328125, -0.2989768981933594, -0.29009246826171875, -0.2812080383300781, -0.2723236083984375, -0.2634391784667969, -0.25455474853515625, -0.24567031860351562, -0.236785888671875, -0.22790145874023438, -0.21901702880859375, -0.21013259887695312, -0.2012481689453125, -0.19236373901367188, -0.18347930908203125, -0.17459487915039062, -0.16571044921875, -0.15682601928710938, -0.14794158935546875, -0.13905715942382812, -0.1301727294921875, -0.12128829956054688, -0.11240386962890625, -0.10351943969726562, -0.094635009765625, -0.08575057983398438, -0.07686614990234375, -0.06798171997070312, -0.0590972900390625, -0.050212860107421875, -0.04132843017578125, -0.032444000244140625, -0.0235595703125, -0.014675140380859375, -0.00579071044921875, 0.003093719482421875, 0.0119781494140625, 0.020862579345703125, 0.02974700927734375, 0.038631439208984375, 0.047515869140625, 0.056400299072265625, 0.06528472900390625, 0.07416915893554688, 0.0830535888671875, 0.09193801879882812, 0.10082244873046875, 0.10970687866210938, 0.11859130859375, 0.12747573852539062, 0.13636016845703125, 0.14524459838867188, 0.1541290283203125, 0.16301345825195312, 0.17189788818359375, 0.18078231811523438, 0.189666748046875, 0.19855117797851562, 0.20743560791015625, 0.21632003784179688, 0.2252044677734375, 0.23408889770507812, 0.24297332763671875, 0.2518577575683594, 0.2607421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 3.0, 11.0, 3.0, 17.0, 20.0, 34.0, 39.0, 63.0, 94.0, 134.0, 223.0, 422.0, 854.0, 1890.0, 4965.0, 16378.0, 77947.0, 573480.0, 310119.0, 44370.0, 11010.0, 3480.0, 1433.0, 667.0, 327.0, 192.0, 115.0, 73.0, 50.0, 35.0, 26.0, 15.0, 18.0, 15.0, 5.0, 5.0, 1.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.491943359375, -0.4742698669433594, -0.45659637451171875, -0.4389228820800781, -0.4212493896484375, -0.4035758972167969, -0.38590240478515625, -0.3682289123535156, -0.350555419921875, -0.3328819274902344, -0.31520843505859375, -0.2975349426269531, -0.2798614501953125, -0.2621879577636719, -0.24451446533203125, -0.22684097290039062, -0.20916748046875, -0.19149398803710938, -0.17382049560546875, -0.15614700317382812, -0.1384735107421875, -0.12080001831054688, -0.10312652587890625, -0.08545303344726562, -0.067779541015625, -0.050106048583984375, -0.03243255615234375, -0.014759063720703125, 0.0029144287109375, 0.020587921142578125, 0.03826141357421875, 0.055934906005859375, 0.0736083984375, 0.09128189086914062, 0.10895538330078125, 0.12662887573242188, 0.1443023681640625, 0.16197586059570312, 0.17964935302734375, 0.19732284545898438, 0.214996337890625, 0.23266983032226562, 0.25034332275390625, 0.2680168151855469, 0.2856903076171875, 0.3033638000488281, 0.32103729248046875, 0.3387107849121094, 0.35638427734375, 0.3740577697753906, 0.39173126220703125, 0.4094047546386719, 0.4270782470703125, 0.4447517395019531, 0.46242523193359375, 0.4800987243652344, 0.497772216796875, 0.5154457092285156, 0.5331192016601562, 0.5507926940917969, 0.5684661865234375, 0.5861396789550781, 0.6038131713867188, 0.6214866638183594, 0.63916015625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 9.0, 9.0, 13.0, 13.0, 23.0, 27.0, 26.0, 38.0, 38.0, 41.0, 40.0, 56.0, 44.0, 58.0, 67.0, 60.0, 42.0, 60.0, 48.0, 52.0, 36.0, 43.0, 20.0, 30.0, 33.0, 24.0, 13.0, 13.0, 7.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.634796142578125, -0.60748291015625, -0.580169677734375, -0.5528564453125, -0.525543212890625, -0.49822998046875, -0.470916748046875, -0.443603515625, -0.416290283203125, -0.38897705078125, -0.361663818359375, -0.3343505859375, -0.307037353515625, -0.27972412109375, -0.252410888671875, -0.22509765625, -0.197784423828125, -0.17047119140625, -0.143157958984375, -0.1158447265625, -0.088531494140625, -0.06121826171875, -0.033905029296875, -0.006591796875, 0.020721435546875, 0.04803466796875, 0.075347900390625, 0.1026611328125, 0.129974365234375, 0.15728759765625, 0.184600830078125, 0.2119140625, 0.239227294921875, 0.26654052734375, 0.293853759765625, 0.3211669921875, 0.348480224609375, 0.37579345703125, 0.403106689453125, 0.430419921875, 0.457733154296875, 0.48504638671875, 0.512359619140625, 0.5396728515625, 0.566986083984375, 0.59429931640625, 0.621612548828125, 0.64892578125, 0.676239013671875, 0.70355224609375, 0.730865478515625, 0.7581787109375, 0.785491943359375, 0.81280517578125, 0.840118408203125, 0.867431640625, 0.894744873046875, 0.92205810546875, 0.949371337890625, 0.9766845703125, 1.003997802734375, 1.03131103515625, 1.058624267578125, 1.0859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 1.0, 7.0, 6.0, 9.0, 11.0, 17.0, 20.0, 28.0, 31.0, 51.0, 79.0, 126.0, 234.0, 434.0, 757.0, 1763.0, 4769.0, 16224.0, 78688.0, 558484.0, 322939.0, 46316.0, 10959.0, 3538.0, 1462.0, 674.0, 366.0, 184.0, 121.0, 78.0, 52.0, 41.0, 27.0, 17.0, 11.0, 9.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1673583984375, -0.16112518310546875, -0.1548919677734375, -0.14865875244140625, -0.142425537109375, -0.13619232177734375, -0.1299591064453125, -0.12372589111328125, -0.11749267578125, -0.11125946044921875, -0.1050262451171875, -0.09879302978515625, -0.092559814453125, -0.08632659912109375, -0.0800933837890625, -0.07386016845703125, -0.067626953125, -0.06139373779296875, -0.0551605224609375, -0.04892730712890625, -0.042694091796875, -0.03646087646484375, -0.0302276611328125, -0.02399444580078125, -0.01776123046875, -0.01152801513671875, -0.0052947998046875, 0.00093841552734375, 0.007171630859375, 0.01340484619140625, 0.0196380615234375, 0.02587127685546875, 0.0321044921875, 0.03833770751953125, 0.0445709228515625, 0.05080413818359375, 0.057037353515625, 0.06327056884765625, 0.0695037841796875, 0.07573699951171875, 0.08197021484375, 0.08820343017578125, 0.0944366455078125, 0.10066986083984375, 0.106903076171875, 0.11313629150390625, 0.1193695068359375, 0.12560272216796875, 0.1318359375, 0.13806915283203125, 0.1443023681640625, 0.15053558349609375, 0.156768798828125, 0.16300201416015625, 0.1692352294921875, 0.17546844482421875, 0.18170166015625, 0.18793487548828125, 0.1941680908203125, 0.20040130615234375, 0.206634521484375, 0.21286773681640625, 0.2191009521484375, 0.22533416748046875, 0.2315673828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 13.0, 2.0, 5.0, 8.0, 3.0, 6.0, 13.0, 10.0, 18.0, 29.0, 32.0, 38.0, 58.0, 66.0, 81.0, 82.0, 94.0, 92.0, 70.0, 57.0, 54.0, 28.0, 25.0, 31.0, 29.0, 10.0, 10.0, 8.0, 5.0, 8.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-4.6193599700927734e-05, -4.501082003116608e-05, -4.382804036140442e-05, -4.264526069164276e-05, -4.1462481021881104e-05, -4.0279701352119446e-05, -3.909692168235779e-05, -3.791414201259613e-05, -3.673136234283447e-05, -3.5548582673072815e-05, -3.436580300331116e-05, -3.31830233335495e-05, -3.200024366378784e-05, -3.0817463994026184e-05, -2.9634684324264526e-05, -2.845190465450287e-05, -2.726912498474121e-05, -2.6086345314979553e-05, -2.4903565645217896e-05, -2.3720785975456238e-05, -2.253800630569458e-05, -2.1355226635932922e-05, -2.0172446966171265e-05, -1.8989667296409607e-05, -1.780688762664795e-05, -1.662410795688629e-05, -1.5441328287124634e-05, -1.4258548617362976e-05, -1.3075768947601318e-05, -1.189298927783966e-05, -1.0710209608078003e-05, -9.527429938316345e-06, -8.344650268554688e-06, -7.16187059879303e-06, -5.979090929031372e-06, -4.796311259269714e-06, -3.6135315895080566e-06, -2.430751919746399e-06, -1.2479722499847412e-06, -6.51925802230835e-08, 1.1175870895385742e-06, 2.300366759300232e-06, 3.4831464290618896e-06, 4.665926098823547e-06, 5.848705768585205e-06, 7.031485438346863e-06, 8.21426510810852e-06, 9.397044777870178e-06, 1.0579824447631836e-05, 1.1762604117393494e-05, 1.2945383787155151e-05, 1.4128163456916809e-05, 1.5310943126678467e-05, 1.6493722796440125e-05, 1.7676502466201782e-05, 1.885928213596344e-05, 2.0042061805725098e-05, 2.1224841475486755e-05, 2.2407621145248413e-05, 2.359040081501007e-05, 2.477318048477173e-05, 2.5955960154533386e-05, 2.7138739824295044e-05, 2.83215194940567e-05, 2.950429916381836e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 5.0, 7.0, 5.0, 7.0, 14.0, 21.0, 31.0, 43.0, 71.0, 91.0, 161.0, 271.0, 483.0, 905.0, 1818.0, 4266.0, 11965.0, 46413.0, 272185.0, 569473.0, 105691.0, 22309.0, 6855.0, 2630.0, 1235.0, 655.0, 364.0, 212.0, 121.0, 81.0, 66.0, 32.0, 23.0, 13.0, 13.0, 9.0, 5.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18017578125, -0.17401504516601562, -0.16785430908203125, -0.16169357299804688, -0.1555328369140625, -0.14937210083007812, -0.14321136474609375, -0.13705062866210938, -0.130889892578125, -0.12472915649414062, -0.11856842041015625, -0.11240768432617188, -0.1062469482421875, -0.10008621215820312, -0.09392547607421875, -0.08776473999023438, -0.08160400390625, -0.07544326782226562, -0.06928253173828125, -0.06312179565429688, -0.0569610595703125, -0.050800323486328125, -0.04463958740234375, -0.038478851318359375, -0.032318115234375, -0.026157379150390625, -0.01999664306640625, -0.013835906982421875, -0.0076751708984375, -0.001514434814453125, 0.00464630126953125, 0.010807037353515625, 0.0169677734375, 0.023128509521484375, 0.02928924560546875, 0.035449981689453125, 0.0416107177734375, 0.047771453857421875, 0.05393218994140625, 0.060092926025390625, 0.066253662109375, 0.07241439819335938, 0.07857513427734375, 0.08473587036132812, 0.0908966064453125, 0.09705734252929688, 0.10321807861328125, 0.10937881469726562, 0.11553955078125, 0.12170028686523438, 0.12786102294921875, 0.13402175903320312, 0.1401824951171875, 0.14634323120117188, 0.15250396728515625, 0.15866470336914062, 0.164825439453125, 0.17098617553710938, 0.17714691162109375, 0.18330764770507812, 0.1894683837890625, 0.19562911987304688, 0.20178985595703125, 0.20795059204101562, 0.214111328125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 9.0, 5.0, 9.0, 11.0, 20.0, 18.0, 23.0, 36.0, 42.0, 57.0, 69.0, 82.0, 86.0, 82.0, 86.0, 91.0, 50.0, 47.0, 45.0, 46.0, 16.0, 18.0, 16.0, 8.0, 7.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2374267578125, -0.23070144653320312, -0.22397613525390625, -0.21725082397460938, -0.2105255126953125, -0.20380020141601562, -0.19707489013671875, -0.19034957885742188, -0.183624267578125, -0.17689895629882812, -0.17017364501953125, -0.16344833374023438, -0.1567230224609375, -0.14999771118164062, -0.14327239990234375, -0.13654708862304688, -0.12982177734375, -0.12309646606445312, -0.11637115478515625, -0.10964584350585938, -0.1029205322265625, -0.09619522094726562, -0.08946990966796875, -0.08274459838867188, -0.076019287109375, -0.06929397583007812, -0.06256866455078125, -0.055843353271484375, -0.0491180419921875, -0.042392730712890625, -0.03566741943359375, -0.028942108154296875, -0.022216796875, -0.015491485595703125, -0.00876617431640625, -0.002040863037109375, 0.0046844482421875, 0.011409759521484375, 0.01813507080078125, 0.024860382080078125, 0.031585693359375, 0.038311004638671875, 0.04503631591796875, 0.051761627197265625, 0.0584869384765625, 0.06521224975585938, 0.07193756103515625, 0.07866287231445312, 0.08538818359375, 0.09211349487304688, 0.09883880615234375, 0.10556411743164062, 0.1122894287109375, 0.11901473999023438, 0.12574005126953125, 0.13246536254882812, 0.139190673828125, 0.14591598510742188, 0.15264129638671875, 0.15936660766601562, 0.1660919189453125, 0.17281723022460938, 0.17954254150390625, 0.18626785278320312, 0.1929931640625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 11.0, 10.0, 10.0, 19.0, 29.0, 47.0, 73.0, 112.0, 130.0, 133.0, 128.0, 97.0, 68.0, 48.0, 31.0, 16.0, 7.0, 12.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.7198100090026855, -4.608731746673584, -4.497653484344482, -4.386575222015381, -4.275496959686279, -4.1644182205200195, -4.053339958190918, -3.9422619342803955, -3.831183433532715, -3.7201051712036133, -3.6090269088745117, -3.49794864654541, -3.3868701457977295, -3.275791883468628, -3.1647136211395264, -3.053635358810425, -2.9425570964813232, -2.8314788341522217, -2.72040057182312, -2.6093220710754395, -2.498243808746338, -2.3871655464172363, -2.2760872840881348, -2.165009021759033, -2.0539307594299316, -1.94285249710083, -1.831774115562439, -1.7206958532333374, -1.6096174716949463, -1.4985392093658447, -1.3874609470367432, -1.2763826847076416, -1.1653039455413818, -1.0542256832122803, -0.9431473016738892, -0.8320690393447876, -0.7209907174110413, -0.6099123954772949, -0.49883413314819336, -0.387755811214447, -0.2766774892807007, -0.16559918224811554, -0.054520875215530396, 0.056557416915893555, 0.1676357388496399, 0.27871406078338623, 0.3897923231124878, 0.5008706450462341, 0.6119489669799805, 0.7230272889137268, 0.8341056108474731, 0.9451838731765747, 1.0562622547149658, 1.1673405170440674, 1.278418779373169, 1.3894970417022705, 1.5005754232406616, 1.6116536855697632, 1.7227320671081543, 1.8338103294372559, 1.9448885917663574, 2.055966854095459, 2.1670451164245605, 2.278123617172241, 2.3892018795013428]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 2.0, 9.0, 6.0, 10.0, 17.0, 21.0, 16.0, 18.0, 18.0, 20.0, 38.0, 42.0, 41.0, 32.0, 42.0, 44.0, 60.0, 43.0, 55.0, 34.0, 41.0, 51.0, 36.0, 45.0, 43.0, 28.0, 28.0, 26.0, 20.0, 27.0, 16.0, 19.0, 9.0, 13.0, 6.0, 6.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1822519302368164, -3.0799543857574463, -2.977656841278076, -2.875359296798706, -2.773061752319336, -2.670764446258545, -2.568466901779175, -2.4661693572998047, -2.3638718128204346, -2.2615742683410645, -2.1592767238616943, -2.056979179382324, -1.9546817541122437, -1.8523842096328735, -1.750086784362793, -1.6477892398834229, -1.5454916954040527, -1.4431941509246826, -1.3408966064453125, -1.238599181175232, -1.1363016366958618, -1.0340040922164917, -0.9317066073417664, -0.829409122467041, -0.7271115779876709, -0.6248140335083008, -0.5225165486335754, -0.4202190339565277, -0.31792151927948, -0.21562397480010986, -0.11332648992538452, -0.01102900505065918, 0.09126853942871094, 0.19356605410575867, 0.2958635687828064, 0.3981610834598541, 0.5004585981369019, 0.602756142616272, 0.7050536274909973, 0.8073511123657227, 0.9096486568450928, 1.011946201324463, 1.114243745803833, 1.2165411710739136, 1.3188387155532837, 1.4211362600326538, 1.5234336853027344, 1.6257312297821045, 1.7280287742614746, 1.8303263187408447, 1.9326238632202148, 2.034921407699585, 2.137218952178955, 2.239516258239746, 2.341813802719116, 2.4441113471984863, 2.5464088916778564, 2.6487064361572266, 2.7510039806365967, 2.853301525115967, 2.955598831176758, 3.057896614074707, 3.160193920135498, 3.262491464614868, 3.3647890090942383]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 16.0, 12.0, 14.0, 22.0, 29.0, 37.0, 94.0, 143.0, 232.0, 656.0, 4187857.0, 4163.0, 458.0, 204.0, 103.0, 75.0, 55.0, 34.0, 24.0, 18.0, 3.0, 7.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8203125, -8.5596923828125, -8.299072265625, -8.0384521484375, -7.77783203125, -7.5172119140625, -7.256591796875, -6.9959716796875, -6.7353515625, -6.4747314453125, -6.214111328125, -5.9534912109375, -5.69287109375, -5.4322509765625, -5.171630859375, -4.9110107421875, -4.650390625, -4.3897705078125, -4.129150390625, -3.8685302734375, -3.60791015625, -3.3472900390625, -3.086669921875, -2.8260498046875, -2.5654296875, -2.3048095703125, -2.044189453125, -1.7835693359375, -1.52294921875, -1.2623291015625, -1.001708984375, -0.7410888671875, -0.48046875, -0.2198486328125, 0.040771484375, 0.3013916015625, 0.56201171875, 0.8226318359375, 1.083251953125, 1.3438720703125, 1.6044921875, 1.8651123046875, 2.125732421875, 2.3863525390625, 2.64697265625, 2.9075927734375, 3.168212890625, 3.4288330078125, 3.689453125, 3.9500732421875, 4.210693359375, 4.4713134765625, 4.73193359375, 4.9925537109375, 5.253173828125, 5.5137939453125, 5.7744140625, 6.0350341796875, 6.295654296875, 6.5562744140625, 6.81689453125, 7.0775146484375, 7.338134765625, 7.5987548828125, 7.859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 1.0, 8.0, 11.0, 10.0, 20.0, 24.0, 31.0, 38.0, 44.0, 41.0, 66.0, 65.0, 54.0, 95.0, 71.0, 71.0, 67.0, 50.0, 65.0, 38.0, 33.0, 28.0, 23.0, 14.0, 10.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.31005859375, -0.3011207580566406, -0.29218292236328125, -0.2832450866699219, -0.2743072509765625, -0.2653694152832031, -0.25643157958984375, -0.24749374389648438, -0.238555908203125, -0.22961807250976562, -0.22068023681640625, -0.21174240112304688, -0.2028045654296875, -0.19386672973632812, -0.18492889404296875, -0.17599105834960938, -0.16705322265625, -0.15811538696289062, -0.14917755126953125, -0.14023971557617188, -0.1313018798828125, -0.12236404418945312, -0.11342620849609375, -0.10448837280273438, -0.095550537109375, -0.08661270141601562, -0.07767486572265625, -0.06873703002929688, -0.0597991943359375, -0.050861358642578125, -0.04192352294921875, -0.032985687255859375, -0.0240478515625, -0.015110015869140625, -0.00617218017578125, 0.002765655517578125, 0.0117034912109375, 0.020641326904296875, 0.02957916259765625, 0.038516998291015625, 0.047454833984375, 0.056392669677734375, 0.06533050537109375, 0.07426834106445312, 0.0832061767578125, 0.09214401245117188, 0.10108184814453125, 0.11001968383789062, 0.11895751953125, 0.12789535522460938, 0.13683319091796875, 0.14577102661132812, 0.1547088623046875, 0.16364669799804688, 0.17258453369140625, 0.18152236938476562, 0.190460205078125, 0.19939804077148438, 0.20833587646484375, 0.21727371215820312, 0.2262115478515625, 0.23514938354492188, 0.24408721923828125, 0.2530250549316406, 0.261962890625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 8.0, 4.0, 6.0, 16.0, 16.0, 15.0, 34.0, 28.0, 60.0, 76.0, 107.0, 160.0, 239.0, 337.0, 490.0, 803.0, 2036.0, 30649.0, 4153439.0, 3016.0, 968.0, 584.0, 387.0, 246.0, 161.0, 105.0, 81.0, 60.0, 41.0, 29.0, 26.0, 14.0, 14.0, 11.0, 2.0, 9.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.814453125, -2.736541748046875, -2.65863037109375, -2.580718994140625, -2.5028076171875, -2.424896240234375, -2.34698486328125, -2.269073486328125, -2.191162109375, -2.113250732421875, -2.03533935546875, -1.957427978515625, -1.8795166015625, -1.801605224609375, -1.72369384765625, -1.645782470703125, -1.56787109375, -1.489959716796875, -1.41204833984375, -1.334136962890625, -1.2562255859375, -1.178314208984375, -1.10040283203125, -1.022491455078125, -0.944580078125, -0.866668701171875, -0.78875732421875, -0.710845947265625, -0.6329345703125, -0.555023193359375, -0.47711181640625, -0.399200439453125, -0.3212890625, -0.243377685546875, -0.16546630859375, -0.087554931640625, -0.0096435546875, 0.068267822265625, 0.14617919921875, 0.224090576171875, 0.302001953125, 0.379913330078125, 0.45782470703125, 0.535736083984375, 0.6136474609375, 0.691558837890625, 0.76947021484375, 0.847381591796875, 0.92529296875, 1.003204345703125, 1.08111572265625, 1.159027099609375, 1.2369384765625, 1.314849853515625, 1.39276123046875, 1.470672607421875, 1.548583984375, 1.626495361328125, 1.70440673828125, 1.782318115234375, 1.8602294921875, 1.938140869140625, 2.01605224609375, 2.093963623046875, 2.171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 12.0, 17.0, 3940.0, 88.0, 10.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.459228515625, -0.4427452087402344, -0.42626190185546875, -0.4097785949707031, -0.3932952880859375, -0.3768119812011719, -0.36032867431640625, -0.3438453674316406, -0.327362060546875, -0.3108787536621094, -0.29439544677734375, -0.2779121398925781, -0.2614288330078125, -0.24494552612304688, -0.22846221923828125, -0.21197891235351562, -0.19549560546875, -0.17901229858398438, -0.16252899169921875, -0.14604568481445312, -0.1295623779296875, -0.11307907104492188, -0.09659576416015625, -0.08011245727539062, -0.063629150390625, -0.047145843505859375, -0.03066253662109375, -0.014179229736328125, 0.0023040771484375, 0.018787384033203125, 0.03527069091796875, 0.051753997802734375, 0.0682373046875, 0.08472061157226562, 0.10120391845703125, 0.11768722534179688, 0.1341705322265625, 0.15065383911132812, 0.16713714599609375, 0.18362045288085938, 0.200103759765625, 0.21658706665039062, 0.23307037353515625, 0.24955368041992188, 0.2660369873046875, 0.2825202941894531, 0.29900360107421875, 0.3154869079589844, 0.33197021484375, 0.3484535217285156, 0.36493682861328125, 0.3814201354980469, 0.3979034423828125, 0.4143867492675781, 0.43087005615234375, 0.4473533630371094, 0.463836669921875, 0.4803199768066406, 0.49680328369140625, 0.5132865905761719, 0.5297698974609375, 0.5462532043457031, 0.5627365112304688, 0.5792198181152344, 0.595703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 13.0, 11.0, 13.0, 15.0, 34.0, 38.0, 79.0, 123.0, 190.0, 155.0, 111.0, 63.0, 31.0, 32.0, 21.0, 15.0, 14.0, 12.0, 4.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9294941425323486, -0.9010617733001709, -0.8726294040679932, -0.8441969752311707, -0.8157646059989929, -0.7873322367668152, -0.7588998675346375, -0.7304674386978149, -0.7020350694656372, -0.6736027002334595, -0.6451703310012817, -0.6167379021644592, -0.5883055329322815, -0.5598731637001038, -0.531440794467926, -0.5030083656311035, -0.47457602620124817, -0.44614365696907043, -0.4177112579345703, -0.3892788887023926, -0.36084648966789246, -0.3324141204357147, -0.3039817214012146, -0.27554935216903687, -0.24711696803569794, -0.218684583902359, -0.19025219976902008, -0.16181981563568115, -0.13338744640350342, -0.10495506227016449, -0.07652267813682556, -0.04809029400348663, -0.019657909870147705, 0.008774472400546074, 0.03720685467123985, 0.06563923507928848, 0.09407161921262741, 0.12250399589538574, 0.15093638002872467, 0.1793687641620636, 0.20780114829540253, 0.23623353242874146, 0.2646659016609192, 0.2930983006954193, 0.32153066992759705, 0.34996306896209717, 0.3783954381942749, 0.40682780742645264, 0.43526020646095276, 0.4636925756931305, 0.4921249747276306, 0.5205573439598083, 0.5489897131919861, 0.5774221420288086, 0.6058545112609863, 0.6342868804931641, 0.6627192497253418, 0.6911516189575195, 0.7195839881896973, 0.7480164170265198, 0.7764487862586975, 0.8048811554908752, 0.833313524723053, 0.8617459535598755, 0.8901783227920532]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 11.0, 12.0, 15.0, 12.0, 21.0, 24.0, 24.0, 32.0, 41.0, 30.0, 47.0, 35.0, 41.0, 42.0, 50.0, 64.0, 47.0, 43.0, 65.0, 48.0, 39.0, 35.0, 29.0, 32.0, 23.0, 26.0, 24.0, 17.0, 11.0, 12.0, 8.0, 9.0, 3.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5416792631149292, -0.5253645181655884, -0.5090497732162476, -0.49273499846458435, -0.47642025351524353, -0.4601054787635803, -0.4437907338142395, -0.4274759888648987, -0.41116124391555786, -0.39484649896621704, -0.37853172421455383, -0.362216979265213, -0.3459022343158722, -0.329587459564209, -0.31327271461486816, -0.29695796966552734, -0.28064319491386414, -0.2643284499645233, -0.2480136901140213, -0.2316989302635193, -0.21538418531417847, -0.19906942546367645, -0.18275466561317444, -0.16643992066383362, -0.1501251608133316, -0.1338104009628296, -0.11749565601348877, -0.10118089616298676, -0.08486614376306534, -0.06855139136314392, -0.05223663151264191, -0.03592187911272049, -0.019607126712799072, -0.003292372450232506, 0.01302238181233406, 0.029337137937545776, 0.045651890337467194, 0.06196664273738861, 0.07828140258789062, 0.09459615498781204, 0.11091090738773346, 0.12722566723823547, 0.1435404121875763, 0.1598551720380783, 0.17616993188858032, 0.19248467683792114, 0.20879943668842316, 0.22511419653892517, 0.241428941488266, 0.2577436864376068, 0.27405846118927, 0.29037320613861084, 0.30668795108795166, 0.3230026960372925, 0.3393174707889557, 0.3556322157382965, 0.3719469904899597, 0.38826173543930054, 0.40457651019096375, 0.42089125514030457, 0.4372060000896454, 0.4535207748413086, 0.4698355197906494, 0.48615026473999023, 0.502465009689331]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 7.0, 7.0, 15.0, 12.0, 25.0, 38.0, 53.0, 84.0, 143.0, 236.0, 360.0, 727.0, 1124.0, 2335.0, 5030.0, 15738.0, 124055.0, 777386.0, 97649.0, 13963.0, 4780.0, 2142.0, 1093.0, 597.0, 361.0, 202.0, 120.0, 105.0, 46.0, 40.0, 16.0, 15.0, 11.0, 14.0, 3.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.86181640625, -0.8335189819335938, -0.8052215576171875, -0.7769241333007812, -0.748626708984375, -0.7203292846679688, -0.6920318603515625, -0.6637344360351562, -0.63543701171875, -0.6071395874023438, -0.5788421630859375, -0.5505447387695312, -0.522247314453125, -0.49394989013671875, -0.4656524658203125, -0.43735504150390625, -0.4090576171875, -0.38076019287109375, -0.3524627685546875, -0.32416534423828125, -0.295867919921875, -0.26757049560546875, -0.2392730712890625, -0.21097564697265625, -0.18267822265625, -0.15438079833984375, -0.1260833740234375, -0.09778594970703125, -0.069488525390625, -0.04119110107421875, -0.0128936767578125, 0.01540374755859375, 0.043701171875, 0.07199859619140625, 0.1002960205078125, 0.12859344482421875, 0.156890869140625, 0.18518829345703125, 0.2134857177734375, 0.24178314208984375, 0.27008056640625, 0.29837799072265625, 0.3266754150390625, 0.35497283935546875, 0.383270263671875, 0.41156768798828125, 0.4398651123046875, 0.46816253662109375, 0.4964599609375, 0.5247573852539062, 0.5530548095703125, 0.5813522338867188, 0.609649658203125, 0.6379470825195312, 0.6662445068359375, 0.6945419311523438, 0.72283935546875, 0.7511367797851562, 0.7794342041015625, 0.8077316284179688, 0.836029052734375, 0.8643264770507812, 0.8926239013671875, 0.9209213256835938, 0.94921875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 7.0, 9.0, 16.0, 21.0, 26.0, 28.0, 37.0, 47.0, 32.0, 65.0, 60.0, 63.0, 57.0, 67.0, 75.0, 64.0, 49.0, 49.0, 49.0, 43.0, 28.0, 27.0, 29.0, 11.0, 12.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.303466796875, -0.29479217529296875, -0.2861175537109375, -0.27744293212890625, -0.268768310546875, -0.26009368896484375, -0.2514190673828125, -0.24274444580078125, -0.23406982421875, -0.22539520263671875, -0.2167205810546875, -0.20804595947265625, -0.199371337890625, -0.19069671630859375, -0.1820220947265625, -0.17334747314453125, -0.1646728515625, -0.15599822998046875, -0.1473236083984375, -0.13864898681640625, -0.129974365234375, -0.12129974365234375, -0.1126251220703125, -0.10395050048828125, -0.09527587890625, -0.08660125732421875, -0.0779266357421875, -0.06925201416015625, -0.060577392578125, -0.05190277099609375, -0.0432281494140625, -0.03455352783203125, -0.02587890625, -0.01720428466796875, -0.0085296630859375, 0.00014495849609375, 0.008819580078125, 0.01749420166015625, 0.0261688232421875, 0.03484344482421875, 0.04351806640625, 0.05219268798828125, 0.0608673095703125, 0.06954193115234375, 0.078216552734375, 0.08689117431640625, 0.0955657958984375, 0.10424041748046875, 0.1129150390625, 0.12158966064453125, 0.1302642822265625, 0.13893890380859375, 0.147613525390625, 0.15628814697265625, 0.1649627685546875, 0.17363739013671875, 0.18231201171875, 0.19098663330078125, 0.1996612548828125, 0.20833587646484375, 0.217010498046875, 0.22568511962890625, 0.2343597412109375, 0.24303436279296875, 0.251708984375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 6.0, 9.0, 14.0, 30.0, 34.0, 35.0, 58.0, 69.0, 163.0, 298.0, 475.0, 975.0, 2329.0, 6839.0, 34427.0, 477630.0, 479825.0, 34053.0, 6821.0, 2244.0, 998.0, 490.0, 270.0, 167.0, 93.0, 63.0, 44.0, 24.0, 16.0, 8.0, 20.0, 4.0, 7.0, 4.0, 3.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63916015625, -0.6191864013671875, -0.599212646484375, -0.5792388916015625, -0.55926513671875, -0.5392913818359375, -0.519317626953125, -0.4993438720703125, -0.4793701171875, -0.4593963623046875, -0.439422607421875, -0.4194488525390625, -0.39947509765625, -0.3795013427734375, -0.359527587890625, -0.3395538330078125, -0.319580078125, -0.2996063232421875, -0.279632568359375, -0.2596588134765625, -0.23968505859375, -0.2197113037109375, -0.199737548828125, -0.1797637939453125, -0.1597900390625, -0.1398162841796875, -0.119842529296875, -0.0998687744140625, -0.07989501953125, -0.0599212646484375, -0.039947509765625, -0.0199737548828125, 0.0, 0.0199737548828125, 0.039947509765625, 0.0599212646484375, 0.07989501953125, 0.0998687744140625, 0.119842529296875, 0.1398162841796875, 0.1597900390625, 0.1797637939453125, 0.199737548828125, 0.2197113037109375, 0.23968505859375, 0.2596588134765625, 0.279632568359375, 0.2996063232421875, 0.319580078125, 0.3395538330078125, 0.359527587890625, 0.3795013427734375, 0.39947509765625, 0.4194488525390625, 0.439422607421875, 0.4593963623046875, 0.4793701171875, 0.4993438720703125, 0.519317626953125, 0.5392913818359375, 0.55926513671875, 0.5792388916015625, 0.599212646484375, 0.6191864013671875, 0.63916015625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 9.0, 11.0, 12.0, 17.0, 17.0, 18.0, 26.0, 32.0, 35.0, 30.0, 34.0, 34.0, 35.0, 47.0, 40.0, 45.0, 48.0, 51.0, 60.0, 44.0, 36.0, 29.0, 33.0, 31.0, 30.0, 28.0, 34.0, 24.0, 22.0, 20.0, 15.0, 14.0, 10.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83642578125, -0.8123626708984375, -0.788299560546875, -0.7642364501953125, -0.74017333984375, -0.7161102294921875, -0.692047119140625, -0.6679840087890625, -0.6439208984375, -0.6198577880859375, -0.595794677734375, -0.5717315673828125, -0.54766845703125, -0.5236053466796875, -0.499542236328125, -0.4754791259765625, -0.451416015625, -0.4273529052734375, -0.403289794921875, -0.3792266845703125, -0.35516357421875, -0.3311004638671875, -0.307037353515625, -0.2829742431640625, -0.2589111328125, -0.2348480224609375, -0.210784912109375, -0.1867218017578125, -0.16265869140625, -0.1385955810546875, -0.114532470703125, -0.0904693603515625, -0.06640625, -0.0423431396484375, -0.018280029296875, 0.0057830810546875, 0.02984619140625, 0.0539093017578125, 0.077972412109375, 0.1020355224609375, 0.1260986328125, 0.1501617431640625, 0.174224853515625, 0.1982879638671875, 0.22235107421875, 0.2464141845703125, 0.270477294921875, 0.2945404052734375, 0.318603515625, 0.3426666259765625, 0.366729736328125, 0.3907928466796875, 0.41485595703125, 0.4389190673828125, 0.462982177734375, 0.4870452880859375, 0.5111083984375, 0.5351715087890625, 0.559234619140625, 0.5832977294921875, 0.60736083984375, 0.6314239501953125, 0.655487060546875, 0.6795501708984375, 0.70361328125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 4.0, 8.0, 9.0, 6.0, 8.0, 16.0, 31.0, 42.0, 110.0, 240.0, 528.0, 1741.0, 8147.0, 107670.0, 882273.0, 40842.0, 4893.0, 1193.0, 399.0, 165.0, 86.0, 54.0, 20.0, 11.0, 15.0, 12.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3017578125, -0.29111480712890625, -0.2804718017578125, -0.26982879638671875, -0.259185791015625, -0.24854278564453125, -0.2378997802734375, -0.22725677490234375, -0.21661376953125, -0.20597076416015625, -0.1953277587890625, -0.18468475341796875, -0.174041748046875, -0.16339874267578125, -0.1527557373046875, -0.14211273193359375, -0.1314697265625, -0.12082672119140625, -0.1101837158203125, -0.09954071044921875, -0.088897705078125, -0.07825469970703125, -0.0676116943359375, -0.05696868896484375, -0.04632568359375, -0.03568267822265625, -0.0250396728515625, -0.01439666748046875, -0.003753662109375, 0.00688934326171875, 0.0175323486328125, 0.02817535400390625, 0.038818359375, 0.04946136474609375, 0.0601043701171875, 0.07074737548828125, 0.081390380859375, 0.09203338623046875, 0.1026763916015625, 0.11331939697265625, 0.12396240234375, 0.13460540771484375, 0.1452484130859375, 0.15589141845703125, 0.166534423828125, 0.17717742919921875, 0.1878204345703125, 0.19846343994140625, 0.2091064453125, 0.21974945068359375, 0.2303924560546875, 0.24103546142578125, 0.251678466796875, 0.26232147216796875, 0.2729644775390625, 0.28360748291015625, 0.29425048828125, 0.30489349365234375, 0.3155364990234375, 0.32617950439453125, 0.336822509765625, 0.34746551513671875, 0.3581085205078125, 0.36875152587890625, 0.37939453125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 8.0, 11.0, 9.0, 19.0, 27.0, 27.0, 41.0, 79.0, 89.0, 121.0, 133.0, 121.0, 82.0, 62.0, 31.0, 41.0, 22.0, 19.0, 14.0, 8.0, 4.0, 2.0, 4.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.398822784423828e-05, -4.2389146983623505e-05, -4.079006612300873e-05, -3.919098526239395e-05, -3.7591904401779175e-05, -3.59928235411644e-05, -3.439374268054962e-05, -3.2794661819934845e-05, -3.119558095932007e-05, -2.9596500098705292e-05, -2.7997419238090515e-05, -2.639833837747574e-05, -2.4799257516860962e-05, -2.3200176656246185e-05, -2.160109579563141e-05, -2.0002014935016632e-05, -1.8402934074401855e-05, -1.680385321378708e-05, -1.5204772353172302e-05, -1.3605691492557526e-05, -1.2006610631942749e-05, -1.0407529771327972e-05, -8.808448910713196e-06, -7.209368050098419e-06, -5.610287189483643e-06, -4.011206328868866e-06, -2.4121254682540894e-06, -8.130446076393127e-07, 7.860362529754639e-07, 2.3851171135902405e-06, 3.984197974205017e-06, 5.583278834819794e-06, 7.18235969543457e-06, 8.781440556049347e-06, 1.0380521416664124e-05, 1.19796022772789e-05, 1.3578683137893677e-05, 1.5177763998508453e-05, 1.677684485912323e-05, 1.8375925719738007e-05, 1.9975006580352783e-05, 2.157408744096756e-05, 2.3173168301582336e-05, 2.4772249162197113e-05, 2.637133002281189e-05, 2.7970410883426666e-05, 2.9569491744041443e-05, 3.116857260465622e-05, 3.2767653465270996e-05, 3.436673432588577e-05, 3.596581518650055e-05, 3.7564896047115326e-05, 3.91639769077301e-05, 4.076305776834488e-05, 4.2362138628959656e-05, 4.396121948957443e-05, 4.556030035018921e-05, 4.7159381210803986e-05, 4.875846207141876e-05, 5.035754293203354e-05, 5.1956623792648315e-05, 5.355570465326309e-05, 5.515478551387787e-05, 5.6753866374492645e-05, 5.835294723510742e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 8.0, 14.0, 25.0, 26.0, 49.0, 71.0, 152.0, 343.0, 901.0, 3333.0, 19528.0, 626234.0, 377821.0, 15650.0, 2937.0, 796.0, 335.0, 140.0, 71.0, 48.0, 22.0, 16.0, 14.0, 4.0, 4.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.333251953125, -0.3204078674316406, -0.30756378173828125, -0.2947196960449219, -0.2818756103515625, -0.2690315246582031, -0.25618743896484375, -0.24334335327148438, -0.230499267578125, -0.21765518188476562, -0.20481109619140625, -0.19196701049804688, -0.1791229248046875, -0.16627883911132812, -0.15343475341796875, -0.14059066772460938, -0.12774658203125, -0.11490249633789062, -0.10205841064453125, -0.08921432495117188, -0.0763702392578125, -0.06352615356445312, -0.05068206787109375, -0.037837982177734375, -0.024993896484375, -0.012149810791015625, 0.00069427490234375, 0.013538360595703125, 0.0263824462890625, 0.039226531982421875, 0.05207061767578125, 0.06491470336914062, 0.0777587890625, 0.09060287475585938, 0.10344696044921875, 0.11629104614257812, 0.1291351318359375, 0.14197921752929688, 0.15482330322265625, 0.16766738891601562, 0.180511474609375, 0.19335556030273438, 0.20619964599609375, 0.21904373168945312, 0.2318878173828125, 0.24473190307617188, 0.25757598876953125, 0.2704200744628906, 0.28326416015625, 0.2961082458496094, 0.30895233154296875, 0.3217964172363281, 0.3346405029296875, 0.3474845886230469, 0.36032867431640625, 0.3731727600097656, 0.386016845703125, 0.3988609313964844, 0.41170501708984375, 0.4245491027832031, 0.4373931884765625, 0.4502372741699219, 0.46308135986328125, 0.4759254455566406, 0.48876953125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 7.0, 14.0, 15.0, 16.0, 23.0, 30.0, 65.0, 95.0, 112.0, 119.0, 118.0, 112.0, 88.0, 59.0, 31.0, 27.0, 23.0, 15.0, 11.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.23193359375, -0.223663330078125, -0.21539306640625, -0.207122802734375, -0.1988525390625, -0.190582275390625, -0.18231201171875, -0.174041748046875, -0.165771484375, -0.157501220703125, -0.14923095703125, -0.140960693359375, -0.1326904296875, -0.124420166015625, -0.11614990234375, -0.107879638671875, -0.099609375, -0.091339111328125, -0.08306884765625, -0.074798583984375, -0.0665283203125, -0.058258056640625, -0.04998779296875, -0.041717529296875, -0.033447265625, -0.025177001953125, -0.01690673828125, -0.008636474609375, -0.0003662109375, 0.007904052734375, 0.01617431640625, 0.024444580078125, 0.03271484375, 0.040985107421875, 0.04925537109375, 0.057525634765625, 0.0657958984375, 0.074066162109375, 0.08233642578125, 0.090606689453125, 0.098876953125, 0.107147216796875, 0.11541748046875, 0.123687744140625, 0.1319580078125, 0.140228271484375, 0.14849853515625, 0.156768798828125, 0.1650390625, 0.173309326171875, 0.18157958984375, 0.189849853515625, 0.1981201171875, 0.206390380859375, 0.21466064453125, 0.222930908203125, 0.231201171875, 0.239471435546875, 0.24774169921875, 0.256011962890625, 0.2642822265625, 0.272552490234375, 0.28082275390625, 0.289093017578125, 0.29736328125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 13.0, 16.0, 21.0, 54.0, 55.0, 77.0, 124.0, 130.0, 116.0, 108.0, 74.0, 56.0, 52.0, 36.0, 10.0, 10.0, 7.0, 4.0, 10.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4914488792419434, -3.399714708328247, -3.30798077583313, -3.2162466049194336, -3.1245126724243164, -3.03277850151062, -2.941044330596924, -2.8493103981018066, -2.7575762271881104, -2.665842056274414, -2.574108123779297, -2.4823739528656006, -2.3906397819519043, -2.298905849456787, -2.207171678543091, -2.1154375076293945, -2.0237035751342773, -1.9319695234298706, -1.8402354717254639, -1.7485013008117676, -1.6567672491073608, -1.565033197402954, -1.4732990264892578, -1.381564974784851, -1.2898309230804443, -1.1980968713760376, -1.1063628196716309, -1.0146286487579346, -0.9228945970535278, -0.8311605453491211, -0.7394264340400696, -0.6476923227310181, -0.5559585094451904, -0.4642244279384613, -0.3724903464317322, -0.28075626492500305, -0.18902218341827393, -0.0972881019115448, -0.005554020404815674, 0.08618009090423584, 0.17791414260864258, 0.2696482241153717, 0.36138230562210083, 0.45311638712882996, 0.5448504686355591, 0.6365845203399658, 0.7283186316490173, 0.8200527429580688, 0.9117867946624756, 1.0035208463668823, 1.095254898071289, 1.1869890689849854, 1.278723120689392, 1.3704571723937988, 1.4621913433074951, 1.5539253950119019, 1.6456594467163086, 1.7373934984207153, 1.829127550125122, 1.9208617210388184, 2.0125956535339355, 2.104329824447632, 2.196063995361328, 2.2877979278564453, 2.3795320987701416]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 3.0, 7.0, 7.0, 6.0, 5.0, 12.0, 13.0, 11.0, 18.0, 22.0, 26.0, 34.0, 50.0, 47.0, 52.0, 44.0, 59.0, 70.0, 59.0, 57.0, 61.0, 53.0, 35.0, 36.0, 31.0, 37.0, 32.0, 20.0, 20.0, 22.0, 14.0, 13.0, 7.0, 11.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9098610877990723, -2.780362367630005, -2.6508636474609375, -2.521364688873291, -2.3918659687042236, -2.2623672485351562, -2.132868528366089, -2.0033698081970215, -1.8738709688186646, -1.7443722486495972, -1.6148734092712402, -1.4853746891021729, -1.3558759689331055, -1.2263771295547485, -1.0968784093856812, -0.967379629611969, -0.8378808498382568, -0.7083820700645447, -0.5788832902908325, -0.44938457012176514, -0.319885790348053, -0.19038701057434082, -0.06088829040527344, 0.06861048936843872, 0.19810926914215088, 0.32760804891586304, 0.4571067988872528, 0.5866055488586426, 0.7161043286323547, 0.8456031084060669, 0.9751018285751343, 1.1046006679534912, 1.2340993881225586, 1.363598108291626, 1.493096947669983, 1.6225956678390503, 1.7520945072174072, 1.8815932273864746, 2.011091947555542, 2.1405906677246094, 2.270089626312256, 2.3995883464813232, 2.5290870666503906, 2.658586025238037, 2.7880847454071045, 2.917583465576172, 3.0470821857452393, 3.1765809059143066, 3.306079626083374, 3.4355783462524414, 3.565077066421509, 3.694575786590576, 3.8240747451782227, 3.95357346534729, 4.083072185516357, 4.212571144104004, 4.342069625854492, 4.471568584442139, 4.601067066192627, 4.730566024780273, 4.860064506530762, 4.989563465118408, 5.119062423706055, 5.248560905456543, 5.3780598640441895]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 12.0, 16.0, 14.0, 28.0, 41.0, 70.0, 82.0, 122.0, 366.0, 1524.0, 4188615.0, 2452.0, 465.0, 165.0, 97.0, 57.0, 40.0, 30.0, 26.0, 15.0, 8.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.47265625, -7.25018310546875, -7.0277099609375, -6.80523681640625, -6.582763671875, -6.36029052734375, -6.1378173828125, -5.91534423828125, -5.69287109375, -5.47039794921875, -5.2479248046875, -5.02545166015625, -4.802978515625, -4.58050537109375, -4.3580322265625, -4.13555908203125, -3.9130859375, -3.69061279296875, -3.4681396484375, -3.24566650390625, -3.023193359375, -2.80072021484375, -2.5782470703125, -2.35577392578125, -2.13330078125, -1.91082763671875, -1.6883544921875, -1.46588134765625, -1.243408203125, -1.02093505859375, -0.7984619140625, -0.57598876953125, -0.353515625, -0.13104248046875, 0.0914306640625, 0.31390380859375, 0.536376953125, 0.75885009765625, 0.9813232421875, 1.20379638671875, 1.42626953125, 1.64874267578125, 1.8712158203125, 2.09368896484375, 2.316162109375, 2.53863525390625, 2.7611083984375, 2.98358154296875, 3.2060546875, 3.42852783203125, 3.6510009765625, 3.87347412109375, 4.095947265625, 4.31842041015625, 4.5408935546875, 4.76336669921875, 4.98583984375, 5.20831298828125, 5.4307861328125, 5.65325927734375, 5.875732421875, 6.09820556640625, 6.3206787109375, 6.54315185546875, 6.765625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 11.0, 15.0, 11.0, 26.0, 26.0, 45.0, 55.0, 45.0, 84.0, 70.0, 69.0, 79.0, 93.0, 77.0, 56.0, 61.0, 37.0, 43.0, 31.0, 20.0, 12.0, 15.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.348876953125, -0.3389701843261719, -0.32906341552734375, -0.3191566467285156, -0.3092498779296875, -0.2993431091308594, -0.28943634033203125, -0.2795295715332031, -0.269622802734375, -0.2597160339355469, -0.24980926513671875, -0.23990249633789062, -0.2299957275390625, -0.22008895874023438, -0.21018218994140625, -0.20027542114257812, -0.19036865234375, -0.18046188354492188, -0.17055511474609375, -0.16064834594726562, -0.1507415771484375, -0.14083480834960938, -0.13092803955078125, -0.12102127075195312, -0.111114501953125, -0.10120773315429688, -0.09130096435546875, -0.08139419555664062, -0.0714874267578125, -0.061580657958984375, -0.05167388916015625, -0.041767120361328125, -0.0318603515625, -0.021953582763671875, -0.01204681396484375, -0.002140045166015625, 0.0077667236328125, 0.017673492431640625, 0.02758026123046875, 0.037487030029296875, 0.047393798828125, 0.057300567626953125, 0.06720733642578125, 0.07711410522460938, 0.0870208740234375, 0.09692764282226562, 0.10683441162109375, 0.11674118041992188, 0.12664794921875, 0.13655471801757812, 0.14646148681640625, 0.15636825561523438, 0.1662750244140625, 0.17618179321289062, 0.18608856201171875, 0.19599533081054688, 0.205902099609375, 0.21580886840820312, 0.22571563720703125, 0.23562240600585938, 0.2455291748046875, 0.2554359436035156, 0.26534271240234375, 0.2752494812011719, 0.28515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 5.0, 3.0, 4.0, 8.0, 4.0, 7.0, 9.0, 10.0, 16.0, 19.0, 32.0, 48.0, 43.0, 71.0, 92.0, 132.0, 167.0, 261.0, 410.0, 716.0, 1273.0, 3110.0, 15251.0, 4143973.0, 21646.0, 3384.0, 1509.0, 724.0, 406.0, 275.0, 170.0, 119.0, 85.0, 58.0, 55.0, 41.0, 32.0, 29.0, 14.0, 19.0, 12.0, 11.0, 5.0, 7.0, 7.0, 0.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2685546875, -1.22705078125, -1.185546875, -1.14404296875, -1.1025390625, -1.06103515625, -1.01953125, -0.97802734375, -0.9365234375, -0.89501953125, -0.853515625, -0.81201171875, -0.7705078125, -0.72900390625, -0.6875, -0.64599609375, -0.6044921875, -0.56298828125, -0.521484375, -0.47998046875, -0.4384765625, -0.39697265625, -0.35546875, -0.31396484375, -0.2724609375, -0.23095703125, -0.189453125, -0.14794921875, -0.1064453125, -0.06494140625, -0.0234375, 0.01806640625, 0.0595703125, 0.10107421875, 0.142578125, 0.18408203125, 0.2255859375, 0.26708984375, 0.30859375, 0.35009765625, 0.3916015625, 0.43310546875, 0.474609375, 0.51611328125, 0.5576171875, 0.59912109375, 0.640625, 0.68212890625, 0.7236328125, 0.76513671875, 0.806640625, 0.84814453125, 0.8896484375, 0.93115234375, 0.97265625, 1.01416015625, 1.0556640625, 1.09716796875, 1.138671875, 1.18017578125, 1.2216796875, 1.26318359375, 1.3046875, 1.34619140625, 1.3876953125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 14.0, 14.0, 68.0, 3707.0, 215.0, 25.0, 9.0, 6.0, 7.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.348388671875, -0.3308219909667969, -0.31325531005859375, -0.2956886291503906, -0.2781219482421875, -0.2605552673339844, -0.24298858642578125, -0.22542190551757812, -0.207855224609375, -0.19028854370117188, -0.17272186279296875, -0.15515518188476562, -0.1375885009765625, -0.12002182006835938, -0.10245513916015625, -0.08488845825195312, -0.06732177734375, -0.049755096435546875, -0.03218841552734375, -0.014621734619140625, 0.0029449462890625, 0.020511627197265625, 0.03807830810546875, 0.055644989013671875, 0.073211669921875, 0.09077835083007812, 0.10834503173828125, 0.12591171264648438, 0.1434783935546875, 0.16104507446289062, 0.17861175537109375, 0.19617843627929688, 0.2137451171875, 0.23131179809570312, 0.24887847900390625, 0.2664451599121094, 0.2840118408203125, 0.3015785217285156, 0.31914520263671875, 0.3367118835449219, 0.354278564453125, 0.3718452453613281, 0.38941192626953125, 0.4069786071777344, 0.4245452880859375, 0.4421119689941406, 0.45967864990234375, 0.4772453308105469, 0.49481201171875, 0.5123786926269531, 0.5299453735351562, 0.5475120544433594, 0.5650787353515625, 0.5826454162597656, 0.6002120971679688, 0.6177787780761719, 0.635345458984375, 0.6529121398925781, 0.6704788208007812, 0.6880455017089844, 0.7056121826171875, 0.7231788635253906, 0.7407455444335938, 0.7583122253417969, 0.77587890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 7.0, 17.0, 36.0, 69.0, 152.0, 265.0, 229.0, 97.0, 46.0, 34.0, 20.0, 12.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0], "bins": [-3.4105446338653564, -3.3435423374176025, -3.2765402793884277, -3.209537982940674, -3.14253568649292, -3.075533390045166, -3.008531332015991, -2.9415290355682373, -2.8745269775390625, -2.8075246810913086, -2.740522623062134, -2.67352032661438, -2.606518030166626, -2.539515972137451, -2.4725136756896973, -2.4055113792419434, -2.3385090827941895, -2.2715067863464355, -2.2045047283172607, -2.137502431869507, -2.070500135421753, -2.003498077392578, -1.9364957809448242, -1.8694934844970703, -1.802491307258606, -1.7354891300201416, -1.6684868335723877, -1.6014846563339233, -1.534482479095459, -1.467480182647705, -1.4004780054092407, -1.3334758281707764, -1.2664732933044434, -1.199471116065979, -1.132468819618225, -1.0654666423797607, -0.9984644055366516, -0.9314621686935425, -0.8644599914550781, -0.797457754611969, -0.7304555773735046, -0.6634533405303955, -0.5964511632919312, -0.529448926448822, -0.4624466896057129, -0.39544445276260376, -0.328442245721817, -0.2614400386810303, -0.19443780183792114, -0.1274355798959732, -0.06043335795402527, 0.0065688639879226685, 0.0735710859298706, 0.14057332277297974, 0.20757552981376648, 0.2745777368545532, 0.34157997369766235, 0.4085822105407715, 0.4755844175815582, 0.542586624622345, 0.6095888614654541, 0.6765910983085632, 0.7435933351516724, 0.8105955123901367, 0.8775977492332458]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 7.0, 9.0, 10.0, 9.0, 14.0, 20.0, 12.0, 23.0, 30.0, 22.0, 39.0, 37.0, 34.0, 51.0, 50.0, 49.0, 49.0, 39.0, 52.0, 60.0, 52.0, 57.0, 54.0, 43.0, 28.0, 24.0, 19.0, 27.0, 18.0, 21.0, 14.0, 5.0, 8.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8186982870101929, -0.7940117716789246, -0.769325315952301, -0.7446388006210327, -0.7199522852897644, -0.6952658295631409, -0.6705793142318726, -0.645892858505249, -0.6212063431739807, -0.5965198278427124, -0.5718333721160889, -0.5471468567848206, -0.5224603414535522, -0.4977738857269287, -0.4730873703956604, -0.4484008848667145, -0.42371436953544617, -0.39902788400650024, -0.37434136867523193, -0.349654883146286, -0.3249683976173401, -0.3002818822860718, -0.27559539675712585, -0.25090891122817993, -0.22622241079807281, -0.2015359103679657, -0.17684942483901978, -0.15216292440891266, -0.12747642397880554, -0.10278993844985962, -0.0781034380197525, -0.05341695249080658, -0.028730452060699463, -0.004043957218527794, 0.020642537623643875, 0.04532903432846069, 0.07001552730798721, 0.09470202028751373, 0.11938852071762085, 0.14407500624656677, 0.1687615066766739, 0.193448007106781, 0.21813449263572693, 0.24282099306583405, 0.26750749349594116, 0.2921939790248871, 0.316880464553833, 0.3415669798851013, 0.36625346541404724, 0.39093995094299316, 0.4156264662742615, 0.4403129518032074, 0.4649994373321533, 0.48968595266342163, 0.5143724679946899, 0.5390589237213135, 0.5637454390525818, 0.5884319543838501, 0.6131184101104736, 0.6378049254417419, 0.6624914407730103, 0.6871778964996338, 0.7118644118309021, 0.7365509271621704, 0.761237382888794]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 5.0, 9.0, 8.0, 5.0, 23.0, 14.0, 18.0, 27.0, 38.0, 44.0, 78.0, 106.0, 149.0, 224.0, 357.0, 608.0, 1107.0, 1952.0, 4059.0, 8820.0, 23217.0, 71617.0, 257381.0, 444464.0, 158660.0, 45984.0, 16048.0, 6534.0, 3011.0, 1601.0, 844.0, 514.0, 316.0, 226.0, 133.0, 103.0, 66.0, 47.0, 36.0, 19.0, 17.0, 15.0, 11.0, 7.0, 6.0, 7.0, 6.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.40869140625, -0.39642333984375, -0.3841552734375, -0.37188720703125, -0.359619140625, -0.34735107421875, -0.3350830078125, -0.32281494140625, -0.310546875, -0.29827880859375, -0.2860107421875, -0.27374267578125, -0.261474609375, -0.24920654296875, -0.2369384765625, -0.22467041015625, -0.21240234375, -0.20013427734375, -0.1878662109375, -0.17559814453125, -0.163330078125, -0.15106201171875, -0.1387939453125, -0.12652587890625, -0.1142578125, -0.10198974609375, -0.0897216796875, -0.07745361328125, -0.065185546875, -0.05291748046875, -0.0406494140625, -0.02838134765625, -0.01611328125, -0.00384521484375, 0.0084228515625, 0.02069091796875, 0.032958984375, 0.04522705078125, 0.0574951171875, 0.06976318359375, 0.08203125, 0.09429931640625, 0.1065673828125, 0.11883544921875, 0.131103515625, 0.14337158203125, 0.1556396484375, 0.16790771484375, 0.18017578125, 0.19244384765625, 0.2047119140625, 0.21697998046875, 0.229248046875, 0.24151611328125, 0.2537841796875, 0.26605224609375, 0.2783203125, 0.29058837890625, 0.3028564453125, 0.31512451171875, 0.327392578125, 0.33966064453125, 0.3519287109375, 0.36419677734375, 0.37646484375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 7.0, 7.0, 12.0, 15.0, 20.0, 32.0, 23.0, 31.0, 55.0, 65.0, 52.0, 77.0, 74.0, 78.0, 65.0, 69.0, 67.0, 59.0, 45.0, 43.0, 35.0, 25.0, 12.0, 14.0, 12.0, 8.0, 0.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.362548828125, -0.3525733947753906, -0.34259796142578125, -0.3326225280761719, -0.3226470947265625, -0.3126716613769531, -0.30269622802734375, -0.2927207946777344, -0.282745361328125, -0.2727699279785156, -0.26279449462890625, -0.2528190612792969, -0.2428436279296875, -0.23286819458007812, -0.22289276123046875, -0.21291732788085938, -0.20294189453125, -0.19296646118164062, -0.18299102783203125, -0.17301559448242188, -0.1630401611328125, -0.15306472778320312, -0.14308929443359375, -0.13311386108398438, -0.123138427734375, -0.11316299438476562, -0.10318756103515625, -0.09321212768554688, -0.0832366943359375, -0.07326126098632812, -0.06328582763671875, -0.053310394287109375, -0.0433349609375, -0.033359527587890625, -0.02338409423828125, -0.013408660888671875, -0.0034332275390625, 0.006542205810546875, 0.01651763916015625, 0.026493072509765625, 0.036468505859375, 0.046443939208984375, 0.05641937255859375, 0.06639480590820312, 0.0763702392578125, 0.08634567260742188, 0.09632110595703125, 0.10629653930664062, 0.11627197265625, 0.12624740600585938, 0.13622283935546875, 0.14619827270507812, 0.1561737060546875, 0.16614913940429688, 0.17612457275390625, 0.18610000610351562, 0.196075439453125, 0.20605087280273438, 0.21602630615234375, 0.22600173950195312, 0.2359771728515625, 0.24595260620117188, 0.25592803955078125, 0.2659034729003906, 0.27587890625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 13.0, 14.0, 19.0, 22.0, 51.0, 55.0, 71.0, 89.0, 131.0, 252.0, 432.0, 780.0, 1728.0, 4913.0, 19051.0, 147190.0, 732631.0, 117118.0, 16375.0, 4215.0, 1636.0, 666.0, 368.0, 250.0, 150.0, 94.0, 70.0, 45.0, 36.0, 16.0, 20.0, 13.0, 9.0, 4.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.513671875, -0.49680328369140625, -0.4799346923828125, -0.46306610107421875, -0.446197509765625, -0.42932891845703125, -0.4124603271484375, -0.39559173583984375, -0.37872314453125, -0.36185455322265625, -0.3449859619140625, -0.32811737060546875, -0.311248779296875, -0.29438018798828125, -0.2775115966796875, -0.26064300537109375, -0.2437744140625, -0.22690582275390625, -0.2100372314453125, -0.19316864013671875, -0.176300048828125, -0.15943145751953125, -0.1425628662109375, -0.12569427490234375, -0.10882568359375, -0.09195709228515625, -0.0750885009765625, -0.05821990966796875, -0.041351318359375, -0.02448272705078125, -0.0076141357421875, 0.00925445556640625, 0.026123046875, 0.04299163818359375, 0.0598602294921875, 0.07672882080078125, 0.093597412109375, 0.11046600341796875, 0.1273345947265625, 0.14420318603515625, 0.16107177734375, 0.17794036865234375, 0.1948089599609375, 0.21167755126953125, 0.228546142578125, 0.24541473388671875, 0.2622833251953125, 0.27915191650390625, 0.2960205078125, 0.31288909912109375, 0.3297576904296875, 0.34662628173828125, 0.363494873046875, 0.38036346435546875, 0.3972320556640625, 0.41410064697265625, 0.43096923828125, 0.44783782958984375, 0.4647064208984375, 0.48157501220703125, 0.498443603515625, 0.5153121948242188, 0.5321807861328125, 0.5490493774414062, 0.56591796875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 9.0, 7.0, 8.0, 12.0, 15.0, 15.0, 21.0, 32.0, 23.0, 25.0, 29.0, 38.0, 36.0, 37.0, 37.0, 53.0, 33.0, 40.0, 60.0, 48.0, 39.0, 55.0, 42.0, 33.0, 34.0, 30.0, 34.0, 19.0, 24.0, 20.0, 17.0, 14.0, 11.0, 8.0, 10.0, 4.0, 7.0, 9.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.64697265625, -0.6252517700195312, -0.6035308837890625, -0.5818099975585938, -0.560089111328125, -0.5383682250976562, -0.5166473388671875, -0.49492645263671875, -0.47320556640625, -0.45148468017578125, -0.4297637939453125, -0.40804290771484375, -0.386322021484375, -0.36460113525390625, -0.3428802490234375, -0.32115936279296875, -0.2994384765625, -0.27771759033203125, -0.2559967041015625, -0.23427581787109375, -0.212554931640625, -0.19083404541015625, -0.1691131591796875, -0.14739227294921875, -0.12567138671875, -0.10395050048828125, -0.0822296142578125, -0.06050872802734375, -0.038787841796875, -0.01706695556640625, 0.0046539306640625, 0.02637481689453125, 0.048095703125, 0.06981658935546875, 0.0915374755859375, 0.11325836181640625, 0.134979248046875, 0.15670013427734375, 0.1784210205078125, 0.20014190673828125, 0.22186279296875, 0.24358367919921875, 0.2653045654296875, 0.28702545166015625, 0.308746337890625, 0.33046722412109375, 0.3521881103515625, 0.37390899658203125, 0.3956298828125, 0.41735076904296875, 0.4390716552734375, 0.46079254150390625, 0.482513427734375, 0.5042343139648438, 0.5259552001953125, 0.5476760864257812, 0.56939697265625, 0.5911178588867188, 0.6128387451171875, 0.6345596313476562, 0.656280517578125, 0.6780014038085938, 0.6997222900390625, 0.7214431762695312, 0.7431640625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 9.0, 9.0, 8.0, 10.0, 20.0, 20.0, 27.0, 42.0, 78.0, 98.0, 162.0, 274.0, 478.0, 931.0, 1944.0, 4784.0, 14552.0, 74693.0, 652046.0, 252257.0, 31720.0, 8246.0, 3110.0, 1327.0, 709.0, 365.0, 210.0, 146.0, 69.0, 57.0, 35.0, 28.0, 20.0, 11.0, 8.0, 7.0, 8.0, 9.0, 4.0, 3.0, 1.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.140625, -0.13590049743652344, -0.13117599487304688, -0.1264514923095703, -0.12172698974609375, -0.11700248718261719, -0.11227798461914062, -0.10755348205566406, -0.1028289794921875, -0.09810447692871094, -0.09337997436523438, -0.08865547180175781, -0.08393096923828125, -0.07920646667480469, -0.07448196411132812, -0.06975746154785156, -0.065032958984375, -0.06030845642089844, -0.055583953857421875, -0.05085945129394531, -0.04613494873046875, -0.04141044616699219, -0.036685943603515625, -0.03196144104003906, -0.0272369384765625, -0.022512435913085938, -0.017787933349609375, -0.013063430786132812, -0.00833892822265625, -0.0036144256591796875, 0.001110076904296875, 0.0058345794677734375, 0.01055908203125, 0.015283584594726562, 0.020008087158203125, 0.024732589721679688, 0.02945709228515625, 0.03418159484863281, 0.038906097412109375, 0.04363059997558594, 0.0483551025390625, 0.05307960510253906, 0.057804107666015625, 0.06252861022949219, 0.06725311279296875, 0.07197761535644531, 0.07670211791992188, 0.08142662048339844, 0.086151123046875, 0.09087562561035156, 0.09560012817382812, 0.10032463073730469, 0.10504913330078125, 0.10977363586425781, 0.11449813842773438, 0.11922264099121094, 0.1239471435546875, 0.12867164611816406, 0.13339614868164062, 0.1381206512451172, 0.14284515380859375, 0.1475696563720703, 0.15229415893554688, 0.15701866149902344, 0.1617431640625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 8.0, 4.0, 11.0, 21.0, 18.0, 24.0, 59.0, 73.0, 124.0, 156.0, 152.0, 136.0, 67.0, 50.0, 27.0, 20.0, 10.0, 13.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4955482482910156e-05, -5.311984568834305e-05, -5.128420889377594e-05, -4.944857209920883e-05, -4.7612935304641724e-05, -4.5777298510074615e-05, -4.394166171550751e-05, -4.21060249209404e-05, -4.027038812637329e-05, -3.843475133180618e-05, -3.6599114537239075e-05, -3.4763477742671967e-05, -3.292784094810486e-05, -3.109220415353775e-05, -2.9256567358970642e-05, -2.7420930564403534e-05, -2.5585293769836426e-05, -2.3749656975269318e-05, -2.191402018070221e-05, -2.00783833861351e-05, -1.8242746591567993e-05, -1.6407109797000885e-05, -1.4571473002433777e-05, -1.2735836207866669e-05, -1.090019941329956e-05, -9.064562618732452e-06, -7.228925824165344e-06, -5.393289029598236e-06, -3.557652235031128e-06, -1.7220154404640198e-06, 1.1362135410308838e-07, 1.9492581486701965e-06, 3.7848949432373047e-06, 5.620531737804413e-06, 7.456168532371521e-06, 9.291805326938629e-06, 1.1127442121505737e-05, 1.2963078916072845e-05, 1.4798715710639954e-05, 1.6634352505207062e-05, 1.846998929977417e-05, 2.0305626094341278e-05, 2.2141262888908386e-05, 2.3976899683475494e-05, 2.5812536478042603e-05, 2.764817327260971e-05, 2.948381006717682e-05, 3.131944686174393e-05, 3.3155083656311035e-05, 3.499072045087814e-05, 3.682635724544525e-05, 3.866199404001236e-05, 4.049763083457947e-05, 4.2333267629146576e-05, 4.4168904423713684e-05, 4.600454121828079e-05, 4.78401780128479e-05, 4.967581480741501e-05, 5.151145160198212e-05, 5.3347088396549225e-05, 5.518272519111633e-05, 5.701836198568344e-05, 5.885399878025055e-05, 6.068963557481766e-05, 6.252527236938477e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 10.0, 11.0, 11.0, 16.0, 18.0, 29.0, 35.0, 70.0, 110.0, 170.0, 354.0, 585.0, 1234.0, 3032.0, 8678.0, 36643.0, 431503.0, 510318.0, 40478.0, 9305.0, 3157.0, 1317.0, 660.0, 310.0, 191.0, 102.0, 71.0, 48.0, 21.0, 21.0, 17.0, 5.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2213134765625, -0.21480941772460938, -0.20830535888671875, -0.20180130004882812, -0.1952972412109375, -0.18879318237304688, -0.18228912353515625, -0.17578506469726562, -0.169281005859375, -0.16277694702148438, -0.15627288818359375, -0.14976882934570312, -0.1432647705078125, -0.13676071166992188, -0.13025665283203125, -0.12375259399414062, -0.11724853515625, -0.11074447631835938, -0.10424041748046875, -0.09773635864257812, -0.0912322998046875, -0.08472824096679688, -0.07822418212890625, -0.07172012329101562, -0.065216064453125, -0.058712005615234375, -0.05220794677734375, -0.045703887939453125, -0.0391998291015625, -0.032695770263671875, -0.02619171142578125, -0.019687652587890625, -0.01318359375, -0.006679534912109375, -0.00017547607421875, 0.006328582763671875, 0.0128326416015625, 0.019336700439453125, 0.02584075927734375, 0.032344818115234375, 0.038848876953125, 0.045352935791015625, 0.05185699462890625, 0.058361053466796875, 0.0648651123046875, 0.07136917114257812, 0.07787322998046875, 0.08437728881835938, 0.09088134765625, 0.09738540649414062, 0.10388946533203125, 0.11039352416992188, 0.1168975830078125, 0.12340164184570312, 0.12990570068359375, 0.13640975952148438, 0.142913818359375, 0.14941787719726562, 0.15592193603515625, 0.16242599487304688, 0.1689300537109375, 0.17543411254882812, 0.18193817138671875, 0.18844223022460938, 0.1949462890625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 5.0, 8.0, 11.0, 11.0, 9.0, 6.0, 20.0, 29.0, 36.0, 55.0, 57.0, 68.0, 99.0, 107.0, 113.0, 76.0, 62.0, 54.0, 44.0, 25.0, 23.0, 19.0, 22.0, 10.0, 7.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2054443359375, -0.19953536987304688, -0.19362640380859375, -0.18771743774414062, -0.1818084716796875, -0.17589950561523438, -0.16999053955078125, -0.16408157348632812, -0.158172607421875, -0.15226364135742188, -0.14635467529296875, -0.14044570922851562, -0.1345367431640625, -0.12862777709960938, -0.12271881103515625, -0.11680984497070312, -0.11090087890625, -0.10499191284179688, -0.09908294677734375, -0.09317398071289062, -0.0872650146484375, -0.08135604858398438, -0.07544708251953125, -0.06953811645507812, -0.063629150390625, -0.057720184326171875, -0.05181121826171875, -0.045902252197265625, -0.0399932861328125, -0.034084320068359375, -0.02817535400390625, -0.022266387939453125, -0.016357421875, -0.010448455810546875, -0.00453948974609375, 0.001369476318359375, 0.0072784423828125, 0.013187408447265625, 0.01909637451171875, 0.025005340576171875, 0.030914306640625, 0.036823272705078125, 0.04273223876953125, 0.048641204833984375, 0.0545501708984375, 0.060459136962890625, 0.06636810302734375, 0.07227706909179688, 0.07818603515625, 0.08409500122070312, 0.09000396728515625, 0.09591293334960938, 0.1018218994140625, 0.10773086547851562, 0.11363983154296875, 0.11954879760742188, 0.125457763671875, 0.13136672973632812, 0.13727569580078125, 0.14318466186523438, 0.1490936279296875, 0.15500259399414062, 0.16091156005859375, 0.16682052612304688, 0.1727294921875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 14.0, 27.0, 81.0, 234.0, 344.0, 206.0, 64.0, 17.0, 20.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.736486434936523, -8.489704132080078, -8.242920875549316, -7.996138572692871, -7.749356269836426, -7.502573490142822, -7.255790710449219, -7.009008407592773, -6.762226104736328, -6.515443325042725, -6.268661022186279, -6.021878242492676, -5.7750959396362305, -5.528313159942627, -5.281530380249023, -5.034748077392578, -4.787965297698975, -4.541182518005371, -4.294400215148926, -4.047617435455322, -3.800835132598877, -3.5540523529052734, -3.307269811630249, -3.0604872703552246, -2.8137047290802, -2.566922187805176, -2.3201396465301514, -2.073357105255127, -1.826574444770813, -1.5797919034957886, -1.3330092430114746, -1.0862267017364502, -0.8394441604614258, -0.5926616191864014, -0.3458790183067322, -0.09909641742706299, 0.14768612384796143, 0.39446866512298584, 0.6412513256072998, 0.8880338668823242, 1.1348164081573486, 1.381598949432373, 1.6283814907073975, 1.8751641511917114, 2.1219468116760254, 2.3687291145324707, 2.615511894226074, 2.8622944355010986, 3.109076976776123, 3.3558595180511475, 3.602642059326172, 3.8494248390197754, 4.096207141876221, 4.342989921569824, 4.5897722244262695, 4.836555004119873, 5.083337783813477, 5.33012056350708, 5.576902866363525, 5.823685646057129, 6.070467948913574, 6.317250728607178, 6.564033508300781, 6.810815811157227, 7.057598114013672]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 2.0, 9.0, 9.0, 8.0, 17.0, 20.0, 24.0, 22.0, 18.0, 15.0, 32.0, 33.0, 40.0, 45.0, 45.0, 39.0, 50.0, 54.0, 58.0, 47.0, 38.0, 47.0, 41.0, 38.0, 37.0, 27.0, 29.0, 26.0, 17.0, 19.0, 17.0, 7.0, 16.0, 8.0, 11.0, 7.0, 9.0, 5.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.983551025390625, -2.8853437900543213, -2.7871365547180176, -2.688929319381714, -2.59072208404541, -2.4925146102905273, -2.3943073749542236, -2.29610013961792, -2.197892904281616, -2.0996856689453125, -2.001478433609009, -1.9032710790634155, -1.8050638437271118, -1.706856608390808, -1.6086492538452148, -1.5104420185089111, -1.4122347831726074, -1.3140275478363037, -1.2158203125, -1.1176129579544067, -1.019405722618103, -0.9211984872817993, -0.8229911923408508, -0.7247838973999023, -0.6265766620635986, -0.5283694267272949, -0.43016213178634644, -0.33195486664772034, -0.23374760150909424, -0.13554033637046814, -0.03733307123184204, 0.060874223709106445, 0.15908169746398926, 0.25728896260261536, 0.35549622774124146, 0.45370349287986755, 0.5519107580184937, 0.6501179933547974, 0.7483252882957458, 0.8465325832366943, 0.944739818572998, 1.0429470539093018, 1.1411542892456055, 1.2393616437911987, 1.3375688791275024, 1.4357761144638062, 1.5339834690093994, 1.6321907043457031, 1.7303979396820068, 1.8286051750183105, 1.9268124103546143, 2.025019645690918, 2.123227119445801, 2.2214343547821045, 2.319641590118408, 2.417848825454712, 2.5160560607910156, 2.6142632961273193, 2.712470531463623, 2.8106777667999268, 2.9088850021362305, 3.0070924758911133, 3.105299711227417, 3.2035069465637207, 3.3017141819000244]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 11.0, 11.0, 20.0, 18.0, 13.0, 20.0, 24.0, 35.0, 50.0, 57.0, 101.0, 116.0, 204.0, 348.0, 568.0, 986.0, 1907.0, 4048.0, 12191.0, 124223.0, 3987806.0, 45466.0, 8902.0, 3380.0, 1593.0, 910.0, 507.0, 278.0, 168.0, 113.0, 66.0, 40.0, 24.0, 19.0, 9.0, 9.0, 8.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2429962158203125, -1.205718994140625, -1.1684417724609375, -1.13116455078125, -1.0938873291015625, -1.056610107421875, -1.0193328857421875, -0.9820556640625, -0.9447784423828125, -0.907501220703125, -0.8702239990234375, -0.83294677734375, -0.7956695556640625, -0.758392333984375, -0.7211151123046875, -0.683837890625, -0.6465606689453125, -0.609283447265625, -0.5720062255859375, -0.53472900390625, -0.4974517822265625, -0.460174560546875, -0.4228973388671875, -0.3856201171875, -0.3483428955078125, -0.311065673828125, -0.2737884521484375, -0.23651123046875, -0.1992340087890625, -0.161956787109375, -0.1246795654296875, -0.08740234375, -0.0501251220703125, -0.012847900390625, 0.0244293212890625, 0.06170654296875, 0.0989837646484375, 0.136260986328125, 0.1735382080078125, 0.2108154296875, 0.2480926513671875, 0.285369873046875, 0.3226470947265625, 0.35992431640625, 0.3972015380859375, 0.434478759765625, 0.4717559814453125, 0.509033203125, 0.5463104248046875, 0.583587646484375, 0.6208648681640625, 0.65814208984375, 0.6954193115234375, 0.732696533203125, 0.7699737548828125, 0.8072509765625, 0.8445281982421875, 0.881805419921875, 0.9190826416015625, 0.95635986328125, 0.9936370849609375, 1.030914306640625, 1.0681915283203125, 1.10546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 4.0, 5.0, 11.0, 9.0, 33.0, 32.0, 33.0, 38.0, 56.0, 80.0, 75.0, 81.0, 93.0, 70.0, 80.0, 76.0, 64.0, 42.0, 31.0, 26.0, 17.0, 17.0, 14.0, 9.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.37060546875, -0.36067962646484375, -0.3507537841796875, -0.34082794189453125, -0.330902099609375, -0.32097625732421875, -0.3110504150390625, -0.30112457275390625, -0.29119873046875, -0.28127288818359375, -0.2713470458984375, -0.26142120361328125, -0.251495361328125, -0.24156951904296875, -0.2316436767578125, -0.22171783447265625, -0.2117919921875, -0.20186614990234375, -0.1919403076171875, -0.18201446533203125, -0.172088623046875, -0.16216278076171875, -0.1522369384765625, -0.14231109619140625, -0.13238525390625, -0.12245941162109375, -0.1125335693359375, -0.10260772705078125, -0.092681884765625, -0.08275604248046875, -0.0728302001953125, -0.06290435791015625, -0.052978515625, -0.04305267333984375, -0.0331268310546875, -0.02320098876953125, -0.013275146484375, -0.00334930419921875, 0.0065765380859375, 0.01650238037109375, 0.02642822265625, 0.03635406494140625, 0.0462799072265625, 0.05620574951171875, 0.066131591796875, 0.07605743408203125, 0.0859832763671875, 0.09590911865234375, 0.1058349609375, 0.11576080322265625, 0.1256866455078125, 0.13561248779296875, 0.145538330078125, 0.15546417236328125, 0.1653900146484375, 0.17531585693359375, 0.18524169921875, 0.19516754150390625, 0.2050933837890625, 0.21501922607421875, 0.224945068359375, 0.23487091064453125, 0.2447967529296875, 0.25472259521484375, 0.2646484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 7.0, 9.0, 13.0, 23.0, 52.0, 122.0, 209.0, 693.0, 2581.0, 17549.0, 4061628.0, 103184.0, 6210.0, 1270.0, 403.0, 169.0, 72.0, 38.0, 22.0, 8.0, 13.0, 4.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8310546875, -1.7673797607421875, -1.703704833984375, -1.6400299072265625, -1.57635498046875, -1.5126800537109375, -1.449005126953125, -1.3853302001953125, -1.3216552734375, -1.2579803466796875, -1.194305419921875, -1.1306304931640625, -1.06695556640625, -1.0032806396484375, -0.939605712890625, -0.8759307861328125, -0.812255859375, -0.7485809326171875, -0.684906005859375, -0.6212310791015625, -0.55755615234375, -0.4938812255859375, -0.430206298828125, -0.3665313720703125, -0.3028564453125, -0.2391815185546875, -0.175506591796875, -0.1118316650390625, -0.04815673828125, 0.0155181884765625, 0.079193115234375, 0.1428680419921875, 0.20654296875, 0.2702178955078125, 0.333892822265625, 0.3975677490234375, 0.46124267578125, 0.5249176025390625, 0.588592529296875, 0.6522674560546875, 0.7159423828125, 0.7796173095703125, 0.843292236328125, 0.9069671630859375, 0.97064208984375, 1.0343170166015625, 1.097991943359375, 1.1616668701171875, 1.225341796875, 1.2890167236328125, 1.352691650390625, 1.4163665771484375, 1.48004150390625, 1.5437164306640625, 1.607391357421875, 1.6710662841796875, 1.7347412109375, 1.7984161376953125, 1.862091064453125, 1.9257659912109375, 1.98944091796875, 2.0531158447265625, 2.116790771484375, 2.1804656982421875, 2.244140625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 7.0, 10.0, 9.0, 15.0, 15.0, 22.0, 23.0, 56.0, 191.0, 1070.0, 2035.0, 358.0, 116.0, 49.0, 26.0, 13.0, 22.0, 11.0, 8.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5849609375, -0.5560302734375, -0.527099609375, -0.4981689453125, -0.46923828125, -0.4403076171875, -0.411376953125, -0.3824462890625, -0.353515625, -0.3245849609375, -0.295654296875, -0.2667236328125, -0.23779296875, -0.2088623046875, -0.179931640625, -0.1510009765625, -0.1220703125, -0.0931396484375, -0.064208984375, -0.0352783203125, -0.00634765625, 0.0225830078125, 0.051513671875, 0.0804443359375, 0.109375, 0.1383056640625, 0.167236328125, 0.1961669921875, 0.22509765625, 0.2540283203125, 0.282958984375, 0.3118896484375, 0.3408203125, 0.3697509765625, 0.398681640625, 0.4276123046875, 0.45654296875, 0.4854736328125, 0.514404296875, 0.5433349609375, 0.572265625, 0.6011962890625, 0.630126953125, 0.6590576171875, 0.68798828125, 0.7169189453125, 0.745849609375, 0.7747802734375, 0.8037109375, 0.8326416015625, 0.861572265625, 0.8905029296875, 0.91943359375, 0.9483642578125, 0.977294921875, 1.0062255859375, 1.03515625, 1.0640869140625, 1.093017578125, 1.1219482421875, 1.15087890625, 1.1798095703125, 1.208740234375, 1.2376708984375, 1.2666015625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 4.0, 5.0, 9.0, 17.0, 31.0, 51.0, 48.0, 106.0, 152.0, 177.0, 156.0, 80.0, 57.0, 25.0, 23.0, 10.0, 12.0, 13.0, 6.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.085221767425537, -5.921083450317383, -5.7569451332092285, -5.592806816101074, -5.428668975830078, -5.264530658721924, -5.1003923416137695, -4.936254024505615, -4.772115707397461, -4.607977390289307, -4.443839073181152, -4.279700756072998, -4.115562438964844, -3.9514243602752686, -3.7872862815856934, -3.623147964477539, -3.4590096473693848, -3.2948713302612305, -3.130733013153076, -2.966594934463501, -2.8024566173553467, -2.6383183002471924, -2.474180221557617, -2.310041904449463, -2.1459035873413086, -1.9817652702331543, -1.8176270723342896, -1.6534888744354248, -1.4893505573272705, -1.3252122402191162, -1.1610740423202515, -0.9969358444213867, -0.8327970504760742, -0.6686587929725647, -0.5045205354690552, -0.34038227796554565, -0.17624402046203613, -0.012105762958526611, 0.1520324945449829, 0.31617069244384766, 0.48030900955200195, 0.6444472670555115, 0.808585524559021, 0.9727237820625305, 1.13686203956604, 1.3010003566741943, 1.465138554573059, 1.6292767524719238, 1.7934150695800781, 1.9575533866882324, 2.1216917037963867, 2.285829782485962, 2.449968099594116, 2.6141064167022705, 2.7782444953918457, 2.9423828125, 3.1065211296081543, 3.2706594467163086, 3.434797763824463, 3.598935842514038, 3.7630741596221924, 3.9272124767303467, 4.091350555419922, 4.255488872528076, 4.4196271896362305]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 1.0, 6.0, 5.0, 14.0, 10.0, 2.0, 13.0, 24.0, 22.0, 25.0, 34.0, 32.0, 30.0, 29.0, 49.0, 37.0, 57.0, 50.0, 52.0, 53.0, 40.0, 44.0, 36.0, 42.0, 45.0, 40.0, 38.0, 25.0, 29.0, 29.0, 12.0, 22.0, 9.0, 15.0, 3.0, 6.0, 5.0, 2.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.839420795440674, -2.7610788345336914, -2.682737112045288, -2.6043951511383057, -2.5260531902313232, -2.44771146774292, -2.3693695068359375, -2.291027545928955, -2.2126855850219727, -2.1343436241149902, -2.056001901626587, -1.9776599407196045, -1.899317979812622, -1.8209761381149292, -1.7426342964172363, -1.664292335510254, -1.5859506130218506, -1.5076087713241577, -1.4292668104171753, -1.3509249687194824, -1.2725830078125, -1.1942411661148071, -1.1158993244171143, -1.0375573635101318, -0.959215521812439, -0.8808736205101013, -0.8025317192077637, -0.7241898775100708, -0.6458479762077332, -0.5675060749053955, -0.48916420340538025, -0.410822331905365, -0.33248043060302734, -0.2541385293006897, -0.17579665780067444, -0.09745477139949799, -0.019112884998321533, 0.05922901630401611, 0.13757088780403137, 0.21591275930404663, 0.2942546606063843, 0.3725965619087219, 0.4509384334087372, 0.5292803049087524, 0.6076222062110901, 0.6859641075134277, 0.7643059492111206, 0.8426478505134583, 0.9209897518157959, 0.9993316531181335, 1.0776735544204712, 1.156015396118164, 1.2343573570251465, 1.3126991987228394, 1.3910410404205322, 1.4693830013275146, 1.5477248430252075, 1.6260666847229004, 1.7044086456298828, 1.7827504873275757, 1.8610923290252686, 1.939434289932251, 2.0177762508392334, 2.0961179733276367, 2.174459934234619]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 7.0, 11.0, 9.0, 11.0, 11.0, 24.0, 43.0, 55.0, 73.0, 147.0, 181.0, 320.0, 591.0, 1080.0, 2228.0, 5402.0, 16695.0, 79457.0, 595013.0, 289882.0, 39534.0, 10389.0, 3722.0, 1631.0, 793.0, 450.0, 254.0, 175.0, 100.0, 63.0, 55.0, 40.0, 25.0, 18.0, 17.0, 9.0, 13.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.9521484375, -0.9255523681640625, -0.898956298828125, -0.8723602294921875, -0.84576416015625, -0.8191680908203125, -0.792572021484375, -0.7659759521484375, -0.7393798828125, -0.7127838134765625, -0.686187744140625, -0.6595916748046875, -0.63299560546875, -0.6063995361328125, -0.579803466796875, -0.5532073974609375, -0.526611328125, -0.5000152587890625, -0.473419189453125, -0.4468231201171875, -0.42022705078125, -0.3936309814453125, -0.367034912109375, -0.3404388427734375, -0.3138427734375, -0.2872467041015625, -0.260650634765625, -0.2340545654296875, -0.20745849609375, -0.1808624267578125, -0.154266357421875, -0.1276702880859375, -0.10107421875, -0.0744781494140625, -0.047882080078125, -0.0212860107421875, 0.00531005859375, 0.0319061279296875, 0.058502197265625, 0.0850982666015625, 0.1116943359375, 0.1382904052734375, 0.164886474609375, 0.1914825439453125, 0.21807861328125, 0.2446746826171875, 0.271270751953125, 0.2978668212890625, 0.324462890625, 0.3510589599609375, 0.377655029296875, 0.4042510986328125, 0.43084716796875, 0.4574432373046875, 0.484039306640625, 0.5106353759765625, 0.5372314453125, 0.5638275146484375, 0.590423583984375, 0.6170196533203125, 0.64361572265625, 0.6702117919921875, 0.696807861328125, 0.7234039306640625, 0.75]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 5.0, 13.0, 17.0, 38.0, 42.0, 42.0, 52.0, 50.0, 64.0, 67.0, 89.0, 78.0, 90.0, 77.0, 54.0, 53.0, 41.0, 38.0, 19.0, 26.0, 18.0, 11.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35595703125, -0.346038818359375, -0.33612060546875, -0.326202392578125, -0.3162841796875, -0.306365966796875, -0.29644775390625, -0.286529541015625, -0.276611328125, -0.266693115234375, -0.25677490234375, -0.246856689453125, -0.2369384765625, -0.227020263671875, -0.21710205078125, -0.207183837890625, -0.197265625, -0.187347412109375, -0.17742919921875, -0.167510986328125, -0.1575927734375, -0.147674560546875, -0.13775634765625, -0.127838134765625, -0.117919921875, -0.108001708984375, -0.09808349609375, -0.088165283203125, -0.0782470703125, -0.068328857421875, -0.05841064453125, -0.048492431640625, -0.03857421875, -0.028656005859375, -0.01873779296875, -0.008819580078125, 0.0010986328125, 0.011016845703125, 0.02093505859375, 0.030853271484375, 0.040771484375, 0.050689697265625, 0.06060791015625, 0.070526123046875, 0.0804443359375, 0.090362548828125, 0.10028076171875, 0.110198974609375, 0.1201171875, 0.130035400390625, 0.13995361328125, 0.149871826171875, 0.1597900390625, 0.169708251953125, 0.17962646484375, 0.189544677734375, 0.199462890625, 0.209381103515625, 0.21929931640625, 0.229217529296875, 0.2391357421875, 0.249053955078125, 0.25897216796875, 0.268890380859375, 0.27880859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 5.0, 3.0, 9.0, 5.0, 22.0, 27.0, 27.0, 36.0, 57.0, 93.0, 112.0, 201.0, 336.0, 595.0, 1090.0, 2671.0, 8108.0, 42630.0, 729433.0, 233765.0, 20244.0, 5083.0, 1921.0, 825.0, 455.0, 273.0, 166.0, 104.0, 65.0, 53.0, 37.0, 28.0, 12.0, 15.0, 10.0, 7.0, 4.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.81396484375, -0.7875442504882812, -0.7611236572265625, -0.7347030639648438, -0.708282470703125, -0.6818618774414062, -0.6554412841796875, -0.6290206909179688, -0.60260009765625, -0.5761795043945312, -0.5497589111328125, -0.5233383178710938, -0.496917724609375, -0.47049713134765625, -0.4440765380859375, -0.41765594482421875, -0.3912353515625, -0.36481475830078125, -0.3383941650390625, -0.31197357177734375, -0.285552978515625, -0.25913238525390625, -0.2327117919921875, -0.20629119873046875, -0.17987060546875, -0.15345001220703125, -0.1270294189453125, -0.10060882568359375, -0.074188232421875, -0.04776763916015625, -0.0213470458984375, 0.00507354736328125, 0.031494140625, 0.05791473388671875, 0.0843353271484375, 0.11075592041015625, 0.137176513671875, 0.16359710693359375, 0.1900177001953125, 0.21643829345703125, 0.24285888671875, 0.26927947998046875, 0.2957000732421875, 0.32212066650390625, 0.348541259765625, 0.37496185302734375, 0.4013824462890625, 0.42780303955078125, 0.4542236328125, 0.48064422607421875, 0.5070648193359375, 0.5334854125976562, 0.559906005859375, 0.5863265991210938, 0.6127471923828125, 0.6391677856445312, 0.66558837890625, 0.6920089721679688, 0.7184295654296875, 0.7448501586914062, 0.771270751953125, 0.7976913452148438, 0.8241119384765625, 0.8505325317382812, 0.876953125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 1.0, 7.0, 4.0, 3.0, 5.0, 9.0, 9.0, 10.0, 11.0, 20.0, 18.0, 22.0, 30.0, 20.0, 33.0, 38.0, 58.0, 44.0, 46.0, 61.0, 43.0, 39.0, 54.0, 50.0, 41.0, 37.0, 24.0, 38.0, 34.0, 35.0, 23.0, 17.0, 30.0, 14.0, 15.0, 14.0, 13.0, 12.0, 7.0, 3.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6953125, -0.6734085083007812, -0.6515045166015625, -0.6296005249023438, -0.607696533203125, -0.5857925415039062, -0.5638885498046875, -0.5419845581054688, -0.52008056640625, -0.49817657470703125, -0.4762725830078125, -0.45436859130859375, -0.432464599609375, -0.41056060791015625, -0.3886566162109375, -0.36675262451171875, -0.3448486328125, -0.32294464111328125, -0.3010406494140625, -0.27913665771484375, -0.257232666015625, -0.23532867431640625, -0.2134246826171875, -0.19152069091796875, -0.16961669921875, -0.14771270751953125, -0.1258087158203125, -0.10390472412109375, -0.082000732421875, -0.06009674072265625, -0.0381927490234375, -0.01628875732421875, 0.005615234375, 0.02751922607421875, 0.0494232177734375, 0.07132720947265625, 0.093231201171875, 0.11513519287109375, 0.1370391845703125, 0.15894317626953125, 0.18084716796875, 0.20275115966796875, 0.2246551513671875, 0.24655914306640625, 0.268463134765625, 0.29036712646484375, 0.3122711181640625, 0.33417510986328125, 0.3560791015625, 0.37798309326171875, 0.3998870849609375, 0.42179107666015625, 0.443695068359375, 0.46559906005859375, 0.4875030517578125, 0.5094070434570312, 0.53131103515625, 0.5532150268554688, 0.5751190185546875, 0.5970230102539062, 0.618927001953125, 0.6408309936523438, 0.6627349853515625, 0.6846389770507812, 0.70654296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 10.0, 4.0, 6.0, 2.0, 11.0, 12.0, 9.0, 20.0, 29.0, 49.0, 74.0, 114.0, 125.0, 255.0, 467.0, 951.0, 2266.0, 6983.0, 40735.0, 845826.0, 131922.0, 12458.0, 3397.0, 1284.0, 590.0, 346.0, 202.0, 109.0, 86.0, 47.0, 40.0, 27.0, 24.0, 19.0, 14.0, 8.0, 10.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.36962890625, -0.3575897216796875, -0.345550537109375, -0.3335113525390625, -0.32147216796875, -0.3094329833984375, -0.297393798828125, -0.2853546142578125, -0.2733154296875, -0.2612762451171875, -0.249237060546875, -0.2371978759765625, -0.22515869140625, -0.2131195068359375, -0.201080322265625, -0.1890411376953125, -0.177001953125, -0.1649627685546875, -0.152923583984375, -0.1408843994140625, -0.12884521484375, -0.1168060302734375, -0.104766845703125, -0.0927276611328125, -0.0806884765625, -0.0686492919921875, -0.056610107421875, -0.0445709228515625, -0.03253173828125, -0.0204925537109375, -0.008453369140625, 0.0035858154296875, 0.015625, 0.0276641845703125, 0.039703369140625, 0.0517425537109375, 0.06378173828125, 0.0758209228515625, 0.087860107421875, 0.0998992919921875, 0.1119384765625, 0.1239776611328125, 0.136016845703125, 0.1480560302734375, 0.16009521484375, 0.1721343994140625, 0.184173583984375, 0.1962127685546875, 0.208251953125, 0.2202911376953125, 0.232330322265625, 0.2443695068359375, 0.25640869140625, 0.2684478759765625, 0.280487060546875, 0.2925262451171875, 0.3045654296875, 0.3166046142578125, 0.328643798828125, 0.3406829833984375, 0.35272216796875, 0.3647613525390625, 0.376800537109375, 0.3888397216796875, 0.40087890625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 9.0, 8.0, 12.0, 7.0, 14.0, 32.0, 51.0, 118.0, 273.0, 228.0, 121.0, 49.0, 20.0, 24.0, 12.0, 6.0, 7.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.894371032714844e-05, -9.481608867645264e-05, -9.068846702575684e-05, -8.656084537506104e-05, -8.243322372436523e-05, -7.830560207366943e-05, -7.417798042297363e-05, -7.005035877227783e-05, -6.592273712158203e-05, -6.179511547088623e-05, -5.766749382019043e-05, -5.353987216949463e-05, -4.941225051879883e-05, -4.528462886810303e-05, -4.1157007217407227e-05, -3.7029385566711426e-05, -3.2901763916015625e-05, -2.8774142265319824e-05, -2.4646520614624023e-05, -2.0518898963928223e-05, -1.6391277313232422e-05, -1.2263655662536621e-05, -8.13603401184082e-06, -4.0084123611450195e-06, 1.1920928955078125e-07, 4.246830940246582e-06, 8.374452590942383e-06, 1.2502074241638184e-05, 1.6629695892333984e-05, 2.0757317543029785e-05, 2.4884939193725586e-05, 2.9012560844421387e-05, 3.314018249511719e-05, 3.726780414581299e-05, 4.139542579650879e-05, 4.552304744720459e-05, 4.965066909790039e-05, 5.377829074859619e-05, 5.790591239929199e-05, 6.203353404998779e-05, 6.61611557006836e-05, 7.02887773513794e-05, 7.44163990020752e-05, 7.8544020652771e-05, 8.26716423034668e-05, 8.67992639541626e-05, 9.09268856048584e-05, 9.50545072555542e-05, 9.918212890625e-05, 0.0001033097505569458, 0.0001074373722076416, 0.0001115649938583374, 0.0001156926155090332, 0.000119820237159729, 0.0001239478588104248, 0.0001280754804611206, 0.0001322031021118164, 0.0001363307237625122, 0.000140458345413208, 0.0001445859670639038, 0.0001487135887145996, 0.0001528412103652954, 0.0001569688320159912, 0.000161096453666687, 0.0001652240753173828]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 12.0, 12.0, 32.0, 30.0, 45.0, 80.0, 101.0, 163.0, 291.0, 414.0, 794.0, 1483.0, 3193.0, 7703.0, 23175.0, 115486.0, 740753.0, 117027.0, 23256.0, 7718.0, 3245.0, 1544.0, 804.0, 436.0, 278.0, 146.0, 95.0, 68.0, 43.0, 38.0, 23.0, 21.0, 7.0, 6.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.26924896240234375, -0.2604217529296875, -0.25159454345703125, -0.242767333984375, -0.23394012451171875, -0.2251129150390625, -0.21628570556640625, -0.20745849609375, -0.19863128662109375, -0.1898040771484375, -0.18097686767578125, -0.172149658203125, -0.16332244873046875, -0.1544952392578125, -0.14566802978515625, -0.1368408203125, -0.12801361083984375, -0.1191864013671875, -0.11035919189453125, -0.101531982421875, -0.09270477294921875, -0.0838775634765625, -0.07505035400390625, -0.06622314453125, -0.05739593505859375, -0.0485687255859375, -0.03974151611328125, -0.030914306640625, -0.02208709716796875, -0.0132598876953125, -0.00443267822265625, 0.00439453125, 0.01322174072265625, 0.0220489501953125, 0.03087615966796875, 0.039703369140625, 0.04853057861328125, 0.0573577880859375, 0.06618499755859375, 0.07501220703125, 0.08383941650390625, 0.0926666259765625, 0.10149383544921875, 0.110321044921875, 0.11914825439453125, 0.1279754638671875, 0.13680267333984375, 0.1456298828125, 0.15445709228515625, 0.1632843017578125, 0.17211151123046875, 0.180938720703125, 0.18976593017578125, 0.1985931396484375, 0.20742034912109375, 0.21624755859375, 0.22507476806640625, 0.2339019775390625, 0.24272918701171875, 0.251556396484375, 0.26038360595703125, 0.2692108154296875, 0.27803802490234375, 0.286865234375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 5.0, 5.0, 7.0, 10.0, 13.0, 14.0, 22.0, 31.0, 35.0, 55.0, 69.0, 93.0, 103.0, 111.0, 111.0, 80.0, 63.0, 46.0, 27.0, 18.0, 15.0, 12.0, 12.0, 12.0, 4.0, 7.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2205810546875, -0.2125225067138672, -0.20446395874023438, -0.19640541076660156, -0.18834686279296875, -0.18028831481933594, -0.17222976684570312, -0.1641712188720703, -0.1561126708984375, -0.1480541229248047, -0.13999557495117188, -0.13193702697753906, -0.12387847900390625, -0.11581993103027344, -0.10776138305664062, -0.09970283508300781, -0.091644287109375, -0.08358573913574219, -0.07552719116210938, -0.06746864318847656, -0.05941009521484375, -0.05135154724121094, -0.043292999267578125, -0.03523445129394531, -0.0271759033203125, -0.019117355346679688, -0.011058807373046875, -0.0030002593994140625, 0.00505828857421875, 0.013116836547851562, 0.021175384521484375, 0.029233932495117188, 0.03729248046875, 0.04535102844238281, 0.053409576416015625, 0.06146812438964844, 0.06952667236328125, 0.07758522033691406, 0.08564376831054688, 0.09370231628417969, 0.1017608642578125, 0.10981941223144531, 0.11787796020507812, 0.12593650817871094, 0.13399505615234375, 0.14205360412597656, 0.15011215209960938, 0.1581707000732422, 0.166229248046875, 0.1742877960205078, 0.18234634399414062, 0.19040489196777344, 0.19846343994140625, 0.20652198791503906, 0.21458053588867188, 0.2226390838623047, 0.2306976318359375, 0.2387561798095703, 0.24681472778320312, 0.25487327575683594, 0.26293182373046875, 0.27099037170410156, 0.2790489196777344, 0.2871074676513672, 0.295166015625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 21.0, 50.0, 113.0, 226.0, 229.0, 156.0, 77.0, 51.0, 29.0, 13.0, 11.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.145428657531738, -7.930696487426758, -7.715964317321777, -7.501232147216797, -7.286499977111816, -7.071767807006836, -6.8570356369018555, -6.642303466796875, -6.4275712966918945, -6.212839126586914, -5.998106956481934, -5.783374786376953, -5.568642616271973, -5.353910446166992, -5.139178276062012, -4.924446105957031, -4.709713935852051, -4.49498176574707, -4.28024959564209, -4.065517425537109, -3.850785255432129, -3.6360530853271484, -3.421320915222168, -3.2065887451171875, -2.991856575012207, -2.7771244049072266, -2.562392234802246, -2.3476600646972656, -2.132927894592285, -1.9181957244873047, -1.7034635543823242, -1.4887313842773438, -1.2739992141723633, -1.0592670440673828, -0.8445348739624023, -0.6298027038574219, -0.4150705337524414, -0.20033836364746094, 0.014393806457519531, 0.2291259765625, 0.44385814666748047, 0.6585903167724609, 0.8733224868774414, 1.0880546569824219, 1.3027868270874023, 1.5175189971923828, 1.7322511672973633, 1.9469833374023438, 2.161715507507324, 2.3764476776123047, 2.591179847717285, 2.8059120178222656, 3.020644187927246, 3.2353763580322266, 3.450108528137207, 3.6648406982421875, 3.879572868347168, 4.094305038452148, 4.309037208557129, 4.523769378662109, 4.73850154876709, 4.95323371887207, 5.167965888977051, 5.382698059082031, 5.597430229187012]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 3.0, 12.0, 13.0, 15.0, 16.0, 14.0, 27.0, 23.0, 27.0, 33.0, 27.0, 43.0, 45.0, 48.0, 40.0, 71.0, 66.0, 55.0, 46.0, 52.0, 31.0, 57.0, 43.0, 32.0, 33.0, 22.0, 26.0, 13.0, 11.0, 14.0, 10.0, 3.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9072117805480957, -2.81426739692688, -2.721323013305664, -2.6283786296844482, -2.5354342460632324, -2.4424898624420166, -2.349545478820801, -2.256601095199585, -2.163656711578369, -2.0707123279571533, -1.9777679443359375, -1.8848235607147217, -1.7918791770935059, -1.69893479347229, -1.6059904098510742, -1.5130460262298584, -1.4201016426086426, -1.3271572589874268, -1.234212875366211, -1.1412684917449951, -1.0483241081237793, -0.9553797245025635, -0.8624353408813477, -0.7694909572601318, -0.676546573638916, -0.5836021900177002, -0.4906578063964844, -0.39771342277526855, -0.30476903915405273, -0.21182465553283691, -0.1188802719116211, -0.025935888290405273, 0.06700849533081055, 0.15995287895202637, 0.2528972625732422, 0.345841646194458, 0.43878602981567383, 0.5317304134368896, 0.6246747970581055, 0.7176191806793213, 0.8105635643005371, 0.9035079479217529, 0.9964523315429688, 1.0893967151641846, 1.1823410987854004, 1.2752854824066162, 1.368229866027832, 1.4611742496490479, 1.5541186332702637, 1.6470630168914795, 1.7400074005126953, 1.8329517841339111, 1.925896167755127, 2.0188405513763428, 2.1117849349975586, 2.2047293186187744, 2.2976737022399902, 2.390618085861206, 2.483562469482422, 2.5765068531036377, 2.6694512367248535, 2.7623956203460693, 2.855340003967285, 2.948284387588501, 3.041228771209717]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 7.0, 2.0, 0.0, 5.0, 7.0, 8.0, 15.0, 17.0, 17.0, 26.0, 27.0, 41.0, 50.0, 93.0, 125.0, 213.0, 346.0, 696.0, 1418.0, 2919.0, 7946.0, 81814.0, 4040667.0, 45718.0, 6812.0, 2547.0, 1240.0, 667.0, 350.0, 204.0, 101.0, 67.0, 40.0, 28.0, 17.0, 16.0, 5.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.0216217041015625, -0.979766845703125, -0.9379119873046875, -0.89605712890625, -0.8542022705078125, -0.812347412109375, -0.7704925537109375, -0.7286376953125, -0.6867828369140625, -0.644927978515625, -0.6030731201171875, -0.56121826171875, -0.5193634033203125, -0.477508544921875, -0.4356536865234375, -0.393798828125, -0.3519439697265625, -0.310089111328125, -0.2682342529296875, -0.22637939453125, -0.1845245361328125, -0.142669677734375, -0.1008148193359375, -0.0589599609375, -0.0171051025390625, 0.024749755859375, 0.0666046142578125, 0.10845947265625, 0.1503143310546875, 0.192169189453125, 0.2340240478515625, 0.27587890625, 0.3177337646484375, 0.359588623046875, 0.4014434814453125, 0.44329833984375, 0.4851531982421875, 0.527008056640625, 0.5688629150390625, 0.6107177734375, 0.6525726318359375, 0.694427490234375, 0.7362823486328125, 0.77813720703125, 0.8199920654296875, 0.861846923828125, 0.9037017822265625, 0.945556640625, 0.9874114990234375, 1.029266357421875, 1.0711212158203125, 1.11297607421875, 1.1548309326171875, 1.196685791015625, 1.2385406494140625, 1.2803955078125, 1.3222503662109375, 1.364105224609375, 1.4059600830078125, 1.44781494140625, 1.4896697998046875, 1.531524658203125, 1.5733795166015625, 1.615234375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 10.0, 22.0, 31.0, 42.0, 48.0, 63.0, 74.0, 67.0, 73.0, 107.0, 93.0, 95.0, 50.0, 51.0, 52.0, 36.0, 26.0, 19.0, 14.0, 9.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4296875, -0.41900634765625, -0.4083251953125, -0.39764404296875, -0.386962890625, -0.37628173828125, -0.3656005859375, -0.35491943359375, -0.34423828125, -0.33355712890625, -0.3228759765625, -0.31219482421875, -0.301513671875, -0.29083251953125, -0.2801513671875, -0.26947021484375, -0.2587890625, -0.24810791015625, -0.2374267578125, -0.22674560546875, -0.216064453125, -0.20538330078125, -0.1947021484375, -0.18402099609375, -0.17333984375, -0.16265869140625, -0.1519775390625, -0.14129638671875, -0.130615234375, -0.11993408203125, -0.1092529296875, -0.09857177734375, -0.087890625, -0.07720947265625, -0.0665283203125, -0.05584716796875, -0.045166015625, -0.03448486328125, -0.0238037109375, -0.01312255859375, -0.00244140625, 0.00823974609375, 0.0189208984375, 0.02960205078125, 0.040283203125, 0.05096435546875, 0.0616455078125, 0.07232666015625, 0.0830078125, 0.09368896484375, 0.1043701171875, 0.11505126953125, 0.125732421875, 0.13641357421875, 0.1470947265625, 0.15777587890625, 0.16845703125, 0.17913818359375, 0.1898193359375, 0.20050048828125, 0.211181640625, 0.22186279296875, 0.2325439453125, 0.24322509765625, 0.25390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 6.0, 7.0, 8.0, 14.0, 21.0, 28.0, 56.0, 54.0, 91.0, 125.0, 188.0, 389.0, 1004.0, 5264.0, 4022220.0, 159977.0, 2964.0, 737.0, 382.0, 220.0, 124.0, 104.0, 70.0, 56.0, 60.0, 38.0, 16.0, 17.0, 15.0, 5.0, 4.0, 4.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.89801025390625, -2.7901611328125, -2.68231201171875, -2.574462890625, -2.46661376953125, -2.3587646484375, -2.25091552734375, -2.14306640625, -2.03521728515625, -1.9273681640625, -1.81951904296875, -1.711669921875, -1.60382080078125, -1.4959716796875, -1.38812255859375, -1.2802734375, -1.17242431640625, -1.0645751953125, -0.95672607421875, -0.848876953125, -0.74102783203125, -0.6331787109375, -0.52532958984375, -0.41748046875, -0.30963134765625, -0.2017822265625, -0.09393310546875, 0.013916015625, 0.12176513671875, 0.2296142578125, 0.33746337890625, 0.4453125, 0.55316162109375, 0.6610107421875, 0.76885986328125, 0.876708984375, 0.98455810546875, 1.0924072265625, 1.20025634765625, 1.30810546875, 1.41595458984375, 1.5238037109375, 1.63165283203125, 1.739501953125, 1.84735107421875, 1.9552001953125, 2.06304931640625, 2.1708984375, 2.27874755859375, 2.3865966796875, 2.49444580078125, 2.602294921875, 2.71014404296875, 2.8179931640625, 2.92584228515625, 3.03369140625, 3.14154052734375, 3.2493896484375, 3.35723876953125, 3.465087890625, 3.57293701171875, 3.6807861328125, 3.78863525390625, 3.896484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 10.0, 43.0, 63.0, 312.0, 3159.0, 359.0, 76.0, 29.0, 13.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91796875, -0.85003662109375, -0.7821044921875, -0.71417236328125, -0.646240234375, -0.57830810546875, -0.5103759765625, -0.44244384765625, -0.37451171875, -0.30657958984375, -0.2386474609375, -0.17071533203125, -0.102783203125, -0.03485107421875, 0.0330810546875, 0.10101318359375, 0.1689453125, 0.23687744140625, 0.3048095703125, 0.37274169921875, 0.440673828125, 0.50860595703125, 0.5765380859375, 0.64447021484375, 0.71240234375, 0.78033447265625, 0.8482666015625, 0.91619873046875, 0.984130859375, 1.05206298828125, 1.1199951171875, 1.18792724609375, 1.255859375, 1.32379150390625, 1.3917236328125, 1.45965576171875, 1.527587890625, 1.59552001953125, 1.6634521484375, 1.73138427734375, 1.79931640625, 1.86724853515625, 1.9351806640625, 2.00311279296875, 2.071044921875, 2.13897705078125, 2.2069091796875, 2.27484130859375, 2.3427734375, 2.41070556640625, 2.4786376953125, 2.54656982421875, 2.614501953125, 2.68243408203125, 2.7503662109375, 2.81829833984375, 2.88623046875, 2.95416259765625, 3.0220947265625, 3.09002685546875, 3.157958984375, 3.22589111328125, 3.2938232421875, 3.36175537109375, 3.4296875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 29.0, 132.0, 551.0, 200.0, 35.0, 21.0, 7.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.79609489440918, -27.07457733154297, -26.353057861328125, -25.631540298461914, -24.910022735595703, -24.18850326538086, -23.46698570251465, -22.745468139648438, -22.023948669433594, -21.302431106567383, -20.58091163635254, -19.859394073486328, -19.137874603271484, -18.416357040405273, -17.694839477539062, -16.97332000732422, -16.251802444458008, -15.53028392791748, -14.808765411376953, -14.087247848510742, -13.365729331970215, -12.644210815429688, -11.922693252563477, -11.20117473602295, -10.479656219482422, -9.758137702941895, -9.036619186401367, -8.315101623535156, -7.593583106994629, -6.872064590454102, -6.150546550750732, -5.429028511047363, -4.707508087158203, -3.985989809036255, -3.2644715309143066, -2.5429532527923584, -1.8214349746704102, -1.099916696548462, -0.37839841842651367, 0.34311962127685547, 1.0646381378173828, 1.786156415939331, 2.5076746940612793, 3.2291929721832275, 3.950711250305176, 4.672229766845703, 5.393747806549072, 6.115265846252441, 6.836784362792969, 7.558302879333496, 8.279821395874023, 9.001338958740234, 9.722857475280762, 10.444375991821289, 11.1658935546875, 11.887412071228027, 12.608930587768555, 13.330449104309082, 14.05196762084961, 14.77348518371582, 15.495003700256348, 16.216522216796875, 16.938039779663086, 17.659557342529297, 18.38107681274414]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 5.0, 13.0, 25.0, 22.0, 16.0, 46.0, 54.0, 61.0, 72.0, 74.0, 90.0, 85.0, 83.0, 87.0, 73.0, 50.0, 37.0, 32.0, 23.0, 12.0, 8.0, 9.0, 5.0, 9.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.369791030883789, -8.162999153137207, -7.956207752227783, -7.749415874481201, -7.542623996734619, -7.335832595825195, -7.129040718078613, -6.922248840332031, -6.715456962585449, -6.508665084838867, -6.301873683929443, -6.095081806182861, -5.888289928436279, -5.6814985275268555, -5.474706649780273, -5.267914772033691, -5.061122894287109, -4.854331016540527, -4.6475396156311035, -4.4407477378845215, -4.2339558601379395, -4.027164459228516, -3.8203725814819336, -3.6135807037353516, -3.4067893028259277, -3.199997663497925, -2.9932057857513428, -2.78641414642334, -2.579622268676758, -2.372830629348755, -2.166038990020752, -1.95924711227417, -1.752455234527588, -1.5456634759902954, -1.338871717453003, -1.132080078125, -0.9252882599830627, -0.718496561050415, -0.5117048025131226, -0.3049130439758301, -0.0981212854385376, 0.10867045819759369, 0.315462201833725, 0.5222539305686951, 0.7290456891059875, 0.9358373880386353, 1.1426291465759277, 1.3494209051132202, 1.5562126636505127, 1.7630044221878052, 1.9697961807250977, 2.1765878200531006, 2.3833796977996826, 2.5901713371276855, 2.7969632148742676, 3.0037548542022705, 3.2105464935302734, 3.4173381328582764, 3.6241300106048584, 3.8309216499328613, 4.037713527679443, 4.244504928588867, 4.451296806335449, 4.658088684082031, 4.864880561828613]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 6.0, 11.0, 15.0, 11.0, 26.0, 40.0, 59.0, 61.0, 122.0, 181.0, 348.0, 583.0, 1140.0, 2395.0, 6110.0, 17792.0, 71389.0, 446748.0, 408442.0, 65688.0, 16684.0, 5777.0, 2420.0, 1093.0, 590.0, 315.0, 163.0, 94.0, 80.0, 50.0, 27.0, 27.0, 18.0, 13.0, 4.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.8515625, -0.8257369995117188, -0.7999114990234375, -0.7740859985351562, -0.748260498046875, -0.7224349975585938, -0.6966094970703125, -0.6707839965820312, -0.64495849609375, -0.6191329956054688, -0.5933074951171875, -0.5674819946289062, -0.541656494140625, -0.5158309936523438, -0.4900054931640625, -0.46417999267578125, -0.4383544921875, -0.41252899169921875, -0.3867034912109375, -0.36087799072265625, -0.335052490234375, -0.30922698974609375, -0.2834014892578125, -0.25757598876953125, -0.23175048828125, -0.20592498779296875, -0.1800994873046875, -0.15427398681640625, -0.128448486328125, -0.10262298583984375, -0.0767974853515625, -0.05097198486328125, -0.025146484375, 0.00067901611328125, 0.0265045166015625, 0.05233001708984375, 0.078155517578125, 0.10398101806640625, 0.1298065185546875, 0.15563201904296875, 0.18145751953125, 0.20728302001953125, 0.2331085205078125, 0.25893402099609375, 0.284759521484375, 0.31058502197265625, 0.3364105224609375, 0.36223602294921875, 0.3880615234375, 0.41388702392578125, 0.4397125244140625, 0.46553802490234375, 0.491363525390625, 0.5171890258789062, 0.5430145263671875, 0.5688400268554688, 0.59466552734375, 0.6204910278320312, 0.6463165283203125, 0.6721420288085938, 0.697967529296875, 0.7237930297851562, 0.7496185302734375, 0.7754440307617188, 0.80126953125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 16.0, 20.0, 30.0, 22.0, 43.0, 49.0, 53.0, 71.0, 102.0, 93.0, 91.0, 70.0, 78.0, 68.0, 45.0, 35.0, 30.0, 28.0, 19.0, 12.0, 9.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57666015625, -0.5625267028808594, -0.5483932495117188, -0.5342597961425781, -0.5201263427734375, -0.5059928894042969, -0.49185943603515625, -0.4777259826660156, -0.463592529296875, -0.4494590759277344, -0.43532562255859375, -0.4211921691894531, -0.4070587158203125, -0.3929252624511719, -0.37879180908203125, -0.3646583557128906, -0.35052490234375, -0.3363914489746094, -0.32225799560546875, -0.3081245422363281, -0.2939910888671875, -0.2798576354980469, -0.26572418212890625, -0.2515907287597656, -0.237457275390625, -0.22332382202148438, -0.20919036865234375, -0.19505691528320312, -0.1809234619140625, -0.16679000854492188, -0.15265655517578125, -0.13852310180664062, -0.1243896484375, -0.11025619506835938, -0.09612274169921875, -0.08198928833007812, -0.0678558349609375, -0.053722381591796875, -0.03958892822265625, -0.025455474853515625, -0.011322021484375, 0.002811431884765625, 0.01694488525390625, 0.031078338623046875, 0.0452117919921875, 0.059345245361328125, 0.07347869873046875, 0.08761215209960938, 0.10174560546875, 0.11587905883789062, 0.13001251220703125, 0.14414596557617188, 0.1582794189453125, 0.17241287231445312, 0.18654632568359375, 0.20067977905273438, 0.214813232421875, 0.22894668579101562, 0.24308013916015625, 0.2572135925292969, 0.2713470458984375, 0.2854804992675781, 0.29961395263671875, 0.3137474060058594, 0.327880859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 8.0, 5.0, 11.0, 16.0, 19.0, 36.0, 28.0, 46.0, 54.0, 79.0, 121.0, 201.0, 313.0, 554.0, 946.0, 1967.0, 5095.0, 16519.0, 87968.0, 682940.0, 208665.0, 29518.0, 7611.0, 2718.0, 1314.0, 707.0, 354.0, 225.0, 137.0, 108.0, 69.0, 43.0, 42.0, 24.0, 17.0, 21.0, 11.0, 12.0, 8.0, 5.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.7509765625, -0.7286911010742188, -0.7064056396484375, -0.6841201782226562, -0.661834716796875, -0.6395492553710938, -0.6172637939453125, -0.5949783325195312, -0.57269287109375, -0.5504074096679688, -0.5281219482421875, -0.5058364868164062, -0.483551025390625, -0.46126556396484375, -0.4389801025390625, -0.41669464111328125, -0.3944091796875, -0.37212371826171875, -0.3498382568359375, -0.32755279541015625, -0.305267333984375, -0.28298187255859375, -0.2606964111328125, -0.23841094970703125, -0.21612548828125, -0.19384002685546875, -0.1715545654296875, -0.14926910400390625, -0.126983642578125, -0.10469818115234375, -0.0824127197265625, -0.06012725830078125, -0.037841796875, -0.01555633544921875, 0.0067291259765625, 0.02901458740234375, 0.051300048828125, 0.07358551025390625, 0.0958709716796875, 0.11815643310546875, 0.14044189453125, 0.16272735595703125, 0.1850128173828125, 0.20729827880859375, 0.229583740234375, 0.25186920166015625, 0.2741546630859375, 0.29644012451171875, 0.3187255859375, 0.34101104736328125, 0.3632965087890625, 0.38558197021484375, 0.407867431640625, 0.43015289306640625, 0.4524383544921875, 0.47472381591796875, 0.49700927734375, 0.5192947387695312, 0.5415802001953125, 0.5638656616210938, 0.586151123046875, 0.6084365844726562, 0.6307220458984375, 0.6530075073242188, 0.67529296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 0.0, 6.0, 9.0, 9.0, 2.0, 10.0, 6.0, 12.0, 16.0, 19.0, 22.0, 18.0, 18.0, 25.0, 21.0, 36.0, 41.0, 26.0, 36.0, 42.0, 51.0, 45.0, 51.0, 32.0, 48.0, 37.0, 32.0, 35.0, 28.0, 39.0, 34.0, 32.0, 20.0, 14.0, 26.0, 18.0, 11.0, 10.0, 11.0, 11.0, 8.0, 7.0, 4.0, 4.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.72265625, -0.7006912231445312, -0.6787261962890625, -0.6567611694335938, -0.634796142578125, -0.6128311157226562, -0.5908660888671875, -0.5689010620117188, -0.54693603515625, -0.5249710083007812, -0.5030059814453125, -0.48104095458984375, -0.459075927734375, -0.43711090087890625, -0.4151458740234375, -0.39318084716796875, -0.3712158203125, -0.34925079345703125, -0.3272857666015625, -0.30532073974609375, -0.283355712890625, -0.26139068603515625, -0.2394256591796875, -0.21746063232421875, -0.19549560546875, -0.17353057861328125, -0.1515655517578125, -0.12960052490234375, -0.107635498046875, -0.08567047119140625, -0.0637054443359375, -0.04174041748046875, -0.019775390625, 0.00218963623046875, 0.0241546630859375, 0.04611968994140625, 0.068084716796875, 0.09004974365234375, 0.1120147705078125, 0.13397979736328125, 0.15594482421875, 0.17790985107421875, 0.1998748779296875, 0.22183990478515625, 0.243804931640625, 0.26576995849609375, 0.2877349853515625, 0.30970001220703125, 0.3316650390625, 0.35363006591796875, 0.3755950927734375, 0.39756011962890625, 0.419525146484375, 0.44149017333984375, 0.4634552001953125, 0.48542022705078125, 0.50738525390625, 0.5293502807617188, 0.5513153076171875, 0.5732803344726562, 0.595245361328125, 0.6172103881835938, 0.6391754150390625, 0.6611404418945312, 0.68310546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 11.0, 16.0, 26.0, 58.0, 109.0, 208.0, 458.0, 1478.0, 7197.0, 92810.0, 908046.0, 32391.0, 4089.0, 979.0, 341.0, 155.0, 75.0, 38.0, 25.0, 12.0, 5.0, 11.0, 2.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64990234375, -0.62847900390625, -0.6070556640625, -0.58563232421875, -0.564208984375, -0.54278564453125, -0.5213623046875, -0.49993896484375, -0.478515625, -0.45709228515625, -0.4356689453125, -0.41424560546875, -0.392822265625, -0.37139892578125, -0.3499755859375, -0.32855224609375, -0.30712890625, -0.28570556640625, -0.2642822265625, -0.24285888671875, -0.221435546875, -0.20001220703125, -0.1785888671875, -0.15716552734375, -0.1357421875, -0.11431884765625, -0.0928955078125, -0.07147216796875, -0.050048828125, -0.02862548828125, -0.0072021484375, 0.01422119140625, 0.03564453125, 0.05706787109375, 0.0784912109375, 0.09991455078125, 0.121337890625, 0.14276123046875, 0.1641845703125, 0.18560791015625, 0.20703125, 0.22845458984375, 0.2498779296875, 0.27130126953125, 0.292724609375, 0.31414794921875, 0.3355712890625, 0.35699462890625, 0.37841796875, 0.39984130859375, 0.4212646484375, 0.44268798828125, 0.464111328125, 0.48553466796875, 0.5069580078125, 0.52838134765625, 0.5498046875, 0.57122802734375, 0.5926513671875, 0.61407470703125, 0.635498046875, 0.65692138671875, 0.6783447265625, 0.69976806640625, 0.72119140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 10.0, 11.0, 18.0, 29.0, 45.0, 67.0, 101.0, 181.0, 213.0, 124.0, 78.0, 42.0, 20.0, 20.0, 8.0, 8.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010281801223754883, -9.903218597173691e-05, -9.524635970592499e-05, -9.146053344011307e-05, -8.767470717430115e-05, -8.388888090848923e-05, -8.010305464267731e-05, -7.631722837686539e-05, -7.253140211105347e-05, -6.874557584524155e-05, -6.495974957942963e-05, -6.11739233136177e-05, -5.7388097047805786e-05, -5.3602270781993866e-05, -4.9816444516181946e-05, -4.6030618250370026e-05, -4.2244791984558105e-05, -3.8458965718746185e-05, -3.4673139452934265e-05, -3.0887313187122345e-05, -2.7101486921310425e-05, -2.3315660655498505e-05, -1.9529834389686584e-05, -1.5744008123874664e-05, -1.1958181858062744e-05, -8.172355592250824e-06, -4.386529326438904e-06, -6.007030606269836e-07, 3.1851232051849365e-06, 6.970949470996857e-06, 1.0756775736808777e-05, 1.4542602002620697e-05, 1.8328428268432617e-05, 2.2114254534244537e-05, 2.5900080800056458e-05, 2.9685907065868378e-05, 3.34717333316803e-05, 3.725755959749222e-05, 4.104338586330414e-05, 4.482921212911606e-05, 4.861503839492798e-05, 5.24008646607399e-05, 5.618669092655182e-05, 5.997251719236374e-05, 6.375834345817566e-05, 6.754416972398758e-05, 7.13299959897995e-05, 7.511582225561142e-05, 7.890164852142334e-05, 8.268747478723526e-05, 8.647330105304718e-05, 9.02591273188591e-05, 9.404495358467102e-05, 9.783077985048294e-05, 0.00010161660611629486, 0.00010540243238210678, 0.0001091882586479187, 0.00011297408491373062, 0.00011675991117954254, 0.00012054573744535446, 0.00012433156371116638, 0.0001281173899769783, 0.00013190321624279022, 0.00013568904250860214, 0.00013947486877441406]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 15.0, 15.0, 15.0, 20.0, 36.0, 71.0, 90.0, 130.0, 189.0, 301.0, 515.0, 986.0, 1663.0, 3542.0, 8785.0, 27888.0, 160373.0, 710656.0, 98543.0, 20916.0, 7035.0, 3032.0, 1621.0, 851.0, 450.0, 267.0, 178.0, 109.0, 94.0, 48.0, 44.0, 20.0, 18.0, 8.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32421875, -0.3135490417480469, -0.30287933349609375, -0.2922096252441406, -0.2815399169921875, -0.2708702087402344, -0.26020050048828125, -0.24953079223632812, -0.238861083984375, -0.22819137573242188, -0.21752166748046875, -0.20685195922851562, -0.1961822509765625, -0.18551254272460938, -0.17484283447265625, -0.16417312622070312, -0.15350341796875, -0.14283370971679688, -0.13216400146484375, -0.12149429321289062, -0.1108245849609375, -0.10015487670898438, -0.08948516845703125, -0.07881546020507812, -0.068145751953125, -0.057476043701171875, -0.04680633544921875, -0.036136627197265625, -0.0254669189453125, -0.014797210693359375, -0.00412750244140625, 0.006542205810546875, 0.0172119140625, 0.027881622314453125, 0.03855133056640625, 0.049221038818359375, 0.0598907470703125, 0.07056045532226562, 0.08123016357421875, 0.09189987182617188, 0.102569580078125, 0.11323928833007812, 0.12390899658203125, 0.13457870483398438, 0.1452484130859375, 0.15591812133789062, 0.16658782958984375, 0.17725753784179688, 0.18792724609375, 0.19859695434570312, 0.20926666259765625, 0.21993637084960938, 0.2306060791015625, 0.24127578735351562, 0.25194549560546875, 0.2626152038574219, 0.273284912109375, 0.2839546203613281, 0.29462432861328125, 0.3052940368652344, 0.3159637451171875, 0.3266334533691406, 0.33730316162109375, 0.3479728698730469, 0.358642578125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 9.0, 12.0, 11.0, 6.0, 21.0, 22.0, 22.0, 26.0, 47.0, 50.0, 61.0, 71.0, 86.0, 81.0, 81.0, 68.0, 58.0, 44.0, 34.0, 29.0, 30.0, 23.0, 14.0, 23.0, 15.0, 8.0, 9.0, 6.0, 5.0, 3.0, 3.0, 9.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.246337890625, -0.2389812469482422, -0.23162460327148438, -0.22426795959472656, -0.21691131591796875, -0.20955467224121094, -0.20219802856445312, -0.1948413848876953, -0.1874847412109375, -0.1801280975341797, -0.17277145385742188, -0.16541481018066406, -0.15805816650390625, -0.15070152282714844, -0.14334487915039062, -0.1359882354736328, -0.128631591796875, -0.12127494812011719, -0.11391830444335938, -0.10656166076660156, -0.09920501708984375, -0.09184837341308594, -0.08449172973632812, -0.07713508605957031, -0.0697784423828125, -0.06242179870605469, -0.055065155029296875, -0.04770851135253906, -0.04035186767578125, -0.03299522399902344, -0.025638580322265625, -0.018281936645507812, -0.01092529296875, -0.0035686492919921875, 0.003787994384765625, 0.011144638061523438, 0.01850128173828125, 0.025857925415039062, 0.033214569091796875, 0.04057121276855469, 0.0479278564453125, 0.05528450012207031, 0.06264114379882812, 0.06999778747558594, 0.07735443115234375, 0.08471107482910156, 0.09206771850585938, 0.09942436218261719, 0.106781005859375, 0.11413764953613281, 0.12149429321289062, 0.12885093688964844, 0.13620758056640625, 0.14356422424316406, 0.15092086791992188, 0.1582775115966797, 0.1656341552734375, 0.1729907989501953, 0.18034744262695312, 0.18770408630371094, 0.19506072998046875, 0.20241737365722656, 0.20977401733398438, 0.2171306610107422, 0.2244873046875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 14.0, 49.0, 107.0, 200.0, 292.0, 185.0, 79.0, 36.0, 17.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2016143798828125, -5.936796188354492, -5.671977519989014, -5.407158851623535, -5.142340660095215, -4.8775224685668945, -4.612703800201416, -4.3478851318359375, -4.083066940307617, -3.8182485103607178, -3.5534300804138184, -3.288611650466919, -3.0237932205200195, -2.75897479057312, -2.4941563606262207, -2.2293379306793213, -1.9645195007324219, -1.6997010707855225, -1.434882640838623, -1.1700642108917236, -0.9052457809448242, -0.6404273509979248, -0.3756089210510254, -0.11079049110412598, 0.15402793884277344, 0.41884636878967285, 0.6836647987365723, 0.9484832286834717, 1.213301658630371, 1.4781200885772705, 1.74293851852417, 2.0077569484710693, 2.2725744247436523, 2.5373928546905518, 2.802211284637451, 3.0670297145843506, 3.33184814453125, 3.5966665744781494, 3.861485004425049, 4.126303672790527, 4.391121864318848, 4.655940055847168, 4.9207587242126465, 5.185577392578125, 5.450395584106445, 5.715213775634766, 5.980032444000244, 6.244851112365723, 6.509669303894043, 6.774487495422363, 7.039306163787842, 7.30412483215332, 7.568943023681641, 7.833761215209961, 8.098579406738281, 8.363398551940918, 8.628216743469238, 8.893034934997559, 9.157854080200195, 9.422672271728516, 9.687490463256836, 9.952308654785156, 10.217126846313477, 10.481945991516113, 10.746764183044434]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 9.0, 8.0, 2.0, 15.0, 6.0, 11.0, 9.0, 15.0, 27.0, 28.0, 32.0, 36.0, 27.0, 60.0, 51.0, 43.0, 56.0, 53.0, 56.0, 72.0, 56.0, 34.0, 49.0, 32.0, 33.0, 24.0, 22.0, 20.0, 31.0, 16.0, 14.0, 13.0, 10.0, 6.0, 5.0, 9.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.831061840057373, -3.7147722244262695, -3.598482608795166, -3.4821929931640625, -3.365903615951538, -3.2496140003204346, -3.133324384689331, -3.0170347690582275, -2.900745391845703, -2.7844557762145996, -2.668166160583496, -2.5518765449523926, -2.435587167739868, -2.3192975521087646, -2.203007936477661, -2.0867183208465576, -1.970428705215454, -1.8541390895843506, -1.7378495931625366, -1.621559977531433, -1.5052704811096191, -1.3889808654785156, -1.272691249847412, -1.1564016342163086, -1.0401121377944946, -0.9238225817680359, -0.8075330257415771, -0.6912434101104736, -0.5749538540840149, -0.45866429805755615, -0.34237468242645264, -0.2260851263999939, -0.10979580879211426, 0.006493762135505676, 0.12278333306312561, 0.23907291889190674, 0.3553624749183655, 0.4716520309448242, 0.5879416465759277, 0.7042312026023865, 0.8205207586288452, 0.936810314655304, 1.0530998706817627, 1.1693894863128662, 1.2856791019439697, 1.4019685983657837, 1.5182582139968872, 1.6345477104187012, 1.7508373260498047, 1.8671269416809082, 1.9834164381027222, 2.0997061729431152, 2.2159955501556396, 2.332285165786743, 2.4485747814178467, 2.56486439704895, 2.6811537742614746, 2.797443389892578, 2.9137330055236816, 3.030022621154785, 3.1463119983673096, 3.262601613998413, 3.3788912296295166, 3.49518084526062, 3.6114704608917236]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 6.0, 7.0, 11.0, 17.0, 22.0, 18.0, 36.0, 43.0, 48.0, 65.0, 84.0, 128.0, 197.0, 320.0, 550.0, 1105.0, 2411.0, 6049.0, 17977.0, 213000.0, 3856355.0, 72142.0, 14755.0, 4823.0, 2102.0, 1004.0, 416.0, 254.0, 132.0, 75.0, 43.0, 38.0, 15.0, 9.0, 8.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6337890625, -1.5911865234375, -1.548583984375, -1.5059814453125, -1.46337890625, -1.4207763671875, -1.378173828125, -1.3355712890625, -1.29296875, -1.2503662109375, -1.207763671875, -1.1651611328125, -1.12255859375, -1.0799560546875, -1.037353515625, -0.9947509765625, -0.9521484375, -0.9095458984375, -0.866943359375, -0.8243408203125, -0.78173828125, -0.7391357421875, -0.696533203125, -0.6539306640625, -0.611328125, -0.5687255859375, -0.526123046875, -0.4835205078125, -0.44091796875, -0.3983154296875, -0.355712890625, -0.3131103515625, -0.2705078125, -0.2279052734375, -0.185302734375, -0.1427001953125, -0.10009765625, -0.0574951171875, -0.014892578125, 0.0277099609375, 0.0703125, 0.1129150390625, 0.155517578125, 0.1981201171875, 0.24072265625, 0.2833251953125, 0.325927734375, 0.3685302734375, 0.4111328125, 0.4537353515625, 0.496337890625, 0.5389404296875, 0.58154296875, 0.6241455078125, 0.666748046875, 0.7093505859375, 0.751953125, 0.7945556640625, 0.837158203125, 0.8797607421875, 0.92236328125, 0.9649658203125, 1.007568359375, 1.0501708984375, 1.0927734375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 11.0, 10.0, 20.0, 28.0, 24.0, 40.0, 53.0, 68.0, 62.0, 94.0, 90.0, 87.0, 87.0, 74.0, 66.0, 57.0, 37.0, 25.0, 30.0, 21.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55322265625, -0.5396728515625, -0.526123046875, -0.5125732421875, -0.4990234375, -0.4854736328125, -0.471923828125, -0.4583740234375, -0.44482421875, -0.4312744140625, -0.417724609375, -0.4041748046875, -0.390625, -0.3770751953125, -0.363525390625, -0.3499755859375, -0.33642578125, -0.3228759765625, -0.309326171875, -0.2957763671875, -0.2822265625, -0.2686767578125, -0.255126953125, -0.2415771484375, -0.22802734375, -0.2144775390625, -0.200927734375, -0.1873779296875, -0.173828125, -0.1602783203125, -0.146728515625, -0.1331787109375, -0.11962890625, -0.1060791015625, -0.092529296875, -0.0789794921875, -0.0654296875, -0.0518798828125, -0.038330078125, -0.0247802734375, -0.01123046875, 0.0023193359375, 0.015869140625, 0.0294189453125, 0.04296875, 0.0565185546875, 0.070068359375, 0.0836181640625, 0.09716796875, 0.1107177734375, 0.124267578125, 0.1378173828125, 0.1513671875, 0.1649169921875, 0.178466796875, 0.1920166015625, 0.20556640625, 0.2191162109375, 0.232666015625, 0.2462158203125, 0.259765625, 0.2733154296875, 0.286865234375, 0.3004150390625, 0.31396484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 2.0, 5.0, 15.0, 16.0, 17.0, 38.0, 58.0, 100.0, 181.0, 497.0, 1812.0, 14568.0, 3967775.0, 200241.0, 6926.0, 1122.0, 339.0, 163.0, 110.0, 71.0, 66.0, 43.0, 34.0, 22.0, 23.0, 14.0, 12.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.22265625, -2.12939453125, -2.0361328125, -1.94287109375, -1.849609375, -1.75634765625, -1.6630859375, -1.56982421875, -1.4765625, -1.38330078125, -1.2900390625, -1.19677734375, -1.103515625, -1.01025390625, -0.9169921875, -0.82373046875, -0.73046875, -0.63720703125, -0.5439453125, -0.45068359375, -0.357421875, -0.26416015625, -0.1708984375, -0.07763671875, 0.015625, 0.10888671875, 0.2021484375, 0.29541015625, 0.388671875, 0.48193359375, 0.5751953125, 0.66845703125, 0.76171875, 0.85498046875, 0.9482421875, 1.04150390625, 1.134765625, 1.22802734375, 1.3212890625, 1.41455078125, 1.5078125, 1.60107421875, 1.6943359375, 1.78759765625, 1.880859375, 1.97412109375, 2.0673828125, 2.16064453125, 2.25390625, 2.34716796875, 2.4404296875, 2.53369140625, 2.626953125, 2.72021484375, 2.8134765625, 2.90673828125, 3.0, 3.09326171875, 3.1865234375, 3.27978515625, 3.373046875, 3.46630859375, 3.5595703125, 3.65283203125, 3.74609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 11.0, 13.0, 27.0, 53.0, 133.0, 673.0, 2426.0, 481.0, 118.0, 66.0, 33.0, 19.0, 12.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8447265625, -0.7819671630859375, -0.719207763671875, -0.6564483642578125, -0.59368896484375, -0.5309295654296875, -0.468170166015625, -0.4054107666015625, -0.3426513671875, -0.2798919677734375, -0.217132568359375, -0.1543731689453125, -0.09161376953125, -0.0288543701171875, 0.033905029296875, 0.0966644287109375, 0.159423828125, 0.2221832275390625, 0.284942626953125, 0.3477020263671875, 0.41046142578125, 0.4732208251953125, 0.535980224609375, 0.5987396240234375, 0.6614990234375, 0.7242584228515625, 0.787017822265625, 0.8497772216796875, 0.91253662109375, 0.9752960205078125, 1.038055419921875, 1.1008148193359375, 1.16357421875, 1.2263336181640625, 1.289093017578125, 1.3518524169921875, 1.41461181640625, 1.4773712158203125, 1.540130615234375, 1.6028900146484375, 1.6656494140625, 1.7284088134765625, 1.791168212890625, 1.8539276123046875, 1.91668701171875, 1.9794464111328125, 2.042205810546875, 2.1049652099609375, 2.167724609375, 2.2304840087890625, 2.293243408203125, 2.3560028076171875, 2.41876220703125, 2.4815216064453125, 2.544281005859375, 2.6070404052734375, 2.6697998046875, 2.7325592041015625, 2.795318603515625, 2.8580780029296875, 2.92083740234375, 2.9835968017578125, 3.046356201171875, 3.1091156005859375, 3.171875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 9.0, 17.0, 35.0, 54.0, 95.0, 226.0, 255.0, 138.0, 64.0, 32.0, 21.0, 15.0, 11.0, 7.0, 1.0, 2.0, 6.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7258501052856445, -7.362420558929443, -6.998991012573242, -6.635560989379883, -6.272131443023682, -5.9087018966674805, -5.545271873474121, -5.18184232711792, -4.818412780761719, -4.454983234405518, -4.091553688049316, -3.728123664855957, -3.364694118499756, -3.0012645721435547, -2.6378347873687744, -2.274405002593994, -1.910975456237793, -1.5475457906723022, -1.1841161251068115, -0.8206864595413208, -0.4572567939758301, -0.09382712841033936, 0.26960253715515137, 0.6330323219299316, 0.9964618682861328, 1.3598915338516235, 1.7233211994171143, 2.0867509841918945, 2.4501805305480957, 2.813610076904297, 3.177039861679077, 3.5404696464538574, 3.903900146484375, 4.267329692840576, 4.630759239196777, 4.994189262390137, 5.357618808746338, 5.721048355102539, 6.084478378295898, 6.4479079246521, 6.811337471008301, 7.174767017364502, 7.538196563720703, 7.9016265869140625, 8.265056610107422, 8.628485679626465, 8.991915702819824, 9.355344772338867, 9.718774795532227, 10.082204818725586, 10.445633888244629, 10.809063911437988, 11.172492980957031, 11.53592300415039, 11.89935302734375, 12.26278305053711, 12.626212120056152, 12.989642143249512, 13.353071212768555, 13.716501235961914, 14.079931259155273, 14.443360328674316, 14.806790351867676, 15.170219421386719, 15.533649444580078]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 1.0, 1.0, 6.0, 10.0, 12.0, 22.0, 18.0, 26.0, 28.0, 27.0, 50.0, 43.0, 45.0, 55.0, 71.0, 70.0, 62.0, 69.0, 69.0, 54.0, 40.0, 30.0, 39.0, 36.0, 36.0, 17.0, 20.0, 14.0, 10.0, 9.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.195430755615234, -4.047861576080322, -3.9002926349639893, -3.7527236938476562, -3.605154514312744, -3.457585573196411, -3.310016632080078, -3.162447452545166, -3.014878511428833, -2.8673095703125, -2.719740390777588, -2.572171449661255, -2.424602508544922, -2.2770333290100098, -2.1294643878936768, -1.9818953275680542, -1.8343262672424316, -1.686757206916809, -1.5391881465911865, -1.3916192054748535, -1.244050145149231, -1.0964810848236084, -0.9489120841026306, -0.8013430833816528, -0.6537740230560303, -0.5062049627304077, -0.35863596200942993, -0.21106693148612976, -0.06349790096282959, 0.08407115936279297, 0.23164016008377075, 0.37920916080474854, 0.5267786979675293, 0.6743477582931519, 0.8219167590141296, 0.9694857597351074, 1.11705482006073, 1.2646238803863525, 1.4121928215026855, 1.559761881828308, 1.7073309421539307, 1.8549000024795532, 2.002469062805176, 2.150038003921509, 2.297606945037842, 2.445176124572754, 2.592745065689087, 2.74031400680542, 2.887883186340332, 3.035452127456665, 3.183021306991577, 3.33059024810791, 3.4781594276428223, 3.6257283687591553, 3.7732973098754883, 3.9208664894104004, 4.0684356689453125, 4.216004848480225, 4.3635735511779785, 4.511142730712891, 4.658711910247803, 4.806281089782715, 4.953849792480469, 5.101418972015381, 5.248987674713135]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 15.0, 13.0, 5.0, 28.0, 34.0, 46.0, 75.0, 96.0, 207.0, 295.0, 543.0, 1127.0, 2528.0, 6605.0, 22451.0, 134162.0, 696438.0, 147758.0, 24014.0, 6862.0, 2597.0, 1189.0, 609.0, 307.0, 192.0, 114.0, 79.0, 50.0, 29.0, 20.0, 12.0, 10.0, 19.0, 8.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0791015625, -1.0437469482421875, -1.008392333984375, -0.9730377197265625, -0.93768310546875, -0.9023284912109375, -0.866973876953125, -0.8316192626953125, -0.7962646484375, -0.7609100341796875, -0.725555419921875, -0.6902008056640625, -0.65484619140625, -0.6194915771484375, -0.584136962890625, -0.5487823486328125, -0.513427734375, -0.4780731201171875, -0.442718505859375, -0.4073638916015625, -0.37200927734375, -0.3366546630859375, -0.301300048828125, -0.2659454345703125, -0.2305908203125, -0.1952362060546875, -0.159881591796875, -0.1245269775390625, -0.08917236328125, -0.0538177490234375, -0.018463134765625, 0.0168914794921875, 0.05224609375, 0.0876007080078125, 0.122955322265625, 0.1583099365234375, 0.19366455078125, 0.2290191650390625, 0.264373779296875, 0.2997283935546875, 0.3350830078125, 0.3704376220703125, 0.405792236328125, 0.4411468505859375, 0.47650146484375, 0.5118560791015625, 0.547210693359375, 0.5825653076171875, 0.617919921875, 0.6532745361328125, 0.688629150390625, 0.7239837646484375, 0.75933837890625, 0.7946929931640625, 0.830047607421875, 0.8654022216796875, 0.9007568359375, 0.9361114501953125, 0.971466064453125, 1.0068206787109375, 1.04217529296875, 1.0775299072265625, 1.112884521484375, 1.1482391357421875, 1.18359375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 8.0, 7.0, 19.0, 27.0, 31.0, 52.0, 48.0, 55.0, 57.0, 82.0, 88.0, 86.0, 82.0, 73.0, 62.0, 56.0, 52.0, 33.0, 24.0, 18.0, 8.0, 7.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.61572265625, -0.6013717651367188, -0.5870208740234375, -0.5726699829101562, -0.558319091796875, -0.5439682006835938, -0.5296173095703125, -0.5152664184570312, -0.50091552734375, -0.48656463623046875, -0.4722137451171875, -0.45786285400390625, -0.443511962890625, -0.42916107177734375, -0.4148101806640625, -0.40045928955078125, -0.3861083984375, -0.37175750732421875, -0.3574066162109375, -0.34305572509765625, -0.328704833984375, -0.31435394287109375, -0.3000030517578125, -0.28565216064453125, -0.27130126953125, -0.25695037841796875, -0.2425994873046875, -0.22824859619140625, -0.213897705078125, -0.19954681396484375, -0.1851959228515625, -0.17084503173828125, -0.156494140625, -0.14214324951171875, -0.1277923583984375, -0.11344146728515625, -0.099090576171875, -0.08473968505859375, -0.0703887939453125, -0.05603790283203125, -0.04168701171875, -0.02733612060546875, -0.0129852294921875, 0.00136566162109375, 0.015716552734375, 0.03006744384765625, 0.0444183349609375, 0.05876922607421875, 0.0731201171875, 0.08747100830078125, 0.1018218994140625, 0.11617279052734375, 0.130523681640625, 0.14487457275390625, 0.1592254638671875, 0.17357635498046875, 0.18792724609375, 0.20227813720703125, 0.2166290283203125, 0.23097991943359375, 0.245330810546875, 0.25968170166015625, 0.2740325927734375, 0.28838348388671875, 0.302734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 4.0, 9.0, 10.0, 12.0, 16.0, 16.0, 38.0, 53.0, 70.0, 118.0, 162.0, 235.0, 411.0, 696.0, 1440.0, 3220.0, 10951.0, 75998.0, 821737.0, 112050.0, 14000.0, 3809.0, 1548.0, 773.0, 413.0, 237.0, 157.0, 117.0, 65.0, 52.0, 34.0, 25.0, 20.0, 14.0, 11.0, 12.0, 4.0, 8.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.107421875, -1.069976806640625, -1.03253173828125, -0.995086669921875, -0.9576416015625, -0.920196533203125, -0.88275146484375, -0.845306396484375, -0.807861328125, -0.770416259765625, -0.73297119140625, -0.695526123046875, -0.6580810546875, -0.620635986328125, -0.58319091796875, -0.545745849609375, -0.50830078125, -0.470855712890625, -0.43341064453125, -0.395965576171875, -0.3585205078125, -0.321075439453125, -0.28363037109375, -0.246185302734375, -0.208740234375, -0.171295166015625, -0.13385009765625, -0.096405029296875, -0.0589599609375, -0.021514892578125, 0.01593017578125, 0.053375244140625, 0.0908203125, 0.128265380859375, 0.16571044921875, 0.203155517578125, 0.2406005859375, 0.278045654296875, 0.31549072265625, 0.352935791015625, 0.390380859375, 0.427825927734375, 0.46527099609375, 0.502716064453125, 0.5401611328125, 0.577606201171875, 0.61505126953125, 0.652496337890625, 0.68994140625, 0.727386474609375, 0.76483154296875, 0.802276611328125, 0.8397216796875, 0.877166748046875, 0.91461181640625, 0.952056884765625, 0.989501953125, 1.026947021484375, 1.06439208984375, 1.101837158203125, 1.1392822265625, 1.176727294921875, 1.21417236328125, 1.251617431640625, 1.2890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 7.0, 8.0, 15.0, 17.0, 15.0, 25.0, 19.0, 27.0, 26.0, 34.0, 36.0, 45.0, 44.0, 50.0, 46.0, 52.0, 50.0, 36.0, 57.0, 37.0, 39.0, 43.0, 23.0, 32.0, 42.0, 30.0, 18.0, 19.0, 19.0, 21.0, 10.0, 8.0, 8.0, 7.0, 6.0, 2.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.0419921875, -1.0101547241210938, -0.9783172607421875, -0.9464797973632812, -0.914642333984375, -0.8828048706054688, -0.8509674072265625, -0.8191299438476562, -0.78729248046875, -0.7554550170898438, -0.7236175537109375, -0.6917800903320312, -0.659942626953125, -0.6281051635742188, -0.5962677001953125, -0.5644302368164062, -0.5325927734375, -0.5007553100585938, -0.4689178466796875, -0.43708038330078125, -0.405242919921875, -0.37340545654296875, -0.3415679931640625, -0.30973052978515625, -0.27789306640625, -0.24605560302734375, -0.2142181396484375, -0.18238067626953125, -0.150543212890625, -0.11870574951171875, -0.0868682861328125, -0.05503082275390625, -0.023193359375, 0.00864410400390625, 0.0404815673828125, 0.07231903076171875, 0.104156494140625, 0.13599395751953125, 0.1678314208984375, 0.19966888427734375, 0.23150634765625, 0.26334381103515625, 0.2951812744140625, 0.32701873779296875, 0.358856201171875, 0.39069366455078125, 0.4225311279296875, 0.45436859130859375, 0.4862060546875, 0.5180435180664062, 0.5498809814453125, 0.5817184448242188, 0.613555908203125, 0.6453933715820312, 0.6772308349609375, 0.7090682983398438, 0.74090576171875, 0.7727432250976562, 0.8045806884765625, 0.8364181518554688, 0.868255615234375, 0.9000930786132812, 0.9319305419921875, 0.9637680053710938, 0.99560546875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 5.0, 3.0, 4.0, 7.0, 19.0, 12.0, 24.0, 41.0, 48.0, 92.0, 129.0, 257.0, 418.0, 794.0, 1679.0, 3211.0, 7147.0, 18839.0, 88068.0, 831444.0, 66846.0, 16820.0, 6540.0, 2957.0, 1368.0, 731.0, 388.0, 245.0, 154.0, 81.0, 69.0, 42.0, 23.0, 8.0, 10.0, 5.0, 8.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56201171875, -0.5452041625976562, -0.5283966064453125, -0.5115890502929688, -0.494781494140625, -0.47797393798828125, -0.4611663818359375, -0.44435882568359375, -0.42755126953125, -0.41074371337890625, -0.3939361572265625, -0.37712860107421875, -0.360321044921875, -0.34351348876953125, -0.3267059326171875, -0.30989837646484375, -0.2930908203125, -0.27628326416015625, -0.2594757080078125, -0.24266815185546875, -0.225860595703125, -0.20905303955078125, -0.1922454833984375, -0.17543792724609375, -0.15863037109375, -0.14182281494140625, -0.1250152587890625, -0.10820770263671875, -0.091400146484375, -0.07459259033203125, -0.0577850341796875, -0.04097747802734375, -0.024169921875, -0.00736236572265625, 0.0094451904296875, 0.02625274658203125, 0.043060302734375, 0.05986785888671875, 0.0766754150390625, 0.09348297119140625, 0.11029052734375, 0.12709808349609375, 0.1439056396484375, 0.16071319580078125, 0.177520751953125, 0.19432830810546875, 0.2111358642578125, 0.22794342041015625, 0.2447509765625, 0.26155853271484375, 0.2783660888671875, 0.29517364501953125, 0.311981201171875, 0.32878875732421875, 0.3455963134765625, 0.36240386962890625, 0.37921142578125, 0.39601898193359375, 0.4128265380859375, 0.42963409423828125, 0.446441650390625, 0.46324920654296875, 0.4800567626953125, 0.49686431884765625, 0.513671875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 6.0, 1.0, 3.0, 7.0, 11.0, 11.0, 15.0, 24.0, 31.0, 59.0, 117.0, 252.0, 216.0, 88.0, 45.0, 27.0, 14.0, 13.0, 13.0, 6.0, 6.0, 2.0, 4.0, 2.0, 4.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002143383026123047, -0.00020739808678627014, -0.0002004578709602356, -0.00019351765513420105, -0.0001865774393081665, -0.00017963722348213196, -0.0001726970076560974, -0.00016575679183006287, -0.00015881657600402832, -0.00015187636017799377, -0.00014493614435195923, -0.00013799592852592468, -0.00013105571269989014, -0.0001241154968738556, -0.00011717528104782104, -0.0001102350652217865, -0.00010329484939575195, -9.635463356971741e-05, -8.941441774368286e-05, -8.247420191764832e-05, -7.553398609161377e-05, -6.859377026557922e-05, -6.165355443954468e-05, -5.471333861351013e-05, -4.7773122787475586e-05, -4.083290696144104e-05, -3.3892691135406494e-05, -2.6952475309371948e-05, -2.0012259483337402e-05, -1.3072043657302856e-05, -6.1318278312683105e-06, 8.083879947662354e-07, 7.748603820800781e-06, 1.4688819646835327e-05, 2.1629035472869873e-05, 2.856925129890442e-05, 3.5509467124938965e-05, 4.244968295097351e-05, 4.938989877700806e-05, 5.63301146030426e-05, 6.327033042907715e-05, 7.02105462551117e-05, 7.715076208114624e-05, 8.409097790718079e-05, 9.103119373321533e-05, 9.797140955924988e-05, 0.00010491162538528442, 0.00011185184121131897, 0.00011879205703735352, 0.00012573227286338806, 0.0001326724886894226, 0.00013961270451545715, 0.0001465529203414917, 0.00015349313616752625, 0.0001604333519935608, 0.00016737356781959534, 0.00017431378364562988, 0.00018125399947166443, 0.00018819421529769897, 0.00019513443112373352, 0.00020207464694976807, 0.0002090148627758026, 0.00021595507860183716, 0.0002228952944278717, 0.00022983551025390625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 8.0, 9.0, 11.0, 21.0, 30.0, 40.0, 63.0, 129.0, 211.0, 529.0, 1219.0, 3145.0, 9224.0, 43423.0, 885788.0, 84416.0, 13485.0, 3954.0, 1496.0, 680.0, 288.0, 164.0, 83.0, 52.0, 21.0, 20.0, 17.0, 9.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7646484375, -0.7412185668945312, -0.7177886962890625, -0.6943588256835938, -0.670928955078125, -0.6474990844726562, -0.6240692138671875, -0.6006393432617188, -0.57720947265625, -0.5537796020507812, -0.5303497314453125, -0.5069198608398438, -0.483489990234375, -0.46006011962890625, -0.4366302490234375, -0.41320037841796875, -0.3897705078125, -0.36634063720703125, -0.3429107666015625, -0.31948089599609375, -0.296051025390625, -0.27262115478515625, -0.2491912841796875, -0.22576141357421875, -0.20233154296875, -0.17890167236328125, -0.1554718017578125, -0.13204193115234375, -0.108612060546875, -0.08518218994140625, -0.0617523193359375, -0.03832244873046875, -0.014892578125, 0.00853729248046875, 0.0319671630859375, 0.05539703369140625, 0.078826904296875, 0.10225677490234375, 0.1256866455078125, 0.14911651611328125, 0.17254638671875, 0.19597625732421875, 0.2194061279296875, 0.24283599853515625, 0.266265869140625, 0.28969573974609375, 0.3131256103515625, 0.33655548095703125, 0.3599853515625, 0.38341522216796875, 0.4068450927734375, 0.43027496337890625, 0.453704833984375, 0.47713470458984375, 0.5005645751953125, 0.5239944458007812, 0.54742431640625, 0.5708541870117188, 0.5942840576171875, 0.6177139282226562, 0.641143798828125, 0.6645736694335938, 0.6880035400390625, 0.7114334106445312, 0.73486328125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 0.0, 4.0, 4.0, 0.0, 8.0, 7.0, 6.0, 15.0, 7.0, 7.0, 12.0, 17.0, 27.0, 41.0, 67.0, 87.0, 135.0, 158.0, 112.0, 71.0, 60.0, 32.0, 26.0, 16.0, 20.0, 13.0, 9.0, 7.0, 9.0, 9.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42333984375, -0.4095458984375, -0.395751953125, -0.3819580078125, -0.3681640625, -0.3543701171875, -0.340576171875, -0.3267822265625, -0.31298828125, -0.2991943359375, -0.285400390625, -0.2716064453125, -0.2578125, -0.2440185546875, -0.230224609375, -0.2164306640625, -0.20263671875, -0.1888427734375, -0.175048828125, -0.1612548828125, -0.1474609375, -0.1336669921875, -0.119873046875, -0.1060791015625, -0.09228515625, -0.0784912109375, -0.064697265625, -0.0509033203125, -0.037109375, -0.0233154296875, -0.009521484375, 0.0042724609375, 0.01806640625, 0.0318603515625, 0.045654296875, 0.0594482421875, 0.0732421875, 0.0870361328125, 0.100830078125, 0.1146240234375, 0.12841796875, 0.1422119140625, 0.156005859375, 0.1697998046875, 0.18359375, 0.1973876953125, 0.211181640625, 0.2249755859375, 0.23876953125, 0.2525634765625, 0.266357421875, 0.2801513671875, 0.2939453125, 0.3077392578125, 0.321533203125, 0.3353271484375, 0.34912109375, 0.3629150390625, 0.376708984375, 0.3905029296875, 0.404296875, 0.4180908203125, 0.431884765625, 0.4456787109375, 0.45947265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 4.0, 11.0, 29.0, 65.0, 208.0, 407.0, 179.0, 70.0, 20.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.929523468017578, -25.396299362182617, -24.863075256347656, -24.329849243164062, -23.7966251373291, -23.26340103149414, -22.73017692565918, -22.19695281982422, -21.663728713989258, -21.130504608154297, -20.597280502319336, -20.064056396484375, -19.53083038330078, -18.99760627746582, -18.46438217163086, -17.9311580657959, -17.397933959960938, -16.864709854125977, -16.331485748291016, -15.798260688781738, -15.265036582946777, -14.7318115234375, -14.198587417602539, -13.665363311767578, -13.132137298583984, -12.598913192749023, -12.065688133239746, -11.532464027404785, -10.999239921569824, -10.466014862060547, -9.932790756225586, -9.399566650390625, -8.866341590881348, -8.333117485046387, -7.799892902374268, -7.266668319702148, -6.7334442138671875, -6.200219631195068, -5.666995048522949, -5.133770942687988, -4.600546360015869, -4.06732177734375, -3.534097671508789, -3.00087308883667, -2.46764874458313, -1.9344244003295898, -1.4011998176574707, -0.8679754734039307, -0.3347511291503906, 0.1984732747077942, 0.731697678565979, 1.2649221420288086, 1.7981464862823486, 2.3313708305358887, 2.864595413208008, 3.397819757461548, 3.931044101715088, 4.464268684387207, 4.997492790222168, 5.530717372894287, 6.063941955566406, 6.597166061401367, 7.130390644073486, 7.6636152267456055, 8.196839332580566]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 5.0, 7.0, 13.0, 7.0, 12.0, 16.0, 28.0, 17.0, 24.0, 22.0, 23.0, 37.0, 27.0, 46.0, 44.0, 59.0, 80.0, 84.0, 78.0, 51.0, 44.0, 38.0, 36.0, 45.0, 19.0, 32.0, 22.0, 17.0, 13.0, 15.0, 11.0, 5.0, 5.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.990909576416016, -4.83718729019165, -4.683465480804443, -4.529743194580078, -4.376021385192871, -4.222299098968506, -4.068576812744141, -3.9148550033569336, -3.7611327171325684, -3.6074106693267822, -3.453688621520996, -3.299966335296631, -3.1462442874908447, -2.9925222396850586, -2.8388001918792725, -2.6850781440734863, -2.5313560962677, -2.377634048461914, -2.223912000656128, -2.070189952850342, -1.9164676666259766, -1.7627456188201904, -1.6090235710144043, -1.4553014039993286, -1.3015793561935425, -1.1478573083877563, -0.9941351413726807, -0.8404130935668945, -0.6866909861564636, -0.5329688787460327, -0.3792468309402466, -0.2255246639251709, -0.07180261611938477, 0.08191947638988495, 0.23564156889915466, 0.3893636465072632, 0.5430857539176941, 0.696807861328125, 0.8505299091339111, 1.0042520761489868, 1.157974123954773, 1.311696171760559, 1.4654183387756348, 1.619140386581421, 1.772862434387207, 1.9265846014022827, 2.0803065299987793, 2.2340288162231445, 2.3877508640289307, 2.541472911834717, 2.695194959640503, 2.848917007446289, 3.0026392936706543, 3.1563613414764404, 3.3100833892822266, 3.463805675506592, 3.617527484893799, 3.771249532699585, 3.924971580505371, 4.078693866729736, 4.232415676116943, 4.386137962341309, 4.539859771728516, 4.693582057952881, 4.847304344177246]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 7.0, 3.0, 9.0, 16.0, 16.0, 24.0, 36.0, 48.0, 56.0, 89.0, 121.0, 186.0, 299.0, 522.0, 857.0, 1899.0, 4273.0, 14216.0, 234428.0, 3864308.0, 56304.0, 9919.0, 3397.0, 1455.0, 764.0, 383.0, 226.0, 122.0, 98.0, 61.0, 53.0, 29.0, 12.0, 5.0, 4.0, 3.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.111328125, -2.0589599609375, -2.006591796875, -1.9542236328125, -1.90185546875, -1.8494873046875, -1.797119140625, -1.7447509765625, -1.6923828125, -1.6400146484375, -1.587646484375, -1.5352783203125, -1.48291015625, -1.4305419921875, -1.378173828125, -1.3258056640625, -1.2734375, -1.2210693359375, -1.168701171875, -1.1163330078125, -1.06396484375, -1.0115966796875, -0.959228515625, -0.9068603515625, -0.8544921875, -0.8021240234375, -0.749755859375, -0.6973876953125, -0.64501953125, -0.5926513671875, -0.540283203125, -0.4879150390625, -0.435546875, -0.3831787109375, -0.330810546875, -0.2784423828125, -0.22607421875, -0.1737060546875, -0.121337890625, -0.0689697265625, -0.0166015625, 0.0357666015625, 0.088134765625, 0.1405029296875, 0.19287109375, 0.2452392578125, 0.297607421875, 0.3499755859375, 0.40234375, 0.4547119140625, 0.507080078125, 0.5594482421875, 0.61181640625, 0.6641845703125, 0.716552734375, 0.7689208984375, 0.8212890625, 0.8736572265625, 0.926025390625, 0.9783935546875, 1.03076171875, 1.0831298828125, 1.135498046875, 1.1878662109375, 1.240234375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 10.0, 12.0, 19.0, 42.0, 40.0, 62.0, 70.0, 90.0, 102.0, 113.0, 88.0, 90.0, 68.0, 64.0, 40.0, 33.0, 22.0, 14.0, 11.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53466796875, -0.51702880859375, -0.4993896484375, -0.48175048828125, -0.464111328125, -0.44647216796875, -0.4288330078125, -0.41119384765625, -0.3935546875, -0.37591552734375, -0.3582763671875, -0.34063720703125, -0.322998046875, -0.30535888671875, -0.2877197265625, -0.27008056640625, -0.25244140625, -0.23480224609375, -0.2171630859375, -0.19952392578125, -0.181884765625, -0.16424560546875, -0.1466064453125, -0.12896728515625, -0.111328125, -0.09368896484375, -0.0760498046875, -0.05841064453125, -0.040771484375, -0.02313232421875, -0.0054931640625, 0.01214599609375, 0.02978515625, 0.04742431640625, 0.0650634765625, 0.08270263671875, 0.100341796875, 0.11798095703125, 0.1356201171875, 0.15325927734375, 0.1708984375, 0.18853759765625, 0.2061767578125, 0.22381591796875, 0.241455078125, 0.25909423828125, 0.2767333984375, 0.29437255859375, 0.31201171875, 0.32965087890625, 0.3472900390625, 0.36492919921875, 0.382568359375, 0.40020751953125, 0.4178466796875, 0.43548583984375, 0.453125, 0.47076416015625, 0.4884033203125, 0.50604248046875, 0.523681640625, 0.54132080078125, 0.5589599609375, 0.57659912109375, 0.59423828125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 12.0, 14.0, 16.0, 34.0, 52.0, 89.0, 141.0, 205.0, 307.0, 496.0, 836.0, 1777.0, 5194.0, 23320.0, 684011.0, 3423800.0, 40647.0, 7872.0, 2557.0, 1140.0, 646.0, 382.0, 231.0, 198.0, 89.0, 64.0, 48.0, 32.0, 15.0, 9.0, 9.0, 9.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.82421875, -1.769134521484375, -1.71405029296875, -1.658966064453125, -1.6038818359375, -1.548797607421875, -1.49371337890625, -1.438629150390625, -1.383544921875, -1.328460693359375, -1.27337646484375, -1.218292236328125, -1.1632080078125, -1.108123779296875, -1.05303955078125, -0.997955322265625, -0.94287109375, -0.887786865234375, -0.83270263671875, -0.777618408203125, -0.7225341796875, -0.667449951171875, -0.61236572265625, -0.557281494140625, -0.502197265625, -0.447113037109375, -0.39202880859375, -0.336944580078125, -0.2818603515625, -0.226776123046875, -0.17169189453125, -0.116607666015625, -0.0615234375, -0.006439208984375, 0.04864501953125, 0.103729248046875, 0.1588134765625, 0.213897705078125, 0.26898193359375, 0.324066162109375, 0.379150390625, 0.434234619140625, 0.48931884765625, 0.544403076171875, 0.5994873046875, 0.654571533203125, 0.70965576171875, 0.764739990234375, 0.81982421875, 0.874908447265625, 0.92999267578125, 0.985076904296875, 1.0401611328125, 1.095245361328125, 1.15032958984375, 1.205413818359375, 1.260498046875, 1.315582275390625, 1.37066650390625, 1.425750732421875, 1.4808349609375, 1.535919189453125, 1.59100341796875, 1.646087646484375, 1.701171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 8.0, 10.0, 15.0, 29.0, 34.0, 75.0, 205.0, 1052.0, 1820.0, 471.0, 151.0, 75.0, 49.0, 28.0, 17.0, 16.0, 9.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7451171875, -1.687530517578125, -1.62994384765625, -1.572357177734375, -1.5147705078125, -1.457183837890625, -1.39959716796875, -1.342010498046875, -1.284423828125, -1.226837158203125, -1.16925048828125, -1.111663818359375, -1.0540771484375, -0.996490478515625, -0.93890380859375, -0.881317138671875, -0.82373046875, -0.766143798828125, -0.70855712890625, -0.650970458984375, -0.5933837890625, -0.535797119140625, -0.47821044921875, -0.420623779296875, -0.363037109375, -0.305450439453125, -0.24786376953125, -0.190277099609375, -0.1326904296875, -0.075103759765625, -0.01751708984375, 0.040069580078125, 0.09765625, 0.155242919921875, 0.21282958984375, 0.270416259765625, 0.3280029296875, 0.385589599609375, 0.44317626953125, 0.500762939453125, 0.558349609375, 0.615936279296875, 0.67352294921875, 0.731109619140625, 0.7886962890625, 0.846282958984375, 0.90386962890625, 0.961456298828125, 1.01904296875, 1.076629638671875, 1.13421630859375, 1.191802978515625, 1.2493896484375, 1.306976318359375, 1.36456298828125, 1.422149658203125, 1.479736328125, 1.537322998046875, 1.59490966796875, 1.652496337890625, 1.7100830078125, 1.767669677734375, 1.82525634765625, 1.882843017578125, 1.9404296875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 7.0, 19.0, 38.0, 72.0, 162.0, 249.0, 214.0, 108.0, 56.0, 25.0, 17.0, 7.0, 8.0, 5.0, 1.0, 7.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.526615142822266, -10.020986557006836, -9.51535701751709, -9.009727478027344, -8.504098892211914, -7.998469829559326, -7.492840766906738, -6.98721170425415, -6.4815826416015625, -5.975953578948975, -5.470324516296387, -4.964695453643799, -4.459066390991211, -3.953437328338623, -3.447808265686035, -2.9421792030334473, -2.4365501403808594, -1.9309210777282715, -1.4252920150756836, -0.9196629524230957, -0.4140338897705078, 0.09159517288208008, 0.597224235534668, 1.1028532981872559, 1.6084823608398438, 2.1141114234924316, 2.6197404861450195, 3.1253695487976074, 3.6309986114501953, 4.136627674102783, 4.642256736755371, 5.147885799407959, 5.653514862060547, 6.159143924713135, 6.664772987365723, 7.1704020500183105, 7.676031112670898, 8.181659698486328, 8.687289237976074, 9.19291877746582, 9.69854736328125, 10.20417594909668, 10.709805488586426, 11.215435028076172, 11.721063613891602, 12.226692199707031, 12.732321739196777, 13.237951278686523, 13.743579864501953, 14.249208450317383, 14.754837989807129, 15.260467529296875, 15.766096115112305, 16.271724700927734, 16.777355194091797, 17.282983779907227, 17.788612365722656, 18.294240951538086, 18.799869537353516, 19.305500030517578, 19.811128616333008, 20.316757202148438, 20.8223876953125, 21.32801628112793, 21.83364486694336]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 5.0, 8.0, 6.0, 15.0, 23.0, 21.0, 23.0, 17.0, 28.0, 37.0, 31.0, 36.0, 36.0, 55.0, 44.0, 40.0, 56.0, 58.0, 40.0, 38.0, 42.0, 41.0, 37.0, 38.0, 31.0, 32.0, 19.0, 24.0, 19.0, 23.0, 13.0, 8.0, 13.0, 8.0, 7.0, 4.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.978796005249023, -4.825719833374023, -4.672643661499023, -4.519567489624023, -4.366491317749023, -4.213415145874023, -4.060338973999023, -3.9072625637054443, -3.7541863918304443, -3.6011102199554443, -3.4480340480804443, -3.2949578762054443, -3.1418814659118652, -2.9888052940368652, -2.8357291221618652, -2.6826529502868652, -2.5295767784118652, -2.3765006065368652, -2.2234244346618652, -2.0703482627868652, -1.9172719717025757, -1.7641957998275757, -1.6111195087432861, -1.4580433368682861, -1.3049671649932861, -1.1518909931182861, -0.9988147616386414, -0.8457385301589966, -0.6926623582839966, -0.5395861864089966, -0.3865099549293518, -0.23343372344970703, -0.08035802841186523, 0.07271817326545715, 0.22579437494277954, 0.37887057662010193, 0.5319467782974243, 0.6850229501724243, 0.8380991816520691, 0.9911754131317139, 1.1442515850067139, 1.2973277568817139, 1.4504039287567139, 1.6034802198410034, 1.7565563917160034, 1.9096325635910034, 2.062708854675293, 2.215785026550293, 2.368861198425293, 2.521937370300293, 2.675013542175293, 2.828089714050293, 2.981165885925293, 3.134242057800293, 3.287318468093872, 3.440394639968872, 3.593470811843872, 3.746546983718872, 3.899623155593872, 4.052699565887451, 4.205775737762451, 4.358851909637451, 4.511928081512451, 4.665004253387451, 4.818080425262451]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 11.0, 7.0, 12.0, 16.0, 20.0, 34.0, 32.0, 53.0, 101.0, 152.0, 203.0, 427.0, 928.0, 1956.0, 4974.0, 14466.0, 57231.0, 397565.0, 477623.0, 66548.0, 16591.0, 5382.0, 2098.0, 940.0, 479.0, 260.0, 151.0, 110.0, 57.0, 38.0, 32.0, 13.0, 11.0, 8.0, 4.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4775390625, -1.43414306640625, -1.3907470703125, -1.34735107421875, -1.303955078125, -1.26055908203125, -1.2171630859375, -1.17376708984375, -1.13037109375, -1.08697509765625, -1.0435791015625, -1.00018310546875, -0.956787109375, -0.91339111328125, -0.8699951171875, -0.82659912109375, -0.783203125, -0.73980712890625, -0.6964111328125, -0.65301513671875, -0.609619140625, -0.56622314453125, -0.5228271484375, -0.47943115234375, -0.43603515625, -0.39263916015625, -0.3492431640625, -0.30584716796875, -0.262451171875, -0.21905517578125, -0.1756591796875, -0.13226318359375, -0.0888671875, -0.04547119140625, -0.0020751953125, 0.04132080078125, 0.084716796875, 0.12811279296875, 0.1715087890625, 0.21490478515625, 0.25830078125, 0.30169677734375, 0.3450927734375, 0.38848876953125, 0.431884765625, 0.47528076171875, 0.5186767578125, 0.56207275390625, 0.60546875, 0.64886474609375, 0.6922607421875, 0.73565673828125, 0.779052734375, 0.82244873046875, 0.8658447265625, 0.90924072265625, 0.95263671875, 0.99603271484375, 1.0394287109375, 1.08282470703125, 1.126220703125, 1.16961669921875, 1.2130126953125, 1.25640869140625, 1.2998046875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 10.0, 12.0, 7.0, 12.0, 31.0, 36.0, 55.0, 55.0, 52.0, 60.0, 64.0, 69.0, 83.0, 81.0, 63.0, 56.0, 58.0, 42.0, 34.0, 24.0, 29.0, 17.0, 17.0, 13.0, 7.0, 4.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.6265640258789062, -0.6105499267578125, -0.5945358276367188, -0.578521728515625, -0.5625076293945312, -0.5464935302734375, -0.5304794311523438, -0.51446533203125, -0.49845123291015625, -0.4824371337890625, -0.46642303466796875, -0.450408935546875, -0.43439483642578125, -0.4183807373046875, -0.40236663818359375, -0.3863525390625, -0.37033843994140625, -0.3543243408203125, -0.33831024169921875, -0.322296142578125, -0.30628204345703125, -0.2902679443359375, -0.27425384521484375, -0.25823974609375, -0.24222564697265625, -0.2262115478515625, -0.21019744873046875, -0.194183349609375, -0.17816925048828125, -0.1621551513671875, -0.14614105224609375, -0.130126953125, -0.11411285400390625, -0.0980987548828125, -0.08208465576171875, -0.066070556640625, -0.05005645751953125, -0.0340423583984375, -0.01802825927734375, -0.00201416015625, 0.01399993896484375, 0.0300140380859375, 0.04602813720703125, 0.062042236328125, 0.07805633544921875, 0.0940704345703125, 0.11008453369140625, 0.1260986328125, 0.14211273193359375, 0.1581268310546875, 0.17414093017578125, 0.190155029296875, 0.20616912841796875, 0.2221832275390625, 0.23819732666015625, 0.25421142578125, 0.27022552490234375, 0.2862396240234375, 0.30225372314453125, 0.318267822265625, 0.33428192138671875, 0.3502960205078125, 0.36631011962890625, 0.38232421875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 10.0, 14.0, 11.0, 16.0, 36.0, 29.0, 53.0, 64.0, 104.0, 173.0, 227.0, 319.0, 511.0, 896.0, 1583.0, 3257.0, 8172.0, 29125.0, 180690.0, 710863.0, 83629.0, 17286.0, 5774.0, 2455.0, 1230.0, 700.0, 441.0, 267.0, 195.0, 113.0, 96.0, 57.0, 41.0, 31.0, 20.0, 14.0, 9.0, 12.0, 11.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.365234375, -1.3229827880859375, -1.280731201171875, -1.2384796142578125, -1.19622802734375, -1.1539764404296875, -1.111724853515625, -1.0694732666015625, -1.0272216796875, -0.9849700927734375, -0.942718505859375, -0.9004669189453125, -0.85821533203125, -0.8159637451171875, -0.773712158203125, -0.7314605712890625, -0.689208984375, -0.6469573974609375, -0.604705810546875, -0.5624542236328125, -0.52020263671875, -0.4779510498046875, -0.435699462890625, -0.3934478759765625, -0.3511962890625, -0.3089447021484375, -0.266693115234375, -0.2244415283203125, -0.18218994140625, -0.1399383544921875, -0.097686767578125, -0.0554351806640625, -0.01318359375, 0.0290679931640625, 0.071319580078125, 0.1135711669921875, 0.15582275390625, 0.1980743408203125, 0.240325927734375, 0.2825775146484375, 0.3248291015625, 0.3670806884765625, 0.409332275390625, 0.4515838623046875, 0.49383544921875, 0.5360870361328125, 0.578338623046875, 0.6205902099609375, 0.662841796875, 0.7050933837890625, 0.747344970703125, 0.7895965576171875, 0.83184814453125, 0.8740997314453125, 0.916351318359375, 0.9586029052734375, 1.0008544921875, 1.0431060791015625, 1.085357666015625, 1.1276092529296875, 1.16986083984375, 1.2121124267578125, 1.254364013671875, 1.2966156005859375, 1.3388671875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 10.0, 7.0, 9.0, 14.0, 15.0, 14.0, 14.0, 24.0, 32.0, 27.0, 28.0, 40.0, 37.0, 37.0, 49.0, 40.0, 51.0, 67.0, 61.0, 59.0, 51.0, 45.0, 35.0, 46.0, 39.0, 22.0, 21.0, 23.0, 11.0, 15.0, 13.0, 8.0, 9.0, 4.0, 3.0, 8.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5517578125, -1.50665283203125, -1.4615478515625, -1.41644287109375, -1.371337890625, -1.32623291015625, -1.2811279296875, -1.23602294921875, -1.19091796875, -1.14581298828125, -1.1007080078125, -1.05560302734375, -1.010498046875, -0.96539306640625, -0.9202880859375, -0.87518310546875, -0.830078125, -0.78497314453125, -0.7398681640625, -0.69476318359375, -0.649658203125, -0.60455322265625, -0.5594482421875, -0.51434326171875, -0.46923828125, -0.42413330078125, -0.3790283203125, -0.33392333984375, -0.288818359375, -0.24371337890625, -0.1986083984375, -0.15350341796875, -0.1083984375, -0.06329345703125, -0.0181884765625, 0.02691650390625, 0.072021484375, 0.11712646484375, 0.1622314453125, 0.20733642578125, 0.25244140625, 0.29754638671875, 0.3426513671875, 0.38775634765625, 0.432861328125, 0.47796630859375, 0.5230712890625, 0.56817626953125, 0.61328125, 0.65838623046875, 0.7034912109375, 0.74859619140625, 0.793701171875, 0.83880615234375, 0.8839111328125, 0.92901611328125, 0.97412109375, 1.01922607421875, 1.0643310546875, 1.10943603515625, 1.154541015625, 1.19964599609375, 1.2447509765625, 1.28985595703125, 1.3349609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 4.0, 10.0, 19.0, 10.0, 31.0, 36.0, 88.0, 117.0, 239.0, 467.0, 974.0, 2257.0, 5605.0, 16768.0, 83533.0, 793557.0, 113665.0, 19964.0, 6389.0, 2575.0, 1083.0, 493.0, 284.0, 144.0, 99.0, 48.0, 29.0, 15.0, 12.0, 14.0, 6.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6387710571289062, -0.6178741455078125, -0.5969772338867188, -0.576080322265625, -0.5551834106445312, -0.5342864990234375, -0.5133895874023438, -0.49249267578125, -0.47159576416015625, -0.4506988525390625, -0.42980194091796875, -0.408905029296875, -0.38800811767578125, -0.3671112060546875, -0.34621429443359375, -0.3253173828125, -0.30442047119140625, -0.2835235595703125, -0.26262664794921875, -0.241729736328125, -0.22083282470703125, -0.1999359130859375, -0.17903900146484375, -0.15814208984375, -0.13724517822265625, -0.1163482666015625, -0.09545135498046875, -0.074554443359375, -0.05365753173828125, -0.0327606201171875, -0.01186370849609375, 0.009033203125, 0.02993011474609375, 0.0508270263671875, 0.07172393798828125, 0.092620849609375, 0.11351776123046875, 0.1344146728515625, 0.15531158447265625, 0.17620849609375, 0.19710540771484375, 0.2180023193359375, 0.23889923095703125, 0.259796142578125, 0.28069305419921875, 0.3015899658203125, 0.32248687744140625, 0.3433837890625, 0.36428070068359375, 0.3851776123046875, 0.40607452392578125, 0.426971435546875, 0.44786834716796875, 0.4687652587890625, 0.48966217041015625, 0.51055908203125, 0.5314559936523438, 0.5523529052734375, 0.5732498168945312, 0.594146728515625, 0.6150436401367188, 0.6359405517578125, 0.6568374633789062, 0.677734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 10.0, 4.0, 6.0, 17.0, 17.0, 27.0, 51.0, 65.0, 156.0, 209.0, 155.0, 83.0, 59.0, 29.0, 17.0, 26.0, 8.0, 4.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020360946655273438, -0.00019531697034835815, -0.00018702447414398193, -0.0001787319779396057, -0.0001704394817352295, -0.00016214698553085327, -0.00015385448932647705, -0.00014556199312210083, -0.0001372694969177246, -0.0001289770007133484, -0.00012068450450897217, -0.00011239200830459595, -0.00010409951210021973, -9.58070158958435e-05, -8.751451969146729e-05, -7.922202348709106e-05, -7.092952728271484e-05, -6.263703107833862e-05, -5.43445348739624e-05, -4.605203866958618e-05, -3.775954246520996e-05, -2.946704626083374e-05, -2.117455005645752e-05, -1.2882053852081299e-05, -4.589557647705078e-06, 3.7029385566711426e-06, 1.1995434761047363e-05, 2.0287930965423584e-05, 2.8580427169799805e-05, 3.6872923374176025e-05, 4.5165419578552246e-05, 5.345791578292847e-05, 6.175041198730469e-05, 7.004290819168091e-05, 7.833540439605713e-05, 8.662790060043335e-05, 9.492039680480957e-05, 0.00010321289300918579, 0.00011150538921356201, 0.00011979788541793823, 0.00012809038162231445, 0.00013638287782669067, 0.0001446753740310669, 0.00015296787023544312, 0.00016126036643981934, 0.00016955286264419556, 0.00017784535884857178, 0.000186137855052948, 0.00019443035125732422, 0.00020272284746170044, 0.00021101534366607666, 0.00021930783987045288, 0.0002276003360748291, 0.00023589283227920532, 0.00024418532848358154, 0.00025247782468795776, 0.000260770320892334, 0.0002690628170967102, 0.0002773553133010864, 0.00028564780950546265, 0.00029394030570983887, 0.0003022328019142151, 0.0003105252981185913, 0.00031881779432296753, 0.00032711029052734375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 6.0, 6.0, 11.0, 20.0, 35.0, 38.0, 77.0, 127.0, 257.0, 491.0, 915.0, 2176.0, 6055.0, 22128.0, 191263.0, 762552.0, 46467.0, 9992.0, 3204.0, 1357.0, 648.0, 285.0, 172.0, 109.0, 55.0, 35.0, 22.0, 23.0, 10.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.009765625, -0.9846572875976562, -0.9595489501953125, -0.9344406127929688, -0.909332275390625, -0.8842239379882812, -0.8591156005859375, -0.8340072631835938, -0.80889892578125, -0.7837905883789062, -0.7586822509765625, -0.7335739135742188, -0.708465576171875, -0.6833572387695312, -0.6582489013671875, -0.6331405639648438, -0.6080322265625, -0.5829238891601562, -0.5578155517578125, -0.5327072143554688, -0.507598876953125, -0.48249053955078125, -0.4573822021484375, -0.43227386474609375, -0.40716552734375, -0.38205718994140625, -0.3569488525390625, -0.33184051513671875, -0.306732177734375, -0.28162384033203125, -0.2565155029296875, -0.23140716552734375, -0.206298828125, -0.18119049072265625, -0.1560821533203125, -0.13097381591796875, -0.105865478515625, -0.08075714111328125, -0.0556488037109375, -0.03054046630859375, -0.00543212890625, 0.01967620849609375, 0.0447845458984375, 0.06989288330078125, 0.095001220703125, 0.12010955810546875, 0.1452178955078125, 0.17032623291015625, 0.1954345703125, 0.22054290771484375, 0.2456512451171875, 0.27075958251953125, 0.295867919921875, 0.32097625732421875, 0.3460845947265625, 0.37119293212890625, 0.39630126953125, 0.42140960693359375, 0.4465179443359375, 0.47162628173828125, 0.496734619140625, 0.5218429565429688, 0.5469512939453125, 0.5720596313476562, 0.59716796875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 7.0, 0.0, 7.0, 6.0, 4.0, 8.0, 19.0, 8.0, 25.0, 42.0, 40.0, 49.0, 87.0, 115.0, 148.0, 109.0, 69.0, 68.0, 59.0, 35.0, 19.0, 10.0, 12.0, 10.0, 9.0, 8.0, 11.0, 3.0, 4.0, 0.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.471435546875, -0.4537773132324219, -0.43611907958984375, -0.4184608459472656, -0.4008026123046875, -0.3831443786621094, -0.36548614501953125, -0.3478279113769531, -0.330169677734375, -0.3125114440917969, -0.29485321044921875, -0.2771949768066406, -0.2595367431640625, -0.24187850952148438, -0.22422027587890625, -0.20656204223632812, -0.18890380859375, -0.17124557495117188, -0.15358734130859375, -0.13592910766601562, -0.1182708740234375, -0.10061264038085938, -0.08295440673828125, -0.06529617309570312, -0.047637939453125, -0.029979705810546875, -0.01232147216796875, 0.005336761474609375, 0.0229949951171875, 0.040653228759765625, 0.05831146240234375, 0.07596969604492188, 0.0936279296875, 0.11128616333007812, 0.12894439697265625, 0.14660263061523438, 0.1642608642578125, 0.18191909790039062, 0.19957733154296875, 0.21723556518554688, 0.234893798828125, 0.2525520324707031, 0.27021026611328125, 0.2878684997558594, 0.3055267333984375, 0.3231849670410156, 0.34084320068359375, 0.3585014343261719, 0.37615966796875, 0.3938179016113281, 0.41147613525390625, 0.4291343688964844, 0.4467926025390625, 0.4644508361816406, 0.48210906982421875, 0.4997673034667969, 0.517425537109375, 0.5350837707519531, 0.5527420043945312, 0.5704002380371094, 0.5880584716796875, 0.6057167053222656, 0.6233749389648438, 0.6410331726074219, 0.65869140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 9.0, 13.0, 26.0, 58.0, 132.0, 317.0, 266.0, 113.0, 32.0, 24.0, 4.0, 7.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.480131149291992, -28.933151245117188, -28.386171340942383, -27.839191436767578, -27.292211532592773, -26.74523162841797, -26.198251724243164, -25.65127182006836, -25.104290008544922, -24.557310104370117, -24.010330200195312, -23.463350296020508, -22.916370391845703, -22.3693904876709, -21.822410583496094, -21.275428771972656, -20.728450775146484, -20.18147087097168, -19.634490966796875, -19.08751106262207, -18.540531158447266, -17.99355125427246, -17.446571350097656, -16.89958953857422, -16.352611541748047, -15.805631637573242, -15.258651733398438, -14.711671829223633, -14.164691925048828, -13.617712020874023, -13.070731163024902, -12.523751258850098, -11.976770401000977, -11.429790496826172, -10.882810592651367, -10.335830688476562, -9.788850784301758, -9.241870880126953, -8.694890022277832, -8.147910118103027, -7.600930690765381, -7.053950786590576, -6.506970405578613, -5.959990501403809, -5.413010597229004, -4.866030693054199, -4.3190507888793945, -3.7720704078674316, -3.225090503692627, -2.6781105995178223, -2.1311304569244385, -1.5841504335403442, -1.03717041015625, -0.4901905059814453, 0.05678963661193848, 0.6037697792053223, 1.150749683380127, 1.6977297067642212, 2.2447097301483154, 2.791689872741699, 3.338669776916504, 3.8856496810913086, 4.432629585266113, 4.979609966278076, 5.526589870452881]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 9.0, 4.0, 12.0, 3.0, 11.0, 15.0, 20.0, 18.0, 21.0, 29.0, 34.0, 39.0, 30.0, 39.0, 33.0, 41.0, 77.0, 78.0, 84.0, 65.0, 50.0, 53.0, 30.0, 27.0, 29.0, 28.0, 15.0, 20.0, 18.0, 15.0, 13.0, 8.0, 8.0, 10.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.526603698730469, -6.309216499328613, -6.091829776763916, -5.874443054199219, -5.657055854797363, -5.439668655395508, -5.2222819328308105, -5.004895210266113, -4.787508010864258, -4.570120811462402, -4.352734088897705, -4.135347366333008, -3.9179601669311523, -3.700573205947876, -3.4831862449645996, -3.2657992839813232, -3.048412322998047, -2.8310253620147705, -2.613638401031494, -2.3962514400482178, -2.1788644790649414, -1.961477518081665, -1.7440905570983887, -1.5267035961151123, -1.309316635131836, -1.0919296741485596, -0.8745427131652832, -0.6571557521820068, -0.43976879119873047, -0.2223818302154541, -0.004994869232177734, 0.21239209175109863, 0.429779052734375, 0.6471660137176514, 0.8645529747009277, 1.081939935684204, 1.2993268966674805, 1.5167138576507568, 1.7341008186340332, 1.9514877796173096, 2.168874740600586, 2.3862617015838623, 2.6036486625671387, 2.821035623550415, 3.0384225845336914, 3.2558095455169678, 3.473196506500244, 3.6905834674835205, 3.907970428466797, 4.125357627868652, 4.34274435043335, 4.560131072998047, 4.777518272399902, 4.994905471801758, 5.212292194366455, 5.429678916931152, 5.647066116333008, 5.864453315734863, 6.0818400382995605, 6.299226760864258, 6.516613960266113, 6.734001159667969, 6.951387882232666, 7.168774604797363, 7.386161804199219]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 8.0, 9.0, 9.0, 15.0, 25.0, 27.0, 39.0, 55.0, 90.0, 173.0, 320.0, 583.0, 1412.0, 4612.0, 47001.0, 4063892.0, 67461.0, 5641.0, 1528.0, 657.0, 319.0, 160.0, 100.0, 48.0, 30.0, 20.0, 16.0, 11.0, 8.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.216796875, -3.1374359130859375, -3.058074951171875, -2.9787139892578125, -2.89935302734375, -2.8199920654296875, -2.740631103515625, -2.6612701416015625, -2.5819091796875, -2.5025482177734375, -2.423187255859375, -2.3438262939453125, -2.26446533203125, -2.1851043701171875, -2.105743408203125, -2.0263824462890625, -1.947021484375, -1.8676605224609375, -1.788299560546875, -1.7089385986328125, -1.62957763671875, -1.5502166748046875, -1.470855712890625, -1.3914947509765625, -1.3121337890625, -1.2327728271484375, -1.153411865234375, -1.0740509033203125, -0.99468994140625, -0.9153289794921875, -0.835968017578125, -0.7566070556640625, -0.67724609375, -0.5978851318359375, -0.518524169921875, -0.4391632080078125, -0.35980224609375, -0.2804412841796875, -0.201080322265625, -0.1217193603515625, -0.0423583984375, 0.0370025634765625, 0.116363525390625, 0.1957244873046875, 0.27508544921875, 0.3544464111328125, 0.433807373046875, 0.5131683349609375, 0.592529296875, 0.6718902587890625, 0.751251220703125, 0.8306121826171875, 0.90997314453125, 0.9893341064453125, 1.068695068359375, 1.1480560302734375, 1.2274169921875, 1.3067779541015625, 1.386138916015625, 1.4654998779296875, 1.54486083984375, 1.6242218017578125, 1.703582763671875, 1.7829437255859375, 1.8623046875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 10.0, 15.0, 19.0, 18.0, 31.0, 30.0, 30.0, 42.0, 36.0, 41.0, 62.0, 53.0, 63.0, 52.0, 55.0, 53.0, 55.0, 66.0, 34.0, 41.0, 34.0, 31.0, 25.0, 20.0, 12.0, 16.0, 6.0, 7.0, 6.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.416259765625, -0.4051551818847656, -0.39405059814453125, -0.3829460144042969, -0.3718414306640625, -0.3607368469238281, -0.34963226318359375, -0.3385276794433594, -0.327423095703125, -0.3163185119628906, -0.30521392822265625, -0.2941093444824219, -0.2830047607421875, -0.2719001770019531, -0.26079559326171875, -0.24969100952148438, -0.23858642578125, -0.22748184204101562, -0.21637725830078125, -0.20527267456054688, -0.1941680908203125, -0.18306350708007812, -0.17195892333984375, -0.16085433959960938, -0.149749755859375, -0.13864517211914062, -0.12754058837890625, -0.11643600463867188, -0.1053314208984375, -0.09422683715820312, -0.08312225341796875, -0.07201766967773438, -0.0609130859375, -0.049808502197265625, -0.03870391845703125, -0.027599334716796875, -0.0164947509765625, -0.005390167236328125, 0.00571441650390625, 0.016819000244140625, 0.027923583984375, 0.039028167724609375, 0.05013275146484375, 0.061237335205078125, 0.0723419189453125, 0.08344650268554688, 0.09455108642578125, 0.10565567016601562, 0.11676025390625, 0.12786483764648438, 0.13896942138671875, 0.15007400512695312, 0.1611785888671875, 0.17228317260742188, 0.18338775634765625, 0.19449234008789062, 0.205596923828125, 0.21670150756835938, 0.22780609130859375, 0.23891067504882812, 0.2500152587890625, 0.2611198425292969, 0.27222442626953125, 0.2833290100097656, 0.29443359375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 3.0, 4.0, 7.0, 11.0, 18.0, 23.0, 42.0, 61.0, 107.0, 138.0, 245.0, 478.0, 1735.0, 21191.0, 4142755.0, 24600.0, 1818.0, 587.0, 206.0, 111.0, 68.0, 31.0, 21.0, 17.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5625, -4.40789794921875, -4.2532958984375, -4.09869384765625, -3.944091796875, -3.78948974609375, -3.6348876953125, -3.48028564453125, -3.32568359375, -3.17108154296875, -3.0164794921875, -2.86187744140625, -2.707275390625, -2.55267333984375, -2.3980712890625, -2.24346923828125, -2.0888671875, -1.93426513671875, -1.7796630859375, -1.62506103515625, -1.470458984375, -1.31585693359375, -1.1612548828125, -1.00665283203125, -0.85205078125, -0.69744873046875, -0.5428466796875, -0.38824462890625, -0.233642578125, -0.07904052734375, 0.0755615234375, 0.23016357421875, 0.384765625, 0.53936767578125, 0.6939697265625, 0.84857177734375, 1.003173828125, 1.15777587890625, 1.3123779296875, 1.46697998046875, 1.62158203125, 1.77618408203125, 1.9307861328125, 2.08538818359375, 2.239990234375, 2.39459228515625, 2.5491943359375, 2.70379638671875, 2.8583984375, 3.01300048828125, 3.1676025390625, 3.32220458984375, 3.476806640625, 3.63140869140625, 3.7860107421875, 3.94061279296875, 4.09521484375, 4.24981689453125, 4.4044189453125, 4.55902099609375, 4.713623046875, 4.86822509765625, 5.0228271484375, 5.17742919921875, 5.33203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 16.0, 45.0, 154.0, 1932.0, 1670.0, 193.0, 40.0, 16.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.88671875, -6.748931884765625, -6.61114501953125, -6.473358154296875, -6.3355712890625, -6.197784423828125, -6.05999755859375, -5.922210693359375, -5.784423828125, -5.646636962890625, -5.50885009765625, -5.371063232421875, -5.2332763671875, -5.095489501953125, -4.95770263671875, -4.819915771484375, -4.68212890625, -4.544342041015625, -4.40655517578125, -4.268768310546875, -4.1309814453125, -3.993194580078125, -3.85540771484375, -3.717620849609375, -3.579833984375, -3.442047119140625, -3.30426025390625, -3.166473388671875, -3.0286865234375, -2.890899658203125, -2.75311279296875, -2.615325927734375, -2.4775390625, -2.339752197265625, -2.20196533203125, -2.064178466796875, -1.9263916015625, -1.788604736328125, -1.65081787109375, -1.513031005859375, -1.375244140625, -1.237457275390625, -1.09967041015625, -0.961883544921875, -0.8240966796875, -0.686309814453125, -0.54852294921875, -0.410736083984375, -0.27294921875, -0.135162353515625, 0.00262451171875, 0.140411376953125, 0.2781982421875, 0.415985107421875, 0.55377197265625, 0.691558837890625, 0.829345703125, 0.967132568359375, 1.10491943359375, 1.242706298828125, 1.3804931640625, 1.518280029296875, 1.65606689453125, 1.793853759765625, 1.931640625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 11.0, 34.0, 118.0, 361.0, 327.0, 96.0, 34.0, 16.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.317466735839844, -47.26463317871094, -46.21179962158203, -45.158966064453125, -44.10613250732422, -43.05329895019531, -42.000465393066406, -40.9476318359375, -39.894798278808594, -38.84196472167969, -37.78913116455078, -36.736297607421875, -35.68346405029297, -34.63063049316406, -33.577796936035156, -32.52496337890625, -31.472129821777344, -30.419296264648438, -29.36646270751953, -28.313629150390625, -27.26079559326172, -26.207962036132812, -25.155128479003906, -24.102294921875, -23.049461364746094, -21.996627807617188, -20.94379425048828, -19.890960693359375, -18.83812713623047, -17.785293579101562, -16.732460021972656, -15.67962646484375, -14.626789093017578, -13.573955535888672, -12.521121978759766, -11.46828842163086, -10.415454864501953, -9.362621307373047, -8.30978775024414, -7.256954193115234, -6.204120635986328, -5.151287078857422, -4.098453521728516, -3.0456199645996094, -1.9927864074707031, -0.9399528503417969, 0.11288070678710938, 1.1657142639160156, 2.218547821044922, 3.271381378173828, 4.324214935302734, 5.377048492431641, 6.429882049560547, 7.482715606689453, 8.53554916381836, 9.588382720947266, 10.641216278076172, 11.694049835205078, 12.746883392333984, 13.79971694946289, 14.852550506591797, 15.905384063720703, 16.95821762084961, 18.011051177978516, 19.063884735107422]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 3.0, 4.0, 8.0, 5.0, 14.0, 15.0, 22.0, 16.0, 23.0, 30.0, 29.0, 33.0, 33.0, 48.0, 47.0, 53.0, 44.0, 67.0, 46.0, 48.0, 59.0, 51.0, 45.0, 38.0, 40.0, 26.0, 25.0, 19.0, 16.0, 16.0, 15.0, 10.0, 11.0, 10.0, 5.0, 5.0, 7.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.96102237701416, -7.726656913757324, -7.492291450500488, -7.257925987243652, -7.023560523986816, -6.7891950607299805, -6.5548295974731445, -6.320464134216309, -6.086098670959473, -5.851733207702637, -5.617367744445801, -5.383002281188965, -5.148636817932129, -4.914271354675293, -4.679905891418457, -4.445540428161621, -4.211174488067627, -3.976809024810791, -3.742443561553955, -3.508078098297119, -3.273712635040283, -3.0393471717834473, -2.8049814701080322, -2.5706160068511963, -2.3362505435943604, -2.1018850803375244, -1.8675196170806885, -1.633154034614563, -1.398788571357727, -1.1644231081008911, -0.9300575256347656, -0.6956920623779297, -0.46132659912109375, -0.22696110606193542, 0.0074043869972229, 0.2417699098587036, 0.47613537311553955, 0.7105008363723755, 0.944866418838501, 1.179231882095337, 1.4135973453521729, 1.6479628086090088, 1.8823282718658447, 2.1166939735412598, 2.3510594367980957, 2.5854249000549316, 2.8197903633117676, 3.0541558265686035, 3.2885212898254395, 3.5228867530822754, 3.7572522163391113, 3.9916176795959473, 4.225983142852783, 4.460348606109619, 4.694714546203613, 4.929080009460449, 5.163445472717285, 5.397810935974121, 5.632176399230957, 5.866541862487793, 6.100907325744629, 6.335272789001465, 6.569638252258301, 6.804003715515137, 7.038369178771973]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 5.0, 12.0, 15.0, 17.0, 30.0, 62.0, 105.0, 173.0, 346.0, 622.0, 1369.0, 3057.0, 7954.0, 23212.0, 82256.0, 334160.0, 430746.0, 116053.0, 31149.0, 10000.0, 3849.0, 1661.0, 762.0, 411.0, 205.0, 120.0, 79.0, 34.0, 29.0, 23.0, 10.0, 8.0, 4.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.84033203125, -0.8093490600585938, -0.7783660888671875, -0.7473831176757812, -0.716400146484375, -0.6854171752929688, -0.6544342041015625, -0.6234512329101562, -0.59246826171875, -0.5614852905273438, -0.5305023193359375, -0.49951934814453125, -0.468536376953125, -0.43755340576171875, -0.4065704345703125, -0.37558746337890625, -0.3446044921875, -0.31362152099609375, -0.2826385498046875, -0.25165557861328125, -0.220672607421875, -0.18968963623046875, -0.1587066650390625, -0.12772369384765625, -0.09674072265625, -0.06575775146484375, -0.0347747802734375, -0.00379180908203125, 0.027191162109375, 0.05817413330078125, 0.0891571044921875, 0.12014007568359375, 0.151123046875, 0.18210601806640625, 0.2130889892578125, 0.24407196044921875, 0.275054931640625, 0.30603790283203125, 0.3370208740234375, 0.36800384521484375, 0.39898681640625, 0.42996978759765625, 0.4609527587890625, 0.49193572998046875, 0.522918701171875, 0.5539016723632812, 0.5848846435546875, 0.6158676147460938, 0.6468505859375, 0.6778335571289062, 0.7088165283203125, 0.7397994995117188, 0.770782470703125, 0.8017654418945312, 0.8327484130859375, 0.8637313842773438, 0.89471435546875, 0.9256973266601562, 0.9566802978515625, 0.9876632690429688, 1.018646240234375, 1.0496292114257812, 1.0806121826171875, 1.1115951538085938, 1.142578125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 9.0, 5.0, 12.0, 19.0, 10.0, 18.0, 22.0, 29.0, 26.0, 25.0, 35.0, 48.0, 47.0, 42.0, 47.0, 47.0, 35.0, 47.0, 50.0, 46.0, 42.0, 36.0, 52.0, 31.0, 37.0, 29.0, 20.0, 24.0, 16.0, 18.0, 18.0, 8.0, 9.0, 10.0, 7.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.47705078125, -0.4634895324707031, -0.44992828369140625, -0.4363670349121094, -0.4228057861328125, -0.4092445373535156, -0.39568328857421875, -0.3821220397949219, -0.368560791015625, -0.3549995422363281, -0.34143829345703125, -0.3278770446777344, -0.3143157958984375, -0.3007545471191406, -0.28719329833984375, -0.2736320495605469, -0.26007080078125, -0.24650955200195312, -0.23294830322265625, -0.21938705444335938, -0.2058258056640625, -0.19226455688476562, -0.17870330810546875, -0.16514205932617188, -0.151580810546875, -0.13801956176757812, -0.12445831298828125, -0.11089706420898438, -0.0973358154296875, -0.08377456665039062, -0.07021331787109375, -0.056652069091796875, -0.0430908203125, -0.029529571533203125, -0.01596832275390625, -0.002407073974609375, 0.0111541748046875, 0.024715423583984375, 0.03827667236328125, 0.051837921142578125, 0.065399169921875, 0.07896041870117188, 0.09252166748046875, 0.10608291625976562, 0.1196441650390625, 0.13320541381835938, 0.14676666259765625, 0.16032791137695312, 0.17388916015625, 0.18745040893554688, 0.20101165771484375, 0.21457290649414062, 0.2281341552734375, 0.24169540405273438, 0.25525665283203125, 0.2688179016113281, 0.282379150390625, 0.2959403991699219, 0.30950164794921875, 0.3230628967285156, 0.3366241455078125, 0.3501853942871094, 0.36374664306640625, 0.3773078918457031, 0.390869140625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 15.0, 15.0, 20.0, 22.0, 32.0, 52.0, 79.0, 127.0, 233.0, 487.0, 1050.0, 2429.0, 8024.0, 35933.0, 261872.0, 652981.0, 66046.0, 12821.0, 3500.0, 1393.0, 625.0, 328.0, 195.0, 97.0, 58.0, 34.0, 30.0, 9.0, 14.0, 10.0, 10.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8369140625, -1.7846832275390625, -1.732452392578125, -1.6802215576171875, -1.62799072265625, -1.5757598876953125, -1.523529052734375, -1.4712982177734375, -1.4190673828125, -1.3668365478515625, -1.314605712890625, -1.2623748779296875, -1.21014404296875, -1.1579132080078125, -1.105682373046875, -1.0534515380859375, -1.001220703125, -0.9489898681640625, -0.896759033203125, -0.8445281982421875, -0.79229736328125, -0.7400665283203125, -0.687835693359375, -0.6356048583984375, -0.5833740234375, -0.5311431884765625, -0.478912353515625, -0.4266815185546875, -0.37445068359375, -0.3222198486328125, -0.269989013671875, -0.2177581787109375, -0.16552734375, -0.1132965087890625, -0.061065673828125, -0.0088348388671875, 0.04339599609375, 0.0956268310546875, 0.147857666015625, 0.2000885009765625, 0.2523193359375, 0.3045501708984375, 0.356781005859375, 0.4090118408203125, 0.46124267578125, 0.5134735107421875, 0.565704345703125, 0.6179351806640625, 0.670166015625, 0.7223968505859375, 0.774627685546875, 0.8268585205078125, 0.87908935546875, 0.9313201904296875, 0.983551025390625, 1.0357818603515625, 1.0880126953125, 1.1402435302734375, 1.192474365234375, 1.2447052001953125, 1.29693603515625, 1.3491668701171875, 1.401397705078125, 1.4536285400390625, 1.505859375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 9.0, 7.0, 10.0, 9.0, 20.0, 13.0, 12.0, 22.0, 23.0, 41.0, 39.0, 34.0, 32.0, 50.0, 49.0, 62.0, 61.0, 52.0, 47.0, 45.0, 39.0, 42.0, 46.0, 46.0, 42.0, 31.0, 22.0, 16.0, 25.0, 13.0, 6.0, 7.0, 11.0, 6.0, 3.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84375, -1.781707763671875, -1.71966552734375, -1.657623291015625, -1.5955810546875, -1.533538818359375, -1.47149658203125, -1.409454345703125, -1.347412109375, -1.285369873046875, -1.22332763671875, -1.161285400390625, -1.0992431640625, -1.037200927734375, -0.97515869140625, -0.913116455078125, -0.85107421875, -0.789031982421875, -0.72698974609375, -0.664947509765625, -0.6029052734375, -0.540863037109375, -0.47882080078125, -0.416778564453125, -0.354736328125, -0.292694091796875, -0.23065185546875, -0.168609619140625, -0.1065673828125, -0.044525146484375, 0.01751708984375, 0.079559326171875, 0.1416015625, 0.203643798828125, 0.26568603515625, 0.327728271484375, 0.3897705078125, 0.451812744140625, 0.51385498046875, 0.575897216796875, 0.637939453125, 0.699981689453125, 0.76202392578125, 0.824066162109375, 0.8861083984375, 0.948150634765625, 1.01019287109375, 1.072235107421875, 1.13427734375, 1.196319580078125, 1.25836181640625, 1.320404052734375, 1.3824462890625, 1.444488525390625, 1.50653076171875, 1.568572998046875, 1.630615234375, 1.692657470703125, 1.75469970703125, 1.816741943359375, 1.8787841796875, 1.940826416015625, 2.00286865234375, 2.064910888671875, 2.126953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 8.0, 9.0, 13.0, 30.0, 37.0, 55.0, 94.0, 201.0, 457.0, 1001.0, 2612.0, 8690.0, 42114.0, 667259.0, 285901.0, 29738.0, 6674.0, 2119.0, 785.0, 340.0, 171.0, 93.0, 58.0, 35.0, 21.0, 12.0, 5.0, 7.0, 7.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.123046875, -1.0889129638671875, -1.054779052734375, -1.0206451416015625, -0.98651123046875, -0.9523773193359375, -0.918243408203125, -0.8841094970703125, -0.8499755859375, -0.8158416748046875, -0.781707763671875, -0.7475738525390625, -0.71343994140625, -0.6793060302734375, -0.645172119140625, -0.6110382080078125, -0.576904296875, -0.5427703857421875, -0.508636474609375, -0.4745025634765625, -0.44036865234375, -0.4062347412109375, -0.372100830078125, -0.3379669189453125, -0.3038330078125, -0.2696990966796875, -0.235565185546875, -0.2014312744140625, -0.16729736328125, -0.1331634521484375, -0.099029541015625, -0.0648956298828125, -0.03076171875, 0.0033721923828125, 0.037506103515625, 0.0716400146484375, 0.10577392578125, 0.1399078369140625, 0.174041748046875, 0.2081756591796875, 0.2423095703125, 0.2764434814453125, 0.310577392578125, 0.3447113037109375, 0.37884521484375, 0.4129791259765625, 0.447113037109375, 0.4812469482421875, 0.515380859375, 0.5495147705078125, 0.583648681640625, 0.6177825927734375, 0.65191650390625, 0.6860504150390625, 0.720184326171875, 0.7543182373046875, 0.7884521484375, 0.8225860595703125, 0.856719970703125, 0.8908538818359375, 0.92498779296875, 0.9591217041015625, 0.993255615234375, 1.0273895263671875, 1.0615234375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 4.0, 3.0, 9.0, 16.0, 18.0, 22.0, 40.0, 43.0, 67.0, 81.0, 121.0, 162.0, 112.0, 73.0, 46.0, 36.0, 27.0, 29.0, 15.0, 19.0, 16.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00026535987854003906, -0.00025716423988342285, -0.00024896860122680664, -0.00024077296257019043, -0.00023257732391357422, -0.000224381685256958, -0.0002161860466003418, -0.00020799040794372559, -0.00019979476928710938, -0.00019159913063049316, -0.00018340349197387695, -0.00017520785331726074, -0.00016701221466064453, -0.00015881657600402832, -0.0001506209373474121, -0.0001424252986907959, -0.0001342296600341797, -0.00012603402137756348, -0.00011783838272094727, -0.00010964274406433105, -0.00010144710540771484, -9.325146675109863e-05, -8.505582809448242e-05, -7.686018943786621e-05, -6.866455078125e-05, -6.046891212463379e-05, -5.227327346801758e-05, -4.407763481140137e-05, -3.5881996154785156e-05, -2.7686357498168945e-05, -1.9490718841552734e-05, -1.1295080184936523e-05, -3.0994415283203125e-06, 5.0961971282958984e-06, 1.329183578491211e-05, 2.148747444152832e-05, 2.968311309814453e-05, 3.787875175476074e-05, 4.607439041137695e-05, 5.4270029067993164e-05, 6.246566772460938e-05, 7.066130638122559e-05, 7.88569450378418e-05, 8.705258369445801e-05, 9.524822235107422e-05, 0.00010344386100769043, 0.00011163949966430664, 0.00011983513832092285, 0.00012803077697753906, 0.00013622641563415527, 0.00014442205429077148, 0.0001526176929473877, 0.0001608133316040039, 0.00016900897026062012, 0.00017720460891723633, 0.00018540024757385254, 0.00019359588623046875, 0.00020179152488708496, 0.00020998716354370117, 0.00021818280220031738, 0.0002263784408569336, 0.0002345740795135498, 0.00024276971817016602, 0.0002509653568267822, 0.00025916099548339844]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 7.0, 17.0, 24.0, 31.0, 69.0, 91.0, 200.0, 416.0, 771.0, 1686.0, 4321.0, 13250.0, 53576.0, 493683.0, 406540.0, 53159.0, 13118.0, 4247.0, 1699.0, 757.0, 385.0, 203.0, 121.0, 57.0, 34.0, 18.0, 24.0, 11.0, 1.0, 4.0, 2.0, 2.0, 7.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63427734375, -0.6098785400390625, -0.585479736328125, -0.5610809326171875, -0.53668212890625, -0.5122833251953125, -0.487884521484375, -0.4634857177734375, -0.4390869140625, -0.4146881103515625, -0.390289306640625, -0.3658905029296875, -0.34149169921875, -0.3170928955078125, -0.292694091796875, -0.2682952880859375, -0.243896484375, -0.2194976806640625, -0.195098876953125, -0.1707000732421875, -0.14630126953125, -0.1219024658203125, -0.097503662109375, -0.0731048583984375, -0.0487060546875, -0.0243072509765625, 9.1552734375e-05, 0.0244903564453125, 0.04888916015625, 0.0732879638671875, 0.097686767578125, 0.1220855712890625, 0.146484375, 0.1708831787109375, 0.195281982421875, 0.2196807861328125, 0.24407958984375, 0.2684783935546875, 0.292877197265625, 0.3172760009765625, 0.3416748046875, 0.3660736083984375, 0.390472412109375, 0.4148712158203125, 0.43927001953125, 0.4636688232421875, 0.488067626953125, 0.5124664306640625, 0.536865234375, 0.5612640380859375, 0.585662841796875, 0.6100616455078125, 0.63446044921875, 0.6588592529296875, 0.683258056640625, 0.7076568603515625, 0.7320556640625, 0.7564544677734375, 0.780853271484375, 0.8052520751953125, 0.82965087890625, 0.8540496826171875, 0.878448486328125, 0.9028472900390625, 0.92724609375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 11.0, 5.0, 9.0, 10.0, 12.0, 13.0, 18.0, 21.0, 36.0, 57.0, 66.0, 81.0, 100.0, 124.0, 96.0, 86.0, 53.0, 59.0, 36.0, 22.0, 16.0, 16.0, 9.0, 6.0, 10.0, 7.0, 3.0, 0.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.67431640625, -0.6547927856445312, -0.6352691650390625, -0.6157455444335938, -0.596221923828125, -0.5766983032226562, -0.5571746826171875, -0.5376510620117188, -0.51812744140625, -0.49860382080078125, -0.4790802001953125, -0.45955657958984375, -0.440032958984375, -0.42050933837890625, -0.4009857177734375, -0.38146209716796875, -0.3619384765625, -0.34241485595703125, -0.3228912353515625, -0.30336761474609375, -0.283843994140625, -0.26432037353515625, -0.2447967529296875, -0.22527313232421875, -0.20574951171875, -0.18622589111328125, -0.1667022705078125, -0.14717864990234375, -0.127655029296875, -0.10813140869140625, -0.0886077880859375, -0.06908416748046875, -0.049560546875, -0.03003692626953125, -0.0105133056640625, 0.00901031494140625, 0.028533935546875, 0.04805755615234375, 0.0675811767578125, 0.08710479736328125, 0.10662841796875, 0.12615203857421875, 0.1456756591796875, 0.16519927978515625, 0.184722900390625, 0.20424652099609375, 0.2237701416015625, 0.24329376220703125, 0.2628173828125, 0.28234100341796875, 0.3018646240234375, 0.32138824462890625, 0.340911865234375, 0.36043548583984375, 0.3799591064453125, 0.39948272705078125, 0.41900634765625, 0.43852996826171875, 0.4580535888671875, 0.47757720947265625, 0.497100830078125, 0.5166244506835938, 0.5361480712890625, 0.5556716918945312, 0.5751953125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 12.0, 13.0, 31.0, 78.0, 130.0, 258.0, 237.0, 119.0, 52.0, 27.0, 19.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.34766960144043, -14.835050582885742, -14.322432518005371, -13.809813499450684, -13.297195434570312, -12.784576416015625, -12.271957397460938, -11.75933837890625, -11.246720314025879, -10.734101295471191, -10.22148323059082, -9.708864212036133, -9.196245193481445, -8.683627128601074, -8.171008110046387, -7.658389568328857, -7.145771026611328, -6.633152484893799, -6.1205339431762695, -5.607914924621582, -5.095296382904053, -4.582677841186523, -4.070058822631836, -3.5574402809143066, -3.0448217391967773, -2.532203197479248, -2.0195844173431396, -1.5069657564163208, -0.994347095489502, -0.48172855377197266, 0.030890226364135742, 0.5435090065002441, 1.0561256408691406, 1.5687443017959595, 2.0813629627227783, 2.5939817428588867, 3.106600284576416, 3.6192188262939453, 4.131837844848633, 4.644456386566162, 5.157074928283691, 5.669693470001221, 6.18231201171875, 6.6949310302734375, 7.207549571990967, 7.720168113708496, 8.232787132263184, 8.745405197143555, 9.258024215698242, 9.77064323425293, 10.2832612991333, 10.795880317687988, 11.30849838256836, 11.821117401123047, 12.333736419677734, 12.846355438232422, 13.358973503112793, 13.87159252166748, 14.384210586547852, 14.896829605102539, 15.409448623657227, 15.922066688537598, 16.43468475341797, 16.947303771972656, 17.459922790527344]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 11.0, 15.0, 13.0, 16.0, 16.0, 25.0, 16.0, 31.0, 25.0, 40.0, 34.0, 33.0, 48.0, 64.0, 78.0, 71.0, 69.0, 51.0, 40.0, 37.0, 37.0, 22.0, 30.0, 12.0, 20.0, 20.0, 16.0, 15.0, 9.0, 9.0, 8.0, 12.0, 4.0, 8.0, 6.0, 3.0, 2.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-8.77496337890625, -8.524949073791504, -8.274934768676758, -8.024920463562012, -7.774906635284424, -7.524892330169678, -7.27487850189209, -7.024864196777344, -6.774849891662598, -6.524835586547852, -6.2748212814331055, -6.024807453155518, -5.7747931480407715, -5.524778842926025, -5.2747650146484375, -5.024750709533691, -4.774736404418945, -4.524722099304199, -4.274707794189453, -4.024693965911865, -3.774679660797119, -3.524665355682373, -3.274651288986206, -3.024637222290039, -2.774622917175293, -2.524608612060547, -2.27459454536438, -2.024580478668213, -1.7745661735534668, -1.5245519876480103, -1.2745378017425537, -1.0245236158370972, -0.7745099067687988, -0.5244957208633423, -0.27448153495788574, -0.0244673490524292, 0.22554683685302734, 0.4755610227584839, 0.7255752086639404, 0.975589394569397, 1.2256035804748535, 1.47561776638031, 1.7256319522857666, 1.9756461381912231, 2.2256603240966797, 2.475674629211426, 2.7256886959075928, 2.9757027626037598, 3.225717067718506, 3.475731372833252, 3.725745439529419, 3.975759506225586, 4.225773811340332, 4.475788116455078, 4.725802421569824, 4.975816249847412, 5.225830554962158, 5.475844860076904, 5.725858688354492, 5.975872993469238, 6.225887298583984, 6.4759016036987305, 6.725915908813477, 6.9759297370910645, 7.2259440422058105]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 4.0, 5.0, 5.0, 3.0, 9.0, 7.0, 16.0, 12.0, 20.0, 36.0, 41.0, 73.0, 106.0, 225.0, 329.0, 654.0, 1633.0, 5624.0, 50455.0, 3909323.0, 211631.0, 9709.0, 2385.0, 942.0, 447.0, 228.0, 129.0, 79.0, 52.0, 33.0, 23.0, 17.0, 15.0, 8.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.85546875, -2.78521728515625, -2.7149658203125, -2.64471435546875, -2.574462890625, -2.50421142578125, -2.4339599609375, -2.36370849609375, -2.29345703125, -2.22320556640625, -2.1529541015625, -2.08270263671875, -2.012451171875, -1.94219970703125, -1.8719482421875, -1.80169677734375, -1.7314453125, -1.66119384765625, -1.5909423828125, -1.52069091796875, -1.450439453125, -1.38018798828125, -1.3099365234375, -1.23968505859375, -1.16943359375, -1.09918212890625, -1.0289306640625, -0.95867919921875, -0.888427734375, -0.81817626953125, -0.7479248046875, -0.67767333984375, -0.607421875, -0.53717041015625, -0.4669189453125, -0.39666748046875, -0.326416015625, -0.25616455078125, -0.1859130859375, -0.11566162109375, -0.04541015625, 0.02484130859375, 0.0950927734375, 0.16534423828125, 0.235595703125, 0.30584716796875, 0.3760986328125, 0.44635009765625, 0.5166015625, 0.58685302734375, 0.6571044921875, 0.72735595703125, 0.797607421875, 0.86785888671875, 0.9381103515625, 1.00836181640625, 1.07861328125, 1.14886474609375, 1.2191162109375, 1.28936767578125, 1.359619140625, 1.42987060546875, 1.5001220703125, 1.57037353515625, 1.640625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 9.0, 8.0, 15.0, 15.0, 22.0, 21.0, 25.0, 34.0, 37.0, 43.0, 50.0, 46.0, 65.0, 61.0, 69.0, 64.0, 50.0, 66.0, 45.0, 40.0, 39.0, 35.0, 26.0, 20.0, 19.0, 14.0, 11.0, 5.0, 10.0, 9.0, 9.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.6259765625, -0.6096229553222656, -0.5932693481445312, -0.5769157409667969, -0.5605621337890625, -0.5442085266113281, -0.5278549194335938, -0.5115013122558594, -0.495147705078125, -0.4787940979003906, -0.46244049072265625, -0.4460868835449219, -0.4297332763671875, -0.4133796691894531, -0.39702606201171875, -0.3806724548339844, -0.36431884765625, -0.3479652404785156, -0.33161163330078125, -0.3152580261230469, -0.2989044189453125, -0.2825508117675781, -0.26619720458984375, -0.24984359741210938, -0.233489990234375, -0.21713638305664062, -0.20078277587890625, -0.18442916870117188, -0.1680755615234375, -0.15172195434570312, -0.13536834716796875, -0.11901473999023438, -0.1026611328125, -0.08630752563476562, -0.06995391845703125, -0.053600311279296875, -0.0372467041015625, -0.020893096923828125, -0.00453948974609375, 0.011814117431640625, 0.028167724609375, 0.044521331787109375, 0.06087493896484375, 0.07722854614257812, 0.0935821533203125, 0.10993576049804688, 0.12628936767578125, 0.14264297485351562, 0.15899658203125, 0.17535018920898438, 0.19170379638671875, 0.20805740356445312, 0.2244110107421875, 0.24076461791992188, 0.25711822509765625, 0.2734718322753906, 0.289825439453125, 0.3061790466308594, 0.32253265380859375, 0.3388862609863281, 0.3552398681640625, 0.3715934753417969, 0.38794708251953125, 0.4043006896972656, 0.420654296875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 0.0, 4.0, 7.0, 9.0, 21.0, 29.0, 36.0, 64.0, 92.0, 171.0, 355.0, 866.0, 3130.0, 27713.0, 4080976.0, 74068.0, 4630.0, 1154.0, 415.0, 206.0, 143.0, 67.0, 48.0, 28.0, 21.0, 13.0, 7.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.26953125, -4.138671875, -4.0078125, -3.876953125, -3.74609375, -3.615234375, -3.484375, -3.353515625, -3.22265625, -3.091796875, -2.9609375, -2.830078125, -2.69921875, -2.568359375, -2.4375, -2.306640625, -2.17578125, -2.044921875, -1.9140625, -1.783203125, -1.65234375, -1.521484375, -1.390625, -1.259765625, -1.12890625, -0.998046875, -0.8671875, -0.736328125, -0.60546875, -0.474609375, -0.34375, -0.212890625, -0.08203125, 0.048828125, 0.1796875, 0.310546875, 0.44140625, 0.572265625, 0.703125, 0.833984375, 0.96484375, 1.095703125, 1.2265625, 1.357421875, 1.48828125, 1.619140625, 1.75, 1.880859375, 2.01171875, 2.142578125, 2.2734375, 2.404296875, 2.53515625, 2.666015625, 2.796875, 2.927734375, 3.05859375, 3.189453125, 3.3203125, 3.451171875, 3.58203125, 3.712890625, 3.84375, 3.974609375, 4.10546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 6.0, 7.0, 12.0, 22.0, 59.0, 103.0, 424.0, 1872.0, 1188.0, 232.0, 81.0, 35.0, 14.0, 10.0, 5.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.94921875, -4.841094970703125, -4.73297119140625, -4.624847412109375, -4.5167236328125, -4.408599853515625, -4.30047607421875, -4.192352294921875, -4.084228515625, -3.976104736328125, -3.86798095703125, -3.759857177734375, -3.6517333984375, -3.543609619140625, -3.43548583984375, -3.327362060546875, -3.21923828125, -3.111114501953125, -3.00299072265625, -2.894866943359375, -2.7867431640625, -2.678619384765625, -2.57049560546875, -2.462371826171875, -2.354248046875, -2.246124267578125, -2.13800048828125, -2.029876708984375, -1.9217529296875, -1.813629150390625, -1.70550537109375, -1.597381591796875, -1.4892578125, -1.381134033203125, -1.27301025390625, -1.164886474609375, -1.0567626953125, -0.948638916015625, -0.84051513671875, -0.732391357421875, -0.624267578125, -0.516143798828125, -0.40802001953125, -0.299896240234375, -0.1917724609375, -0.083648681640625, 0.02447509765625, 0.132598876953125, 0.24072265625, 0.348846435546875, 0.45697021484375, 0.565093994140625, 0.6732177734375, 0.781341552734375, 0.88946533203125, 0.997589111328125, 1.105712890625, 1.213836669921875, 1.32196044921875, 1.430084228515625, 1.5382080078125, 1.646331787109375, 1.75445556640625, 1.862579345703125, 1.970703125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 10.0, 12.0, 30.0, 41.0, 84.0, 130.0, 216.0, 190.0, 124.0, 77.0, 37.0, 21.0, 10.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.27149486541748, -13.719356536865234, -13.167217254638672, -12.615078926086426, -12.06294059753418, -11.510801315307617, -10.958662986755371, -10.406524658203125, -9.854385375976562, -9.302247047424316, -8.750107765197754, -8.197969436645508, -7.6458306312561035, -7.093691825866699, -6.541553497314453, -5.989414691925049, -5.4372758865356445, -4.88513708114624, -4.332998275756836, -3.78085994720459, -3.2287211418151855, -2.6765823364257812, -2.124443769454956, -1.5723052024841309, -1.0201663970947266, -0.4680277109146118, 0.08411097526550293, 0.6362496614456177, 1.1883883476257324, 1.7405271530151367, 2.292665719985962, 2.844804286956787, 3.396942138671875, 3.9490809440612793, 4.501219749450684, 5.05335807800293, 5.605496883392334, 6.157635688781738, 6.709774017333984, 7.261912822723389, 7.814051628112793, 8.366189956665039, 8.918329238891602, 9.470467567443848, 10.022605895996094, 10.574745178222656, 11.126883506774902, 11.679021835327148, 12.231161117553711, 12.783299446105957, 13.33543872833252, 13.887577056884766, 14.439716339111328, 14.991854667663574, 15.54399299621582, 16.096132278442383, 16.648269653320312, 17.200408935546875, 17.752546310424805, 18.304685592651367, 18.85682487487793, 19.40896224975586, 19.961101531982422, 20.513240814208984, 21.065380096435547]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 11.0, 9.0, 10.0, 7.0, 16.0, 21.0, 14.0, 17.0, 29.0, 29.0, 26.0, 35.0, 28.0, 33.0, 41.0, 39.0, 63.0, 56.0, 71.0, 63.0, 49.0, 47.0, 44.0, 35.0, 27.0, 29.0, 26.0, 22.0, 22.0, 20.0, 13.0, 10.0, 11.0, 3.0, 10.0, 3.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.990432262420654, -6.754762649536133, -6.5190935134887695, -6.283424377441406, -6.047754764556885, -5.812085151672363, -5.576416015625, -5.340746879577637, -5.105077266693115, -4.869407653808594, -4.6337385177612305, -4.398069381713867, -4.162399768829346, -3.9267303943634033, -3.691061019897461, -3.4553916454315186, -3.219722270965576, -2.984052896499634, -2.7483835220336914, -2.512714147567749, -2.2770447731018066, -2.0413753986358643, -1.8057060241699219, -1.5700366497039795, -1.334367275238037, -1.0986979007720947, -0.8630285263061523, -0.62735915184021, -0.3916897773742676, -0.1560204029083252, 0.07964897155761719, 0.31531834602355957, 0.5509881973266602, 0.7866575717926025, 1.022326946258545, 1.2579963207244873, 1.4936656951904297, 1.729335069656372, 1.9650044441223145, 2.200673818588257, 2.436343193054199, 2.6720125675201416, 2.907681941986084, 3.1433513164520264, 3.3790206909179688, 3.614690065383911, 3.8503594398498535, 4.086029052734375, 4.321698188781738, 4.557367324829102, 4.793036937713623, 5.0287065505981445, 5.264375686645508, 5.500044822692871, 5.735714435577393, 5.971384048461914, 6.207053184509277, 6.442722320556641, 6.678391933441162, 6.914061546325684, 7.149730682373047, 7.38539981842041, 7.621069431304932, 7.856739044189453, 8.092408180236816]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 12.0, 13.0, 20.0, 24.0, 48.0, 79.0, 114.0, 194.0, 360.0, 553.0, 1060.0, 1999.0, 4006.0, 8065.0, 17660.0, 41354.0, 109146.0, 316606.0, 344854.0, 120220.0, 45260.0, 19038.0, 8897.0, 4226.0, 2117.0, 1122.0, 629.0, 326.0, 194.0, 133.0, 75.0, 54.0, 23.0, 25.0, 13.0, 12.0, 3.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6171875, -0.591522216796875, -0.56585693359375, -0.540191650390625, -0.5145263671875, -0.488861083984375, -0.46319580078125, -0.437530517578125, -0.411865234375, -0.386199951171875, -0.36053466796875, -0.334869384765625, -0.3092041015625, -0.283538818359375, -0.25787353515625, -0.232208251953125, -0.20654296875, -0.180877685546875, -0.15521240234375, -0.129547119140625, -0.1038818359375, -0.078216552734375, -0.05255126953125, -0.026885986328125, -0.001220703125, 0.024444580078125, 0.05010986328125, 0.075775146484375, 0.1014404296875, 0.127105712890625, 0.15277099609375, 0.178436279296875, 0.2041015625, 0.229766845703125, 0.25543212890625, 0.281097412109375, 0.3067626953125, 0.332427978515625, 0.35809326171875, 0.383758544921875, 0.409423828125, 0.435089111328125, 0.46075439453125, 0.486419677734375, 0.5120849609375, 0.537750244140625, 0.56341552734375, 0.589080810546875, 0.61474609375, 0.640411376953125, 0.66607666015625, 0.691741943359375, 0.7174072265625, 0.743072509765625, 0.76873779296875, 0.794403076171875, 0.820068359375, 0.845733642578125, 0.87139892578125, 0.897064208984375, 0.9227294921875, 0.948394775390625, 0.97406005859375, 0.999725341796875, 1.025390625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 5.0, 8.0, 6.0, 6.0, 17.0, 20.0, 20.0, 23.0, 33.0, 49.0, 34.0, 41.0, 50.0, 49.0, 46.0, 58.0, 45.0, 58.0, 55.0, 50.0, 58.0, 46.0, 50.0, 39.0, 22.0, 22.0, 22.0, 14.0, 11.0, 11.0, 4.0, 3.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.78173828125, -0.7617149353027344, -0.7416915893554688, -0.7216682434082031, -0.7016448974609375, -0.6816215515136719, -0.6615982055664062, -0.6415748596191406, -0.621551513671875, -0.6015281677246094, -0.5815048217773438, -0.5614814758300781, -0.5414581298828125, -0.5214347839355469, -0.5014114379882812, -0.4813880920410156, -0.46136474609375, -0.4413414001464844, -0.42131805419921875, -0.4012947082519531, -0.3812713623046875, -0.3612480163574219, -0.34122467041015625, -0.3212013244628906, -0.301177978515625, -0.2811546325683594, -0.26113128662109375, -0.24110794067382812, -0.2210845947265625, -0.20106124877929688, -0.18103790283203125, -0.16101455688476562, -0.1409912109375, -0.12096786499023438, -0.10094451904296875, -0.08092117309570312, -0.0608978271484375, -0.040874481201171875, -0.02085113525390625, -0.000827789306640625, 0.019195556640625, 0.039218902587890625, 0.05924224853515625, 0.07926559448242188, 0.0992889404296875, 0.11931228637695312, 0.13933563232421875, 0.15935897827148438, 0.17938232421875, 0.19940567016601562, 0.21942901611328125, 0.23945236206054688, 0.2594757080078125, 0.2794990539550781, 0.29952239990234375, 0.3195457458496094, 0.339569091796875, 0.3595924377441406, 0.37961578369140625, 0.3996391296386719, 0.4196624755859375, 0.4396858215332031, 0.45970916748046875, 0.4797325134277344, 0.499755859375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 11.0, 12.0, 16.0, 13.0, 32.0, 33.0, 45.0, 70.0, 83.0, 137.0, 181.0, 292.0, 489.0, 874.0, 1725.0, 4340.0, 14180.0, 65679.0, 692736.0, 220223.0, 33101.0, 8267.0, 2864.0, 1289.0, 630.0, 387.0, 241.0, 174.0, 101.0, 99.0, 55.0, 34.0, 31.0, 19.0, 16.0, 14.0, 12.0, 7.0, 7.0, 7.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.806640625, -1.74981689453125, -1.6929931640625, -1.63616943359375, -1.579345703125, -1.52252197265625, -1.4656982421875, -1.40887451171875, -1.35205078125, -1.29522705078125, -1.2384033203125, -1.18157958984375, -1.124755859375, -1.06793212890625, -1.0111083984375, -0.95428466796875, -0.8974609375, -0.84063720703125, -0.7838134765625, -0.72698974609375, -0.670166015625, -0.61334228515625, -0.5565185546875, -0.49969482421875, -0.44287109375, -0.38604736328125, -0.3292236328125, -0.27239990234375, -0.215576171875, -0.15875244140625, -0.1019287109375, -0.04510498046875, 0.01171875, 0.06854248046875, 0.1253662109375, 0.18218994140625, 0.239013671875, 0.29583740234375, 0.3526611328125, 0.40948486328125, 0.46630859375, 0.52313232421875, 0.5799560546875, 0.63677978515625, 0.693603515625, 0.75042724609375, 0.8072509765625, 0.86407470703125, 0.9208984375, 0.97772216796875, 1.0345458984375, 1.09136962890625, 1.148193359375, 1.20501708984375, 1.2618408203125, 1.31866455078125, 1.37548828125, 1.43231201171875, 1.4891357421875, 1.54595947265625, 1.602783203125, 1.65960693359375, 1.7164306640625, 1.77325439453125, 1.830078125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 10.0, 10.0, 8.0, 12.0, 21.0, 15.0, 17.0, 29.0, 27.0, 42.0, 47.0, 51.0, 59.0, 51.0, 47.0, 63.0, 44.0, 53.0, 60.0, 51.0, 32.0, 38.0, 31.0, 26.0, 20.0, 26.0, 22.0, 16.0, 15.0, 13.0, 2.0, 11.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0], "bins": [-2.755859375, -2.6802978515625, -2.604736328125, -2.5291748046875, -2.45361328125, -2.3780517578125, -2.302490234375, -2.2269287109375, -2.1513671875, -2.0758056640625, -2.000244140625, -1.9246826171875, -1.84912109375, -1.7735595703125, -1.697998046875, -1.6224365234375, -1.546875, -1.4713134765625, -1.395751953125, -1.3201904296875, -1.24462890625, -1.1690673828125, -1.093505859375, -1.0179443359375, -0.9423828125, -0.8668212890625, -0.791259765625, -0.7156982421875, -0.64013671875, -0.5645751953125, -0.489013671875, -0.4134521484375, -0.337890625, -0.2623291015625, -0.186767578125, -0.1112060546875, -0.03564453125, 0.0399169921875, 0.115478515625, 0.1910400390625, 0.2666015625, 0.3421630859375, 0.417724609375, 0.4932861328125, 0.56884765625, 0.6444091796875, 0.719970703125, 0.7955322265625, 0.87109375, 0.9466552734375, 1.022216796875, 1.0977783203125, 1.17333984375, 1.2489013671875, 1.324462890625, 1.4000244140625, 1.4755859375, 1.5511474609375, 1.626708984375, 1.7022705078125, 1.77783203125, 1.8533935546875, 1.928955078125, 2.0045166015625, 2.080078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 10.0, 14.0, 1.0, 16.0, 22.0, 19.0, 33.0, 50.0, 53.0, 77.0, 119.0, 118.0, 192.0, 316.0, 398.0, 710.0, 1012.0, 1733.0, 3217.0, 6787.0, 16653.0, 53484.0, 321055.0, 552090.0, 57176.0, 17677.0, 7100.0, 3387.0, 1769.0, 1063.0, 702.0, 428.0, 297.0, 219.0, 145.0, 102.0, 79.0, 47.0, 59.0, 34.0, 35.0, 20.0, 8.0, 8.0, 7.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.79345703125, -0.7694320678710938, -0.7454071044921875, -0.7213821411132812, -0.697357177734375, -0.6733322143554688, -0.6493072509765625, -0.6252822875976562, -0.60125732421875, -0.5772323608398438, -0.5532073974609375, -0.5291824340820312, -0.505157470703125, -0.48113250732421875, -0.4571075439453125, -0.43308258056640625, -0.4090576171875, -0.38503265380859375, -0.3610076904296875, -0.33698272705078125, -0.312957763671875, -0.28893280029296875, -0.2649078369140625, -0.24088287353515625, -0.21685791015625, -0.19283294677734375, -0.1688079833984375, -0.14478302001953125, -0.120758056640625, -0.09673309326171875, -0.0727081298828125, -0.04868316650390625, -0.024658203125, -0.00063323974609375, 0.0233917236328125, 0.04741668701171875, 0.071441650390625, 0.09546661376953125, 0.1194915771484375, 0.14351654052734375, 0.16754150390625, 0.19156646728515625, 0.2155914306640625, 0.23961639404296875, 0.263641357421875, 0.28766632080078125, 0.3116912841796875, 0.33571624755859375, 0.3597412109375, 0.38376617431640625, 0.4077911376953125, 0.43181610107421875, 0.455841064453125, 0.47986602783203125, 0.5038909912109375, 0.5279159545898438, 0.55194091796875, 0.5759658813476562, 0.5999908447265625, 0.6240158081054688, 0.648040771484375, 0.6720657348632812, 0.6960906982421875, 0.7201156616210938, 0.744140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 9.0, 8.0, 12.0, 18.0, 25.0, 27.0, 41.0, 78.0, 128.0, 248.0, 169.0, 91.0, 60.0, 23.0, 21.0, 11.0, 8.0, 7.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005178451538085938, -0.0005004033446311951, -0.0004829615354537964, -0.0004655197262763977, -0.000448077917098999, -0.00043063610792160034, -0.00041319429874420166, -0.000395752489566803, -0.0003783106803894043, -0.0003608688712120056, -0.00034342706203460693, -0.00032598525285720825, -0.00030854344367980957, -0.0002911016345024109, -0.0002736598253250122, -0.0002562180161476135, -0.00023877620697021484, -0.00022133439779281616, -0.00020389258861541748, -0.0001864507794380188, -0.00016900897026062012, -0.00015156716108322144, -0.00013412535190582275, -0.00011668354272842407, -9.924173355102539e-05, -8.179992437362671e-05, -6.435811519622803e-05, -4.6916306018829346e-05, -2.9474496841430664e-05, -1.2032687664031982e-05, 5.409121513366699e-06, 2.285093069076538e-05, 4.029273986816406e-05, 5.7734549045562744e-05, 7.517635822296143e-05, 9.261816740036011e-05, 0.00011005997657775879, 0.00012750178575515747, 0.00014494359493255615, 0.00016238540410995483, 0.00017982721328735352, 0.0001972690224647522, 0.00021471083164215088, 0.00023215264081954956, 0.00024959444999694824, 0.0002670362591743469, 0.0002844780683517456, 0.0003019198775291443, 0.00031936168670654297, 0.00033680349588394165, 0.00035424530506134033, 0.000371687114238739, 0.0003891289234161377, 0.0004065707325935364, 0.00042401254177093506, 0.00044145435094833374, 0.0004588961601257324, 0.0004763379693031311, 0.0004937797784805298, 0.0005112215876579285, 0.0005286633968353271, 0.0005461052060127258, 0.0005635470151901245, 0.0005809888243675232, 0.0005984306335449219]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 9.0, 2.0, 4.0, 11.0, 18.0, 28.0, 39.0, 71.0, 100.0, 177.0, 375.0, 774.0, 2002.0, 6425.0, 28169.0, 252772.0, 701438.0, 42924.0, 8739.0, 2523.0, 952.0, 464.0, 230.0, 102.0, 64.0, 37.0, 28.0, 21.0, 13.0, 14.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0712890625, -1.0331878662109375, -0.995086669921875, -0.9569854736328125, -0.91888427734375, -0.8807830810546875, -0.842681884765625, -0.8045806884765625, -0.7664794921875, -0.7283782958984375, -0.690277099609375, -0.6521759033203125, -0.61407470703125, -0.5759735107421875, -0.537872314453125, -0.4997711181640625, -0.461669921875, -0.4235687255859375, -0.385467529296875, -0.3473663330078125, -0.30926513671875, -0.2711639404296875, -0.233062744140625, -0.1949615478515625, -0.1568603515625, -0.1187591552734375, -0.080657958984375, -0.0425567626953125, -0.00445556640625, 0.0336456298828125, 0.071746826171875, 0.1098480224609375, 0.14794921875, 0.1860504150390625, 0.224151611328125, 0.2622528076171875, 0.30035400390625, 0.3384552001953125, 0.376556396484375, 0.4146575927734375, 0.4527587890625, 0.4908599853515625, 0.528961181640625, 0.5670623779296875, 0.60516357421875, 0.6432647705078125, 0.681365966796875, 0.7194671630859375, 0.757568359375, 0.7956695556640625, 0.833770751953125, 0.8718719482421875, 0.90997314453125, 0.9480743408203125, 0.986175537109375, 1.0242767333984375, 1.0623779296875, 1.1004791259765625, 1.138580322265625, 1.1766815185546875, 1.21478271484375, 1.2528839111328125, 1.290985107421875, 1.3290863037109375, 1.3671875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 6.0, 9.0, 12.0, 25.0, 16.0, 26.0, 40.0, 47.0, 64.0, 107.0, 132.0, 116.0, 96.0, 72.0, 56.0, 35.0, 32.0, 21.0, 18.0, 13.0, 15.0, 8.0, 6.0, 8.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.123046875, -1.0950393676757812, -1.0670318603515625, -1.0390243530273438, -1.011016845703125, -0.9830093383789062, -0.9550018310546875, -0.9269943237304688, -0.89898681640625, -0.8709793090820312, -0.8429718017578125, -0.8149642944335938, -0.786956787109375, -0.7589492797851562, -0.7309417724609375, -0.7029342651367188, -0.6749267578125, -0.6469192504882812, -0.6189117431640625, -0.5909042358398438, -0.562896728515625, -0.5348892211914062, -0.5068817138671875, -0.47887420654296875, -0.45086669921875, -0.42285919189453125, -0.3948516845703125, -0.36684417724609375, -0.338836669921875, -0.31082916259765625, -0.2828216552734375, -0.25481414794921875, -0.226806640625, -0.19879913330078125, -0.1707916259765625, -0.14278411865234375, -0.114776611328125, -0.08676910400390625, -0.0587615966796875, -0.03075408935546875, -0.00274658203125, 0.02526092529296875, 0.0532684326171875, 0.08127593994140625, 0.109283447265625, 0.13729095458984375, 0.1652984619140625, 0.19330596923828125, 0.2213134765625, 0.24932098388671875, 0.2773284912109375, 0.30533599853515625, 0.333343505859375, 0.36135101318359375, 0.3893585205078125, 0.41736602783203125, 0.44537353515625, 0.47338104248046875, 0.5013885498046875, 0.5293960571289062, 0.557403564453125, 0.5854110717773438, 0.6134185791015625, 0.6414260864257812, 0.66943359375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 8.0, 16.0, 53.0, 140.0, 480.0, 232.0, 63.0, 5.0, 9.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.801151275634766, -45.6234245300293, -44.44569778442383, -43.26797103881836, -42.090248107910156, -40.91252136230469, -39.73479461669922, -38.55706787109375, -37.37934112548828, -36.20161437988281, -35.023887634277344, -33.846160888671875, -32.668434143066406, -31.49070930480957, -30.312984466552734, -29.135257720947266, -27.957530975341797, -26.779804229736328, -25.60207748413086, -24.424352645874023, -23.246625900268555, -22.068899154663086, -20.89117431640625, -19.71344757080078, -18.535720825195312, -17.357994079589844, -16.180267333984375, -15.002542495727539, -13.82481575012207, -12.647089004516602, -11.46936321258545, -10.291637420654297, -9.113910675048828, -7.936184406280518, -6.758458137512207, -5.5807318687438965, -4.403005599975586, -3.2252793312072754, -2.047553062438965, -0.8698272705078125, 0.30789947509765625, 1.4856257438659668, 2.6633520126342773, 3.841078281402588, 5.018804550170898, 6.196530818939209, 7.3742570877075195, 8.551982879638672, 9.72970962524414, 10.90743637084961, 12.085162162780762, 13.262887954711914, 14.440614700317383, 15.618341445922852, 16.796066284179688, 17.973793029785156, 19.151519775390625, 20.329246520996094, 21.506973266601562, 22.6846981048584, 23.862424850463867, 25.040151596069336, 26.217876434326172, 27.39560317993164, 28.57332992553711]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 14.0, 10.0, 23.0, 12.0, 23.0, 30.0, 31.0, 21.0, 27.0, 27.0, 33.0, 30.0, 43.0, 56.0, 102.0, 110.0, 61.0, 49.0, 31.0, 33.0, 30.0, 26.0, 18.0, 19.0, 21.0, 12.0, 11.0, 17.0, 11.0, 17.0, 10.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-9.112117767333984, -8.818464279174805, -8.524810791015625, -8.231157302856445, -7.937503814697266, -7.643850326538086, -7.350196838378906, -7.056543350219727, -6.762889862060547, -6.469236373901367, -6.1755828857421875, -5.881929397583008, -5.588275909423828, -5.294622421264648, -5.000968933105469, -4.707315444946289, -4.413661956787109, -4.12000846862793, -3.82635498046875, -3.5327014923095703, -3.2390480041503906, -2.945394515991211, -2.6517410278320312, -2.3580875396728516, -2.064434051513672, -1.7707805633544922, -1.4771270751953125, -1.1834735870361328, -0.8898200988769531, -0.5961666107177734, -0.30251312255859375, -0.008859634399414062, 0.2847938537597656, 0.5784473419189453, 0.872100830078125, 1.1657543182373047, 1.4594078063964844, 1.753061294555664, 2.0467147827148438, 2.3403682708740234, 2.634021759033203, 2.927675247192383, 3.2213287353515625, 3.514982223510742, 3.808635711669922, 4.102289199829102, 4.395942687988281, 4.689596176147461, 4.983249664306641, 5.27690315246582, 5.570556640625, 5.86421012878418, 6.157863616943359, 6.451517105102539, 6.745170593261719, 7.038824081420898, 7.332477569580078, 7.626131057739258, 7.9197845458984375, 8.213438034057617, 8.507091522216797, 8.800745010375977, 9.094398498535156, 9.388051986694336, 9.681705474853516]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 13.0, 7.0, 17.0, 14.0, 19.0, 25.0, 24.0, 43.0, 52.0, 92.0, 145.0, 221.0, 400.0, 629.0, 1079.0, 2005.0, 3759.0, 8700.0, 34004.0, 699625.0, 3214161.0, 196065.0, 19562.0, 6407.0, 3012.0, 1723.0, 955.0, 589.0, 348.0, 213.0, 146.0, 75.0, 44.0, 31.0, 22.0, 18.0, 9.0, 11.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.451171875, -1.4048309326171875, -1.358489990234375, -1.3121490478515625, -1.26580810546875, -1.2194671630859375, -1.173126220703125, -1.1267852783203125, -1.0804443359375, -1.0341033935546875, -0.987762451171875, -0.9414215087890625, -0.89508056640625, -0.8487396240234375, -0.802398681640625, -0.7560577392578125, -0.709716796875, -0.6633758544921875, -0.617034912109375, -0.5706939697265625, -0.52435302734375, -0.4780120849609375, -0.431671142578125, -0.3853302001953125, -0.3389892578125, -0.2926483154296875, -0.246307373046875, -0.1999664306640625, -0.15362548828125, -0.1072845458984375, -0.060943603515625, -0.0146026611328125, 0.03173828125, 0.0780792236328125, 0.124420166015625, 0.1707611083984375, 0.21710205078125, 0.2634429931640625, 0.309783935546875, 0.3561248779296875, 0.4024658203125, 0.4488067626953125, 0.495147705078125, 0.5414886474609375, 0.58782958984375, 0.6341705322265625, 0.680511474609375, 0.7268524169921875, 0.773193359375, 0.8195343017578125, 0.865875244140625, 0.9122161865234375, 0.95855712890625, 1.0048980712890625, 1.051239013671875, 1.0975799560546875, 1.1439208984375, 1.1902618408203125, 1.236602783203125, 1.2829437255859375, 1.32928466796875, 1.3756256103515625, 1.421966552734375, 1.4683074951171875, 1.5146484375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 7.0, 5.0, 4.0, 14.0, 4.0, 12.0, 17.0, 19.0, 12.0, 19.0, 34.0, 30.0, 41.0, 27.0, 33.0, 39.0, 39.0, 42.0, 51.0, 32.0, 54.0, 46.0, 45.0, 45.0, 47.0, 49.0, 30.0, 35.0, 30.0, 24.0, 15.0, 23.0, 10.0, 20.0, 10.0, 7.0, 8.0, 5.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5263671875, -0.5102996826171875, -0.494232177734375, -0.4781646728515625, -0.46209716796875, -0.4460296630859375, -0.429962158203125, -0.4138946533203125, -0.3978271484375, -0.3817596435546875, -0.365692138671875, -0.3496246337890625, -0.33355712890625, -0.3174896240234375, -0.301422119140625, -0.2853546142578125, -0.269287109375, -0.2532196044921875, -0.237152099609375, -0.2210845947265625, -0.20501708984375, -0.1889495849609375, -0.172882080078125, -0.1568145751953125, -0.1407470703125, -0.1246795654296875, -0.108612060546875, -0.0925445556640625, -0.07647705078125, -0.0604095458984375, -0.044342041015625, -0.0282745361328125, -0.01220703125, 0.0038604736328125, 0.019927978515625, 0.0359954833984375, 0.05206298828125, 0.0681304931640625, 0.084197998046875, 0.1002655029296875, 0.1163330078125, 0.1324005126953125, 0.148468017578125, 0.1645355224609375, 0.18060302734375, 0.1966705322265625, 0.212738037109375, 0.2288055419921875, 0.244873046875, 0.2609405517578125, 0.277008056640625, 0.2930755615234375, 0.30914306640625, 0.3252105712890625, 0.341278076171875, 0.3573455810546875, 0.3734130859375, 0.3894805908203125, 0.405548095703125, 0.4216156005859375, 0.43768310546875, 0.4537506103515625, 0.469818115234375, 0.4858856201171875, 0.501953125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 7.0, 4.0, 12.0, 27.0, 55.0, 126.0, 198.0, 477.0, 942.0, 3025.0, 33778.0, 4100633.0, 49277.0, 3687.0, 1091.0, 496.0, 222.0, 119.0, 40.0, 26.0, 19.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.953125, -4.79095458984375, -4.6287841796875, -4.46661376953125, -4.304443359375, -4.14227294921875, -3.9801025390625, -3.81793212890625, -3.65576171875, -3.49359130859375, -3.3314208984375, -3.16925048828125, -3.007080078125, -2.84490966796875, -2.6827392578125, -2.52056884765625, -2.3583984375, -2.19622802734375, -2.0340576171875, -1.87188720703125, -1.709716796875, -1.54754638671875, -1.3853759765625, -1.22320556640625, -1.06103515625, -0.89886474609375, -0.7366943359375, -0.57452392578125, -0.412353515625, -0.25018310546875, -0.0880126953125, 0.07415771484375, 0.236328125, 0.39849853515625, 0.5606689453125, 0.72283935546875, 0.885009765625, 1.04718017578125, 1.2093505859375, 1.37152099609375, 1.53369140625, 1.69586181640625, 1.8580322265625, 2.02020263671875, 2.182373046875, 2.34454345703125, 2.5067138671875, 2.66888427734375, 2.8310546875, 2.99322509765625, 3.1553955078125, 3.31756591796875, 3.479736328125, 3.64190673828125, 3.8040771484375, 3.96624755859375, 4.12841796875, 4.29058837890625, 4.4527587890625, 4.61492919921875, 4.777099609375, 4.93927001953125, 5.1014404296875, 5.26361083984375, 5.42578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 21.0, 48.0, 74.0, 201.0, 569.0, 1625.0, 1031.0, 277.0, 104.0, 45.0, 24.0, 15.0, 6.0, 7.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.861328125, -3.749908447265625, -3.63848876953125, -3.527069091796875, -3.4156494140625, -3.304229736328125, -3.19281005859375, -3.081390380859375, -2.969970703125, -2.858551025390625, -2.74713134765625, -2.635711669921875, -2.5242919921875, -2.412872314453125, -2.30145263671875, -2.190032958984375, -2.07861328125, -1.967193603515625, -1.85577392578125, -1.744354248046875, -1.6329345703125, -1.521514892578125, -1.41009521484375, -1.298675537109375, -1.187255859375, -1.075836181640625, -0.96441650390625, -0.852996826171875, -0.7415771484375, -0.630157470703125, -0.51873779296875, -0.407318115234375, -0.2958984375, -0.184478759765625, -0.07305908203125, 0.038360595703125, 0.1497802734375, 0.261199951171875, 0.37261962890625, 0.484039306640625, 0.595458984375, 0.706878662109375, 0.81829833984375, 0.929718017578125, 1.0411376953125, 1.152557373046875, 1.26397705078125, 1.375396728515625, 1.48681640625, 1.598236083984375, 1.70965576171875, 1.821075439453125, 1.9324951171875, 2.043914794921875, 2.15533447265625, 2.266754150390625, 2.378173828125, 2.489593505859375, 2.60101318359375, 2.712432861328125, 2.8238525390625, 2.935272216796875, 3.04669189453125, 3.158111572265625, 3.26953125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 13.0, 12.0, 20.0, 28.0, 50.0, 94.0, 140.0, 196.0, 157.0, 113.0, 65.0, 40.0, 27.0, 13.0, 8.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.471111297607422, -11.894577026367188, -11.318042755126953, -10.741509437561035, -10.1649751663208, -9.588440895080566, -9.011907577514648, -8.435373306274414, -7.85883903503418, -7.282304763793945, -6.705770969390869, -6.129237174987793, -5.552702903747559, -4.976168632507324, -4.399634838104248, -3.823101043701172, -3.2465667724609375, -2.6700327396392822, -2.093498706817627, -1.5169646739959717, -0.9404306411743164, -0.36389660835266113, 0.21263742446899414, 0.7891712188720703, 1.3657054901123047, 1.94223952293396, 2.5187735557556152, 3.0953075885772705, 3.671841621398926, 4.24837589263916, 4.824909687042236, 5.4014434814453125, 5.977977752685547, 6.554512023925781, 7.131045818328857, 7.707579612731934, 8.284113883972168, 8.860648155212402, 9.43718147277832, 10.013715744018555, 10.590250015258789, 11.166784286499023, 11.743318557739258, 12.319851875305176, 12.89638614654541, 13.472920417785645, 14.049453735351562, 14.625988006591797, 15.202522277832031, 15.779056549072266, 16.3555908203125, 16.932125091552734, 17.50865936279297, 18.08519172668457, 18.661725997924805, 19.23826026916504, 19.814794540405273, 20.391328811645508, 20.967863082885742, 21.544397354125977, 22.120929718017578, 22.697463989257812, 23.273998260498047, 23.85053253173828, 24.427066802978516]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 6.0, 3.0, 4.0, 8.0, 6.0, 17.0, 15.0, 15.0, 29.0, 26.0, 31.0, 18.0, 42.0, 44.0, 47.0, 65.0, 55.0, 68.0, 63.0, 71.0, 46.0, 46.0, 44.0, 35.0, 33.0, 33.0, 20.0, 19.0, 14.0, 18.0, 15.0, 8.0, 9.0, 6.0, 4.0, 5.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.278467178344727, -7.967028617858887, -7.655590057373047, -7.344151496887207, -7.032712936401367, -6.721274375915527, -6.409836292266846, -6.098397731781006, -5.786959171295166, -5.475520610809326, -5.164082050323486, -4.8526434898376465, -4.541205406188965, -4.229766845703125, -3.918328285217285, -3.6068897247314453, -3.2954511642456055, -2.9840126037597656, -2.672574043273926, -2.361135721206665, -2.049697160720825, -1.7382586002349854, -1.426820158958435, -1.1153817176818848, -0.8039431571960449, -0.49250465631484985, -0.18106615543365479, 0.13037234544754028, 0.44181084632873535, 0.7532494068145752, 1.0646878480911255, 1.3761262893676758, 1.6875648498535156, 1.9990034103393555, 2.3104419708251953, 2.621880292892456, 2.933318853378296, 3.2447574138641357, 3.5561957359313965, 3.8676342964172363, 4.179072856903076, 4.490511417388916, 4.801949977874756, 5.113388538360596, 5.424826622009277, 5.736265182495117, 6.047703742980957, 6.359142303466797, 6.670580863952637, 6.982019424438477, 7.293457984924316, 7.604896545410156, 7.916335105895996, 8.227773666381836, 8.539212226867676, 8.850650787353516, 9.162088394165039, 9.473526954650879, 9.784965515136719, 10.096404075622559, 10.407842636108398, 10.719281196594238, 11.030719757080078, 11.342157363891602, 11.653596878051758]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 16.0, 18.0, 9.0, 24.0, 47.0, 44.0, 73.0, 119.0, 186.0, 288.0, 383.0, 651.0, 1083.0, 1654.0, 2944.0, 5004.0, 9176.0, 17209.0, 34868.0, 77354.0, 193205.0, 369175.0, 187694.0, 75087.0, 34241.0, 16599.0, 9069.0, 4878.0, 2906.0, 1709.0, 1028.0, 690.0, 397.0, 249.0, 152.0, 101.0, 73.0, 38.0, 32.0, 26.0, 13.0, 15.0, 9.0, 6.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.0, -0.9692153930664062, -0.9384307861328125, -0.9076461791992188, -0.876861572265625, -0.8460769653320312, -0.8152923583984375, -0.7845077514648438, -0.75372314453125, -0.7229385375976562, -0.6921539306640625, -0.6613693237304688, -0.630584716796875, -0.5998001098632812, -0.5690155029296875, -0.5382308959960938, -0.5074462890625, -0.47666168212890625, -0.4458770751953125, -0.41509246826171875, -0.384307861328125, -0.35352325439453125, -0.3227386474609375, -0.29195404052734375, -0.26116943359375, -0.23038482666015625, -0.1996002197265625, -0.16881561279296875, -0.138031005859375, -0.10724639892578125, -0.0764617919921875, -0.04567718505859375, -0.014892578125, 0.01589202880859375, 0.0466766357421875, 0.07746124267578125, 0.108245849609375, 0.13903045654296875, 0.1698150634765625, 0.20059967041015625, 0.23138427734375, 0.26216888427734375, 0.2929534912109375, 0.32373809814453125, 0.354522705078125, 0.38530731201171875, 0.4160919189453125, 0.44687652587890625, 0.4776611328125, 0.5084457397460938, 0.5392303466796875, 0.5700149536132812, 0.600799560546875, 0.6315841674804688, 0.6623687744140625, 0.6931533813476562, 0.72393798828125, 0.7547225952148438, 0.7855072021484375, 0.8162918090820312, 0.847076416015625, 0.8778610229492188, 0.9086456298828125, 0.9394302368164062, 0.97021484375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 7.0, 5.0, 14.0, 9.0, 12.0, 12.0, 13.0, 18.0, 34.0, 25.0, 24.0, 41.0, 32.0, 31.0, 45.0, 42.0, 39.0, 37.0, 45.0, 52.0, 53.0, 51.0, 49.0, 29.0, 46.0, 22.0, 37.0, 40.0, 22.0, 19.0, 14.0, 12.0, 16.0, 9.0, 7.0, 8.0, 6.0, 4.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.72216796875, -0.70135498046875, -0.6805419921875, -0.65972900390625, -0.638916015625, -0.61810302734375, -0.5972900390625, -0.57647705078125, -0.5556640625, -0.53485107421875, -0.5140380859375, -0.49322509765625, -0.472412109375, -0.45159912109375, -0.4307861328125, -0.40997314453125, -0.38916015625, -0.36834716796875, -0.3475341796875, -0.32672119140625, -0.305908203125, -0.28509521484375, -0.2642822265625, -0.24346923828125, -0.22265625, -0.20184326171875, -0.1810302734375, -0.16021728515625, -0.139404296875, -0.11859130859375, -0.0977783203125, -0.07696533203125, -0.05615234375, -0.03533935546875, -0.0145263671875, 0.00628662109375, 0.027099609375, 0.04791259765625, 0.0687255859375, 0.08953857421875, 0.1103515625, 0.13116455078125, 0.1519775390625, 0.17279052734375, 0.193603515625, 0.21441650390625, 0.2352294921875, 0.25604248046875, 0.27685546875, 0.29766845703125, 0.3184814453125, 0.33929443359375, 0.360107421875, 0.38092041015625, 0.4017333984375, 0.42254638671875, 0.443359375, 0.46417236328125, 0.4849853515625, 0.50579833984375, 0.526611328125, 0.54742431640625, 0.5682373046875, 0.58905029296875, 0.60986328125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 8.0, 10.0, 9.0, 26.0, 23.0, 26.0, 48.0, 75.0, 76.0, 113.0, 171.0, 227.0, 320.0, 534.0, 884.0, 1715.0, 4233.0, 15703.0, 113338.0, 821190.0, 70932.0, 11658.0, 3388.0, 1502.0, 810.0, 512.0, 318.0, 195.0, 132.0, 108.0, 76.0, 53.0, 43.0, 21.0, 30.0, 20.0, 12.0, 13.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.09375, -3.008758544921875, -2.92376708984375, -2.838775634765625, -2.7537841796875, -2.668792724609375, -2.58380126953125, -2.498809814453125, -2.413818359375, -2.328826904296875, -2.24383544921875, -2.158843994140625, -2.0738525390625, -1.988861083984375, -1.90386962890625, -1.818878173828125, -1.73388671875, -1.648895263671875, -1.56390380859375, -1.478912353515625, -1.3939208984375, -1.308929443359375, -1.22393798828125, -1.138946533203125, -1.053955078125, -0.968963623046875, -0.88397216796875, -0.798980712890625, -0.7139892578125, -0.628997802734375, -0.54400634765625, -0.459014892578125, -0.3740234375, -0.289031982421875, -0.20404052734375, -0.119049072265625, -0.0340576171875, 0.050933837890625, 0.13592529296875, 0.220916748046875, 0.305908203125, 0.390899658203125, 0.47589111328125, 0.560882568359375, 0.6458740234375, 0.730865478515625, 0.81585693359375, 0.900848388671875, 0.98583984375, 1.070831298828125, 1.15582275390625, 1.240814208984375, 1.3258056640625, 1.410797119140625, 1.49578857421875, 1.580780029296875, 1.665771484375, 1.750762939453125, 1.83575439453125, 1.920745849609375, 2.0057373046875, 2.090728759765625, 2.17572021484375, 2.260711669921875, 2.345703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 3.0, 9.0, 10.0, 8.0, 8.0, 13.0, 12.0, 10.0, 19.0, 26.0, 22.0, 27.0, 44.0, 35.0, 44.0, 31.0, 60.0, 51.0, 48.0, 77.0, 61.0, 56.0, 44.0, 43.0, 38.0, 22.0, 25.0, 23.0, 21.0, 25.0, 15.0, 11.0, 6.0, 8.0, 8.0, 4.0, 4.0, 6.0, 2.0, 0.0, 5.0, 0.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.580078125, -2.4906005859375, -2.401123046875, -2.3116455078125, -2.22216796875, -2.1326904296875, -2.043212890625, -1.9537353515625, -1.8642578125, -1.7747802734375, -1.685302734375, -1.5958251953125, -1.50634765625, -1.4168701171875, -1.327392578125, -1.2379150390625, -1.1484375, -1.0589599609375, -0.969482421875, -0.8800048828125, -0.79052734375, -0.7010498046875, -0.611572265625, -0.5220947265625, -0.4326171875, -0.3431396484375, -0.253662109375, -0.1641845703125, -0.07470703125, 0.0147705078125, 0.104248046875, 0.1937255859375, 0.283203125, 0.3726806640625, 0.462158203125, 0.5516357421875, 0.64111328125, 0.7305908203125, 0.820068359375, 0.9095458984375, 0.9990234375, 1.0885009765625, 1.177978515625, 1.2674560546875, 1.35693359375, 1.4464111328125, 1.535888671875, 1.6253662109375, 1.71484375, 1.8043212890625, 1.893798828125, 1.9832763671875, 2.07275390625, 2.1622314453125, 2.251708984375, 2.3411865234375, 2.4306640625, 2.5201416015625, 2.609619140625, 2.6990966796875, 2.78857421875, 2.8780517578125, 2.967529296875, 3.0570068359375, 3.146484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 11.0, 6.0, 4.0, 11.0, 10.0, 19.0, 15.0, 39.0, 58.0, 83.0, 121.0, 216.0, 283.0, 571.0, 1039.0, 2161.0, 5190.0, 15881.0, 66861.0, 732081.0, 177286.0, 31089.0, 8895.0, 3268.0, 1460.0, 740.0, 449.0, 225.0, 162.0, 100.0, 58.0, 39.0, 31.0, 22.0, 23.0, 8.0, 7.0, 11.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.7900390625, -0.7651596069335938, -0.7402801513671875, -0.7154006958007812, -0.690521240234375, -0.6656417846679688, -0.6407623291015625, -0.6158828735351562, -0.59100341796875, -0.5661239624023438, -0.5412445068359375, -0.5163650512695312, -0.491485595703125, -0.46660614013671875, -0.4417266845703125, -0.41684722900390625, -0.3919677734375, -0.36708831787109375, -0.3422088623046875, -0.31732940673828125, -0.292449951171875, -0.26757049560546875, -0.2426910400390625, -0.21781158447265625, -0.19293212890625, -0.16805267333984375, -0.1431732177734375, -0.11829376220703125, -0.093414306640625, -0.06853485107421875, -0.0436553955078125, -0.01877593994140625, 0.006103515625, 0.03098297119140625, 0.0558624267578125, 0.08074188232421875, 0.105621337890625, 0.13050079345703125, 0.1553802490234375, 0.18025970458984375, 0.20513916015625, 0.23001861572265625, 0.2548980712890625, 0.27977752685546875, 0.304656982421875, 0.32953643798828125, 0.3544158935546875, 0.37929534912109375, 0.4041748046875, 0.42905426025390625, 0.4539337158203125, 0.47881317138671875, 0.503692626953125, 0.5285720825195312, 0.5534515380859375, 0.5783309936523438, 0.60321044921875, 0.6280899047851562, 0.6529693603515625, 0.6778488159179688, 0.702728271484375, 0.7276077270507812, 0.7524871826171875, 0.7773666381835938, 0.80224609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 4.0, 9.0, 8.0, 4.0, 10.0, 15.0, 20.0, 18.0, 28.0, 27.0, 55.0, 61.0, 79.0, 103.0, 163.0, 99.0, 61.0, 57.0, 37.0, 37.0, 19.0, 12.0, 6.0, 13.0, 10.0, 6.0, 6.0, 8.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00031447410583496094, -0.0003055669367313385, -0.00029665976762771606, -0.00028775259852409363, -0.0002788454294204712, -0.00026993826031684875, -0.0002610310912132263, -0.0002521239221096039, -0.00024321675300598145, -0.000234309583902359, -0.00022540241479873657, -0.00021649524569511414, -0.0002075880765914917, -0.00019868090748786926, -0.00018977373838424683, -0.0001808665692806244, -0.00017195940017700195, -0.00016305223107337952, -0.00015414506196975708, -0.00014523789286613464, -0.0001363307237625122, -0.00012742355465888977, -0.00011851638555526733, -0.0001096092164516449, -0.00010070204734802246, -9.179487824440002e-05, -8.288770914077759e-05, -7.398054003715515e-05, -6.507337093353271e-05, -5.616620182991028e-05, -4.725903272628784e-05, -3.8351863622665405e-05, -2.944469451904297e-05, -2.0537525415420532e-05, -1.1630356311798096e-05, -2.723187208175659e-06, 6.183981895446777e-06, 1.5091150999069214e-05, 2.399832010269165e-05, 3.290548920631409e-05, 4.1812658309936523e-05, 5.071982741355896e-05, 5.9626996517181396e-05, 6.853416562080383e-05, 7.744133472442627e-05, 8.63485038280487e-05, 9.525567293167114e-05, 0.00010416284203529358, 0.00011307001113891602, 0.00012197718024253845, 0.0001308843493461609, 0.00013979151844978333, 0.00014869868755340576, 0.0001576058566570282, 0.00016651302576065063, 0.00017542019486427307, 0.0001843273639678955, 0.00019323453307151794, 0.00020214170217514038, 0.00021104887127876282, 0.00021995604038238525, 0.0002288632094860077, 0.00023777037858963013, 0.00024667754769325256, 0.000255584716796875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 3.0, 4.0, 7.0, 11.0, 20.0, 24.0, 28.0, 33.0, 79.0, 107.0, 160.0, 224.0, 430.0, 844.0, 1668.0, 4315.0, 13870.0, 64100.0, 725720.0, 192955.0, 30673.0, 7777.0, 2772.0, 1163.0, 595.0, 332.0, 185.0, 150.0, 85.0, 71.0, 45.0, 25.0, 21.0, 16.0, 8.0, 6.0, 8.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.697265625, -0.67303466796875, -0.6488037109375, -0.62457275390625, -0.600341796875, -0.57611083984375, -0.5518798828125, -0.52764892578125, -0.50341796875, -0.47918701171875, -0.4549560546875, -0.43072509765625, -0.406494140625, -0.38226318359375, -0.3580322265625, -0.33380126953125, -0.3095703125, -0.28533935546875, -0.2611083984375, -0.23687744140625, -0.212646484375, -0.18841552734375, -0.1641845703125, -0.13995361328125, -0.11572265625, -0.09149169921875, -0.0672607421875, -0.04302978515625, -0.018798828125, 0.00543212890625, 0.0296630859375, 0.05389404296875, 0.078125, 0.10235595703125, 0.1265869140625, 0.15081787109375, 0.175048828125, 0.19927978515625, 0.2235107421875, 0.24774169921875, 0.27197265625, 0.29620361328125, 0.3204345703125, 0.34466552734375, 0.368896484375, 0.39312744140625, 0.4173583984375, 0.44158935546875, 0.4658203125, 0.49005126953125, 0.5142822265625, 0.53851318359375, 0.562744140625, 0.58697509765625, 0.6112060546875, 0.63543701171875, 0.65966796875, 0.68389892578125, 0.7081298828125, 0.73236083984375, 0.756591796875, 0.78082275390625, 0.8050537109375, 0.82928466796875, 0.853515625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 5.0, 7.0, 4.0, 9.0, 10.0, 17.0, 25.0, 20.0, 28.0, 42.0, 37.0, 42.0, 58.0, 72.0, 109.0, 108.0, 85.0, 67.0, 51.0, 38.0, 34.0, 27.0, 15.0, 9.0, 15.0, 9.0, 13.0, 9.0, 15.0, 9.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.666015625, -0.6470413208007812, -0.6280670166015625, -0.6090927124023438, -0.590118408203125, -0.5711441040039062, -0.5521697998046875, -0.5331954956054688, -0.51422119140625, -0.49524688720703125, -0.4762725830078125, -0.45729827880859375, -0.438323974609375, -0.41934967041015625, -0.4003753662109375, -0.38140106201171875, -0.3624267578125, -0.34345245361328125, -0.3244781494140625, -0.30550384521484375, -0.286529541015625, -0.26755523681640625, -0.2485809326171875, -0.22960662841796875, -0.21063232421875, -0.19165802001953125, -0.1726837158203125, -0.15370941162109375, -0.134735107421875, -0.11576080322265625, -0.0967864990234375, -0.07781219482421875, -0.058837890625, -0.03986358642578125, -0.0208892822265625, -0.00191497802734375, 0.017059326171875, 0.03603363037109375, 0.0550079345703125, 0.07398223876953125, 0.09295654296875, 0.11193084716796875, 0.1309051513671875, 0.14987945556640625, 0.168853759765625, 0.18782806396484375, 0.2068023681640625, 0.22577667236328125, 0.2447509765625, 0.26372528076171875, 0.2826995849609375, 0.30167388916015625, 0.320648193359375, 0.33962249755859375, 0.3585968017578125, 0.37757110595703125, 0.39654541015625, 0.41551971435546875, 0.4344940185546875, 0.45346832275390625, 0.472442626953125, 0.49141693115234375, 0.5103912353515625, 0.5293655395507812, 0.54833984375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 13.0, 32.0, 113.0, 349.0, 320.0, 100.0, 45.0, 16.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.54279327392578, -41.529170989990234, -40.51555252075195, -39.501930236816406, -38.488311767578125, -37.47468948364258, -36.46106719970703, -35.44744873046875, -34.4338264465332, -33.420204162597656, -32.406585693359375, -31.392963409423828, -30.379343032836914, -29.36572265625, -28.352102279663086, -27.338481903076172, -26.324861526489258, -25.311241149902344, -24.29762077331543, -23.284000396728516, -22.27037811279297, -21.256757736206055, -20.24313735961914, -19.229516983032227, -18.215896606445312, -17.2022762298584, -16.188655853271484, -15.175034523010254, -14.161413192749023, -13.14779281616211, -12.134172439575195, -11.120552062988281, -10.106929779052734, -9.09330940246582, -8.07968807220459, -7.066067695617676, -6.0524468421936035, -5.038825988769531, -4.025205612182617, -3.011584758758545, -1.9979639053344727, -0.9843431711196899, 0.029277563095092773, 1.042898178100586, 2.056519031524658, 3.0701398849487305, 4.0837602615356445, 5.097381114959717, 6.111001968383789, 7.124622821807861, 8.138243675231934, 9.151864051818848, 10.165485382080078, 11.179105758666992, 12.192726135253906, 13.20634651184082, 14.21996784210205, 15.233588218688965, 16.247209548950195, 17.26082992553711, 18.274450302124023, 19.288070678710938, 20.301692962646484, 21.3153133392334, 22.328933715820312]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 5.0, 7.0, 9.0, 9.0, 11.0, 9.0, 15.0, 11.0, 14.0, 17.0, 15.0, 29.0, 35.0, 31.0, 35.0, 29.0, 38.0, 63.0, 180.0, 109.0, 45.0, 37.0, 29.0, 28.0, 24.0, 25.0, 24.0, 17.0, 18.0, 16.0, 19.0, 13.0, 5.0, 8.0, 7.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.030384063720703, -14.596818923950195, -14.163253784179688, -13.72968864440918, -13.296123504638672, -12.862558364868164, -12.42899227142334, -11.995427131652832, -11.561861991882324, -11.128296852111816, -10.694731712341309, -10.2611665725708, -9.827600479125977, -9.394035339355469, -8.960470199584961, -8.526905059814453, -8.093339920043945, -7.6597747802734375, -7.22620964050293, -6.792644023895264, -6.359078884124756, -5.925513744354248, -5.491948127746582, -5.058382987976074, -4.624817848205566, -4.191252708435059, -3.7576873302459717, -3.3241219520568848, -2.890556812286377, -2.456991672515869, -2.0234262943267822, -1.5898609161376953, -1.156296730041504, -0.7227314710617065, -0.2891662120819092, 0.14439904689788818, 0.5779643058776855, 1.0115294456481934, 1.4450948238372803, 1.8786602020263672, 2.312225341796875, 2.745790481567383, 3.1793558597564697, 3.6129212379455566, 4.0464863777160645, 4.480051517486572, 4.913617134094238, 5.347182273864746, 5.780747413635254, 6.214312553405762, 6.6478776931762695, 7.0814433097839355, 7.515008449554443, 7.948573589324951, 8.382139205932617, 8.815704345703125, 9.249269485473633, 9.68283462524414, 10.116399765014648, 10.549964904785156, 10.983530044555664, 11.417095184326172, 11.850661277770996, 12.284226417541504, 12.717791557312012]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 8.0, 11.0, 7.0, 7.0, 10.0, 22.0, 30.0, 29.0, 41.0, 59.0, 119.0, 180.0, 317.0, 513.0, 1034.0, 2205.0, 5265.0, 15154.0, 74637.0, 1331726.0, 2584543.0, 142533.0, 22917.0, 7263.0, 2837.0, 1274.0, 685.0, 328.0, 207.0, 103.0, 60.0, 59.0, 35.0, 19.0, 16.0, 9.0, 5.0, 5.0, 2.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.568359375, -2.501007080078125, -2.43365478515625, -2.366302490234375, -2.2989501953125, -2.231597900390625, -2.16424560546875, -2.096893310546875, -2.029541015625, -1.962188720703125, -1.89483642578125, -1.827484130859375, -1.7601318359375, -1.692779541015625, -1.62542724609375, -1.558074951171875, -1.49072265625, -1.423370361328125, -1.35601806640625, -1.288665771484375, -1.2213134765625, -1.153961181640625, -1.08660888671875, -1.019256591796875, -0.951904296875, -0.884552001953125, -0.81719970703125, -0.749847412109375, -0.6824951171875, -0.615142822265625, -0.54779052734375, -0.480438232421875, -0.4130859375, -0.345733642578125, -0.27838134765625, -0.211029052734375, -0.1436767578125, -0.076324462890625, -0.00897216796875, 0.058380126953125, 0.125732421875, 0.193084716796875, 0.26043701171875, 0.327789306640625, 0.3951416015625, 0.462493896484375, 0.52984619140625, 0.597198486328125, 0.66455078125, 0.731903076171875, 0.79925537109375, 0.866607666015625, 0.9339599609375, 1.001312255859375, 1.06866455078125, 1.136016845703125, 1.203369140625, 1.270721435546875, 1.33807373046875, 1.405426025390625, 1.4727783203125, 1.540130615234375, 1.60748291015625, 1.674835205078125, 1.7421875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 5.0, 5.0, 4.0, 10.0, 9.0, 13.0, 13.0, 15.0, 13.0, 32.0, 34.0, 31.0, 30.0, 38.0, 48.0, 51.0, 53.0, 40.0, 52.0, 54.0, 53.0, 44.0, 56.0, 31.0, 43.0, 39.0, 19.0, 26.0, 19.0, 30.0, 19.0, 11.0, 19.0, 8.0, 8.0, 9.0, 3.0, 4.0, 8.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.74072265625, -0.7195816040039062, -0.6984405517578125, -0.6772994995117188, -0.656158447265625, -0.6350173950195312, -0.6138763427734375, -0.5927352905273438, -0.57159423828125, -0.5504531860351562, -0.5293121337890625, -0.5081710815429688, -0.487030029296875, -0.46588897705078125, -0.4447479248046875, -0.42360687255859375, -0.4024658203125, -0.38132476806640625, -0.3601837158203125, -0.33904266357421875, -0.317901611328125, -0.29676055908203125, -0.2756195068359375, -0.25447845458984375, -0.23333740234375, -0.21219635009765625, -0.1910552978515625, -0.16991424560546875, -0.148773193359375, -0.12763214111328125, -0.1064910888671875, -0.08535003662109375, -0.064208984375, -0.04306793212890625, -0.0219268798828125, -0.00078582763671875, 0.020355224609375, 0.04149627685546875, 0.0626373291015625, 0.08377838134765625, 0.10491943359375, 0.12606048583984375, 0.1472015380859375, 0.16834259033203125, 0.189483642578125, 0.21062469482421875, 0.2317657470703125, 0.25290679931640625, 0.2740478515625, 0.29518890380859375, 0.3163299560546875, 0.33747100830078125, 0.358612060546875, 0.37975311279296875, 0.4008941650390625, 0.42203521728515625, 0.44317626953125, 0.46431732177734375, 0.4854583740234375, 0.5065994262695312, 0.527740478515625, 0.5488815307617188, 0.5700225830078125, 0.5911636352539062, 0.6123046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 17.0, 12.0, 15.0, 18.0, 39.0, 54.0, 87.0, 185.0, 309.0, 663.0, 1736.0, 7853.0, 210098.0, 3944732.0, 23254.0, 3145.0, 996.0, 405.0, 237.0, 131.0, 84.0, 52.0, 39.0, 32.0, 21.0, 9.0, 14.0, 6.0, 0.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.473388671875, -6.25927734375, -6.045166015625, -5.8310546875, -5.616943359375, -5.40283203125, -5.188720703125, -4.974609375, -4.760498046875, -4.54638671875, -4.332275390625, -4.1181640625, -3.904052734375, -3.68994140625, -3.475830078125, -3.26171875, -3.047607421875, -2.83349609375, -2.619384765625, -2.4052734375, -2.191162109375, -1.97705078125, -1.762939453125, -1.548828125, -1.334716796875, -1.12060546875, -0.906494140625, -0.6923828125, -0.478271484375, -0.26416015625, -0.050048828125, 0.1640625, 0.378173828125, 0.59228515625, 0.806396484375, 1.0205078125, 1.234619140625, 1.44873046875, 1.662841796875, 1.876953125, 2.091064453125, 2.30517578125, 2.519287109375, 2.7333984375, 2.947509765625, 3.16162109375, 3.375732421875, 3.58984375, 3.803955078125, 4.01806640625, 4.232177734375, 4.4462890625, 4.660400390625, 4.87451171875, 5.088623046875, 5.302734375, 5.516845703125, 5.73095703125, 5.945068359375, 6.1591796875, 6.373291015625, 6.58740234375, 6.801513671875, 7.015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 8.0, 10.0, 9.0, 18.0, 18.0, 25.0, 36.0, 56.0, 61.0, 115.0, 156.0, 211.0, 421.0, 724.0, 871.0, 497.0, 283.0, 176.0, 122.0, 76.0, 48.0, 36.0, 22.0, 18.0, 14.0, 11.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.076171875, -2.98046875, -2.884765625, -2.7890625, -2.693359375, -2.59765625, -2.501953125, -2.40625, -2.310546875, -2.21484375, -2.119140625, -2.0234375, -1.927734375, -1.83203125, -1.736328125, -1.640625, -1.544921875, -1.44921875, -1.353515625, -1.2578125, -1.162109375, -1.06640625, -0.970703125, -0.875, -0.779296875, -0.68359375, -0.587890625, -0.4921875, -0.396484375, -0.30078125, -0.205078125, -0.109375, -0.013671875, 0.08203125, 0.177734375, 0.2734375, 0.369140625, 0.46484375, 0.560546875, 0.65625, 0.751953125, 0.84765625, 0.943359375, 1.0390625, 1.134765625, 1.23046875, 1.326171875, 1.421875, 1.517578125, 1.61328125, 1.708984375, 1.8046875, 1.900390625, 1.99609375, 2.091796875, 2.1875, 2.283203125, 2.37890625, 2.474609375, 2.5703125, 2.666015625, 2.76171875, 2.857421875, 2.953125, 3.048828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 13.0, 33.0, 71.0, 155.0, 333.0, 243.0, 90.0, 31.0, 14.0, 7.0, 5.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.54647827148438, -87.66806030273438, -85.78964233398438, -83.91122436523438, -82.03280639648438, -80.15438842773438, -78.27597045898438, -76.39754486083984, -74.51912689208984, -72.64070892333984, -70.76229095458984, -68.88387298583984, -67.00545501708984, -65.12702941894531, -63.24861526489258, -61.37019729614258, -59.49177932739258, -57.61336135864258, -55.73494338989258, -53.85652160644531, -51.97810363769531, -50.09968566894531, -48.22126770019531, -46.34284973144531, -44.46443176269531, -42.58601379394531, -40.70759582519531, -38.82917785644531, -36.95075607299805, -35.07233810424805, -33.19392013549805, -31.315502166748047, -29.437076568603516, -27.558658599853516, -25.680238723754883, -23.801820755004883, -21.92340087890625, -20.04498291015625, -18.16656494140625, -16.28814697265625, -14.409727096557617, -12.5313081741333, -10.652889251708984, -8.774471282958984, -6.896052360534668, -5.017633438110352, -3.1392154693603516, -1.2607965469360352, 0.6176223754882812, 2.4960410594940186, 4.374459743499756, 6.252878189086914, 8.13129711151123, 10.009716033935547, 11.888134002685547, 13.766552925109863, 15.64497184753418, 17.52338981628418, 19.401809692382812, 21.280227661132812, 23.158645629882812, 25.037065505981445, 26.915483474731445, 28.793903350830078, 30.672321319580078]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 9.0, 11.0, 10.0, 20.0, 13.0, 24.0, 21.0, 35.0, 35.0, 44.0, 50.0, 43.0, 50.0, 67.0, 76.0, 57.0, 76.0, 52.0, 50.0, 34.0, 44.0, 35.0, 29.0, 20.0, 32.0, 14.0, 11.0, 8.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-25.032047271728516, -24.416133880615234, -23.800222396850586, -23.184309005737305, -22.568397521972656, -21.952484130859375, -21.336570739746094, -20.720657348632812, -20.104745864868164, -19.488832473754883, -18.872920989990234, -18.257007598876953, -17.641094207763672, -17.025182723999023, -16.409269332885742, -15.793356895446777, -15.177444458007812, -14.561532020568848, -13.945619583129883, -13.329706192016602, -12.713793754577637, -12.097881317138672, -11.48196792602539, -10.866055488586426, -10.250143051147461, -9.634230613708496, -9.018318176269531, -8.40240478515625, -7.786492347717285, -7.17057991027832, -6.554666996002197, -5.938754081726074, -5.322840690612793, -4.706928253173828, -4.091015338897705, -3.475102663040161, -2.859189987182617, -2.2432773113250732, -1.6273646354675293, -1.0114517211914062, -0.3955392837524414, 0.22037339210510254, 0.8362860679626465, 1.4521987438201904, 2.0681114196777344, 2.6840240955352783, 3.2999367713928223, 3.9158496856689453, 4.53176212310791, 5.147674560546875, 5.763587474822998, 6.379500389099121, 6.995412826538086, 7.611325263977051, 8.227237701416016, 8.843151092529297, 9.459063529968262, 10.074975967407227, 10.690889358520508, 11.306801795959473, 11.922714233398438, 12.538626670837402, 13.154539108276367, 13.770452499389648, 14.386364936828613]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 7.0, 9.0, 5.0, 15.0, 23.0, 33.0, 48.0, 81.0, 121.0, 171.0, 276.0, 523.0, 1002.0, 1815.0, 3682.0, 8726.0, 24226.0, 99175.0, 709441.0, 147916.0, 31592.0, 10663.0, 4407.0, 2035.0, 1046.0, 585.0, 342.0, 202.0, 122.0, 77.0, 60.0, 27.0, 34.0, 14.0, 14.0, 16.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.37109375, -2.300537109375, -2.22998046875, -2.159423828125, -2.0888671875, -2.018310546875, -1.94775390625, -1.877197265625, -1.806640625, -1.736083984375, -1.66552734375, -1.594970703125, -1.5244140625, -1.453857421875, -1.38330078125, -1.312744140625, -1.2421875, -1.171630859375, -1.10107421875, -1.030517578125, -0.9599609375, -0.889404296875, -0.81884765625, -0.748291015625, -0.677734375, -0.607177734375, -0.53662109375, -0.466064453125, -0.3955078125, -0.324951171875, -0.25439453125, -0.183837890625, -0.11328125, -0.042724609375, 0.02783203125, 0.098388671875, 0.1689453125, 0.239501953125, 0.31005859375, 0.380615234375, 0.451171875, 0.521728515625, 0.59228515625, 0.662841796875, 0.7333984375, 0.803955078125, 0.87451171875, 0.945068359375, 1.015625, 1.086181640625, 1.15673828125, 1.227294921875, 1.2978515625, 1.368408203125, 1.43896484375, 1.509521484375, 1.580078125, 1.650634765625, 1.72119140625, 1.791748046875, 1.8623046875, 1.932861328125, 2.00341796875, 2.073974609375, 2.14453125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 10.0, 10.0, 11.0, 28.0, 27.0, 23.0, 46.0, 50.0, 64.0, 64.0, 89.0, 88.0, 84.0, 79.0, 57.0, 61.0, 48.0, 38.0, 28.0, 22.0, 13.0, 13.0, 9.0, 8.0, 12.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8544921875, -1.80267333984375, -1.7508544921875, -1.69903564453125, -1.647216796875, -1.59539794921875, -1.5435791015625, -1.49176025390625, -1.43994140625, -1.38812255859375, -1.3363037109375, -1.28448486328125, -1.232666015625, -1.18084716796875, -1.1290283203125, -1.07720947265625, -1.025390625, -0.97357177734375, -0.9217529296875, -0.86993408203125, -0.818115234375, -0.76629638671875, -0.7144775390625, -0.66265869140625, -0.61083984375, -0.55902099609375, -0.5072021484375, -0.45538330078125, -0.403564453125, -0.35174560546875, -0.2999267578125, -0.24810791015625, -0.1962890625, -0.14447021484375, -0.0926513671875, -0.04083251953125, 0.010986328125, 0.06280517578125, 0.1146240234375, 0.16644287109375, 0.21826171875, 0.27008056640625, 0.3218994140625, 0.37371826171875, 0.425537109375, 0.47735595703125, 0.5291748046875, 0.58099365234375, 0.6328125, 0.68463134765625, 0.7364501953125, 0.78826904296875, 0.840087890625, 0.89190673828125, 0.9437255859375, 0.99554443359375, 1.04736328125, 1.09918212890625, 1.1510009765625, 1.20281982421875, 1.254638671875, 1.30645751953125, 1.3582763671875, 1.41009521484375, 1.4619140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 1.0, 5.0, 5.0, 6.0, 2.0, 15.0, 18.0, 16.0, 20.0, 30.0, 41.0, 55.0, 83.0, 110.0, 155.0, 266.0, 459.0, 863.0, 2104.0, 6772.0, 34849.0, 886839.0, 96658.0, 12837.0, 3456.0, 1281.0, 580.0, 340.0, 201.0, 158.0, 99.0, 57.0, 44.0, 31.0, 17.0, 19.0, 13.0, 14.0, 9.0, 6.0, 8.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.697265625, -2.60650634765625, -2.5157470703125, -2.42498779296875, -2.334228515625, -2.24346923828125, -2.1527099609375, -2.06195068359375, -1.97119140625, -1.88043212890625, -1.7896728515625, -1.69891357421875, -1.608154296875, -1.51739501953125, -1.4266357421875, -1.33587646484375, -1.2451171875, -1.15435791015625, -1.0635986328125, -0.97283935546875, -0.882080078125, -0.79132080078125, -0.7005615234375, -0.60980224609375, -0.51904296875, -0.42828369140625, -0.3375244140625, -0.24676513671875, -0.156005859375, -0.06524658203125, 0.0255126953125, 0.11627197265625, 0.20703125, 0.29779052734375, 0.3885498046875, 0.47930908203125, 0.570068359375, 0.66082763671875, 0.7515869140625, 0.84234619140625, 0.93310546875, 1.02386474609375, 1.1146240234375, 1.20538330078125, 1.296142578125, 1.38690185546875, 1.4776611328125, 1.56842041015625, 1.6591796875, 1.74993896484375, 1.8406982421875, 1.93145751953125, 2.022216796875, 2.11297607421875, 2.2037353515625, 2.29449462890625, 2.38525390625, 2.47601318359375, 2.5667724609375, 2.65753173828125, 2.748291015625, 2.83905029296875, 2.9298095703125, 3.02056884765625, 3.111328125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 6.0, 12.0, 14.0, 18.0, 19.0, 16.0, 21.0, 35.0, 26.0, 34.0, 33.0, 42.0, 70.0, 68.0, 91.0, 83.0, 46.0, 52.0, 54.0, 43.0, 30.0, 31.0, 17.0, 22.0, 17.0, 15.0, 13.0, 12.0, 6.0, 3.0, 7.0, 3.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.59765625, -4.456298828125, -4.31494140625, -4.173583984375, -4.0322265625, -3.890869140625, -3.74951171875, -3.608154296875, -3.466796875, -3.325439453125, -3.18408203125, -3.042724609375, -2.9013671875, -2.760009765625, -2.61865234375, -2.477294921875, -2.3359375, -2.194580078125, -2.05322265625, -1.911865234375, -1.7705078125, -1.629150390625, -1.48779296875, -1.346435546875, -1.205078125, -1.063720703125, -0.92236328125, -0.781005859375, -0.6396484375, -0.498291015625, -0.35693359375, -0.215576171875, -0.07421875, 0.067138671875, 0.20849609375, 0.349853515625, 0.4912109375, 0.632568359375, 0.77392578125, 0.915283203125, 1.056640625, 1.197998046875, 1.33935546875, 1.480712890625, 1.6220703125, 1.763427734375, 1.90478515625, 2.046142578125, 2.1875, 2.328857421875, 2.47021484375, 2.611572265625, 2.7529296875, 2.894287109375, 3.03564453125, 3.177001953125, 3.318359375, 3.459716796875, 3.60107421875, 3.742431640625, 3.8837890625, 4.025146484375, 4.16650390625, 4.307861328125, 4.44921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 8.0, 13.0, 12.0, 20.0, 22.0, 34.0, 42.0, 70.0, 113.0, 230.0, 479.0, 1263.0, 3541.0, 16883.0, 934494.0, 79128.0, 8301.0, 2332.0, 782.0, 354.0, 134.0, 91.0, 53.0, 33.0, 19.0, 23.0, 14.0, 13.0, 13.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.169921875, -1.131927490234375, -1.09393310546875, -1.055938720703125, -1.0179443359375, -0.979949951171875, -0.94195556640625, -0.903961181640625, -0.865966796875, -0.827972412109375, -0.78997802734375, -0.751983642578125, -0.7139892578125, -0.675994873046875, -0.63800048828125, -0.600006103515625, -0.56201171875, -0.524017333984375, -0.48602294921875, -0.448028564453125, -0.4100341796875, -0.372039794921875, -0.33404541015625, -0.296051025390625, -0.258056640625, -0.220062255859375, -0.18206787109375, -0.144073486328125, -0.1060791015625, -0.068084716796875, -0.03009033203125, 0.007904052734375, 0.0458984375, 0.083892822265625, 0.12188720703125, 0.159881591796875, 0.1978759765625, 0.235870361328125, 0.27386474609375, 0.311859130859375, 0.349853515625, 0.387847900390625, 0.42584228515625, 0.463836669921875, 0.5018310546875, 0.539825439453125, 0.57781982421875, 0.615814208984375, 0.65380859375, 0.691802978515625, 0.72979736328125, 0.767791748046875, 0.8057861328125, 0.843780517578125, 0.88177490234375, 0.919769287109375, 0.957763671875, 0.995758056640625, 1.03375244140625, 1.071746826171875, 1.1097412109375, 1.147735595703125, 1.18572998046875, 1.223724365234375, 1.26171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 0.0, 2.0, 4.0, 5.0, 5.0, 7.0, 8.0, 18.0, 19.0, 23.0, 22.0, 32.0, 65.0, 132.0, 200.0, 162.0, 88.0, 60.0, 36.0, 27.0, 17.0, 11.0, 11.0, 11.0, 9.0, 3.0, 3.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028586387634277344, -0.00027718767523765564, -0.00026851147413253784, -0.00025983527302742004, -0.00025115907192230225, -0.00024248287081718445, -0.00023380666971206665, -0.00022513046860694885, -0.00021645426750183105, -0.00020777806639671326, -0.00019910186529159546, -0.00019042566418647766, -0.00018174946308135986, -0.00017307326197624207, -0.00016439706087112427, -0.00015572085976600647, -0.00014704465866088867, -0.00013836845755577087, -0.00012969225645065308, -0.00012101605534553528, -0.00011233985424041748, -0.00010366365313529968, -9.498745203018188e-05, -8.631125092506409e-05, -7.763504981994629e-05, -6.895884871482849e-05, -6.028264760971069e-05, -5.1606446504592896e-05, -4.29302453994751e-05, -3.42540442943573e-05, -2.5577843189239502e-05, -1.6901642084121704e-05, -8.225440979003906e-06, 4.507601261138916e-07, 9.12696123123169e-06, 1.7803162336349487e-05, 2.6479363441467285e-05, 3.515556454658508e-05, 4.383176565170288e-05, 5.250796675682068e-05, 6.118416786193848e-05, 6.986036896705627e-05, 7.853657007217407e-05, 8.721277117729187e-05, 9.588897228240967e-05, 0.00010456517338752747, 0.00011324137449264526, 0.00012191757559776306, 0.00013059377670288086, 0.00013926997780799866, 0.00014794617891311646, 0.00015662238001823425, 0.00016529858112335205, 0.00017397478222846985, 0.00018265098333358765, 0.00019132718443870544, 0.00020000338554382324, 0.00020867958664894104, 0.00021735578775405884, 0.00022603198885917664, 0.00023470818996429443, 0.00024338439106941223, 0.00025206059217453003, 0.00026073679327964783, 0.0002694129943847656]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 9.0, 6.0, 11.0, 20.0, 27.0, 35.0, 66.0, 95.0, 206.0, 432.0, 1523.0, 9170.0, 981434.0, 50518.0, 3640.0, 805.0, 283.0, 109.0, 59.0, 35.0, 20.0, 9.0, 11.0, 8.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.046875, -1.9879913330078125, -1.929107666015625, -1.8702239990234375, -1.81134033203125, -1.7524566650390625, -1.693572998046875, -1.6346893310546875, -1.5758056640625, -1.5169219970703125, -1.458038330078125, -1.3991546630859375, -1.34027099609375, -1.2813873291015625, -1.222503662109375, -1.1636199951171875, -1.104736328125, -1.0458526611328125, -0.986968994140625, -0.9280853271484375, -0.86920166015625, -0.8103179931640625, -0.751434326171875, -0.6925506591796875, -0.6336669921875, -0.5747833251953125, -0.515899658203125, -0.4570159912109375, -0.39813232421875, -0.3392486572265625, -0.280364990234375, -0.2214813232421875, -0.16259765625, -0.1037139892578125, -0.044830322265625, 0.0140533447265625, 0.07293701171875, 0.1318206787109375, 0.190704345703125, 0.2495880126953125, 0.3084716796875, 0.3673553466796875, 0.426239013671875, 0.4851226806640625, 0.54400634765625, 0.6028900146484375, 0.661773681640625, 0.7206573486328125, 0.779541015625, 0.8384246826171875, 0.897308349609375, 0.9561920166015625, 1.01507568359375, 1.0739593505859375, 1.132843017578125, 1.1917266845703125, 1.2506103515625, 1.3094940185546875, 1.368377685546875, 1.4272613525390625, 1.48614501953125, 1.5450286865234375, 1.603912353515625, 1.6627960205078125, 1.7216796875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 11.0, 3.0, 7.0, 9.0, 13.0, 11.0, 12.0, 17.0, 25.0, 48.0, 134.0, 235.0, 229.0, 82.0, 43.0, 30.0, 24.0, 12.0, 16.0, 15.0, 14.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.25390625, -1.2178497314453125, -1.181793212890625, -1.1457366943359375, -1.10968017578125, -1.0736236572265625, -1.037567138671875, -1.0015106201171875, -0.9654541015625, -0.9293975830078125, -0.893341064453125, -0.8572845458984375, -0.82122802734375, -0.7851715087890625, -0.749114990234375, -0.7130584716796875, -0.677001953125, -0.6409454345703125, -0.604888916015625, -0.5688323974609375, -0.53277587890625, -0.4967193603515625, -0.460662841796875, -0.4246063232421875, -0.3885498046875, -0.3524932861328125, -0.316436767578125, -0.2803802490234375, -0.24432373046875, -0.2082672119140625, -0.172210693359375, -0.1361541748046875, -0.10009765625, -0.0640411376953125, -0.027984619140625, 0.0080718994140625, 0.04412841796875, 0.0801849365234375, 0.116241455078125, 0.1522979736328125, 0.1883544921875, 0.2244110107421875, 0.260467529296875, 0.2965240478515625, 0.33258056640625, 0.3686370849609375, 0.404693603515625, 0.4407501220703125, 0.476806640625, 0.5128631591796875, 0.548919677734375, 0.5849761962890625, 0.62103271484375, 0.6570892333984375, 0.693145751953125, 0.7292022705078125, 0.7652587890625, 0.8013153076171875, 0.837371826171875, 0.8734283447265625, 0.90948486328125, 0.9455413818359375, 0.981597900390625, 1.0176544189453125, 1.0537109375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 20.0, 52.0, 78.0, 580.0, 144.0, 60.0, 33.0, 12.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.29560852050781, -34.217350006103516, -33.13909149169922, -32.060829162597656, -30.98257064819336, -29.904312133789062, -28.826051712036133, -27.747791290283203, -26.669532775878906, -25.59127426147461, -24.51301383972168, -23.43475341796875, -22.356494903564453, -21.278236389160156, -20.199975967407227, -19.121715545654297, -18.04345703125, -16.965198516845703, -15.886938095092773, -14.80867862701416, -13.730419158935547, -12.652159690856934, -11.57390022277832, -10.495640754699707, -9.417381286621094, -8.33912181854248, -7.260862350463867, -6.182602882385254, -5.104343414306641, -4.026083946228027, -2.947824478149414, -1.8695650100708008, -0.7913093566894531, 0.28695011138916016, 1.3652095794677734, 2.4434690475463867, 3.521728515625, 4.599987983703613, 5.678247451782227, 6.75650691986084, 7.834766387939453, 8.913025856018066, 9.99128532409668, 11.069544792175293, 12.147804260253906, 13.22606372833252, 14.304323196411133, 15.382582664489746, 16.46084213256836, 17.539100646972656, 18.617361068725586, 19.695621490478516, 20.773880004882812, 21.85213851928711, 22.93039894104004, 24.00865936279297, 25.086917877197266, 26.165176391601562, 27.243436813354492, 28.321697235107422, 29.39995574951172, 30.478214263916016, 31.556474685668945, 32.634735107421875, 33.71299362182617]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 13.0, 16.0, 6.0, 19.0, 14.0, 16.0, 31.0, 24.0, 14.0, 30.0, 36.0, 56.0, 325.0, 140.0, 31.0, 28.0, 25.0, 17.0, 20.0, 16.0, 24.0, 21.0, 8.0, 15.0, 12.0, 12.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-19.801328659057617, -19.290637969970703, -18.77994728088379, -18.269256591796875, -17.75856590270996, -17.247875213623047, -16.737184524536133, -16.22649383544922, -15.715802192687988, -15.205111503601074, -14.69442081451416, -14.183730125427246, -13.673038482666016, -13.162347793579102, -12.651657104492188, -12.140966415405273, -11.63027572631836, -11.119585037231445, -10.608894348144531, -10.098203659057617, -9.587512969970703, -9.076822280883789, -8.566130638122559, -8.055439949035645, -7.5447492599487305, -7.034058570861816, -6.523367881774902, -6.01267671585083, -5.501986026763916, -4.991295337677002, -4.48060417175293, -3.9699134826660156, -3.4592208862304688, -2.9485301971435547, -2.4378392696380615, -1.927148461341858, -1.4164576530456543, -0.9057669639587402, -0.39507603645324707, 0.1156148910522461, 0.6263055801391602, 1.1369963884353638, 1.6476871967315674, 2.1583781242370605, 2.6690688133239746, 3.1797595024108887, 3.690450429916382, 4.201141357421875, 4.711832046508789, 5.222522735595703, 5.733213424682617, 6.2439045906066895, 6.7545952796936035, 7.265285968780518, 7.77597713470459, 8.286667823791504, 8.797358512878418, 9.308049201965332, 9.818739891052246, 10.32943058013916, 10.84012222290039, 11.350812911987305, 11.861503601074219, 12.372194290161133, 12.882884979248047]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 8.0, 1.0, 5.0, 20.0, 16.0, 31.0, 32.0, 62.0, 60.0, 99.0, 308.0, 117.0, 53.0, 52.0, 31.0, 21.0, 30.0, 17.0, 12.0, 10.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.306640625, -2.2437744140625, -2.180908203125, -2.1180419921875, -2.05517578125, -1.9923095703125, -1.929443359375, -1.8665771484375, -1.8037109375, -1.7408447265625, -1.677978515625, -1.6151123046875, -1.55224609375, -1.4893798828125, -1.426513671875, -1.3636474609375, -1.30078125, -1.2379150390625, -1.175048828125, -1.1121826171875, -1.04931640625, -0.9864501953125, -0.923583984375, -0.8607177734375, -0.7978515625, -0.7349853515625, -0.672119140625, -0.6092529296875, -0.54638671875, -0.4835205078125, -0.420654296875, -0.3577880859375, -0.294921875, -0.2320556640625, -0.169189453125, -0.1063232421875, -0.04345703125, 0.0194091796875, 0.082275390625, 0.1451416015625, 0.2080078125, 0.2708740234375, 0.333740234375, 0.3966064453125, 0.45947265625, 0.5223388671875, 0.585205078125, 0.6480712890625, 0.7109375, 0.7738037109375, 0.836669921875, 0.8995361328125, 0.96240234375, 1.0252685546875, 1.088134765625, 1.1510009765625, 1.2138671875, 1.2767333984375, 1.339599609375, 1.4024658203125, 1.46533203125, 1.5281982421875, 1.591064453125, 1.6539306640625, 1.716796875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 7.0, 5.0, 3.0, 5.0, 6.0, 13.0, 12.0, 11.0, 6.0, 19.0, 44.0, 35.0, 73.0, 113.0, 174.0, 297.0, 633.0, 1487.0, 4767.0, 43857.0, 8320232.0, 11859.0, 2777.0, 981.0, 453.0, 244.0, 128.0, 97.0, 61.0, 33.0, 30.0, 28.0, 16.0, 18.0, 8.0, 8.0, 5.0, 4.0, 5.0, 6.0, 4.0, 7.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0], "bins": [-9.084898948669434, -8.834385871887207, -8.583873748779297, -8.33336067199707, -8.082847595214844, -7.832334518432617, -7.581821918487549, -7.3313093185424805, -7.080796241760254, -6.830283164978027, -6.579770565032959, -6.329257965087891, -6.078744888305664, -5.8282318115234375, -5.577719211578369, -5.327206611633301, -5.076693534851074, -4.826180458068848, -4.575667858123779, -4.325155258178711, -4.074642181396484, -3.824129343032837, -3.5736165046691895, -3.323103666305542, -3.0725908279418945, -2.822077989578247, -2.5715651512145996, -2.321052312850952, -2.0705394744873047, -1.8200266361236572, -1.5695137977600098, -1.3190009593963623, -1.0684871673583984, -0.817974328994751, -0.5674614906311035, -0.31694865226745605, -0.0664358139038086, 0.18407702445983887, 0.43458986282348633, 0.6851027011871338, 0.9356155395507812, 1.1861283779144287, 1.4366412162780762, 1.6871540546417236, 1.937666893005371, 2.1881797313690186, 2.438692569732666, 2.6892054080963135, 2.939718246459961, 3.1902310848236084, 3.440743923187256, 3.6912567615509033, 3.941769599914551, 4.192282676696777, 4.442795276641846, 4.693307876586914, 4.943820953369141, 5.194334030151367, 5.4448466300964355, 5.695359230041504, 5.9458723068237305, 6.196385383605957, 6.446897983551025, 6.697410583496094, 6.94792366027832]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 6.0, 2.0, 2.0, 8.0, 8.0, 2.0, 3.0, 7.0, 7.0, 5.0, 8.0, 5.0, 3.0, 6.0, 5.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.012498378753662, -5.805891036987305, -5.5992841720581055, -5.392677307128906, -5.186069965362549, -4.979462623596191, -4.772855758666992, -4.566248893737793, -4.3596415519714355, -4.153034210205078, -3.946427345275879, -3.7398202419281006, -3.5332131385803223, -3.326606035232544, -3.1199989318847656, -2.9133918285369873, -2.706784725189209, -2.5001776218414307, -2.2935705184936523, -2.086963415145874, -1.8803563117980957, -1.6737492084503174, -1.467142105102539, -1.2605350017547607, -1.0539278984069824, -0.8473207950592041, -0.6407136917114258, -0.43410658836364746, -0.22749948501586914, -0.02089238166809082, 0.1857147216796875, 0.3923218250274658, 0.5989289283752441, 0.8055360317230225, 1.0121431350708008, 1.218750238418579, 1.4253573417663574, 1.6319644451141357, 1.838571548461914, 2.0451786518096924, 2.2517857551574707, 2.458392858505249, 2.6649999618530273, 2.8716070652008057, 3.078214168548584, 3.2848212718963623, 3.4914283752441406, 3.698035478591919, 3.9046425819396973, 4.111249923706055, 4.317856788635254, 4.524463653564453, 4.7310709953308105, 4.937678337097168, 5.144285202026367, 5.350892066955566, 5.557499408721924, 5.764106750488281, 5.9707136154174805, 6.17732048034668, 6.383927822113037, 6.5905351638793945, 6.797142028808594, 7.003748893737793, 7.21035623550415]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 5.0, 19.0, 13.0, 28.0, 37.0, 52.0, 98.0, 129.0, 226.0, 395.0, 854.0, 1695.0, 4110.0, 11199.0, 39395.0, 167426.0, 218376.0, 55521.0, 15112.0, 5125.0, 2183.0, 1002.0, 485.0, 291.0, 167.0, 108.0, 76.0, 41.0, 24.0, 22.0, 9.0, 10.0, 5.0, 7.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.106689453125, -7.84619140625, -7.585693359375, -7.3251953125, -7.064697265625, -6.80419921875, -6.543701171875, -6.283203125, -6.022705078125, -5.76220703125, -5.501708984375, -5.2412109375, -4.980712890625, -4.72021484375, -4.459716796875, -4.19921875, -3.938720703125, -3.67822265625, -3.417724609375, -3.1572265625, -2.896728515625, -2.63623046875, -2.375732421875, -2.115234375, -1.854736328125, -1.59423828125, -1.333740234375, -1.0732421875, -0.812744140625, -0.55224609375, -0.291748046875, -0.03125, 0.229248046875, 0.48974609375, 0.750244140625, 1.0107421875, 1.271240234375, 1.53173828125, 1.792236328125, 2.052734375, 2.313232421875, 2.57373046875, 2.834228515625, 3.0947265625, 3.355224609375, 3.61572265625, 3.876220703125, 4.13671875, 4.397216796875, 4.65771484375, 4.918212890625, 5.1787109375, 5.439208984375, 5.69970703125, 5.960205078125, 6.220703125, 6.481201171875, 6.74169921875, 7.002197265625, 7.2626953125, 7.523193359375, 7.78369140625, 8.044189453125, 8.3046875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 7.0, 9.0, 9.0, 11.0, 13.0, 18.0, 26.0, 59.0, 50.0, 59.0, 67.0, 75.0, 90.0, 96.0, 98.0, 58.0, 62.0, 45.0, 46.0, 23.0, 14.0, 19.0, 9.0, 13.0, 5.0, 9.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.68359375, -1.6350860595703125, -1.586578369140625, -1.5380706787109375, -1.48956298828125, -1.4410552978515625, -1.392547607421875, -1.3440399169921875, -1.2955322265625, -1.2470245361328125, -1.198516845703125, -1.1500091552734375, -1.10150146484375, -1.0529937744140625, -1.004486083984375, -0.9559783935546875, -0.907470703125, -0.8589630126953125, -0.810455322265625, -0.7619476318359375, -0.71343994140625, -0.6649322509765625, -0.616424560546875, -0.5679168701171875, -0.5194091796875, -0.4709014892578125, -0.422393798828125, -0.3738861083984375, -0.32537841796875, -0.2768707275390625, -0.228363037109375, -0.1798553466796875, -0.13134765625, -0.0828399658203125, -0.034332275390625, 0.0141754150390625, 0.06268310546875, 0.1111907958984375, 0.159698486328125, 0.2082061767578125, 0.2567138671875, 0.3052215576171875, 0.353729248046875, 0.4022369384765625, 0.45074462890625, 0.4992523193359375, 0.547760009765625, 0.5962677001953125, 0.644775390625, 0.6932830810546875, 0.741790771484375, 0.7902984619140625, 0.83880615234375, 0.8873138427734375, 0.935821533203125, 0.9843292236328125, 1.0328369140625, 1.0813446044921875, 1.129852294921875, 1.1783599853515625, 1.22686767578125, 1.2753753662109375, 1.323883056640625, 1.3723907470703125, 1.4208984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 6.0, 6.0, 14.0, 56.0, 96.0, 167.0, 67.0, 26.0, 17.0, 8.0, 10.0, 4.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.818387985229492, -8.407612800598145, -7.9968366622924805, -7.586061477661133, -7.175285339355469, -6.764510154724121, -6.353734493255615, -5.942958831787109, -5.5321831703186035, -5.121407508850098, -4.710631847381592, -4.299856185913086, -3.889080762863159, -3.4783051013946533, -3.0675296783447266, -2.6567540168762207, -2.245978355407715, -1.835202693939209, -1.4244271516799927, -1.0136516094207764, -0.6028759479522705, -0.19210028648376465, 0.2186751365661621, 0.629450798034668, 1.0402264595031738, 1.4510021209716797, 1.861777663230896, 2.2725532054901123, 2.683328866958618, 3.094104528427124, 3.504879951477051, 3.9156556129455566, 4.3264312744140625, 4.737206935882568, 5.147982597351074, 5.558757781982422, 5.969533920288086, 6.380309104919434, 6.7910847663879395, 7.201860427856445, 7.612636089324951, 8.023411750793457, 8.434186935424805, 8.844963073730469, 9.255738258361816, 9.66651439666748, 10.077289581298828, 10.488065719604492, 10.89884090423584, 11.309616088867188, 11.720392227172852, 12.1311674118042, 12.541943550109863, 12.952718734741211, 13.363494873046875, 13.774270057678223, 14.18504524230957, 14.595820426940918, 15.006596565246582, 15.41737174987793, 15.828147888183594, 16.238924026489258, 16.64969825744629, 17.060474395751953, 17.471250534057617]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 1.0, 5.0, 6.0, 5.0, 5.0, 5.0, 9.0, 14.0, 20.0, 34.0, 89.0, 104.0, 78.0, 43.0, 18.0, 14.0, 3.0, 3.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.792799472808838, -7.552576065063477, -7.312352657318115, -7.072129249572754, -6.831905841827393, -6.591682434082031, -6.351458549499512, -6.111235618591309, -5.871011734008789, -5.630788326263428, -5.390564918518066, -5.150341510772705, -4.910118103027344, -4.669894695281982, -4.429671287536621, -4.189447402954102, -3.9492244720458984, -3.709001064300537, -3.468777656555176, -3.2285542488098145, -2.988330841064453, -2.748107433319092, -2.5078837871551514, -2.26766037940979, -2.0274369716644287, -1.7872135639190674, -1.546990156173706, -1.3067666292190552, -1.0665432214736938, -0.8263198137283325, -0.5860962867736816, -0.3458728790283203, -0.10564947128295898, 0.13457396626472473, 0.37479740381240845, 0.6150208711624146, 0.8552442789077759, 1.0954676866531372, 1.335691213607788, 1.5759146213531494, 1.8161380290985107, 2.056361436843872, 2.2965848445892334, 2.536808490753174, 2.777031898498535, 3.0172553062438965, 3.257478713989258, 3.497702121734619, 3.7379255294799805, 3.978148937225342, 4.218372344970703, 4.4585957527160645, 4.698819160461426, 4.939042568206787, 5.179265975952148, 5.419489860534668, 5.659712791442871, 5.899936199188232, 6.140159606933594, 6.380383014678955, 6.620606422424316, 6.860829830169678, 7.101053237915039, 7.341277122497559, 7.58150053024292]}, "eval/loss": 4.228886127471924, "eval/wer": 1.9632883776279255, "eval/runtime": 974.9232, "eval/samples_per_second": 2.71, "eval/steps_per_second": 0.34} \ No newline at end of file +{"train/loss": 4.0199, "train/learning_rate": 7.653061224489796e-08, "train/epoch": 1.0, "train/global_step": 892, "_runtime": 6364, "_timestamp": 1646057670, "_step": 893, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [2.0, 101.0, 880.0, 34.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.887240409851074, -9.418985366821289, -2.9507312774658203, 3.517523765563965, 9.985777854919434, 16.45403289794922, 22.922286987304688, 29.390541076660156, 35.858795166015625, 42.327049255371094, 48.79530334472656, 55.26355743408203, 61.7318115234375, 68.2000732421875, 74.66831970214844, 81.13658142089844, 87.6048355102539, 94.07308959960938, 100.54134368896484, 107.00959777832031, 113.47785186767578, 119.94610595703125, 126.41436767578125, 132.8826141357422, 139.3508758544922, 145.8191375732422, 152.28738403320312, 158.75564575195312, 165.22389221191406, 171.69215393066406, 178.160400390625, 184.628662109375, 191.09690856933594, 197.56517028808594, 204.03341674804688, 210.50167846679688, 216.9699249267578, 223.4381866455078, 229.90643310546875, 236.37469482421875, 242.8429412841797, 249.3112030029297, 255.77944946289062, 262.2477111816406, 268.7159729003906, 275.1842041015625, 281.6524658203125, 288.1207275390625, 294.5889892578125, 301.0572509765625, 307.5255126953125, 313.9937438964844, 320.4620056152344, 326.9302673339844, 333.3985290527344, 339.86676025390625, 346.33502197265625, 352.80328369140625, 359.27154541015625, 365.7397766113281, 372.2080383300781, 378.6763000488281, 385.1445617675781, 391.61279296875, 398.0810546875]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 6.0, 11.0, 5.0, 13.0, 5.0, 16.0, 23.0, 19.0, 22.0, 31.0, 42.0, 36.0, 35.0, 42.0, 39.0, 52.0, 63.0, 66.0, 56.0, 65.0, 65.0, 46.0, 40.0, 50.0, 26.0, 31.0, 19.0, 19.0, 17.0, 7.0, 11.0, 11.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.502586364746094, -29.423606872558594, -28.344627380371094, -27.265649795532227, -26.186670303344727, -25.107690811157227, -24.02871322631836, -22.94973373413086, -21.87075424194336, -20.79177474975586, -19.71279525756836, -18.633817672729492, -17.554838180541992, -16.475858688354492, -15.396880149841309, -14.317901611328125, -13.238922119140625, -12.159942626953125, -11.080964088439941, -10.001985549926758, -8.923006057739258, -7.844027042388916, -6.765048027038574, -5.686069011688232, -4.607089996337891, -3.528110980987549, -2.449131965637207, -1.3701529502868652, -0.29117393493652344, 0.7878050804138184, 1.8667840957641602, 2.945763111114502, 4.024742126464844, 5.1037211418151855, 6.182700157165527, 7.261679172515869, 8.340658187866211, 9.419637680053711, 10.498616218566895, 11.577594757080078, 12.656574249267578, 13.735553741455078, 14.814532279968262, 15.893510818481445, 16.972490310668945, 18.051469802856445, 19.130447387695312, 20.209426879882812, 21.288406372070312, 22.367385864257812, 23.446365356445312, 24.52534294128418, 25.60432243347168, 26.68330192565918, 27.762279510498047, 28.841259002685547, 29.920238494873047, 30.999217987060547, 32.07819747924805, 33.15717697143555, 34.23615264892578, 35.31513214111328, 36.39411163330078, 37.47309112548828, 38.55207061767578]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 9.0, 9.0, 10.0, 6.0, 13.0, 9.0, 17.0, 21.0, 26.0, 21.0, 20.0, 26.0, 45.0, 50.0, 43.0, 57.0, 31.0, 41.0, 60.0, 58.0, 55.0, 58.0, 46.0, 44.0, 38.0, 31.0, 27.0, 20.0, 15.0, 15.0, 20.0, 16.0, 11.0, 12.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9337921142578125, -1.877349853515625, -1.8209075927734375, -1.76446533203125, -1.7080230712890625, -1.651580810546875, -1.5951385498046875, -1.5386962890625, -1.4822540283203125, -1.425811767578125, -1.3693695068359375, -1.31292724609375, -1.2564849853515625, -1.200042724609375, -1.1436004638671875, -1.087158203125, -1.0307159423828125, -0.974273681640625, -0.9178314208984375, -0.86138916015625, -0.8049468994140625, -0.748504638671875, -0.6920623779296875, -0.6356201171875, -0.5791778564453125, -0.522735595703125, -0.4662933349609375, -0.40985107421875, -0.3534088134765625, -0.296966552734375, -0.2405242919921875, -0.18408203125, -0.1276397705078125, -0.071197509765625, -0.0147552490234375, 0.04168701171875, 0.0981292724609375, 0.154571533203125, 0.2110137939453125, 0.2674560546875, 0.3238983154296875, 0.380340576171875, 0.4367828369140625, 0.49322509765625, 0.5496673583984375, 0.606109619140625, 0.6625518798828125, 0.718994140625, 0.7754364013671875, 0.831878662109375, 0.8883209228515625, 0.94476318359375, 1.0012054443359375, 1.057647705078125, 1.1140899658203125, 1.1705322265625, 1.2269744873046875, 1.283416748046875, 1.3398590087890625, 1.39630126953125, 1.4527435302734375, 1.509185791015625, 1.5656280517578125, 1.6220703125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 8.0, 8.0, 7.0, 17.0, 19.0, 31.0, 43.0, 46.0, 63.0, 102.0, 147.0, 232.0, 318.0, 463.0, 754.0, 1153.0, 2061.0, 3794.0, 8242.0, 23126.0, 90145.0, 629874.0, 2531855.0, 752435.0, 105746.0, 25547.0, 8820.0, 3836.0, 2137.0, 1182.0, 658.0, 450.0, 303.0, 210.0, 143.0, 120.0, 60.0, 32.0, 27.0, 32.0, 14.0, 9.0, 9.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.125, -3.98046875, -3.8359375, -3.69140625, -3.546875, -3.40234375, -3.2578125, -3.11328125, -2.96875, -2.82421875, -2.6796875, -2.53515625, -2.390625, -2.24609375, -2.1015625, -1.95703125, -1.8125, -1.66796875, -1.5234375, -1.37890625, -1.234375, -1.08984375, -0.9453125, -0.80078125, -0.65625, -0.51171875, -0.3671875, -0.22265625, -0.078125, 0.06640625, 0.2109375, 0.35546875, 0.5, 0.64453125, 0.7890625, 0.93359375, 1.078125, 1.22265625, 1.3671875, 1.51171875, 1.65625, 1.80078125, 1.9453125, 2.08984375, 2.234375, 2.37890625, 2.5234375, 2.66796875, 2.8125, 2.95703125, 3.1015625, 3.24609375, 3.390625, 3.53515625, 3.6796875, 3.82421875, 3.96875, 4.11328125, 4.2578125, 4.40234375, 4.546875, 4.69140625, 4.8359375, 4.98046875, 5.125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 5.0, 19.0, 22.0, 41.0, 79.0, 139.0, 250.0, 500.0, 880.0, 859.0, 529.0, 309.0, 172.0, 104.0, 67.0, 34.0, 24.0, 10.0, 6.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.453125, -9.1148681640625, -8.776611328125, -8.4383544921875, -8.10009765625, -7.7618408203125, -7.423583984375, -7.0853271484375, -6.7470703125, -6.4088134765625, -6.070556640625, -5.7322998046875, -5.39404296875, -5.0557861328125, -4.717529296875, -4.3792724609375, -4.041015625, -3.7027587890625, -3.364501953125, -3.0262451171875, -2.68798828125, -2.3497314453125, -2.011474609375, -1.6732177734375, -1.3349609375, -0.9967041015625, -0.658447265625, -0.3201904296875, 0.01806640625, 0.3563232421875, 0.694580078125, 1.0328369140625, 1.37109375, 1.7093505859375, 2.047607421875, 2.3858642578125, 2.72412109375, 3.0623779296875, 3.400634765625, 3.7388916015625, 4.0771484375, 4.4154052734375, 4.753662109375, 5.0919189453125, 5.43017578125, 5.7684326171875, 6.106689453125, 6.4449462890625, 6.783203125, 7.1214599609375, 7.459716796875, 7.7979736328125, 8.13623046875, 8.4744873046875, 8.812744140625, 9.1510009765625, 9.4892578125, 9.8275146484375, 10.165771484375, 10.5040283203125, 10.84228515625, 11.1805419921875, 11.518798828125, 11.8570556640625, 12.1953125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 7.0, 16.0, 16.0, 20.0, 50.0, 76.0, 159.0, 269.0, 602.0, 1602.0, 8923.0, 3179612.0, 993909.0, 6244.0, 1496.0, 606.0, 279.0, 160.0, 84.0, 52.0, 28.0, 20.0, 14.0, 9.0, 6.0, 5.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.96875, -27.93115234375, -26.8935546875, -25.85595703125, -24.818359375, -23.78076171875, -22.7431640625, -21.70556640625, -20.66796875, -19.63037109375, -18.5927734375, -17.55517578125, -16.517578125, -15.47998046875, -14.4423828125, -13.40478515625, -12.3671875, -11.32958984375, -10.2919921875, -9.25439453125, -8.216796875, -7.17919921875, -6.1416015625, -5.10400390625, -4.06640625, -3.02880859375, -1.9912109375, -0.95361328125, 0.083984375, 1.12158203125, 2.1591796875, 3.19677734375, 4.234375, 5.27197265625, 6.3095703125, 7.34716796875, 8.384765625, 9.42236328125, 10.4599609375, 11.49755859375, 12.53515625, 13.57275390625, 14.6103515625, 15.64794921875, 16.685546875, 17.72314453125, 18.7607421875, 19.79833984375, 20.8359375, 21.87353515625, 22.9111328125, 23.94873046875, 24.986328125, 26.02392578125, 27.0615234375, 28.09912109375, 29.13671875, 30.17431640625, 31.2119140625, 32.24951171875, 33.287109375, 34.32470703125, 35.3623046875, 36.39990234375, 37.4375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 10.0, 599.0, 389.0, 14.0, 1.0, 1.0, 0.0, 1.0], "bins": [-297.2367858886719, -292.0941467285156, -286.9515075683594, -281.8088684082031, -276.6662292480469, -271.5235900878906, -266.3809509277344, -261.2383117675781, -256.0956726074219, -250.95303344726562, -245.81039428710938, -240.66775512695312, -235.52511596679688, -230.38247680664062, -225.23983764648438, -220.09718322753906, -214.95452880859375, -209.8118896484375, -204.66925048828125, -199.526611328125, -194.38397216796875, -189.2413330078125, -184.09869384765625, -178.95603942871094, -173.81341552734375, -168.6707763671875, -163.52813720703125, -158.385498046875, -153.24285888671875, -148.1002197265625, -142.95758056640625, -137.81492614746094, -132.67227172851562, -127.52963256835938, -122.38699340820312, -117.24435424804688, -112.1017074584961, -106.95906829833984, -101.8164291381836, -96.67378234863281, -91.5311508178711, -86.38851165771484, -81.2458724975586, -76.10322570800781, -70.96058654785156, -65.81794738769531, -60.67530822753906, -55.53266525268555, -50.39002227783203, -45.24738311767578, -40.104740142822266, -34.962100982666016, -29.819459915161133, -24.67681884765625, -19.5341796875, -14.391536712646484, -9.248899459838867, -4.106258869171143, 1.036381721496582, 6.179021835327148, 11.321662902832031, 16.464303970336914, 21.606943130493164, 26.74958610534668, 31.89222526550293]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 9.0, 9.0, 5.0, 3.0, 6.0, 13.0, 10.0, 13.0, 13.0, 22.0, 18.0, 24.0, 26.0, 26.0, 35.0, 33.0, 24.0, 38.0, 37.0, 43.0, 42.0, 56.0, 36.0, 44.0, 43.0, 49.0, 34.0, 33.0, 37.0, 33.0, 38.0, 26.0, 24.0, 22.0, 16.0, 10.0, 13.0, 9.0, 13.0, 6.0, 5.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-30.77267074584961, -29.925748825073242, -29.078826904296875, -28.23190689086914, -27.384984970092773, -26.538063049316406, -25.691143035888672, -24.844221115112305, -23.997299194335938, -23.15037727355957, -22.303455352783203, -21.45653533935547, -20.6096134185791, -19.762691497802734, -18.915771484375, -18.068849563598633, -17.221927642822266, -16.3750057220459, -15.528084754943848, -14.681163787841797, -13.83424186706543, -12.987319946289062, -12.140398979187012, -11.293478012084961, -10.446556091308594, -9.599634170532227, -8.752713203430176, -7.905791759490967, -7.058870315551758, -6.211948871612549, -5.36502742767334, -4.518105983734131, -3.671182632446289, -2.82426118850708, -1.977339744567871, -1.130418300628662, -0.2834968566894531, 0.5634245872497559, 1.4103460311889648, 2.257267475128174, 3.104188919067383, 3.951110363006592, 4.798031806945801, 5.64495325088501, 6.491874694824219, 7.338796138763428, 8.185717582702637, 9.032638549804688, 9.879560470581055, 10.726482391357422, 11.573403358459473, 12.420324325561523, 13.26724624633789, 14.114168167114258, 14.961089134216309, 15.80801010131836, 16.654932022094727, 17.501853942871094, 18.348773956298828, 19.195695877075195, 20.042617797851562, 20.88953971862793, 21.736461639404297, 22.58338165283203, 23.4303035736084]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 1.0, 5.0, 6.0, 10.0, 12.0, 11.0, 15.0, 21.0, 19.0, 23.0, 24.0, 20.0, 34.0, 44.0, 35.0, 41.0, 42.0, 37.0, 47.0, 54.0, 51.0, 45.0, 46.0, 49.0, 37.0, 43.0, 34.0, 22.0, 31.0, 25.0, 18.0, 29.0, 10.0, 11.0, 8.0, 13.0, 3.0, 5.0, 1.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5546875, -1.499847412109375, -1.44500732421875, -1.390167236328125, -1.3353271484375, -1.280487060546875, -1.22564697265625, -1.170806884765625, -1.115966796875, -1.061126708984375, -1.00628662109375, -0.951446533203125, -0.8966064453125, -0.841766357421875, -0.78692626953125, -0.732086181640625, -0.67724609375, -0.622406005859375, -0.56756591796875, -0.512725830078125, -0.4578857421875, -0.403045654296875, -0.34820556640625, -0.293365478515625, -0.238525390625, -0.183685302734375, -0.12884521484375, -0.074005126953125, -0.0191650390625, 0.035675048828125, 0.09051513671875, 0.145355224609375, 0.2001953125, 0.255035400390625, 0.30987548828125, 0.364715576171875, 0.4195556640625, 0.474395751953125, 0.52923583984375, 0.584075927734375, 0.638916015625, 0.693756103515625, 0.74859619140625, 0.803436279296875, 0.8582763671875, 0.913116455078125, 0.96795654296875, 1.022796630859375, 1.07763671875, 1.132476806640625, 1.18731689453125, 1.242156982421875, 1.2969970703125, 1.351837158203125, 1.40667724609375, 1.461517333984375, 1.516357421875, 1.571197509765625, 1.62603759765625, 1.680877685546875, 1.7357177734375, 1.790557861328125, 1.84539794921875, 1.900238037109375, 1.955078125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 14.0, 15.0, 17.0, 22.0, 40.0, 54.0, 88.0, 110.0, 148.0, 280.0, 350.0, 479.0, 804.0, 1204.0, 1724.0, 2618.0, 4032.0, 5900.0, 9354.0, 14738.0, 23585.0, 39743.0, 70557.0, 137214.0, 308373.0, 198468.0, 94899.0, 51644.0, 30078.0, 18486.0, 11625.0, 7476.0, 4740.0, 3281.0, 2010.0, 1463.0, 950.0, 596.0, 452.0, 325.0, 193.0, 119.0, 112.0, 67.0, 42.0, 30.0, 14.0, 8.0, 5.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.29345703125, -0.284210205078125, -0.27496337890625, -0.265716552734375, -0.2564697265625, -0.247222900390625, -0.23797607421875, -0.228729248046875, -0.219482421875, -0.210235595703125, -0.20098876953125, -0.191741943359375, -0.1824951171875, -0.173248291015625, -0.16400146484375, -0.154754638671875, -0.1455078125, -0.136260986328125, -0.12701416015625, -0.117767333984375, -0.1085205078125, -0.099273681640625, -0.09002685546875, -0.080780029296875, -0.071533203125, -0.062286376953125, -0.05303955078125, -0.043792724609375, -0.0345458984375, -0.025299072265625, -0.01605224609375, -0.006805419921875, 0.00244140625, 0.011688232421875, 0.02093505859375, 0.030181884765625, 0.0394287109375, 0.048675537109375, 0.05792236328125, 0.067169189453125, 0.076416015625, 0.085662841796875, 0.09490966796875, 0.104156494140625, 0.1134033203125, 0.122650146484375, 0.13189697265625, 0.141143798828125, 0.150390625, 0.159637451171875, 0.16888427734375, 0.178131103515625, 0.1873779296875, 0.196624755859375, 0.20587158203125, 0.215118408203125, 0.224365234375, 0.233612060546875, 0.24285888671875, 0.252105712890625, 0.2613525390625, 0.270599365234375, 0.27984619140625, 0.289093017578125, 0.29833984375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 3.0, 8.0, 4.0, 14.0, 12.0, 11.0, 21.0, 13.0, 12.0, 25.0, 24.0, 33.0, 31.0, 23.0, 32.0, 45.0, 43.0, 40.0, 40.0, 44.0, 1081.0, 27.0, 39.0, 37.0, 32.0, 34.0, 36.0, 26.0, 27.0, 24.0, 25.0, 22.0, 32.0, 20.0, 20.0, 15.0, 15.0, 3.0, 7.0, 6.0, 7.0, 0.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0634765625, -1.03118896484375, -0.9989013671875, -0.96661376953125, -0.934326171875, -0.90203857421875, -0.8697509765625, -0.83746337890625, -0.80517578125, -0.77288818359375, -0.7406005859375, -0.70831298828125, -0.676025390625, -0.64373779296875, -0.6114501953125, -0.57916259765625, -0.546875, -0.51458740234375, -0.4822998046875, -0.45001220703125, -0.417724609375, -0.38543701171875, -0.3531494140625, -0.32086181640625, -0.28857421875, -0.25628662109375, -0.2239990234375, -0.19171142578125, -0.159423828125, -0.12713623046875, -0.0948486328125, -0.06256103515625, -0.0302734375, 0.00201416015625, 0.0343017578125, 0.06658935546875, 0.098876953125, 0.13116455078125, 0.1634521484375, 0.19573974609375, 0.22802734375, 0.26031494140625, 0.2926025390625, 0.32489013671875, 0.357177734375, 0.38946533203125, 0.4217529296875, 0.45404052734375, 0.486328125, 0.51861572265625, 0.5509033203125, 0.58319091796875, 0.615478515625, 0.64776611328125, 0.6800537109375, 0.71234130859375, 0.74462890625, 0.77691650390625, 0.8092041015625, 0.84149169921875, 0.873779296875, 0.90606689453125, 0.9383544921875, 0.97064208984375, 1.0029296875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 3.0, 9.0, 16.0, 14.0, 23.0, 41.0, 55.0, 63.0, 108.0, 153.0, 223.0, 340.0, 488.0, 654.0, 957.0, 1436.0, 1972.0, 2964.0, 4471.0, 6159.0, 8963.0, 12893.0, 18837.0, 27545.0, 41787.0, 66383.0, 116669.0, 1289573.0, 209407.0, 103500.0, 60285.0, 38497.0, 25841.0, 17584.0, 11864.0, 8388.0, 5704.0, 3864.0, 2744.0, 1912.0, 1381.0, 964.0, 705.0, 447.0, 370.0, 242.0, 189.0, 142.0, 94.0, 77.0, 43.0, 34.0, 29.0, 10.0, 10.0, 8.0, 5.0, 4.0, 0.0, 1.0], "bins": [-0.2288818359375, -0.22170639038085938, -0.21453094482421875, -0.20735549926757812, -0.2001800537109375, -0.19300460815429688, -0.18582916259765625, -0.17865371704101562, -0.171478271484375, -0.16430282592773438, -0.15712738037109375, -0.14995193481445312, -0.1427764892578125, -0.13560104370117188, -0.12842559814453125, -0.12125015258789062, -0.11407470703125, -0.10689926147460938, -0.09972381591796875, -0.09254837036132812, -0.0853729248046875, -0.07819747924804688, -0.07102203369140625, -0.06384658813476562, -0.056671142578125, -0.049495697021484375, -0.04232025146484375, -0.035144805908203125, -0.0279693603515625, -0.020793914794921875, -0.01361846923828125, -0.006443023681640625, 0.000732421875, 0.007907867431640625, 0.01508331298828125, 0.022258758544921875, 0.0294342041015625, 0.036609649658203125, 0.04378509521484375, 0.050960540771484375, 0.058135986328125, 0.06531143188476562, 0.07248687744140625, 0.07966232299804688, 0.0868377685546875, 0.09401321411132812, 0.10118865966796875, 0.10836410522460938, 0.11553955078125, 0.12271499633789062, 0.12989044189453125, 0.13706588745117188, 0.1442413330078125, 0.15141677856445312, 0.15859222412109375, 0.16576766967773438, 0.172943115234375, 0.18011856079101562, 0.18729400634765625, 0.19446945190429688, 0.2016448974609375, 0.20882034301757812, 0.21599578857421875, 0.22317123413085938, 0.2303466796875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 4.0, 9.0, 9.0, 12.0, 14.0, 14.0, 12.0, 20.0, 26.0, 32.0, 39.0, 48.0, 50.0, 55.0, 53.0, 68.0, 71.0, 65.0, 54.0, 48.0, 52.0, 29.0, 41.0, 27.0, 33.0, 26.0, 10.0, 12.0, 10.0, 10.0, 3.0, 8.0, 9.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.937980651855469e-05, -6.724148988723755e-05, -6.510317325592041e-05, -6.296485662460327e-05, -6.082653999328613e-05, -5.8688223361968994e-05, -5.6549906730651855e-05, -5.441159009933472e-05, -5.227327346801758e-05, -5.013495683670044e-05, -4.79966402053833e-05, -4.585832357406616e-05, -4.3720006942749023e-05, -4.1581690311431885e-05, -3.9443373680114746e-05, -3.730505704879761e-05, -3.516674041748047e-05, -3.302842378616333e-05, -3.089010715484619e-05, -2.8751790523529053e-05, -2.6613473892211914e-05, -2.4475157260894775e-05, -2.2336840629577637e-05, -2.0198523998260498e-05, -1.806020736694336e-05, -1.592189073562622e-05, -1.3783574104309082e-05, -1.1645257472991943e-05, -9.506940841674805e-06, -7.368624210357666e-06, -5.230307579040527e-06, -3.0919909477233887e-06, -9.5367431640625e-07, 1.1846423149108887e-06, 3.3229589462280273e-06, 5.461275577545166e-06, 7.599592208862305e-06, 9.737908840179443e-06, 1.1876225471496582e-05, 1.401454210281372e-05, 1.615285873413086e-05, 1.8291175365447998e-05, 2.0429491996765137e-05, 2.2567808628082275e-05, 2.4706125259399414e-05, 2.6844441890716553e-05, 2.898275852203369e-05, 3.112107515335083e-05, 3.325939178466797e-05, 3.539770841598511e-05, 3.7536025047302246e-05, 3.9674341678619385e-05, 4.1812658309936523e-05, 4.395097494125366e-05, 4.60892915725708e-05, 4.822760820388794e-05, 5.036592483520508e-05, 5.250424146652222e-05, 5.4642558097839355e-05, 5.6780874729156494e-05, 5.891919136047363e-05, 6.105750799179077e-05, 6.319582462310791e-05, 6.533414125442505e-05, 6.747245788574219e-05]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 7.0, 5.0, 11.0, 23.0, 16.0, 21.0, 22.0, 46.0, 32.0, 40.0, 47.0, 59.0, 98.0, 128.0, 149.0, 241.0, 317.0, 469.0, 865.0, 13397.0, 1028482.0, 1825.0, 682.0, 413.0, 285.0, 170.0, 147.0, 146.0, 88.0, 73.0, 44.0, 35.0, 24.0, 23.0, 21.0, 35.0, 9.0, 11.0, 10.0, 5.0, 6.0, 10.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0010995864868164062, -0.001063317060470581, -0.0010270476341247559, -0.0009907782077789307, -0.0009545087814331055, -0.0009182393550872803, -0.0008819699287414551, -0.0008457005023956299, -0.0008094310760498047, -0.0007731616497039795, -0.0007368922233581543, -0.0007006227970123291, -0.0006643533706665039, -0.0006280839443206787, -0.0005918145179748535, -0.0005555450916290283, -0.0005192756652832031, -0.00048300623893737793, -0.00044673681259155273, -0.00041046738624572754, -0.00037419795989990234, -0.00033792853355407715, -0.00030165910720825195, -0.00026538968086242676, -0.00022912025451660156, -0.00019285082817077637, -0.00015658140182495117, -0.00012031197547912598, -8.404254913330078e-05, -4.7773122787475586e-05, -1.150369644165039e-05, 2.4765729904174805e-05, 6.103515625e-05, 9.73045825958252e-05, 0.0001335740089416504, 0.00016984343528747559, 0.00020611286163330078, 0.00024238228797912598, 0.00027865171432495117, 0.00031492114067077637, 0.00035119056701660156, 0.00038745999336242676, 0.00042372941970825195, 0.00045999884605407715, 0.0004962682723999023, 0.0005325376987457275, 0.0005688071250915527, 0.0006050765514373779, 0.0006413459777832031, 0.0006776154041290283, 0.0007138848304748535, 0.0007501542568206787, 0.0007864236831665039, 0.0008226931095123291, 0.0008589625358581543, 0.0008952319622039795, 0.0009315013885498047, 0.0009677708148956299, 0.001004040241241455, 0.0010403096675872803, 0.0010765790939331055, 0.0011128485202789307, 0.0011491179466247559, 0.001185387372970581, 0.0012216567993164062]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 35.0, 888.0, 93.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001707318442640826, -0.00016243892605416477, -0.00015414600784424692, -0.00014585308963432908, -0.000137560156872496, -0.00012926723866257817, -0.00012097432045266032, -0.00011268140224274248, -0.00010438847675686702, -9.609555854694918e-05, -8.780263306107372e-05, -7.950971485115588e-05, -7.121679664123803e-05, -6.292387115536258e-05, -5.463095294544473e-05, -4.633803109754808e-05, -3.804510924965143e-05, -2.975218740175478e-05, -2.1459267372847535e-05, -1.3166347343940288e-05, -4.873425496043637e-06, 3.419496351853013e-06, 1.1712414561770856e-05, 2.0005336409667507e-05, 2.8298258257564157e-05, 3.659118010546081e-05, 4.488410195335746e-05, 5.31770201632753e-05, 6.146993837319314e-05, 6.97628638590686e-05, 7.805578206898645e-05, 8.63487075548619e-05, 9.464164031669497e-05, 0.00010293455852661282, 0.00011122748401248828, 0.00011952040222240612, 0.00012781332770828158, 0.00013610624591819942, 0.00014439916412811726, 0.0001526920823380351, 0.00016098501509986818, 0.00016927793330978602, 0.00017757085151970387, 0.00018586378428153694, 0.00019415670249145478, 0.00020244962070137262, 0.00021074253891129047, 0.0002190354571212083, 0.00022732837533112615, 0.000235621293541044, 0.00024391421175096184, 0.0002522071299608797, 0.00026050006272271276, 0.00026879296638071537, 0.00027708589914254844, 0.0002853788319043815, 0.00029367173556238413, 0.0003019646683242172, 0.0003102575719822198, 0.0003185505047440529, 0.0003268434084020555, 0.0003351363411638886, 0.00034342927392572165, 0.00035172217758372426, 0.00036001511034555733]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 7.0, 4.0, 7.0, 10.0, 15.0, 13.0, 15.0, 11.0, 13.0, 19.0, 27.0, 22.0, 32.0, 38.0, 26.0, 32.0, 28.0, 41.0, 27.0, 37.0, 38.0, 46.0, 49.0, 46.0, 37.0, 39.0, 33.0, 21.0, 31.0, 25.0, 15.0, 27.0, 17.0, 40.0, 22.0, 21.0, 14.0, 12.0, 6.0, 9.0, 7.0, 4.0, 5.0, 9.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.635883331298828e-05, -3.5315752029418945e-05, -3.427267074584961e-05, -3.3229589462280273e-05, -3.218650817871094e-05, -3.11434268951416e-05, -3.0100345611572266e-05, -2.905726432800293e-05, -2.8014183044433594e-05, -2.6971101760864258e-05, -2.5928020477294922e-05, -2.4884939193725586e-05, -2.384185791015625e-05, -2.2798776626586914e-05, -2.1755695343017578e-05, -2.0712614059448242e-05, -1.9669532775878906e-05, -1.862645149230957e-05, -1.7583370208740234e-05, -1.65402889251709e-05, -1.5497207641601562e-05, -1.4454126358032227e-05, -1.341104507446289e-05, -1.2367963790893555e-05, -1.1324882507324219e-05, -1.0281801223754883e-05, -9.238719940185547e-06, -8.195638656616211e-06, -7.152557373046875e-06, -6.109476089477539e-06, -5.066394805908203e-06, -4.023313522338867e-06, -2.9802322387695312e-06, -1.9371509552001953e-06, -8.940696716308594e-07, 1.4901161193847656e-07, 1.1920928955078125e-06, 2.2351741790771484e-06, 3.2782554626464844e-06, 4.32133674621582e-06, 5.364418029785156e-06, 6.407499313354492e-06, 7.450580596923828e-06, 8.493661880493164e-06, 9.5367431640625e-06, 1.0579824447631836e-05, 1.1622905731201172e-05, 1.2665987014770508e-05, 1.3709068298339844e-05, 1.475214958190918e-05, 1.5795230865478516e-05, 1.683831214904785e-05, 1.7881393432617188e-05, 1.8924474716186523e-05, 1.996755599975586e-05, 2.1010637283325195e-05, 2.205371856689453e-05, 2.3096799850463867e-05, 2.4139881134033203e-05, 2.518296241760254e-05, 2.6226043701171875e-05, 2.726912498474121e-05, 2.8312206268310547e-05, 2.9355287551879883e-05, 3.039836883544922e-05]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 1.0, 5.0, 6.0, 10.0, 12.0, 11.0, 15.0, 21.0, 19.0, 23.0, 24.0, 20.0, 34.0, 44.0, 35.0, 41.0, 42.0, 37.0, 47.0, 54.0, 51.0, 45.0, 46.0, 49.0, 37.0, 43.0, 34.0, 22.0, 31.0, 25.0, 18.0, 29.0, 10.0, 11.0, 8.0, 13.0, 3.0, 5.0, 1.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5546875, -1.499847412109375, -1.44500732421875, -1.390167236328125, -1.3353271484375, -1.280487060546875, -1.22564697265625, -1.170806884765625, -1.115966796875, -1.061126708984375, -1.00628662109375, -0.951446533203125, -0.8966064453125, -0.841766357421875, -0.78692626953125, -0.732086181640625, -0.67724609375, -0.622406005859375, -0.56756591796875, -0.512725830078125, -0.4578857421875, -0.403045654296875, -0.34820556640625, -0.293365478515625, -0.238525390625, -0.183685302734375, -0.12884521484375, -0.074005126953125, -0.0191650390625, 0.035675048828125, 0.09051513671875, 0.145355224609375, 0.2001953125, 0.255035400390625, 0.30987548828125, 0.364715576171875, 0.4195556640625, 0.474395751953125, 0.52923583984375, 0.584075927734375, 0.638916015625, 0.693756103515625, 0.74859619140625, 0.803436279296875, 0.8582763671875, 0.913116455078125, 0.96795654296875, 1.022796630859375, 1.07763671875, 1.132476806640625, 1.18731689453125, 1.242156982421875, 1.2969970703125, 1.351837158203125, 1.40667724609375, 1.461517333984375, 1.516357421875, 1.571197509765625, 1.62603759765625, 1.680877685546875, 1.7357177734375, 1.790557861328125, 1.84539794921875, 1.900238037109375, 1.955078125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 5.0, 5.0, 5.0, 13.0, 17.0, 24.0, 24.0, 36.0, 54.0, 65.0, 93.0, 108.0, 167.0, 204.0, 284.0, 385.0, 512.0, 709.0, 1041.0, 1343.0, 1881.0, 2874.0, 4679.0, 8767.0, 20892.0, 101709.0, 672134.0, 176356.0, 27795.0, 10147.0, 5401.0, 3226.0, 2145.0, 1514.0, 1046.0, 707.0, 560.0, 471.0, 280.0, 213.0, 179.0, 129.0, 92.0, 70.0, 59.0, 44.0, 22.0, 19.0, 17.0, 15.0, 9.0, 7.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.87109375, -6.63909912109375, -6.4071044921875, -6.17510986328125, -5.943115234375, -5.71112060546875, -5.4791259765625, -5.24713134765625, -5.01513671875, -4.78314208984375, -4.5511474609375, -4.31915283203125, -4.087158203125, -3.85516357421875, -3.6231689453125, -3.39117431640625, -3.1591796875, -2.92718505859375, -2.6951904296875, -2.46319580078125, -2.231201171875, -1.99920654296875, -1.7672119140625, -1.53521728515625, -1.30322265625, -1.07122802734375, -0.8392333984375, -0.60723876953125, -0.375244140625, -0.14324951171875, 0.0887451171875, 0.32073974609375, 0.552734375, 0.78472900390625, 1.0167236328125, 1.24871826171875, 1.480712890625, 1.71270751953125, 1.9447021484375, 2.17669677734375, 2.40869140625, 2.64068603515625, 2.8726806640625, 3.10467529296875, 3.336669921875, 3.56866455078125, 3.8006591796875, 4.03265380859375, 4.2646484375, 4.49664306640625, 4.7286376953125, 4.96063232421875, 5.192626953125, 5.42462158203125, 5.6566162109375, 5.88861083984375, 6.12060546875, 6.35260009765625, 6.5845947265625, 6.81658935546875, 7.048583984375, 7.28057861328125, 7.5125732421875, 7.74456787109375, 7.9765625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 15.0, 14.0, 17.0, 11.0, 15.0, 21.0, 25.0, 22.0, 30.0, 28.0, 40.0, 37.0, 41.0, 65.0, 113.0, 190.0, 276.0, 1370.0, 167.0, 92.0, 65.0, 62.0, 34.0, 34.0, 28.0, 26.0, 36.0, 17.0, 21.0, 20.0, 18.0, 10.0, 10.0, 10.0, 6.0, 9.0, 9.0, 3.0, 5.0, 2.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0], "bins": [-5.6953125, -5.5328369140625, -5.370361328125, -5.2078857421875, -5.04541015625, -4.8829345703125, -4.720458984375, -4.5579833984375, -4.3955078125, -4.2330322265625, -4.070556640625, -3.9080810546875, -3.74560546875, -3.5831298828125, -3.420654296875, -3.2581787109375, -3.095703125, -2.9332275390625, -2.770751953125, -2.6082763671875, -2.44580078125, -2.2833251953125, -2.120849609375, -1.9583740234375, -1.7958984375, -1.6334228515625, -1.470947265625, -1.3084716796875, -1.14599609375, -0.9835205078125, -0.821044921875, -0.6585693359375, -0.49609375, -0.3336181640625, -0.171142578125, -0.0086669921875, 0.15380859375, 0.3162841796875, 0.478759765625, 0.6412353515625, 0.8037109375, 0.9661865234375, 1.128662109375, 1.2911376953125, 1.45361328125, 1.6160888671875, 1.778564453125, 1.9410400390625, 2.103515625, 2.2659912109375, 2.428466796875, 2.5909423828125, 2.75341796875, 2.9158935546875, 3.078369140625, 3.2408447265625, 3.4033203125, 3.5657958984375, 3.728271484375, 3.8907470703125, 4.05322265625, 4.2156982421875, 4.378173828125, 4.5406494140625, 4.703125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 10.0, 4.0, 6.0, 9.0, 8.0, 11.0, 9.0, 13.0, 16.0, 12.0, 25.0, 14.0, 27.0, 35.0, 35.0, 73.0, 102.0, 154.0, 274.0, 631.0, 2175.0, 68979.0, 3052408.0, 18001.0, 1447.0, 482.0, 242.0, 125.0, 69.0, 54.0, 35.0, 27.0, 39.0, 29.0, 21.0, 11.0, 14.0, 19.0, 11.0, 11.0, 9.0, 6.0, 4.0, 6.0, 1.0, 3.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.640625, -17.0400390625, -16.439453125, -15.8388671875, -15.23828125, -14.6376953125, -14.037109375, -13.4365234375, -12.8359375, -12.2353515625, -11.634765625, -11.0341796875, -10.43359375, -9.8330078125, -9.232421875, -8.6318359375, -8.03125, -7.4306640625, -6.830078125, -6.2294921875, -5.62890625, -5.0283203125, -4.427734375, -3.8271484375, -3.2265625, -2.6259765625, -2.025390625, -1.4248046875, -0.82421875, -0.2236328125, 0.376953125, 0.9775390625, 1.578125, 2.1787109375, 2.779296875, 3.3798828125, 3.98046875, 4.5810546875, 5.181640625, 5.7822265625, 6.3828125, 6.9833984375, 7.583984375, 8.1845703125, 8.78515625, 9.3857421875, 9.986328125, 10.5869140625, 11.1875, 11.7880859375, 12.388671875, 12.9892578125, 13.58984375, 14.1904296875, 14.791015625, 15.3916015625, 15.9921875, 16.5927734375, 17.193359375, 17.7939453125, 18.39453125, 18.9951171875, 19.595703125, 20.1962890625, 20.796875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 11.0, 169.0, 657.0, 167.0, 10.0, 0.0, 1.0], "bins": [-82.16666412353516, -80.78565216064453, -79.4046401977539, -78.02362823486328, -76.64261627197266, -75.26160430908203, -73.8805923461914, -72.49958038330078, -71.11856842041016, -69.73755645751953, -68.3565444946289, -66.97553253173828, -65.59452056884766, -64.21350860595703, -62.832496643066406, -61.45148468017578, -60.070472717285156, -58.68946075439453, -57.308448791503906, -55.92743682861328, -54.546424865722656, -53.16541290283203, -51.784400939941406, -50.40338897705078, -49.02237319946289, -47.641361236572266, -46.26034927368164, -44.879337310791016, -43.49832534790039, -42.117313385009766, -40.73630142211914, -39.355289459228516, -37.97427749633789, -36.593265533447266, -35.21225357055664, -33.831241607666016, -32.45022964477539, -31.069217681884766, -29.68820571899414, -28.307193756103516, -26.92618179321289, -25.545169830322266, -24.16415786743164, -22.783145904541016, -21.40213394165039, -20.021121978759766, -18.64011001586914, -17.259098052978516, -15.878084182739258, -14.497072219848633, -13.116060256958008, -11.735048294067383, -10.354036331176758, -8.973024368286133, -7.592011451721191, -6.210999488830566, -4.829987525939941, -3.4489755630493164, -2.0679633617401123, -0.6869511604309082, 0.6940608024597168, 2.075072765350342, 3.456085205078125, 4.83709716796875, 6.218109130859375]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 4.0, 6.0, 7.0, 9.0, 15.0, 6.0, 6.0, 16.0, 17.0, 16.0, 19.0, 15.0, 27.0, 13.0, 28.0, 30.0, 31.0, 27.0, 36.0, 43.0, 42.0, 28.0, 49.0, 37.0, 41.0, 37.0, 34.0, 43.0, 29.0, 33.0, 37.0, 25.0, 17.0, 39.0, 14.0, 22.0, 25.0, 12.0, 9.0, 16.0, 12.0, 7.0, 6.0, 2.0, 1.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-16.75569725036621, -16.251174926757812, -15.746650695800781, -15.242127418518066, -14.737604141235352, -14.233081817626953, -13.728558540344238, -13.224035263061523, -12.719511985778809, -12.214988708496094, -11.710465431213379, -11.205942153930664, -10.701419830322266, -10.196895599365234, -9.692373275756836, -9.187849998474121, -8.683326721191406, -8.178803443908691, -7.674280166625977, -7.16975736618042, -6.665234088897705, -6.16071081161499, -5.656188011169434, -5.151664733886719, -4.647141456604004, -4.142618179321289, -3.6380951404571533, -3.1335721015930176, -2.6290488243103027, -2.124525547027588, -1.6200025081634521, -1.1154794692993164, -0.6109542846679688, -0.10643112659454346, 0.39809203147888184, 0.9026151895523071, 1.4071383476257324, 1.9116616249084473, 2.416184663772583, 2.9207077026367188, 3.4252309799194336, 3.9297542572021484, 4.434277534484863, 4.93880033493042, 5.443323612213135, 5.94784688949585, 6.452369689941406, 6.956892967224121, 7.461416244506836, 7.965939521789551, 8.470462799072266, 8.97498607635498, 9.479509353637695, 9.984031677246094, 10.488554954528809, 10.993078231811523, 11.497601509094238, 12.002124786376953, 12.506648063659668, 13.011171340942383, 13.515693664550781, 14.020217895507812, 14.524740219116211, 15.029263496398926, 15.53378677368164]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 10.0, 7.0, 5.0, 11.0, 10.0, 13.0, 19.0, 15.0, 20.0, 27.0, 26.0, 27.0, 31.0, 43.0, 43.0, 26.0, 47.0, 43.0, 47.0, 55.0, 53.0, 44.0, 42.0, 42.0, 45.0, 35.0, 33.0, 28.0, 30.0, 23.0, 17.0, 20.0, 12.0, 18.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.74609375, -1.685760498046875, -1.62542724609375, -1.565093994140625, -1.5047607421875, -1.444427490234375, -1.38409423828125, -1.323760986328125, -1.263427734375, -1.203094482421875, -1.14276123046875, -1.082427978515625, -1.0220947265625, -0.961761474609375, -0.90142822265625, -0.841094970703125, -0.78076171875, -0.720428466796875, -0.66009521484375, -0.599761962890625, -0.5394287109375, -0.479095458984375, -0.41876220703125, -0.358428955078125, -0.298095703125, -0.237762451171875, -0.17742919921875, -0.117095947265625, -0.0567626953125, 0.003570556640625, 0.06390380859375, 0.124237060546875, 0.1845703125, 0.244903564453125, 0.30523681640625, 0.365570068359375, 0.4259033203125, 0.486236572265625, 0.54656982421875, 0.606903076171875, 0.667236328125, 0.727569580078125, 0.78790283203125, 0.848236083984375, 0.9085693359375, 0.968902587890625, 1.02923583984375, 1.089569091796875, 1.14990234375, 1.210235595703125, 1.27056884765625, 1.330902099609375, 1.3912353515625, 1.451568603515625, 1.51190185546875, 1.572235107421875, 1.632568359375, 1.692901611328125, 1.75323486328125, 1.813568115234375, 1.8739013671875, 1.934234619140625, 1.99456787109375, 2.054901123046875, 2.115234375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 7.0, 11.0, 6.0, 7.0, 15.0, 17.0, 22.0, 29.0, 47.0, 58.0, 89.0, 111.0, 138.0, 217.0, 327.0, 539.0, 925.0, 1530.0, 2854.0, 5924.0, 13750.0, 42170.0, 237811.0, 2545061.0, 1187643.0, 109444.0, 26385.0, 9608.0, 4283.0, 2172.0, 1148.0, 651.0, 391.0, 261.0, 177.0, 108.0, 92.0, 71.0, 41.0, 37.0, 29.0, 15.0, 13.0, 14.0, 6.0, 6.0, 3.0, 6.0, 1.0, 8.0, 2.0, 2.0, 2.0, 1.0], "bins": [-7.64453125, -7.41839599609375, -7.1922607421875, -6.96612548828125, -6.739990234375, -6.51385498046875, -6.2877197265625, -6.06158447265625, -5.83544921875, -5.60931396484375, -5.3831787109375, -5.15704345703125, -4.930908203125, -4.70477294921875, -4.4786376953125, -4.25250244140625, -4.0263671875, -3.80023193359375, -3.5740966796875, -3.34796142578125, -3.121826171875, -2.89569091796875, -2.6695556640625, -2.44342041015625, -2.21728515625, -1.99114990234375, -1.7650146484375, -1.53887939453125, -1.312744140625, -1.08660888671875, -0.8604736328125, -0.63433837890625, -0.408203125, -0.18206787109375, 0.0440673828125, 0.27020263671875, 0.496337890625, 0.72247314453125, 0.9486083984375, 1.17474365234375, 1.40087890625, 1.62701416015625, 1.8531494140625, 2.07928466796875, 2.305419921875, 2.53155517578125, 2.7576904296875, 2.98382568359375, 3.2099609375, 3.43609619140625, 3.6622314453125, 3.88836669921875, 4.114501953125, 4.34063720703125, 4.5667724609375, 4.79290771484375, 5.01904296875, 5.24517822265625, 5.4713134765625, 5.69744873046875, 5.923583984375, 6.14971923828125, 6.3758544921875, 6.60198974609375, 6.828125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 12.0, 11.0, 19.0, 43.0, 66.0, 92.0, 180.0, 266.0, 498.0, 779.0, 794.0, 508.0, 348.0, 197.0, 102.0, 69.0, 43.0, 18.0, 15.0, 10.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.890625, -6.5302734375, -6.169921875, -5.8095703125, -5.44921875, -5.0888671875, -4.728515625, -4.3681640625, -4.0078125, -3.6474609375, -3.287109375, -2.9267578125, -2.56640625, -2.2060546875, -1.845703125, -1.4853515625, -1.125, -0.7646484375, -0.404296875, -0.0439453125, 0.31640625, 0.6767578125, 1.037109375, 1.3974609375, 1.7578125, 2.1181640625, 2.478515625, 2.8388671875, 3.19921875, 3.5595703125, 3.919921875, 4.2802734375, 4.640625, 5.0009765625, 5.361328125, 5.7216796875, 6.08203125, 6.4423828125, 6.802734375, 7.1630859375, 7.5234375, 7.8837890625, 8.244140625, 8.6044921875, 8.96484375, 9.3251953125, 9.685546875, 10.0458984375, 10.40625, 10.7666015625, 11.126953125, 11.4873046875, 11.84765625, 12.2080078125, 12.568359375, 12.9287109375, 13.2890625, 13.6494140625, 14.009765625, 14.3701171875, 14.73046875, 15.0908203125, 15.451171875, 15.8115234375, 16.171875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 10.0, 7.0, 15.0, 28.0, 41.0, 72.0, 140.0, 280.0, 878.0, 13716.0, 4160214.0, 17197.0, 1008.0, 329.0, 131.0, 75.0, 54.0, 36.0, 13.0, 17.0, 8.0, 4.0, 5.0, 3.0, 0.0, 3.0], "bins": [-70.9375, -69.475341796875, -68.01318359375, -66.551025390625, -65.0888671875, -63.626708984375, -62.16455078125, -60.702392578125, -59.240234375, -57.778076171875, -56.31591796875, -54.853759765625, -53.3916015625, -51.929443359375, -50.46728515625, -49.005126953125, -47.54296875, -46.080810546875, -44.61865234375, -43.156494140625, -41.6943359375, -40.232177734375, -38.77001953125, -37.307861328125, -35.845703125, -34.383544921875, -32.92138671875, -31.459228515625, -29.9970703125, -28.534912109375, -27.07275390625, -25.610595703125, -24.1484375, -22.686279296875, -21.22412109375, -19.761962890625, -18.2998046875, -16.837646484375, -15.37548828125, -13.913330078125, -12.451171875, -10.989013671875, -9.52685546875, -8.064697265625, -6.6025390625, -5.140380859375, -3.67822265625, -2.216064453125, -0.75390625, 0.708251953125, 2.17041015625, 3.632568359375, 5.0947265625, 6.556884765625, 8.01904296875, 9.481201171875, 10.943359375, 12.405517578125, 13.86767578125, 15.329833984375, 16.7919921875, 18.254150390625, 19.71630859375, 21.178466796875, 22.640625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 31.0, 631.0, 349.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-173.17491149902344, -168.1968994140625, -163.2188720703125, -158.24085998535156, -153.26283264160156, -148.28482055664062, -143.30679321289062, -138.3287811279297, -133.35076904296875, -128.3727569580078, -123.39472961425781, -118.41670989990234, -113.43869018554688, -108.46067810058594, -103.48265838623047, -98.504638671875, -93.526611328125, -88.54859161376953, -83.57057189941406, -78.5925521850586, -73.61453247070312, -68.63652038574219, -63.65850067138672, -58.68048095703125, -53.70246124267578, -48.72444152832031, -43.746421813964844, -38.76840591430664, -33.79038619995117, -28.812366485595703, -23.834348678588867, -18.85633087158203, -13.878326416015625, -8.900307655334473, -3.9222888946533203, 1.055729866027832, 6.033748626708984, 11.011768341064453, 15.989786148071289, 20.967803955078125, 25.945823669433594, 30.923843383789062, 35.90186309814453, 40.879878997802734, 45.8578987121582, 50.83591842651367, 55.813934326171875, 60.791954040527344, 65.76997375488281, 70.74799346923828, 75.72601318359375, 80.70403289794922, 85.68205261230469, 90.66006469726562, 95.6380844116211, 100.61610412597656, 105.59412384033203, 110.5721435546875, 115.55016326904297, 120.52818298339844, 125.50619506835938, 130.48422241210938, 135.4622344970703, 140.44024658203125, 145.41827392578125]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 8.0, 18.0, 6.0, 15.0, 17.0, 21.0, 25.0, 26.0, 25.0, 29.0, 31.0, 34.0, 49.0, 41.0, 52.0, 48.0, 38.0, 49.0, 35.0, 62.0, 38.0, 27.0, 33.0, 36.0, 33.0, 33.0, 26.0, 22.0, 18.0, 15.0, 11.0, 10.0, 9.0, 12.0, 7.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-29.26920509338379, -28.47728157043457, -27.68535804748535, -26.893434524536133, -26.101511001586914, -25.309587478637695, -24.517663955688477, -23.725740432739258, -22.93381690979004, -22.14189338684082, -21.3499698638916, -20.558046340942383, -19.766122817993164, -18.974199295043945, -18.182275772094727, -17.390352249145508, -16.59842872619629, -15.80650520324707, -15.014581680297852, -14.222658157348633, -13.430734634399414, -12.638811111450195, -11.846887588500977, -11.054964065551758, -10.263040542602539, -9.47111701965332, -8.679193496704102, -7.887269973754883, -7.095346450805664, -6.303422927856445, -5.511499404907227, -4.719575881958008, -3.927654266357422, -3.135730743408203, -2.3438072204589844, -1.5518836975097656, -0.7599601745605469, 0.031963348388671875, 0.8238868713378906, 1.6158103942871094, 2.407733917236328, 3.199657440185547, 3.9915809631347656, 4.783504486083984, 5.575428009033203, 6.367351531982422, 7.159275054931641, 7.951198577880859, 8.743122100830078, 9.535045623779297, 10.326969146728516, 11.118892669677734, 11.910816192626953, 12.702739715576172, 13.49466323852539, 14.28658676147461, 15.078510284423828, 15.870433807373047, 16.662357330322266, 17.454280853271484, 18.246204376220703, 19.038127899169922, 19.83005142211914, 20.62197494506836, 21.413898468017578]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 3.0, 1.0, 10.0, 11.0, 6.0, 7.0, 12.0, 12.0, 18.0, 21.0, 14.0, 22.0, 30.0, 26.0, 29.0, 29.0, 33.0, 28.0, 35.0, 37.0, 43.0, 40.0, 61.0, 50.0, 41.0, 46.0, 40.0, 44.0, 38.0, 29.0, 33.0, 25.0, 20.0, 21.0, 11.0, 20.0, 17.0, 11.0, 5.0, 6.0, 2.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.9409942626953125, -1.881988525390625, -1.8229827880859375, -1.76397705078125, -1.7049713134765625, -1.645965576171875, -1.5869598388671875, -1.5279541015625, -1.4689483642578125, -1.409942626953125, -1.3509368896484375, -1.29193115234375, -1.2329254150390625, -1.173919677734375, -1.1149139404296875, -1.055908203125, -0.9969024658203125, -0.937896728515625, -0.8788909912109375, -0.81988525390625, -0.7608795166015625, -0.701873779296875, -0.6428680419921875, -0.5838623046875, -0.5248565673828125, -0.465850830078125, -0.4068450927734375, -0.34783935546875, -0.2888336181640625, -0.229827880859375, -0.1708221435546875, -0.11181640625, -0.0528106689453125, 0.006195068359375, 0.0652008056640625, 0.12420654296875, 0.1832122802734375, 0.242218017578125, 0.3012237548828125, 0.3602294921875, 0.4192352294921875, 0.478240966796875, 0.5372467041015625, 0.59625244140625, 0.6552581787109375, 0.714263916015625, 0.7732696533203125, 0.832275390625, 0.8912811279296875, 0.950286865234375, 1.0092926025390625, 1.06829833984375, 1.1273040771484375, 1.186309814453125, 1.2453155517578125, 1.3043212890625, 1.3633270263671875, 1.422332763671875, 1.4813385009765625, 1.54034423828125, 1.5993499755859375, 1.658355712890625, 1.7173614501953125, 1.7763671875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 9.0, 12.0, 31.0, 28.0, 43.0, 74.0, 102.0, 127.0, 212.0, 341.0, 445.0, 710.0, 988.0, 1548.0, 2371.0, 3366.0, 5271.0, 8430.0, 13109.0, 21275.0, 35288.0, 59312.0, 105862.0, 240259.0, 273999.0, 113601.0, 62751.0, 37111.0, 22422.0, 13931.0, 8684.0, 5610.0, 3744.0, 2474.0, 1596.0, 1085.0, 741.0, 505.0, 351.0, 235.0, 169.0, 103.0, 75.0, 50.0, 41.0, 27.0, 13.0, 9.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.329833984375, -0.3192138671875, -0.30859375, -0.2979736328125, -0.287353515625, -0.2767333984375, -0.26611328125, -0.2554931640625, -0.244873046875, -0.2342529296875, -0.2236328125, -0.2130126953125, -0.202392578125, -0.1917724609375, -0.18115234375, -0.1705322265625, -0.159912109375, -0.1492919921875, -0.138671875, -0.1280517578125, -0.117431640625, -0.1068115234375, -0.09619140625, -0.0855712890625, -0.074951171875, -0.0643310546875, -0.0537109375, -0.0430908203125, -0.032470703125, -0.0218505859375, -0.01123046875, -0.0006103515625, 0.010009765625, 0.0206298828125, 0.03125, 0.0418701171875, 0.052490234375, 0.0631103515625, 0.07373046875, 0.0843505859375, 0.094970703125, 0.1055908203125, 0.1162109375, 0.1268310546875, 0.137451171875, 0.1480712890625, 0.15869140625, 0.1693115234375, 0.179931640625, 0.1905517578125, 0.201171875, 0.2117919921875, 0.222412109375, 0.2330322265625, 0.24365234375, 0.2542724609375, 0.264892578125, 0.2755126953125, 0.2861328125, 0.2967529296875, 0.307373046875, 0.3179931640625, 0.32861328125, 0.3392333984375, 0.349853515625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 4.0, 12.0, 10.0, 9.0, 16.0, 19.0, 20.0, 22.0, 12.0, 14.0, 16.0, 25.0, 29.0, 25.0, 31.0, 30.0, 32.0, 24.0, 40.0, 38.0, 34.0, 1064.0, 31.0, 37.0, 37.0, 46.0, 37.0, 29.0, 34.0, 24.0, 25.0, 28.0, 22.0, 22.0, 18.0, 21.0, 10.0, 16.0, 9.0, 8.0, 8.0, 9.0, 7.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0498046875, -1.0162506103515625, -0.982696533203125, -0.9491424560546875, -0.91558837890625, -0.8820343017578125, -0.848480224609375, -0.8149261474609375, -0.7813720703125, -0.7478179931640625, -0.714263916015625, -0.6807098388671875, -0.64715576171875, -0.6136016845703125, -0.580047607421875, -0.5464935302734375, -0.512939453125, -0.4793853759765625, -0.445831298828125, -0.4122772216796875, -0.37872314453125, -0.3451690673828125, -0.311614990234375, -0.2780609130859375, -0.2445068359375, -0.2109527587890625, -0.177398681640625, -0.1438446044921875, -0.11029052734375, -0.0767364501953125, -0.043182373046875, -0.0096282958984375, 0.02392578125, 0.0574798583984375, 0.091033935546875, 0.1245880126953125, 0.15814208984375, 0.1916961669921875, 0.225250244140625, 0.2588043212890625, 0.2923583984375, 0.3259124755859375, 0.359466552734375, 0.3930206298828125, 0.42657470703125, 0.4601287841796875, 0.493682861328125, 0.5272369384765625, 0.560791015625, 0.5943450927734375, 0.627899169921875, 0.6614532470703125, 0.69500732421875, 0.7285614013671875, 0.762115478515625, 0.7956695556640625, 0.8292236328125, 0.8627777099609375, 0.896331787109375, 0.9298858642578125, 0.96343994140625, 0.9969940185546875, 1.030548095703125, 1.0641021728515625, 1.09765625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 3.0, 8.0, 12.0, 21.0, 39.0, 57.0, 64.0, 90.0, 132.0, 174.0, 280.0, 414.0, 514.0, 696.0, 1026.0, 1412.0, 1910.0, 2671.0, 3779.0, 5171.0, 7078.0, 9874.0, 13753.0, 19038.0, 26981.0, 39583.0, 60424.0, 98990.0, 186081.0, 1275836.0, 119936.0, 69929.0, 45029.0, 30523.0, 21165.0, 15086.0, 10726.0, 7912.0, 5685.0, 4233.0, 3059.0, 2216.0, 1686.0, 1137.0, 793.0, 578.0, 401.0, 275.0, 209.0, 136.0, 111.0, 72.0, 56.0, 25.0, 25.0, 11.0, 7.0, 3.0, 3.0, 2.0, 3.0], "bins": [-0.2374267578125, -0.23004531860351562, -0.22266387939453125, -0.21528244018554688, -0.2079010009765625, -0.20051956176757812, -0.19313812255859375, -0.18575668334960938, -0.178375244140625, -0.17099380493164062, -0.16361236572265625, -0.15623092651367188, -0.1488494873046875, -0.14146804809570312, -0.13408660888671875, -0.12670516967773438, -0.11932373046875, -0.11194229125976562, -0.10456085205078125, -0.09717941284179688, -0.0897979736328125, -0.08241653442382812, -0.07503509521484375, -0.06765365600585938, -0.060272216796875, -0.052890777587890625, -0.04550933837890625, -0.038127899169921875, -0.0307464599609375, -0.023365020751953125, -0.01598358154296875, -0.008602142333984375, -0.001220703125, 0.006160736083984375, 0.01354217529296875, 0.020923614501953125, 0.0283050537109375, 0.035686492919921875, 0.04306793212890625, 0.050449371337890625, 0.057830810546875, 0.06521224975585938, 0.07259368896484375, 0.07997512817382812, 0.0873565673828125, 0.09473800659179688, 0.10211944580078125, 0.10950088500976562, 0.11688232421875, 0.12426376342773438, 0.13164520263671875, 0.13902664184570312, 0.1464080810546875, 0.15378952026367188, 0.16117095947265625, 0.16855239868164062, 0.175933837890625, 0.18331527709960938, 0.19069671630859375, 0.19807815551757812, 0.2054595947265625, 0.21284103393554688, 0.22022247314453125, 0.22760391235351562, 0.2349853515625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 8.0, 9.0, 10.0, 12.0, 20.0, 21.0, 29.0, 40.0, 47.0, 52.0, 59.0, 66.0, 65.0, 81.0, 82.0, 66.0, 49.0, 49.0, 51.0, 39.0, 33.0, 24.0, 18.0, 14.0, 9.0, 6.0, 5.0, 2.0, 5.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.578466415405273e-05, -9.315088391304016e-05, -9.051710367202759e-05, -8.788332343101501e-05, -8.524954319000244e-05, -8.261576294898987e-05, -7.99819827079773e-05, -7.734820246696472e-05, -7.471442222595215e-05, -7.208064198493958e-05, -6.9446861743927e-05, -6.681308150291443e-05, -6.417930126190186e-05, -6.154552102088928e-05, -5.891174077987671e-05, -5.6277960538864136e-05, -5.364418029785156e-05, -5.101040005683899e-05, -4.8376619815826416e-05, -4.574283957481384e-05, -4.310905933380127e-05, -4.0475279092788696e-05, -3.784149885177612e-05, -3.520771861076355e-05, -3.2573938369750977e-05, -2.9940158128738403e-05, -2.730637788772583e-05, -2.4672597646713257e-05, -2.2038817405700684e-05, -1.940503716468811e-05, -1.6771256923675537e-05, -1.4137476682662964e-05, -1.150369644165039e-05, -8.869916200637817e-06, -6.236135959625244e-06, -3.602355718612671e-06, -9.685754776000977e-07, 1.6652047634124756e-06, 4.298985004425049e-06, 6.932765245437622e-06, 9.566545486450195e-06, 1.2200325727462769e-05, 1.4834105968475342e-05, 1.7467886209487915e-05, 2.0101666450500488e-05, 2.273544669151306e-05, 2.5369226932525635e-05, 2.8003007173538208e-05, 3.063678741455078e-05, 3.3270567655563354e-05, 3.590434789657593e-05, 3.85381281375885e-05, 4.1171908378601074e-05, 4.380568861961365e-05, 4.643946886062622e-05, 4.9073249101638794e-05, 5.170702934265137e-05, 5.434080958366394e-05, 5.6974589824676514e-05, 5.960837006568909e-05, 6.224215030670166e-05, 6.487593054771423e-05, 6.75097107887268e-05, 7.014349102973938e-05, 7.277727127075195e-05]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 7.0, 7.0, 7.0, 16.0, 15.0, 23.0, 29.0, 45.0, 60.0, 72.0, 123.0, 158.0, 264.0, 505.0, 1214.0, 978979.0, 64951.0, 910.0, 400.0, 219.0, 147.0, 98.0, 105.0, 57.0, 45.0, 23.0, 19.0, 11.0, 12.0, 8.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015001296997070312, -0.0014442652463912964, -0.0013884007930755615, -0.0013325363397598267, -0.0012766718864440918, -0.001220807433128357, -0.001164942979812622, -0.0011090785264968872, -0.0010532140731811523, -0.0009973496198654175, -0.0009414851665496826, -0.0008856207132339478, -0.0008297562599182129, -0.000773891806602478, -0.0007180273532867432, -0.0006621628999710083, -0.0006062984466552734, -0.0005504339933395386, -0.0004945695400238037, -0.00043870508670806885, -0.000382840633392334, -0.0003269761800765991, -0.00027111172676086426, -0.0002152472734451294, -0.00015938282012939453, -0.00010351836681365967, -4.7653913497924805e-05, 8.210539817810059e-06, 6.407499313354492e-05, 0.00011993944644927979, 0.00017580389976501465, 0.0002316683530807495, 0.0002875328063964844, 0.00034339725971221924, 0.0003992617130279541, 0.00045512616634368896, 0.0005109906196594238, 0.0005668550729751587, 0.0006227195262908936, 0.0006785839796066284, 0.0007344484329223633, 0.0007903128862380981, 0.000846177339553833, 0.0009020417928695679, 0.0009579062461853027, 0.0010137706995010376, 0.0010696351528167725, 0.0011254996061325073, 0.0011813640594482422, 0.001237228512763977, 0.001293092966079712, 0.0013489574193954468, 0.0014048218727111816, 0.0014606863260269165, 0.0015165507793426514, 0.0015724152326583862, 0.001628279685974121, 0.001684144139289856, 0.0017400085926055908, 0.0017958730459213257, 0.0018517374992370605, 0.0019076019525527954, 0.0019634664058685303, 0.002019330859184265, 0.0020751953125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 81.0, 663.0, 255.0, 11.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003224206157028675, -0.0003155171580146998, -0.0003086137003265321, -0.00030171024263836443, -0.00029480678495019674, -0.00028790332726202905, -0.00028099986957386136, -0.00027409641188569367, -0.000267192954197526, -0.0002602894965093583, -0.0002533860388211906, -0.0002464825811330229, -0.0002395791234448552, -0.00023267566575668752, -0.00022577220806851983, -0.00021886876493226737, -0.0002119653217960149, -0.00020506186410784721, -0.00019815840641967952, -0.00019125494873151183, -0.00018435149104334414, -0.00017744803335517645, -0.00017054457566700876, -0.0001636411325307563, -0.00015673766029067338, -0.00014983420260250568, -0.000142930744914338, -0.0001360272872261703, -0.0001291238295380026, -0.00012222037184983492, -0.00011531692143762484, -0.00010841347102541476, -0.00010151002061320469, -9.4606562925037e-05, -8.77031052368693e-05, -8.079965482465923e-05, -7.389619713649154e-05, -6.699273944832385e-05, -6.0089281760156155e-05, -5.318582770996727e-05, -4.628237002179958e-05, -3.937891233363189e-05, -3.2475458283443004e-05, -2.5572000595275313e-05, -1.8668544726097025e-05, -1.1765088856918737e-05, -4.861631168751046e-06, 2.041822881437838e-06, 8.94528056960553e-06, 1.5848736438783817e-05, 2.2752192307962105e-05, 2.9655649996129796e-05, 3.655910404631868e-05, 4.346256173448637e-05, 5.036601942265406e-05, 5.726947347284295e-05, 6.417292752303183e-05, 7.107638521119952e-05, 7.797984289936721e-05, 8.48833005875349e-05, 9.178675099974498e-05, 9.869020868791267e-05, 0.00010559366637608036, 0.00011249711678829044, 0.00011940058175241575]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 0.0, 6.0, 8.0, 2.0, 7.0, 9.0, 16.0, 10.0, 15.0, 16.0, 11.0, 14.0, 19.0, 29.0, 34.0, 32.0, 24.0, 38.0, 35.0, 39.0, 51.0, 50.0, 46.0, 49.0, 35.0, 37.0, 32.0, 35.0, 31.0, 43.0, 30.0, 37.0, 27.0, 11.0, 28.0, 22.0, 20.0, 11.0, 8.0, 7.0, 12.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.62396240234375e-05, -3.496836870908737e-05, -3.3697113394737244e-05, -3.2425858080387115e-05, -3.115460276603699e-05, -2.988334745168686e-05, -2.861209213733673e-05, -2.7340836822986603e-05, -2.6069581508636475e-05, -2.4798326194286346e-05, -2.3527070879936218e-05, -2.225581556558609e-05, -2.0984560251235962e-05, -1.9713304936885834e-05, -1.8442049622535706e-05, -1.7170794308185577e-05, -1.589953899383545e-05, -1.4628283679485321e-05, -1.3357028365135193e-05, -1.2085773050785065e-05, -1.0814517736434937e-05, -9.543262422084808e-06, -8.27200710773468e-06, -7.000751793384552e-06, -5.729496479034424e-06, -4.458241164684296e-06, -3.1869858503341675e-06, -1.9157305359840393e-06, -6.444752216339111e-07, 6.26780092716217e-07, 1.8980354070663452e-06, 3.1692907214164734e-06, 4.4405460357666016e-06, 5.71180135011673e-06, 6.983056664466858e-06, 8.254311978816986e-06, 9.525567293167114e-06, 1.0796822607517242e-05, 1.206807792186737e-05, 1.3339333236217499e-05, 1.4610588550567627e-05, 1.5881843864917755e-05, 1.7153099179267883e-05, 1.842435449361801e-05, 1.969560980796814e-05, 2.0966865122318268e-05, 2.2238120436668396e-05, 2.3509375751018524e-05, 2.4780631065368652e-05, 2.605188637971878e-05, 2.732314169406891e-05, 2.8594397008419037e-05, 2.9865652322769165e-05, 3.113690763711929e-05, 3.240816295146942e-05, 3.367941826581955e-05, 3.495067358016968e-05, 3.6221928894519806e-05, 3.7493184208869934e-05, 3.876443952322006e-05, 4.003569483757019e-05, 4.130695015192032e-05, 4.257820546627045e-05, 4.3849460780620575e-05, 4.51207160949707e-05]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 3.0, 1.0, 10.0, 11.0, 6.0, 7.0, 12.0, 12.0, 18.0, 21.0, 14.0, 22.0, 30.0, 26.0, 29.0, 29.0, 33.0, 28.0, 35.0, 37.0, 43.0, 40.0, 61.0, 50.0, 41.0, 46.0, 40.0, 44.0, 38.0, 29.0, 33.0, 25.0, 20.0, 21.0, 11.0, 20.0, 17.0, 11.0, 5.0, 6.0, 2.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.9409942626953125, -1.881988525390625, -1.8229827880859375, -1.76397705078125, -1.7049713134765625, -1.645965576171875, -1.5869598388671875, -1.5279541015625, -1.4689483642578125, -1.409942626953125, -1.3509368896484375, -1.29193115234375, -1.2329254150390625, -1.173919677734375, -1.1149139404296875, -1.055908203125, -0.9969024658203125, -0.937896728515625, -0.8788909912109375, -0.81988525390625, -0.7608795166015625, -0.701873779296875, -0.6428680419921875, -0.5838623046875, -0.5248565673828125, -0.465850830078125, -0.4068450927734375, -0.34783935546875, -0.2888336181640625, -0.229827880859375, -0.1708221435546875, -0.11181640625, -0.0528106689453125, 0.006195068359375, 0.0652008056640625, 0.12420654296875, 0.1832122802734375, 0.242218017578125, 0.3012237548828125, 0.3602294921875, 0.4192352294921875, 0.478240966796875, 0.5372467041015625, 0.59625244140625, 0.6552581787109375, 0.714263916015625, 0.7732696533203125, 0.832275390625, 0.8912811279296875, 0.950286865234375, 1.0092926025390625, 1.06829833984375, 1.1273040771484375, 1.186309814453125, 1.2453155517578125, 1.3043212890625, 1.3633270263671875, 1.422332763671875, 1.4813385009765625, 1.54034423828125, 1.5993499755859375, 1.658355712890625, 1.7173614501953125, 1.7763671875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 3.0, 10.0, 8.0, 23.0, 24.0, 22.0, 36.0, 58.0, 81.0, 97.0, 151.0, 199.0, 298.0, 420.0, 718.0, 1287.0, 2288.0, 4678.0, 9991.0, 23459.0, 62141.0, 169298.0, 344182.0, 259544.0, 102242.0, 37395.0, 15451.0, 6761.0, 3280.0, 1712.0, 945.0, 562.0, 366.0, 226.0, 156.0, 124.0, 91.0, 62.0, 54.0, 28.0, 29.0, 13.0, 18.0, 11.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.37109375, -2.3028564453125, -2.234619140625, -2.1663818359375, -2.09814453125, -2.0299072265625, -1.961669921875, -1.8934326171875, -1.8251953125, -1.7569580078125, -1.688720703125, -1.6204833984375, -1.55224609375, -1.4840087890625, -1.415771484375, -1.3475341796875, -1.279296875, -1.2110595703125, -1.142822265625, -1.0745849609375, -1.00634765625, -0.9381103515625, -0.869873046875, -0.8016357421875, -0.7333984375, -0.6651611328125, -0.596923828125, -0.5286865234375, -0.46044921875, -0.3922119140625, -0.323974609375, -0.2557373046875, -0.1875, -0.1192626953125, -0.051025390625, 0.0172119140625, 0.08544921875, 0.1536865234375, 0.221923828125, 0.2901611328125, 0.3583984375, 0.4266357421875, 0.494873046875, 0.5631103515625, 0.63134765625, 0.6995849609375, 0.767822265625, 0.8360595703125, 0.904296875, 0.9725341796875, 1.040771484375, 1.1090087890625, 1.17724609375, 1.2454833984375, 1.313720703125, 1.3819580078125, 1.4501953125, 1.5184326171875, 1.586669921875, 1.6549072265625, 1.72314453125, 1.7913818359375, 1.859619140625, 1.9278564453125, 1.99609375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 11.0, 5.0, 12.0, 12.0, 14.0, 15.0, 17.0, 21.0, 31.0, 44.0, 43.0, 36.0, 53.0, 64.0, 91.0, 164.0, 1512.0, 318.0, 136.0, 81.0, 49.0, 44.0, 34.0, 36.0, 36.0, 30.0, 26.0, 26.0, 18.0, 16.0, 6.0, 12.0, 9.0, 2.0, 1.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.390625, -7.1583251953125, -6.926025390625, -6.6937255859375, -6.46142578125, -6.2291259765625, -5.996826171875, -5.7645263671875, -5.5322265625, -5.2999267578125, -5.067626953125, -4.8353271484375, -4.60302734375, -4.3707275390625, -4.138427734375, -3.9061279296875, -3.673828125, -3.4415283203125, -3.209228515625, -2.9769287109375, -2.74462890625, -2.5123291015625, -2.280029296875, -2.0477294921875, -1.8154296875, -1.5831298828125, -1.350830078125, -1.1185302734375, -0.88623046875, -0.6539306640625, -0.421630859375, -0.1893310546875, 0.04296875, 0.2752685546875, 0.507568359375, 0.7398681640625, 0.97216796875, 1.2044677734375, 1.436767578125, 1.6690673828125, 1.9013671875, 2.1336669921875, 2.365966796875, 2.5982666015625, 2.83056640625, 3.0628662109375, 3.295166015625, 3.5274658203125, 3.759765625, 3.9920654296875, 4.224365234375, 4.4566650390625, 4.68896484375, 4.9212646484375, 5.153564453125, 5.3858642578125, 5.6181640625, 5.8504638671875, 6.082763671875, 6.3150634765625, 6.54736328125, 6.7796630859375, 7.011962890625, 7.2442626953125, 7.4765625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 2.0, 2.0, 5.0, 3.0, 9.0, 7.0, 11.0, 11.0, 24.0, 18.0, 28.0, 39.0, 47.0, 59.0, 66.0, 119.0, 197.0, 369.0, 1019.0, 5349.0, 451560.0, 2672278.0, 11843.0, 1452.0, 450.0, 239.0, 121.0, 89.0, 68.0, 43.0, 47.0, 25.0, 17.0, 18.0, 18.0, 10.0, 8.0, 10.0, 14.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-14.46875, -14.004150390625, -13.53955078125, -13.074951171875, -12.6103515625, -12.145751953125, -11.68115234375, -11.216552734375, -10.751953125, -10.287353515625, -9.82275390625, -9.358154296875, -8.8935546875, -8.428955078125, -7.96435546875, -7.499755859375, -7.03515625, -6.570556640625, -6.10595703125, -5.641357421875, -5.1767578125, -4.712158203125, -4.24755859375, -3.782958984375, -3.318359375, -2.853759765625, -2.38916015625, -1.924560546875, -1.4599609375, -0.995361328125, -0.53076171875, -0.066162109375, 0.3984375, 0.863037109375, 1.32763671875, 1.792236328125, 2.2568359375, 2.721435546875, 3.18603515625, 3.650634765625, 4.115234375, 4.579833984375, 5.04443359375, 5.509033203125, 5.9736328125, 6.438232421875, 6.90283203125, 7.367431640625, 7.83203125, 8.296630859375, 8.76123046875, 9.225830078125, 9.6904296875, 10.155029296875, 10.61962890625, 11.084228515625, 11.548828125, 12.013427734375, 12.47802734375, 12.942626953125, 13.4072265625, 13.871826171875, 14.33642578125, 14.801025390625, 15.265625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 31.0, 299.0, 569.0, 97.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-73.2428207397461, -71.9386215209961, -70.63442993164062, -69.33023071289062, -68.02603149414062, -66.72183227539062, -65.41764068603516, -64.11344146728516, -62.80924606323242, -61.50505065917969, -60.20085144042969, -58.89665603637695, -57.59245681762695, -56.28826141357422, -54.98406219482422, -53.679866790771484, -52.37567138671875, -51.071475982666016, -49.767276763916016, -48.46308135986328, -47.15888214111328, -45.85468673706055, -44.55049133300781, -43.24629211425781, -41.94209289550781, -40.63789749145508, -39.33369827270508, -38.029502868652344, -36.725303649902344, -35.42110824584961, -34.116912841796875, -32.812713623046875, -31.508520126342773, -30.204322814941406, -28.90012550354004, -27.595928192138672, -26.291732788085938, -24.98753547668457, -23.683338165283203, -22.37914276123047, -21.07494354248047, -19.7707462310791, -18.466548919677734, -17.162353515625, -15.858156204223633, -14.553958892822266, -13.249761581420898, -11.945565223693848, -10.641368865966797, -9.33717155456543, -8.032975196838379, -6.728777885437012, -5.424581050872803, -4.120384216308594, -2.8161869049072266, -1.5119905471801758, -0.2077932357788086, 1.09640371799469, 2.4006006717681885, 3.7047977447509766, 5.0089945793151855, 6.3131914138793945, 7.617388725280762, 8.921585083007812, 10.22578239440918]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 6.0, 5.0, 12.0, 8.0, 7.0, 12.0, 11.0, 12.0, 24.0, 21.0, 28.0, 23.0, 25.0, 30.0, 37.0, 43.0, 45.0, 51.0, 58.0, 47.0, 40.0, 45.0, 37.0, 44.0, 32.0, 38.0, 36.0, 28.0, 32.0, 27.0, 21.0, 25.0, 13.0, 22.0, 13.0, 7.0, 7.0, 6.0, 5.0, 6.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.31951141357422, -22.629880905151367, -21.940250396728516, -21.250619888305664, -20.560989379882812, -19.871360778808594, -19.18172836303711, -18.49209976196289, -17.80246925354004, -17.112838745117188, -16.423208236694336, -15.733577728271484, -15.04394817352295, -14.354317665100098, -13.664687156677246, -12.975057601928711, -12.285426139831543, -11.595795631408691, -10.90616512298584, -10.216535568237305, -9.526905059814453, -8.837274551391602, -8.14764404296875, -7.458014011383057, -6.768383502960205, -6.0787529945373535, -5.38912296295166, -4.699492454528809, -4.009861946105957, -3.3202319145202637, -2.630601406097412, -1.9409713745117188, -1.2513408660888672, -0.56171053647995, 0.12791979312896729, 0.8175501823425293, 1.5071804523468018, 2.196810722351074, 2.886441230773926, 3.576071262359619, 4.265701770782471, 4.955332279205322, 5.644962310791016, 6.334592819213867, 7.024223327636719, 7.713853359222412, 8.403484344482422, 9.093113899230957, 9.782744407653809, 10.47237491607666, 11.162005424499512, 11.851634979248047, 12.541265487670898, 13.23089599609375, 13.920526504516602, 14.610157012939453, 15.299787521362305, 15.989418029785156, 16.679048538208008, 17.36867904663086, 18.05830955505371, 18.747940063476562, 19.43756866455078, 20.127199172973633, 20.816829681396484]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 9.0, 8.0, 9.0, 7.0, 12.0, 16.0, 14.0, 26.0, 23.0, 28.0, 23.0, 30.0, 30.0, 34.0, 31.0, 34.0, 42.0, 42.0, 49.0, 56.0, 55.0, 45.0, 66.0, 35.0, 29.0, 42.0, 39.0, 35.0, 24.0, 18.0, 18.0, 15.0, 9.0, 7.0, 13.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.30859375, -2.2423858642578125, -2.176177978515625, -2.1099700927734375, -2.04376220703125, -1.9775543212890625, -1.911346435546875, -1.8451385498046875, -1.7789306640625, -1.7127227783203125, -1.646514892578125, -1.5803070068359375, -1.51409912109375, -1.4478912353515625, -1.381683349609375, -1.3154754638671875, -1.249267578125, -1.1830596923828125, -1.116851806640625, -1.0506439208984375, -0.98443603515625, -0.9182281494140625, -0.852020263671875, -0.7858123779296875, -0.7196044921875, -0.6533966064453125, -0.587188720703125, -0.5209808349609375, -0.45477294921875, -0.3885650634765625, -0.322357177734375, -0.2561492919921875, -0.18994140625, -0.1237335205078125, -0.057525634765625, 0.0086822509765625, 0.07489013671875, 0.1410980224609375, 0.207305908203125, 0.2735137939453125, 0.3397216796875, 0.4059295654296875, 0.472137451171875, 0.5383453369140625, 0.60455322265625, 0.6707611083984375, 0.736968994140625, 0.8031768798828125, 0.869384765625, 0.9355926513671875, 1.001800537109375, 1.0680084228515625, 1.13421630859375, 1.2004241943359375, 1.266632080078125, 1.3328399658203125, 1.3990478515625, 1.4652557373046875, 1.531463623046875, 1.5976715087890625, 1.66387939453125, 1.7300872802734375, 1.796295166015625, 1.8625030517578125, 1.9287109375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 9.0, 12.0, 16.0, 19.0, 24.0, 18.0, 20.0, 38.0, 60.0, 86.0, 107.0, 178.0, 270.0, 542.0, 1348.0, 4361.0, 21695.0, 170462.0, 1976015.0, 1832545.0, 159411.0, 20266.0, 4177.0, 1245.0, 549.0, 256.0, 157.0, 106.0, 69.0, 44.0, 33.0, 27.0, 30.0, 21.0, 15.0, 7.0, 9.0, 8.0, 5.0, 5.0, 7.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-6.62109375, -6.43182373046875, -6.2425537109375, -6.05328369140625, -5.864013671875, -5.67474365234375, -5.4854736328125, -5.29620361328125, -5.10693359375, -4.91766357421875, -4.7283935546875, -4.53912353515625, -4.349853515625, -4.16058349609375, -3.9713134765625, -3.78204345703125, -3.5927734375, -3.40350341796875, -3.2142333984375, -3.02496337890625, -2.835693359375, -2.64642333984375, -2.4571533203125, -2.26788330078125, -2.07861328125, -1.88934326171875, -1.7000732421875, -1.51080322265625, -1.321533203125, -1.13226318359375, -0.9429931640625, -0.75372314453125, -0.564453125, -0.37518310546875, -0.1859130859375, 0.00335693359375, 0.192626953125, 0.38189697265625, 0.5711669921875, 0.76043701171875, 0.94970703125, 1.13897705078125, 1.3282470703125, 1.51751708984375, 1.706787109375, 1.89605712890625, 2.0853271484375, 2.27459716796875, 2.4638671875, 2.65313720703125, 2.8424072265625, 3.03167724609375, 3.220947265625, 3.41021728515625, 3.5994873046875, 3.78875732421875, 3.97802734375, 4.16729736328125, 4.3565673828125, 4.54583740234375, 4.735107421875, 4.92437744140625, 5.1136474609375, 5.30291748046875, 5.4921875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 14.0, 6.0, 14.0, 15.0, 22.0, 41.0, 48.0, 53.0, 80.0, 92.0, 138.0, 184.0, 221.0, 318.0, 404.0, 398.0, 419.0, 337.0, 286.0, 227.0, 174.0, 137.0, 118.0, 76.0, 69.0, 42.0, 35.0, 25.0, 19.0, 18.0, 5.0, 7.0, 8.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.33984375, -6.1593017578125, -5.978759765625, -5.7982177734375, -5.61767578125, -5.4371337890625, -5.256591796875, -5.0760498046875, -4.8955078125, -4.7149658203125, -4.534423828125, -4.3538818359375, -4.17333984375, -3.9927978515625, -3.812255859375, -3.6317138671875, -3.451171875, -3.2706298828125, -3.090087890625, -2.9095458984375, -2.72900390625, -2.5484619140625, -2.367919921875, -2.1873779296875, -2.0068359375, -1.8262939453125, -1.645751953125, -1.4652099609375, -1.28466796875, -1.1041259765625, -0.923583984375, -0.7430419921875, -0.5625, -0.3819580078125, -0.201416015625, -0.0208740234375, 0.15966796875, 0.3402099609375, 0.520751953125, 0.7012939453125, 0.8818359375, 1.0623779296875, 1.242919921875, 1.4234619140625, 1.60400390625, 1.7845458984375, 1.965087890625, 2.1456298828125, 2.326171875, 2.5067138671875, 2.687255859375, 2.8677978515625, 3.04833984375, 3.2288818359375, 3.409423828125, 3.5899658203125, 3.7705078125, 3.9510498046875, 4.131591796875, 4.3121337890625, 4.49267578125, 4.6732177734375, 4.853759765625, 5.0343017578125, 5.21484375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 15.0, 18.0, 34.0, 44.0, 87.0, 143.0, 261.0, 557.0, 2170.0, 62725.0, 3959119.0, 164549.0, 3235.0, 659.0, 286.0, 133.0, 91.0, 52.0, 35.0, 21.0, 14.0, 10.0, 8.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.96875, -29.192138671875, -28.41552734375, -27.638916015625, -26.8623046875, -26.085693359375, -25.30908203125, -24.532470703125, -23.755859375, -22.979248046875, -22.20263671875, -21.426025390625, -20.6494140625, -19.872802734375, -19.09619140625, -18.319580078125, -17.54296875, -16.766357421875, -15.98974609375, -15.213134765625, -14.4365234375, -13.659912109375, -12.88330078125, -12.106689453125, -11.330078125, -10.553466796875, -9.77685546875, -9.000244140625, -8.2236328125, -7.447021484375, -6.67041015625, -5.893798828125, -5.1171875, -4.340576171875, -3.56396484375, -2.787353515625, -2.0107421875, -1.234130859375, -0.45751953125, 0.319091796875, 1.095703125, 1.872314453125, 2.64892578125, 3.425537109375, 4.2021484375, 4.978759765625, 5.75537109375, 6.531982421875, 7.30859375, 8.085205078125, 8.86181640625, 9.638427734375, 10.4150390625, 11.191650390625, 11.96826171875, 12.744873046875, 13.521484375, 14.298095703125, 15.07470703125, 15.851318359375, 16.6279296875, 17.404541015625, 18.18115234375, 18.957763671875, 19.734375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 90.0, 256.0, 334.0, 239.0, 68.0, 11.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.97063446044922, -34.863502502441406, -32.756370544433594, -30.64923858642578, -28.54210662841797, -26.434974670410156, -24.327842712402344, -22.22071075439453, -20.11357879638672, -18.006446838378906, -15.899314880371094, -13.792182922363281, -11.685050964355469, -9.577919006347656, -7.470787048339844, -5.363655090332031, -3.2565231323242188, -1.1493911743164062, 0.9577407836914062, 3.0648727416992188, 5.172004699707031, 7.279136657714844, 9.386268615722656, 11.493400573730469, 13.600532531738281, 15.707664489746094, 17.814796447753906, 19.92192840576172, 22.02906036376953, 24.136192321777344, 26.243324279785156, 28.35045623779297, 30.45758056640625, 32.56471252441406, 34.671844482421875, 36.77897644042969, 38.8861083984375, 40.99324035644531, 43.100372314453125, 45.20750427246094, 47.31463623046875, 49.42176818847656, 51.528900146484375, 53.63603210449219, 55.7431640625, 57.85029602050781, 59.957427978515625, 62.06455993652344, 64.17169189453125, 66.27882385253906, 68.38595581054688, 70.49308776855469, 72.6002197265625, 74.70735168457031, 76.81448364257812, 78.92161560058594, 81.02874755859375, 83.13587951660156, 85.24301147460938, 87.35014343261719, 89.457275390625, 91.56440734863281, 93.67153930664062, 95.77867126464844, 97.88580322265625]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 6.0, 7.0, 10.0, 7.0, 11.0, 19.0, 19.0, 25.0, 16.0, 22.0, 25.0, 37.0, 30.0, 48.0, 46.0, 39.0, 52.0, 45.0, 34.0, 49.0, 44.0, 41.0, 40.0, 44.0, 40.0, 29.0, 30.0, 23.0, 21.0, 13.0, 21.0, 14.0, 16.0, 13.0, 11.0, 10.0, 8.0, 7.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.987842559814453, -19.301700592041016, -18.61556053161621, -17.929418563842773, -17.243276596069336, -16.5571346282959, -15.870994567871094, -15.184852600097656, -14.498710632324219, -13.812569618225098, -13.12642765045166, -12.440286636352539, -11.754144668579102, -11.06800365447998, -10.38186264038086, -9.695720672607422, -9.0095796585083, -8.32343864440918, -7.637296676635742, -6.951155662536621, -6.265013694763184, -5.5788726806640625, -4.892731189727783, -4.206589698791504, -3.5204482078552246, -2.8343067169189453, -2.148165225982666, -1.4620239734649658, -0.7758824825286865, -0.08974099159240723, 0.596400260925293, 1.2825417518615723, 1.9686832427978516, 2.654824733734131, 3.34096622467041, 4.027107238769531, 4.713249206542969, 5.39939022064209, 6.085531711578369, 6.771673202514648, 7.457814693450928, 8.143956184387207, 8.830097198486328, 9.516239166259766, 10.202380180358887, 10.888522148132324, 11.574663162231445, 12.260805130004883, 12.946946144104004, 13.633087158203125, 14.319229125976562, 15.005370140075684, 15.691512107849121, 16.377653121948242, 17.06379508972168, 17.749935150146484, 18.436077117919922, 19.12221908569336, 19.808359146118164, 20.4945011138916, 21.18064308166504, 21.866785049438477, 22.55292510986328, 23.23906707763672, 23.925209045410156]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 1.0, 9.0, 13.0, 7.0, 20.0, 17.0, 7.0, 14.0, 16.0, 15.0, 25.0, 23.0, 33.0, 23.0, 30.0, 30.0, 35.0, 36.0, 50.0, 45.0, 47.0, 53.0, 53.0, 40.0, 43.0, 28.0, 39.0, 37.0, 33.0, 29.0, 31.0, 26.0, 18.0, 12.0, 10.0, 10.0, 8.0, 6.0, 5.0, 3.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.123687744140625, -2.06182861328125, -1.999969482421875, -1.9381103515625, -1.876251220703125, -1.81439208984375, -1.752532958984375, -1.690673828125, -1.628814697265625, -1.56695556640625, -1.505096435546875, -1.4432373046875, -1.381378173828125, -1.31951904296875, -1.257659912109375, -1.19580078125, -1.133941650390625, -1.07208251953125, -1.010223388671875, -0.9483642578125, -0.886505126953125, -0.82464599609375, -0.762786865234375, -0.700927734375, -0.639068603515625, -0.57720947265625, -0.515350341796875, -0.4534912109375, -0.391632080078125, -0.32977294921875, -0.267913818359375, -0.2060546875, -0.144195556640625, -0.08233642578125, -0.020477294921875, 0.0413818359375, 0.103240966796875, 0.16510009765625, 0.226959228515625, 0.288818359375, 0.350677490234375, 0.41253662109375, 0.474395751953125, 0.5362548828125, 0.598114013671875, 0.65997314453125, 0.721832275390625, 0.78369140625, 0.845550537109375, 0.90740966796875, 0.969268798828125, 1.0311279296875, 1.092987060546875, 1.15484619140625, 1.216705322265625, 1.278564453125, 1.340423583984375, 1.40228271484375, 1.464141845703125, 1.5260009765625, 1.587860107421875, 1.64971923828125, 1.711578369140625, 1.7734375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 8.0, 4.0, 5.0, 13.0, 16.0, 20.0, 25.0, 57.0, 76.0, 104.0, 197.0, 303.0, 494.0, 809.0, 1291.0, 2260.0, 3831.0, 6446.0, 11170.0, 19550.0, 35809.0, 68235.0, 146490.0, 357552.0, 205752.0, 86932.0, 44285.0, 23964.0, 13536.0, 7808.0, 4631.0, 2632.0, 1650.0, 982.0, 592.0, 352.0, 238.0, 135.0, 95.0, 74.0, 47.0, 29.0, 25.0, 14.0, 9.0, 2.0, 7.0, 3.0, 7.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.379638671875, -0.3659210205078125, -0.352203369140625, -0.3384857177734375, -0.32476806640625, -0.3110504150390625, -0.297332763671875, -0.2836151123046875, -0.2698974609375, -0.2561798095703125, -0.242462158203125, -0.2287445068359375, -0.21502685546875, -0.2013092041015625, -0.187591552734375, -0.1738739013671875, -0.16015625, -0.1464385986328125, -0.132720947265625, -0.1190032958984375, -0.10528564453125, -0.0915679931640625, -0.077850341796875, -0.0641326904296875, -0.0504150390625, -0.0366973876953125, -0.022979736328125, -0.0092620849609375, 0.00445556640625, 0.0181732177734375, 0.031890869140625, 0.0456085205078125, 0.059326171875, 0.0730438232421875, 0.086761474609375, 0.1004791259765625, 0.11419677734375, 0.1279144287109375, 0.141632080078125, 0.1553497314453125, 0.1690673828125, 0.1827850341796875, 0.196502685546875, 0.2102203369140625, 0.22393798828125, 0.2376556396484375, 0.251373291015625, 0.2650909423828125, 0.27880859375, 0.2925262451171875, 0.306243896484375, 0.3199615478515625, 0.33367919921875, 0.3473968505859375, 0.361114501953125, 0.3748321533203125, 0.3885498046875, 0.4022674560546875, 0.415985107421875, 0.4297027587890625, 0.44342041015625, 0.4571380615234375, 0.470855712890625, 0.4845733642578125, 0.498291015625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 3.0, 11.0, 14.0, 8.0, 13.0, 21.0, 17.0, 22.0, 27.0, 27.0, 32.0, 19.0, 43.0, 43.0, 41.0, 27.0, 38.0, 40.0, 1065.0, 46.0, 40.0, 45.0, 46.0, 23.0, 48.0, 42.0, 32.0, 30.0, 28.0, 29.0, 18.0, 15.0, 13.0, 6.0, 11.0, 6.0, 8.0, 6.0, 9.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.37890625, -1.3394775390625, -1.300048828125, -1.2606201171875, -1.22119140625, -1.1817626953125, -1.142333984375, -1.1029052734375, -1.0634765625, -1.0240478515625, -0.984619140625, -0.9451904296875, -0.90576171875, -0.8663330078125, -0.826904296875, -0.7874755859375, -0.748046875, -0.7086181640625, -0.669189453125, -0.6297607421875, -0.59033203125, -0.5509033203125, -0.511474609375, -0.4720458984375, -0.4326171875, -0.3931884765625, -0.353759765625, -0.3143310546875, -0.27490234375, -0.2354736328125, -0.196044921875, -0.1566162109375, -0.1171875, -0.0777587890625, -0.038330078125, 0.0010986328125, 0.04052734375, 0.0799560546875, 0.119384765625, 0.1588134765625, 0.1982421875, 0.2376708984375, 0.277099609375, 0.3165283203125, 0.35595703125, 0.3953857421875, 0.434814453125, 0.4742431640625, 0.513671875, 0.5531005859375, 0.592529296875, 0.6319580078125, 0.67138671875, 0.7108154296875, 0.750244140625, 0.7896728515625, 0.8291015625, 0.8685302734375, 0.907958984375, 0.9473876953125, 0.98681640625, 1.0262451171875, 1.065673828125, 1.1051025390625, 1.14453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 6.0, 2.0, 11.0, 11.0, 22.0, 37.0, 47.0, 47.0, 92.0, 141.0, 178.0, 276.0, 424.0, 608.0, 858.0, 1186.0, 1766.0, 2576.0, 3894.0, 5707.0, 8644.0, 13402.0, 20189.0, 31498.0, 49860.0, 83676.0, 158735.0, 1333063.0, 156420.0, 82359.0, 50357.0, 31328.0, 19893.0, 12890.0, 8660.0, 5788.0, 3969.0, 2713.0, 1864.0, 1203.0, 892.0, 557.0, 389.0, 281.0, 201.0, 119.0, 100.0, 72.0, 31.0, 33.0, 18.0, 18.0, 16.0, 7.0, 5.0, 6.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.287353515625, -0.278228759765625, -0.26910400390625, -0.259979248046875, -0.2508544921875, -0.241729736328125, -0.23260498046875, -0.223480224609375, -0.21435546875, -0.205230712890625, -0.19610595703125, -0.186981201171875, -0.1778564453125, -0.168731689453125, -0.15960693359375, -0.150482177734375, -0.141357421875, -0.132232666015625, -0.12310791015625, -0.113983154296875, -0.1048583984375, -0.095733642578125, -0.08660888671875, -0.077484130859375, -0.068359375, -0.059234619140625, -0.05010986328125, -0.040985107421875, -0.0318603515625, -0.022735595703125, -0.01361083984375, -0.004486083984375, 0.004638671875, 0.013763427734375, 0.02288818359375, 0.032012939453125, 0.0411376953125, 0.050262451171875, 0.05938720703125, 0.068511962890625, 0.07763671875, 0.086761474609375, 0.09588623046875, 0.105010986328125, 0.1141357421875, 0.123260498046875, 0.13238525390625, 0.141510009765625, 0.150634765625, 0.159759521484375, 0.16888427734375, 0.178009033203125, 0.1871337890625, 0.196258544921875, 0.20538330078125, 0.214508056640625, 0.2236328125, 0.232757568359375, 0.24188232421875, 0.251007080078125, 0.2601318359375, 0.269256591796875, 0.27838134765625, 0.287506103515625, 0.296630859375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 7.0, 3.0, 8.0, 8.0, 6.0, 8.0, 15.0, 22.0, 23.0, 27.0, 42.0, 37.0, 39.0, 43.0, 77.0, 70.0, 69.0, 62.0, 61.0, 59.0, 56.0, 47.0, 36.0, 34.0, 32.0, 24.0, 19.0, 16.0, 9.0, 7.0, 12.0, 6.0, 2.0, 3.0, 3.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.128715515136719e-05, -6.90976157784462e-05, -6.690807640552521e-05, -6.471853703260422e-05, -6.252899765968323e-05, -6.033945828676224e-05, -5.814991891384125e-05, -5.596037954092026e-05, -5.377084016799927e-05, -5.158130079507828e-05, -4.939176142215729e-05, -4.72022220492363e-05, -4.501268267631531e-05, -4.282314330339432e-05, -4.063360393047333e-05, -3.844406455755234e-05, -3.625452518463135e-05, -3.406498581171036e-05, -3.187544643878937e-05, -2.9685907065868378e-05, -2.7496367692947388e-05, -2.5306828320026398e-05, -2.3117288947105408e-05, -2.0927749574184418e-05, -1.8738210201263428e-05, -1.6548670828342438e-05, -1.4359131455421448e-05, -1.2169592082500458e-05, -9.980052709579468e-06, -7.790513336658478e-06, -5.600973963737488e-06, -3.411434590816498e-06, -1.2218952178955078e-06, 9.676441550254822e-07, 3.157183527946472e-06, 5.346722900867462e-06, 7.536262273788452e-06, 9.725801646709442e-06, 1.1915341019630432e-05, 1.4104880392551422e-05, 1.6294419765472412e-05, 1.8483959138393402e-05, 2.0673498511314392e-05, 2.2863037884235382e-05, 2.5052577257156372e-05, 2.7242116630077362e-05, 2.9431656002998352e-05, 3.162119537591934e-05, 3.381073474884033e-05, 3.600027412176132e-05, 3.818981349468231e-05, 4.03793528676033e-05, 4.256889224052429e-05, 4.475843161344528e-05, 4.694797098636627e-05, 4.913751035928726e-05, 5.132704973220825e-05, 5.351658910512924e-05, 5.570612847805023e-05, 5.789566785097122e-05, 6.008520722389221e-05, 6.22747465968132e-05, 6.446428596973419e-05, 6.665382534265518e-05, 6.884336471557617e-05]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 9.0, 9.0, 9.0, 13.0, 23.0, 30.0, 32.0, 36.0, 59.0, 66.0, 100.0, 149.0, 168.0, 299.0, 497.0, 1532.0, 669083.0, 373763.0, 1201.0, 456.0, 248.0, 194.0, 156.0, 104.0, 83.0, 63.0, 44.0, 26.0, 18.0, 18.0, 12.0, 14.0, 6.0, 6.0, 2.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0014019012451171875, -0.0013606101274490356, -0.0013193190097808838, -0.001278027892112732, -0.00123673677444458, -0.0011954456567764282, -0.0011541545391082764, -0.0011128634214401245, -0.0010715723037719727, -0.0010302811861038208, -0.000988990068435669, -0.0009476989507675171, -0.0009064078330993652, -0.0008651167154312134, -0.0008238255977630615, -0.0007825344800949097, -0.0007412433624267578, -0.000699952244758606, -0.0006586611270904541, -0.0006173700094223022, -0.0005760788917541504, -0.0005347877740859985, -0.0004934966564178467, -0.0004522055387496948, -0.00041091442108154297, -0.0003696233034133911, -0.00032833218574523926, -0.0002870410680770874, -0.00024574995040893555, -0.0002044588327407837, -0.00016316771507263184, -0.00012187659740447998, -8.058547973632812e-05, -3.929436206817627e-05, 1.996755599975586e-06, 4.328787326812744e-05, 8.45789909362793e-05, 0.00012587010860443115, 0.000167161226272583, 0.00020845234394073486, 0.0002497434616088867, 0.0002910345792770386, 0.00033232569694519043, 0.0003736168146133423, 0.00041490793228149414, 0.000456199049949646, 0.0004974901676177979, 0.0005387812852859497, 0.0005800724029541016, 0.0006213635206222534, 0.0006626546382904053, 0.0007039457559585571, 0.000745236873626709, 0.0007865279912948608, 0.0008278191089630127, 0.0008691102266311646, 0.0009104013442993164, 0.0009516924619674683, 0.0009929835796356201, 0.001034274697303772, 0.0010755658149719238, 0.0011168569326400757, 0.0011581480503082275, 0.0011994391679763794, 0.0012407302856445312]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 15.0, 33.0, 100.0, 184.0, 265.0, 209.0, 117.0, 56.0, 13.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44899157830514e-05, -5.185039117350243e-05, -4.921086292597465e-05, -4.657133831642568e-05, -4.39318100688979e-05, -4.129228545934893e-05, -3.865276084979996e-05, -3.601323260227218e-05, -3.337370799272321e-05, -3.073418338317424e-05, -2.8094655135646462e-05, -2.545513052609749e-05, -2.2815604097559117e-05, -2.0176077669020742e-05, -1.753655305947177e-05, -1.4897026630933397e-05, -1.2257500202395022e-05, -9.617973773856647e-06, -6.9784482548129745e-06, -4.338922735769302e-06, -1.699396307230927e-06, 9.401301213074476e-07, 3.5796547308564186e-06, 6.219181159394793e-06, 8.858707587933168e-06, 1.1498234016471542e-05, 1.4137759535515215e-05, 1.6777285054558888e-05, 1.9416811483097263e-05, 2.2056337911635637e-05, 2.469586252118461e-05, 2.7335388949722983e-05, 2.9974922654218972e-05, 3.261444726376794e-05, 3.525397551129572e-05, 3.789350012084469e-05, 4.053302836837247e-05, 4.317255297792144e-05, 4.581207758747041e-05, 4.845160583499819e-05, 5.109113044454716e-05, 5.373065505409613e-05, 5.637018330162391e-05, 5.900970791117288e-05, 6.164923252072185e-05, 6.428876076824963e-05, 6.692828901577741e-05, 6.956780998734757e-05, 7.220733823487535e-05, 7.484686648240313e-05, 7.74863874539733e-05, 8.012591570150107e-05, 8.276544394902885e-05, 8.540497219655663e-05, 8.804449316812679e-05, 9.068402141565457e-05, 9.332354238722473e-05, 9.596307063475251e-05, 9.860259160632268e-05, 0.00010124211985385045, 0.00010388164810137823, 0.0001065211690729484, 0.00010916069732047617, 0.00011180022556800395, 0.00011443975381553173]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 5.0, 4.0, 11.0, 9.0, 9.0, 23.0, 17.0, 22.0, 21.0, 31.0, 30.0, 44.0, 36.0, 34.0, 48.0, 60.0, 43.0, 49.0, 54.0, 36.0, 52.0, 41.0, 35.0, 41.0, 29.0, 29.0, 28.0, 27.0, 22.0, 19.0, 22.0, 18.0, 15.0, 10.0, 8.0, 2.0, 5.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.13060188293457e-05, -4.010181874036789e-05, -3.8897618651390076e-05, -3.769341856241226e-05, -3.648921847343445e-05, -3.5285018384456635e-05, -3.408081829547882e-05, -3.287661820650101e-05, -3.167241811752319e-05, -3.046821802854538e-05, -2.9264017939567566e-05, -2.8059817850589752e-05, -2.685561776161194e-05, -2.5651417672634125e-05, -2.444721758365631e-05, -2.3243017494678497e-05, -2.2038817405700684e-05, -2.083461731672287e-05, -1.9630417227745056e-05, -1.8426217138767242e-05, -1.722201704978943e-05, -1.6017816960811615e-05, -1.4813616871833801e-05, -1.3609416782855988e-05, -1.2405216693878174e-05, -1.120101660490036e-05, -9.996816515922546e-06, -8.792616426944733e-06, -7.588416337966919e-06, -6.384216248989105e-06, -5.1800161600112915e-06, -3.975816071033478e-06, -2.771615982055664e-06, -1.5674158930778503e-06, -3.632158041000366e-07, 8.409842848777771e-07, 2.045184373855591e-06, 3.2493844628334045e-06, 4.453584551811218e-06, 5.657784640789032e-06, 6.861984729766846e-06, 8.06618481874466e-06, 9.270384907722473e-06, 1.0474584996700287e-05, 1.16787850856781e-05, 1.2882985174655914e-05, 1.4087185263633728e-05, 1.5291385352611542e-05, 1.6495585441589355e-05, 1.769978553056717e-05, 1.8903985619544983e-05, 2.0108185708522797e-05, 2.131238579750061e-05, 2.2516585886478424e-05, 2.3720785975456238e-05, 2.492498606443405e-05, 2.6129186153411865e-05, 2.733338624238968e-05, 2.8537586331367493e-05, 2.9741786420345306e-05, 3.094598650932312e-05, 3.2150186598300934e-05, 3.335438668727875e-05, 3.455858677625656e-05, 3.5762786865234375e-05]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 1.0, 9.0, 13.0, 7.0, 20.0, 17.0, 7.0, 14.0, 15.0, 16.0, 25.0, 23.0, 33.0, 23.0, 30.0, 30.0, 35.0, 36.0, 50.0, 45.0, 47.0, 53.0, 53.0, 40.0, 43.0, 28.0, 39.0, 37.0, 33.0, 29.0, 31.0, 26.0, 18.0, 12.0, 10.0, 10.0, 8.0, 6.0, 5.0, 3.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.123687744140625, -2.06182861328125, -1.999969482421875, -1.9381103515625, -1.876251220703125, -1.81439208984375, -1.752532958984375, -1.690673828125, -1.628814697265625, -1.56695556640625, -1.505096435546875, -1.4432373046875, -1.381378173828125, -1.31951904296875, -1.257659912109375, -1.19580078125, -1.133941650390625, -1.07208251953125, -1.010223388671875, -0.9483642578125, -0.886505126953125, -0.82464599609375, -0.762786865234375, -0.700927734375, -0.639068603515625, -0.57720947265625, -0.515350341796875, -0.4534912109375, -0.391632080078125, -0.32977294921875, -0.267913818359375, -0.2060546875, -0.144195556640625, -0.08233642578125, -0.020477294921875, 0.0413818359375, 0.103240966796875, 0.16510009765625, 0.226959228515625, 0.288818359375, 0.350677490234375, 0.41253662109375, 0.474395751953125, 0.5362548828125, 0.598114013671875, 0.65997314453125, 0.721832275390625, 0.78369140625, 0.845550537109375, 0.90740966796875, 0.969268798828125, 1.0311279296875, 1.092987060546875, 1.15484619140625, 1.216705322265625, 1.278564453125, 1.340423583984375, 1.40228271484375, 1.464141845703125, 1.5260009765625, 1.587860107421875, 1.64971923828125, 1.711578369140625, 1.7734375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 12.0, 10.0, 14.0, 18.0, 41.0, 54.0, 56.0, 96.0, 136.0, 196.0, 274.0, 474.0, 716.0, 1276.0, 2094.0, 3836.0, 7437.0, 15460.0, 34927.0, 98178.0, 328634.0, 368591.0, 112101.0, 39093.0, 16698.0, 8121.0, 4238.0, 2287.0, 1267.0, 817.0, 446.0, 304.0, 196.0, 138.0, 102.0, 73.0, 58.0, 32.0, 17.0, 8.0, 9.0, 8.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9072265625, -1.8392486572265625, -1.771270751953125, -1.7032928466796875, -1.63531494140625, -1.5673370361328125, -1.499359130859375, -1.4313812255859375, -1.3634033203125, -1.2954254150390625, -1.227447509765625, -1.1594696044921875, -1.09149169921875, -1.0235137939453125, -0.955535888671875, -0.8875579833984375, -0.819580078125, -0.7516021728515625, -0.683624267578125, -0.6156463623046875, -0.54766845703125, -0.4796905517578125, -0.411712646484375, -0.3437347412109375, -0.2757568359375, -0.2077789306640625, -0.139801025390625, -0.0718231201171875, -0.00384521484375, 0.0641326904296875, 0.132110595703125, 0.2000885009765625, 0.26806640625, 0.3360443115234375, 0.404022216796875, 0.4720001220703125, 0.53997802734375, 0.6079559326171875, 0.675933837890625, 0.7439117431640625, 0.8118896484375, 0.8798675537109375, 0.947845458984375, 1.0158233642578125, 1.08380126953125, 1.1517791748046875, 1.219757080078125, 1.2877349853515625, 1.355712890625, 1.4236907958984375, 1.491668701171875, 1.5596466064453125, 1.62762451171875, 1.6956024169921875, 1.763580322265625, 1.8315582275390625, 1.8995361328125, 1.9675140380859375, 2.035491943359375, 2.1034698486328125, 2.17144775390625, 2.2394256591796875, 2.307403564453125, 2.3753814697265625, 2.443359375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 7.0, 14.0, 13.0, 13.0, 14.0, 16.0, 21.0, 25.0, 26.0, 32.0, 34.0, 40.0, 53.0, 51.0, 48.0, 76.0, 129.0, 1543.0, 382.0, 99.0, 63.0, 44.0, 36.0, 37.0, 33.0, 34.0, 22.0, 25.0, 18.0, 18.0, 18.0, 19.0, 11.0, 4.0, 10.0, 2.0, 5.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.515625, -7.27984619140625, -7.0440673828125, -6.80828857421875, -6.572509765625, -6.33673095703125, -6.1009521484375, -5.86517333984375, -5.62939453125, -5.39361572265625, -5.1578369140625, -4.92205810546875, -4.686279296875, -4.45050048828125, -4.2147216796875, -3.97894287109375, -3.7431640625, -3.50738525390625, -3.2716064453125, -3.03582763671875, -2.800048828125, -2.56427001953125, -2.3284912109375, -2.09271240234375, -1.85693359375, -1.62115478515625, -1.3853759765625, -1.14959716796875, -0.913818359375, -0.67803955078125, -0.4422607421875, -0.20648193359375, 0.029296875, 0.26507568359375, 0.5008544921875, 0.73663330078125, 0.972412109375, 1.20819091796875, 1.4439697265625, 1.67974853515625, 1.91552734375, 2.15130615234375, 2.3870849609375, 2.62286376953125, 2.858642578125, 3.09442138671875, 3.3302001953125, 3.56597900390625, 3.8017578125, 4.03753662109375, 4.2733154296875, 4.50909423828125, 4.744873046875, 4.98065185546875, 5.2164306640625, 5.45220947265625, 5.68798828125, 5.92376708984375, 6.1595458984375, 6.39532470703125, 6.631103515625, 6.86688232421875, 7.1026611328125, 7.33843994140625, 7.57421875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 8.0, 7.0, 14.0, 12.0, 17.0, 21.0, 24.0, 22.0, 39.0, 43.0, 48.0, 66.0, 116.0, 181.0, 342.0, 843.0, 5185.0, 157199.0, 2945351.0, 32345.0, 2371.0, 563.0, 283.0, 147.0, 120.0, 62.0, 53.0, 35.0, 34.0, 37.0, 29.0, 20.0, 11.0, 17.0, 12.0, 2.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.4609375, -12.06298828125, -11.6650390625, -11.26708984375, -10.869140625, -10.47119140625, -10.0732421875, -9.67529296875, -9.27734375, -8.87939453125, -8.4814453125, -8.08349609375, -7.685546875, -7.28759765625, -6.8896484375, -6.49169921875, -6.09375, -5.69580078125, -5.2978515625, -4.89990234375, -4.501953125, -4.10400390625, -3.7060546875, -3.30810546875, -2.91015625, -2.51220703125, -2.1142578125, -1.71630859375, -1.318359375, -0.92041015625, -0.5224609375, -0.12451171875, 0.2734375, 0.67138671875, 1.0693359375, 1.46728515625, 1.865234375, 2.26318359375, 2.6611328125, 3.05908203125, 3.45703125, 3.85498046875, 4.2529296875, 4.65087890625, 5.048828125, 5.44677734375, 5.8447265625, 6.24267578125, 6.640625, 7.03857421875, 7.4365234375, 7.83447265625, 8.232421875, 8.63037109375, 9.0283203125, 9.42626953125, 9.82421875, 10.22216796875, 10.6201171875, 11.01806640625, 11.416015625, 11.81396484375, 12.2119140625, 12.60986328125, 13.0078125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 9.0, 19.0, 62.0, 130.0, 184.0, 228.0, 187.0, 93.0, 62.0, 19.0, 9.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.176681518554688, -19.700082778930664, -19.22348403930664, -18.746885299682617, -18.270286560058594, -17.793685913085938, -17.317087173461914, -16.84048843383789, -16.363889694213867, -15.887290954589844, -15.41069221496582, -14.93409252166748, -14.457493782043457, -13.980895042419434, -13.504295349121094, -13.02769660949707, -12.551097869873047, -12.074499130249023, -11.597900390625, -11.12130069732666, -10.644701957702637, -10.168103218078613, -9.691503524780273, -9.21490478515625, -8.738306045532227, -8.261707305908203, -7.7851080894470215, -7.30850887298584, -6.831910133361816, -6.355311393737793, -5.878712177276611, -5.40211296081543, -4.925515174865723, -4.448916435241699, -3.9723172187805176, -3.495718240737915, -3.0191192626953125, -2.54252028465271, -2.0659213066101074, -1.5893223285675049, -1.1127233505249023, -0.6361243724822998, -0.15952539443969727, 0.3170735836029053, 0.7936725616455078, 1.2702715396881104, 1.746870517730713, 2.2234694957733154, 2.700068473815918, 3.1766674518585205, 3.653266429901123, 4.129865646362305, 4.606464385986328, 5.083063125610352, 5.559662342071533, 6.036261558532715, 6.512860298156738, 6.989459037780762, 7.466058254241943, 7.942657470703125, 8.419256210327148, 8.895854949951172, 9.372453689575195, 9.849053382873535, 10.325652122497559]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 4.0, 6.0, 7.0, 7.0, 9.0, 8.0, 14.0, 15.0, 15.0, 22.0, 17.0, 33.0, 31.0, 20.0, 26.0, 33.0, 36.0, 39.0, 40.0, 34.0, 44.0, 43.0, 46.0, 53.0, 51.0, 42.0, 46.0, 32.0, 29.0, 27.0, 24.0, 32.0, 29.0, 14.0, 20.0, 10.0, 12.0, 7.0, 8.0, 3.0, 3.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.622669219970703, -21.874195098876953, -21.125720977783203, -20.377248764038086, -19.628774642944336, -18.880300521850586, -18.13182830810547, -17.38335418701172, -16.63488006591797, -15.886405944824219, -15.137932777404785, -14.389459609985352, -13.640985488891602, -12.892511367797852, -12.144038200378418, -11.395565032958984, -10.647090911865234, -9.898616790771484, -9.15014362335205, -8.401670455932617, -7.653196334838867, -6.904722690582275, -6.156249046325684, -5.407775402069092, -4.6593017578125, -3.910828113555908, -3.1623544692993164, -2.4138808250427246, -1.6654071807861328, -0.916933536529541, -0.16845989227294922, 0.5800137519836426, 1.3284893035888672, 2.076962947845459, 2.825436592102051, 3.5739102363586426, 4.322383880615234, 5.070857524871826, 5.819331169128418, 6.56780481338501, 7.316278457641602, 8.064752578735352, 8.813225746154785, 9.561698913574219, 10.310173034667969, 11.058647155761719, 11.807120323181152, 12.555593490600586, 13.304067611694336, 14.052541732788086, 14.80101490020752, 15.549488067626953, 16.297962188720703, 17.046436309814453, 17.794910430908203, 18.54338264465332, 19.29185676574707, 20.04033088684082, 20.788803100585938, 21.537277221679688, 22.285751342773438, 23.034225463867188, 23.782699584960938, 24.531171798706055, 25.279645919799805]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 12.0, 11.0, 9.0, 13.0, 17.0, 12.0, 14.0, 15.0, 13.0, 29.0, 24.0, 35.0, 33.0, 27.0, 40.0, 39.0, 37.0, 53.0, 39.0, 49.0, 36.0, 49.0, 45.0, 40.0, 51.0, 43.0, 27.0, 32.0, 32.0, 26.0, 18.0, 15.0, 9.0, 11.0, 5.0, 5.0, 9.0, 6.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.435546875, -2.3675994873046875, -2.299652099609375, -2.2317047119140625, -2.16375732421875, -2.0958099365234375, -2.027862548828125, -1.9599151611328125, -1.8919677734375, -1.8240203857421875, -1.756072998046875, -1.6881256103515625, -1.62017822265625, -1.5522308349609375, -1.484283447265625, -1.4163360595703125, -1.348388671875, -1.2804412841796875, -1.212493896484375, -1.1445465087890625, -1.07659912109375, -1.0086517333984375, -0.940704345703125, -0.8727569580078125, -0.8048095703125, -0.7368621826171875, -0.668914794921875, -0.6009674072265625, -0.53302001953125, -0.4650726318359375, -0.397125244140625, -0.3291778564453125, -0.26123046875, -0.1932830810546875, -0.125335693359375, -0.0573883056640625, 0.01055908203125, 0.0785064697265625, 0.146453857421875, 0.2144012451171875, 0.2823486328125, 0.3502960205078125, 0.418243408203125, 0.4861907958984375, 0.55413818359375, 0.6220855712890625, 0.690032958984375, 0.7579803466796875, 0.825927734375, 0.8938751220703125, 0.961822509765625, 1.0297698974609375, 1.09771728515625, 1.1656646728515625, 1.233612060546875, 1.3015594482421875, 1.3695068359375, 1.4374542236328125, 1.505401611328125, 1.5733489990234375, 1.64129638671875, 1.7092437744140625, 1.777191162109375, 1.8451385498046875, 1.9130859375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 4.0, 6.0, 2.0, 11.0, 7.0, 5.0, 10.0, 10.0, 10.0, 20.0, 14.0, 19.0, 25.0, 21.0, 26.0, 33.0, 50.0, 65.0, 104.0, 330.0, 1407.0, 11399.0, 273402.0, 3590325.0, 302869.0, 11961.0, 1402.0, 272.0, 125.0, 68.0, 48.0, 26.0, 29.0, 29.0, 23.0, 24.0, 20.0, 12.0, 18.0, 10.0, 4.0, 11.0, 5.0, 4.0, 2.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.5859375, -10.27001953125, -9.9541015625, -9.63818359375, -9.322265625, -9.00634765625, -8.6904296875, -8.37451171875, -8.05859375, -7.74267578125, -7.4267578125, -7.11083984375, -6.794921875, -6.47900390625, -6.1630859375, -5.84716796875, -5.53125, -5.21533203125, -4.8994140625, -4.58349609375, -4.267578125, -3.95166015625, -3.6357421875, -3.31982421875, -3.00390625, -2.68798828125, -2.3720703125, -2.05615234375, -1.740234375, -1.42431640625, -1.1083984375, -0.79248046875, -0.4765625, -0.16064453125, 0.1552734375, 0.47119140625, 0.787109375, 1.10302734375, 1.4189453125, 1.73486328125, 2.05078125, 2.36669921875, 2.6826171875, 2.99853515625, 3.314453125, 3.63037109375, 3.9462890625, 4.26220703125, 4.578125, 4.89404296875, 5.2099609375, 5.52587890625, 5.841796875, 6.15771484375, 6.4736328125, 6.78955078125, 7.10546875, 7.42138671875, 7.7373046875, 8.05322265625, 8.369140625, 8.68505859375, 9.0009765625, 9.31689453125, 9.6328125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 2.0, 11.0, 20.0, 43.0, 59.0, 100.0, 185.0, 286.0, 506.0, 699.0, 767.0, 560.0, 353.0, 184.0, 137.0, 67.0, 48.0, 19.0, 17.0, 8.0, 6.0, 4.0], "bins": [-16.46875, -16.152923583984375, -15.83709716796875, -15.521270751953125, -15.2054443359375, -14.889617919921875, -14.57379150390625, -14.257965087890625, -13.942138671875, -13.626312255859375, -13.31048583984375, -12.994659423828125, -12.6788330078125, -12.363006591796875, -12.04718017578125, -11.731353759765625, -11.41552734375, -11.099700927734375, -10.78387451171875, -10.468048095703125, -10.1522216796875, -9.836395263671875, -9.52056884765625, -9.204742431640625, -8.888916015625, -8.573089599609375, -8.25726318359375, -7.941436767578125, -7.6256103515625, -7.309783935546875, -6.99395751953125, -6.678131103515625, -6.3623046875, -6.046478271484375, -5.73065185546875, -5.414825439453125, -5.0989990234375, -4.783172607421875, -4.46734619140625, -4.151519775390625, -3.835693359375, -3.519866943359375, -3.20404052734375, -2.888214111328125, -2.5723876953125, -2.256561279296875, -1.94073486328125, -1.624908447265625, -1.30908203125, -0.993255615234375, -0.67742919921875, -0.361602783203125, -0.0457763671875, 0.270050048828125, 0.58587646484375, 0.901702880859375, 1.217529296875, 1.533355712890625, 1.84918212890625, 2.165008544921875, 2.4808349609375, 2.796661376953125, 3.11248779296875, 3.428314208984375, 3.744140625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 18.0, 31.0, 46.0, 96.0, 148.0, 220.0, 400.0, 984.0, 10297.0, 2416651.0, 1755167.0, 8335.0, 930.0, 382.0, 227.0, 135.0, 86.0, 36.0, 34.0, 13.0, 15.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6171875, -13.8038330078125, -12.990478515625, -12.1771240234375, -11.36376953125, -10.5504150390625, -9.737060546875, -8.9237060546875, -8.1103515625, -7.2969970703125, -6.483642578125, -5.6702880859375, -4.85693359375, -4.0435791015625, -3.230224609375, -2.4168701171875, -1.603515625, -0.7901611328125, 0.023193359375, 0.8365478515625, 1.64990234375, 2.4632568359375, 3.276611328125, 4.0899658203125, 4.9033203125, 5.7166748046875, 6.530029296875, 7.3433837890625, 8.15673828125, 8.9700927734375, 9.783447265625, 10.5968017578125, 11.41015625, 12.2235107421875, 13.036865234375, 13.8502197265625, 14.66357421875, 15.4769287109375, 16.290283203125, 17.1036376953125, 17.9169921875, 18.7303466796875, 19.543701171875, 20.3570556640625, 21.17041015625, 21.9837646484375, 22.797119140625, 23.6104736328125, 24.423828125, 25.2371826171875, 26.050537109375, 26.8638916015625, 27.67724609375, 28.4906005859375, 29.303955078125, 30.1173095703125, 30.9306640625, 31.7440185546875, 32.557373046875, 33.3707275390625, 34.18408203125, 34.9974365234375, 35.810791015625, 36.6241455078125, 37.4375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 11.0, 44.0, 100.0, 231.0, 245.0, 220.0, 109.0, 38.0, 11.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.50689697265625, -67.70074462890625, -65.89459228515625, -64.08843994140625, -62.28228759765625, -60.47613525390625, -58.66998291015625, -56.863834381103516, -55.057682037353516, -53.251529693603516, -51.445377349853516, -49.639225006103516, -47.833072662353516, -46.02692413330078, -44.22077178955078, -42.41461944580078, -40.60846710205078, -38.80231475830078, -36.99616241455078, -35.19001007080078, -33.38385772705078, -31.577707290649414, -29.771554946899414, -27.965404510498047, -26.15924835205078, -24.35309600830078, -22.54694366455078, -20.74079132080078, -18.934640884399414, -17.128488540649414, -15.322336196899414, -13.51618480682373, -11.710033416748047, -9.903881072998047, -8.097729682922363, -6.291577339172363, -4.4854254722595215, -2.6792736053466797, -0.8731212615966797, 0.9330301284790039, 2.739182472229004, 4.545334339141846, 6.3514862060546875, 8.157638549804688, 9.963790893554688, 11.769942283630371, 13.576094627380371, 15.382246017456055, 17.188398361206055, 18.994550704956055, 20.800703048706055, 22.606853485107422, 24.413005828857422, 26.219158172607422, 28.025310516357422, 29.831462860107422, 31.637615203857422, 33.44376754760742, 35.24991989135742, 37.05607223510742, 38.86222457885742, 40.668373107910156, 42.474525451660156, 44.280677795410156, 46.086830139160156]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 14.0, 6.0, 8.0, 9.0, 14.0, 11.0, 11.0, 18.0, 21.0, 23.0, 31.0, 21.0, 31.0, 26.0, 27.0, 36.0, 34.0, 30.0, 43.0, 44.0, 37.0, 38.0, 52.0, 35.0, 28.0, 22.0, 30.0, 29.0, 38.0, 28.0, 26.0, 18.0, 27.0, 16.0, 17.0, 13.0, 12.0, 12.0, 10.0, 7.0, 4.0, 7.0, 11.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.114425659179688, -16.55829620361328, -16.002166748046875, -15.446037292480469, -14.889907836914062, -14.333778381347656, -13.77764892578125, -13.221519470214844, -12.665390014648438, -12.109260559082031, -11.553131103515625, -10.997001647949219, -10.440872192382812, -9.884742736816406, -9.32861328125, -8.772483825683594, -8.216355323791504, -7.660225868225098, -7.104096412658691, -6.547966957092285, -5.991837501525879, -5.435708045959473, -4.879579067230225, -4.323449611663818, -3.767320156097412, -3.211190700531006, -2.6550612449645996, -2.0989320278167725, -1.5428025722503662, -0.98667311668396, -0.4305438995361328, 0.12558555603027344, 0.6817150115966797, 1.237844467163086, 1.7939738035202026, 2.3501031398773193, 2.9062325954437256, 3.462362051010132, 4.018491268157959, 4.574620723724365, 5.1307501792907715, 5.686879634857178, 6.243009090423584, 6.799138069152832, 7.355267524719238, 7.9113969802856445, 8.46752643585205, 9.023655891418457, 9.579785346984863, 10.13591480255127, 10.692044258117676, 11.248173713684082, 11.804303169250488, 12.360432624816895, 12.916561126708984, 13.47269058227539, 14.028820037841797, 14.584949493408203, 15.14107894897461, 15.697208404541016, 16.253337860107422, 16.809467315673828, 17.365596771240234, 17.92172622680664, 18.477855682373047]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 6.0, 5.0, 8.0, 3.0, 12.0, 16.0, 17.0, 10.0, 16.0, 14.0, 18.0, 19.0, 17.0, 29.0, 23.0, 38.0, 50.0, 39.0, 50.0, 43.0, 44.0, 49.0, 35.0, 41.0, 55.0, 39.0, 36.0, 33.0, 46.0, 38.0, 27.0, 29.0, 18.0, 21.0, 7.0, 14.0, 10.0, 4.0, 5.0, 7.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.662109375, -2.590667724609375, -2.51922607421875, -2.447784423828125, -2.3763427734375, -2.304901123046875, -2.23345947265625, -2.162017822265625, -2.090576171875, -2.019134521484375, -1.94769287109375, -1.876251220703125, -1.8048095703125, -1.733367919921875, -1.66192626953125, -1.590484619140625, -1.51904296875, -1.447601318359375, -1.37615966796875, -1.304718017578125, -1.2332763671875, -1.161834716796875, -1.09039306640625, -1.018951416015625, -0.947509765625, -0.876068115234375, -0.80462646484375, -0.733184814453125, -0.6617431640625, -0.590301513671875, -0.51885986328125, -0.447418212890625, -0.3759765625, -0.304534912109375, -0.23309326171875, -0.161651611328125, -0.0902099609375, -0.018768310546875, 0.05267333984375, 0.124114990234375, 0.195556640625, 0.266998291015625, 0.33843994140625, 0.409881591796875, 0.4813232421875, 0.552764892578125, 0.62420654296875, 0.695648193359375, 0.76708984375, 0.838531494140625, 0.90997314453125, 0.981414794921875, 1.0528564453125, 1.124298095703125, 1.19573974609375, 1.267181396484375, 1.338623046875, 1.410064697265625, 1.48150634765625, 1.552947998046875, 1.6243896484375, 1.695831298828125, 1.76727294921875, 1.838714599609375, 1.91015625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 12.0, 20.0, 33.0, 41.0, 56.0, 114.0, 171.0, 288.0, 485.0, 770.0, 1301.0, 2218.0, 3646.0, 6347.0, 10521.0, 17924.0, 31885.0, 60797.0, 127073.0, 320745.0, 245575.0, 102906.0, 50152.0, 27372.0, 15777.0, 9015.0, 5336.0, 3225.0, 1850.0, 1138.0, 693.0, 437.0, 244.0, 139.0, 88.0, 43.0, 46.0, 21.0, 16.0, 10.0, 11.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50634765625, -0.4909400939941406, -0.47553253173828125, -0.4601249694824219, -0.4447174072265625, -0.4293098449707031, -0.41390228271484375, -0.3984947204589844, -0.383087158203125, -0.3676795959472656, -0.35227203369140625, -0.3368644714355469, -0.3214569091796875, -0.3060493469238281, -0.29064178466796875, -0.2752342224121094, -0.25982666015625, -0.24441909790039062, -0.22901153564453125, -0.21360397338867188, -0.1981964111328125, -0.18278884887695312, -0.16738128662109375, -0.15197372436523438, -0.136566162109375, -0.12115859985351562, -0.10575103759765625, -0.09034347534179688, -0.0749359130859375, -0.059528350830078125, -0.04412078857421875, -0.028713226318359375, -0.0133056640625, 0.002101898193359375, 0.01750946044921875, 0.032917022705078125, 0.0483245849609375, 0.06373214721679688, 0.07913970947265625, 0.09454727172851562, 0.109954833984375, 0.12536239624023438, 0.14076995849609375, 0.15617752075195312, 0.1715850830078125, 0.18699264526367188, 0.20240020751953125, 0.21780776977539062, 0.23321533203125, 0.24862289428710938, 0.26403045654296875, 0.2794380187988281, 0.2948455810546875, 0.3102531433105469, 0.32566070556640625, 0.3410682678222656, 0.356475830078125, 0.3718833923339844, 0.38729095458984375, 0.4026985168457031, 0.4181060791015625, 0.4335136413574219, 0.44892120361328125, 0.4643287658691406, 0.479736328125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 9.0, 10.0, 10.0, 7.0, 10.0, 13.0, 22.0, 12.0, 14.0, 23.0, 25.0, 26.0, 30.0, 35.0, 37.0, 37.0, 31.0, 43.0, 35.0, 32.0, 37.0, 1064.0, 27.0, 32.0, 44.0, 37.0, 33.0, 29.0, 36.0, 24.0, 28.0, 25.0, 25.0, 23.0, 17.0, 16.0, 16.0, 6.0, 6.0, 9.0, 11.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3583984375, -1.3172760009765625, -1.276153564453125, -1.2350311279296875, -1.19390869140625, -1.1527862548828125, -1.111663818359375, -1.0705413818359375, -1.0294189453125, -0.9882965087890625, -0.947174072265625, -0.9060516357421875, -0.86492919921875, -0.8238067626953125, -0.782684326171875, -0.7415618896484375, -0.700439453125, -0.6593170166015625, -0.618194580078125, -0.5770721435546875, -0.53594970703125, -0.4948272705078125, -0.453704833984375, -0.4125823974609375, -0.3714599609375, -0.3303375244140625, -0.289215087890625, -0.2480926513671875, -0.20697021484375, -0.1658477783203125, -0.124725341796875, -0.0836029052734375, -0.04248046875, -0.0013580322265625, 0.039764404296875, 0.0808868408203125, 0.12200927734375, 0.1631317138671875, 0.204254150390625, 0.2453765869140625, 0.2864990234375, 0.3276214599609375, 0.368743896484375, 0.4098663330078125, 0.45098876953125, 0.4921112060546875, 0.533233642578125, 0.5743560791015625, 0.615478515625, 0.6566009521484375, 0.697723388671875, 0.7388458251953125, 0.77996826171875, 0.8210906982421875, 0.862213134765625, 0.9033355712890625, 0.9444580078125, 0.9855804443359375, 1.026702880859375, 1.0678253173828125, 1.10894775390625, 1.1500701904296875, 1.191192626953125, 1.2323150634765625, 1.2734375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 5.0, 4.0, 5.0, 9.0, 15.0, 22.0, 35.0, 40.0, 63.0, 110.0, 152.0, 190.0, 331.0, 440.0, 642.0, 885.0, 1219.0, 1738.0, 2416.0, 3516.0, 4800.0, 6669.0, 9396.0, 13324.0, 18943.0, 27182.0, 40491.0, 61636.0, 100250.0, 189570.0, 1277059.0, 118268.0, 69913.0, 45503.0, 30412.0, 20984.0, 14722.0, 10340.0, 7371.0, 5184.0, 3813.0, 2759.0, 1913.0, 1351.0, 1088.0, 655.0, 506.0, 395.0, 252.0, 173.0, 116.0, 83.0, 57.0, 39.0, 30.0, 22.0, 14.0, 9.0, 13.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.2744140625, -0.26560211181640625, -0.2567901611328125, -0.24797821044921875, -0.239166259765625, -0.23035430908203125, -0.2215423583984375, -0.21273040771484375, -0.20391845703125, -0.19510650634765625, -0.1862945556640625, -0.17748260498046875, -0.168670654296875, -0.15985870361328125, -0.1510467529296875, -0.14223480224609375, -0.1334228515625, -0.12461090087890625, -0.1157989501953125, -0.10698699951171875, -0.098175048828125, -0.08936309814453125, -0.0805511474609375, -0.07173919677734375, -0.06292724609375, -0.05411529541015625, -0.0453033447265625, -0.03649139404296875, -0.027679443359375, -0.01886749267578125, -0.0100555419921875, -0.00124359130859375, 0.007568359375, 0.01638031005859375, 0.0251922607421875, 0.03400421142578125, 0.042816162109375, 0.05162811279296875, 0.0604400634765625, 0.06925201416015625, 0.07806396484375, 0.08687591552734375, 0.0956878662109375, 0.10449981689453125, 0.113311767578125, 0.12212371826171875, 0.1309356689453125, 0.13974761962890625, 0.1485595703125, 0.15737152099609375, 0.1661834716796875, 0.17499542236328125, 0.183807373046875, 0.19261932373046875, 0.2014312744140625, 0.21024322509765625, 0.21905517578125, 0.22786712646484375, 0.2366790771484375, 0.24549102783203125, 0.254302978515625, 0.26311492919921875, 0.2719268798828125, 0.28073883056640625, 0.28955078125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 6.0, 10.0, 10.0, 8.0, 16.0, 18.0, 21.0, 39.0, 27.0, 33.0, 42.0, 68.0, 55.0, 53.0, 64.0, 69.0, 54.0, 63.0, 48.0, 50.0, 37.0, 27.0, 43.0, 19.0, 21.0, 16.0, 14.0, 16.0, 12.0, 8.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.920099258422852e-05, -6.668083369731903e-05, -6.416067481040955e-05, -6.164051592350006e-05, -5.9120357036590576e-05, -5.660019814968109e-05, -5.4080039262771606e-05, -5.155988037586212e-05, -4.903972148895264e-05, -4.651956260204315e-05, -4.399940371513367e-05, -4.147924482822418e-05, -3.89590859413147e-05, -3.643892705440521e-05, -3.391876816749573e-05, -3.139860928058624e-05, -2.8878450393676758e-05, -2.6358291506767273e-05, -2.3838132619857788e-05, -2.1317973732948303e-05, -1.879781484603882e-05, -1.6277655959129333e-05, -1.3757497072219849e-05, -1.1237338185310364e-05, -8.717179298400879e-06, -6.197020411491394e-06, -3.676861524581909e-06, -1.1567026376724243e-06, 1.3634562492370605e-06, 3.883615136146545e-06, 6.40377402305603e-06, 8.923932909965515e-06, 1.1444091796875e-05, 1.3964250683784485e-05, 1.648440957069397e-05, 1.9004568457603455e-05, 2.152472734451294e-05, 2.4044886231422424e-05, 2.656504511833191e-05, 2.9085204005241394e-05, 3.160536289215088e-05, 3.4125521779060364e-05, 3.664568066596985e-05, 3.9165839552879333e-05, 4.168599843978882e-05, 4.42061573266983e-05, 4.672631621360779e-05, 4.924647510051727e-05, 5.176663398742676e-05, 5.428679287433624e-05, 5.680695176124573e-05, 5.932711064815521e-05, 6.18472695350647e-05, 6.436742842197418e-05, 6.688758730888367e-05, 6.940774619579315e-05, 7.192790508270264e-05, 7.444806396961212e-05, 7.69682228565216e-05, 7.948838174343109e-05, 8.200854063034058e-05, 8.452869951725006e-05, 8.704885840415955e-05, 8.956901729106903e-05, 9.208917617797852e-05]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 8.0, 9.0, 8.0, 10.0, 20.0, 33.0, 35.0, 57.0, 65.0, 75.0, 111.0, 171.0, 286.0, 469.0, 899.0, 135450.0, 907729.0, 1677.0, 511.0, 252.0, 213.0, 92.0, 111.0, 64.0, 47.0, 42.0, 22.0, 17.0, 12.0, 16.0, 11.0, 8.0, 3.0, 3.0, 1.0, 6.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0017881393432617188, -0.001735791563987732, -0.0016834437847137451, -0.0016310960054397583, -0.0015787482261657715, -0.0015264004468917847, -0.0014740526676177979, -0.001421704888343811, -0.0013693571090698242, -0.0013170093297958374, -0.0012646615505218506, -0.0012123137712478638, -0.001159965991973877, -0.0011076182126998901, -0.0010552704334259033, -0.0010029226541519165, -0.0009505748748779297, -0.0008982270956039429, -0.0008458793163299561, -0.0007935315370559692, -0.0007411837577819824, -0.0006888359785079956, -0.0006364881992340088, -0.000584140419960022, -0.0005317926406860352, -0.00047944486141204834, -0.0004270970821380615, -0.0003747493028640747, -0.0003224015235900879, -0.0002700537443161011, -0.00021770596504211426, -0.00016535818576812744, -0.00011301040649414062, -6.066262722015381e-05, -8.314847946166992e-06, 4.4032931327819824e-05, 9.638071060180664e-05, 0.00014872848987579346, 0.00020107626914978027, 0.0002534240484237671, 0.0003057718276977539, 0.0003581196069717407, 0.00041046738624572754, 0.00046281516551971436, 0.0005151629447937012, 0.000567510724067688, 0.0006198585033416748, 0.0006722062826156616, 0.0007245540618896484, 0.0007769018411636353, 0.0008292496204376221, 0.0008815973997116089, 0.0009339451789855957, 0.0009862929582595825, 0.0010386407375335693, 0.0010909885168075562, 0.001143336296081543, 0.0011956840753555298, 0.0012480318546295166, 0.0013003796339035034, 0.0013527274131774902, 0.001405075192451477, 0.0014574229717254639, 0.0015097707509994507, 0.0015621185302734375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 18.0, 74.0, 200.0, 315.0, 251.0, 106.0, 32.0, 9.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014139461563900113, -0.00013720209244638681, -0.0001330095692537725, -0.00012881704606115818, -0.00012462452286854386, -0.00012043199967592955, -0.00011623947648331523, -0.00011204695329070091, -0.0001078544300980866, -0.00010366190690547228, -9.946938371285796e-05, -9.527686052024364e-05, -9.108433732762933e-05, -8.689181413501501e-05, -8.26992909424007e-05, -7.850676774978638e-05, -7.431424455717206e-05, -7.012172136455774e-05, -6.592919817194343e-05, -6.173667497932911e-05, -5.754415178671479e-05, -5.3351628594100475e-05, -4.915910540148616e-05, -4.496658220887184e-05, -4.0774059016257524e-05, -3.658153582364321e-05, -3.238901263102889e-05, -2.8196489438414574e-05, -2.4003966245800257e-05, -1.981144305318594e-05, -1.5618919860571623e-05, -1.1426396667957306e-05, -7.233888027258217e-06, -3.0413648346439004e-06, 1.1511583579704165e-06, 5.3436815505847335e-06, 9.53620474319905e-06, 1.3728727935813367e-05, 1.7921251128427684e-05, 2.2113774321042e-05, 2.6306297513656318e-05, 3.0498820706270635e-05, 3.469134389888495e-05, 3.888386709149927e-05, 4.3076390284113586e-05, 4.72689134767279e-05, 5.146143666934222e-05, 5.565395986195654e-05, 5.9846483054570854e-05, 6.403900624718517e-05, 6.823152943979949e-05, 7.24240526324138e-05, 7.661657582502812e-05, 8.080909901764244e-05, 8.500162221025676e-05, 8.919414540287107e-05, 9.338666859548539e-05, 9.75791917880997e-05, 0.00010177171498071402, 0.00010596423817332834, 0.00011015676136594266, 0.00011434928455855697, 0.00011854180775117129, 0.0001227343309437856, 0.00012692685413639992]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 7.0, 4.0, 7.0, 7.0, 11.0, 12.0, 15.0, 12.0, 16.0, 13.0, 24.0, 24.0, 40.0, 29.0, 30.0, 36.0, 43.0, 35.0, 39.0, 40.0, 44.0, 20.0, 42.0, 46.0, 39.0, 36.0, 38.0, 39.0, 37.0, 27.0, 33.0, 29.0, 19.0, 19.0, 16.0, 14.0, 14.0, 8.0, 8.0, 7.0, 9.0, 6.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.993511199951172e-05, -3.862474113702774e-05, -3.731437027454376e-05, -3.6003999412059784e-05, -3.4693628549575806e-05, -3.338325768709183e-05, -3.207288682460785e-05, -3.076251596212387e-05, -2.9452145099639893e-05, -2.8141774237155914e-05, -2.6831403374671936e-05, -2.5521032512187958e-05, -2.421066164970398e-05, -2.290029078722e-05, -2.1589919924736023e-05, -2.0279549062252045e-05, -1.8969178199768066e-05, -1.7658807337284088e-05, -1.634843647480011e-05, -1.5038065612316132e-05, -1.3727694749832153e-05, -1.2417323887348175e-05, -1.1106953024864197e-05, -9.796582162380219e-06, -8.48621129989624e-06, -7.175840437412262e-06, -5.865469574928284e-06, -4.555098712444305e-06, -3.244727849960327e-06, -1.934356987476349e-06, -6.239861249923706e-07, 6.863847374916077e-07, 1.996755599975586e-06, 3.307126462459564e-06, 4.6174973249435425e-06, 5.927868187427521e-06, 7.238239049911499e-06, 8.548609912395477e-06, 9.858980774879456e-06, 1.1169351637363434e-05, 1.2479722499847412e-05, 1.379009336233139e-05, 1.5100464224815369e-05, 1.6410835087299347e-05, 1.7721205949783325e-05, 1.9031576812267303e-05, 2.0341947674751282e-05, 2.165231853723526e-05, 2.2962689399719238e-05, 2.4273060262203217e-05, 2.5583431124687195e-05, 2.6893801987171173e-05, 2.820417284965515e-05, 2.951454371213913e-05, 3.082491457462311e-05, 3.2135285437107086e-05, 3.3445656299591064e-05, 3.475602716207504e-05, 3.606639802455902e-05, 3.7376768887043e-05, 3.868713974952698e-05, 3.9997510612010956e-05, 4.1307881474494934e-05, 4.261825233697891e-05, 4.392862319946289e-05]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 6.0, 5.0, 8.0, 3.0, 12.0, 16.0, 17.0, 10.0, 16.0, 14.0, 18.0, 19.0, 17.0, 29.0, 23.0, 38.0, 50.0, 39.0, 50.0, 43.0, 44.0, 49.0, 35.0, 41.0, 55.0, 39.0, 36.0, 33.0, 46.0, 38.0, 27.0, 29.0, 18.0, 21.0, 7.0, 14.0, 10.0, 4.0, 5.0, 7.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.662109375, -2.590667724609375, -2.51922607421875, -2.447784423828125, -2.3763427734375, -2.304901123046875, -2.23345947265625, -2.162017822265625, -2.090576171875, -2.019134521484375, -1.94769287109375, -1.876251220703125, -1.8048095703125, -1.733367919921875, -1.66192626953125, -1.590484619140625, -1.51904296875, -1.447601318359375, -1.37615966796875, -1.304718017578125, -1.2332763671875, -1.161834716796875, -1.09039306640625, -1.018951416015625, -0.947509765625, -0.876068115234375, -0.80462646484375, -0.733184814453125, -0.6617431640625, -0.590301513671875, -0.51885986328125, -0.447418212890625, -0.3759765625, -0.304534912109375, -0.23309326171875, -0.161651611328125, -0.0902099609375, -0.018768310546875, 0.05267333984375, 0.124114990234375, 0.195556640625, 0.266998291015625, 0.33843994140625, 0.409881591796875, 0.4813232421875, 0.552764892578125, 0.62420654296875, 0.695648193359375, 0.76708984375, 0.838531494140625, 0.90997314453125, 0.981414794921875, 1.0528564453125, 1.124298095703125, 1.19573974609375, 1.267181396484375, 1.338623046875, 1.410064697265625, 1.48150634765625, 1.552947998046875, 1.6243896484375, 1.695831298828125, 1.76727294921875, 1.838714599609375, 1.91015625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 5.0, 9.0, 5.0, 7.0, 20.0, 24.0, 28.0, 44.0, 46.0, 83.0, 89.0, 124.0, 160.0, 265.0, 432.0, 600.0, 1161.0, 2082.0, 4168.0, 9598.0, 27434.0, 103100.0, 415593.0, 357992.0, 84778.0, 23181.0, 8720.0, 3802.0, 1931.0, 1132.0, 624.0, 429.0, 267.0, 180.0, 126.0, 94.0, 60.0, 42.0, 32.0, 20.0, 17.0, 17.0, 10.0, 6.0, 8.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.767578125, -2.6883544921875, -2.609130859375, -2.5299072265625, -2.45068359375, -2.3714599609375, -2.292236328125, -2.2130126953125, -2.1337890625, -2.0545654296875, -1.975341796875, -1.8961181640625, -1.81689453125, -1.7376708984375, -1.658447265625, -1.5792236328125, -1.5, -1.4207763671875, -1.341552734375, -1.2623291015625, -1.18310546875, -1.1038818359375, -1.024658203125, -0.9454345703125, -0.8662109375, -0.7869873046875, -0.707763671875, -0.6285400390625, -0.54931640625, -0.4700927734375, -0.390869140625, -0.3116455078125, -0.232421875, -0.1531982421875, -0.073974609375, 0.0052490234375, 0.08447265625, 0.1636962890625, 0.242919921875, 0.3221435546875, 0.4013671875, 0.4805908203125, 0.559814453125, 0.6390380859375, 0.71826171875, 0.7974853515625, 0.876708984375, 0.9559326171875, 1.03515625, 1.1143798828125, 1.193603515625, 1.2728271484375, 1.35205078125, 1.4312744140625, 1.510498046875, 1.5897216796875, 1.6689453125, 1.7481689453125, 1.827392578125, 1.9066162109375, 1.98583984375, 2.0650634765625, 2.144287109375, 2.2235107421875, 2.302734375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 3.0, 9.0, 10.0, 11.0, 7.0, 9.0, 16.0, 17.0, 18.0, 29.0, 26.0, 37.0, 26.0, 32.0, 37.0, 47.0, 54.0, 54.0, 197.0, 1701.0, 210.0, 70.0, 46.0, 58.0, 37.0, 47.0, 38.0, 31.0, 22.0, 26.0, 27.0, 19.0, 12.0, 16.0, 12.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.376708984375, -6.13623046875, -5.895751953125, -5.6552734375, -5.414794921875, -5.17431640625, -4.933837890625, -4.693359375, -4.452880859375, -4.21240234375, -3.971923828125, -3.7314453125, -3.490966796875, -3.25048828125, -3.010009765625, -2.76953125, -2.529052734375, -2.28857421875, -2.048095703125, -1.8076171875, -1.567138671875, -1.32666015625, -1.086181640625, -0.845703125, -0.605224609375, -0.36474609375, -0.124267578125, 0.1162109375, 0.356689453125, 0.59716796875, 0.837646484375, 1.078125, 1.318603515625, 1.55908203125, 1.799560546875, 2.0400390625, 2.280517578125, 2.52099609375, 2.761474609375, 3.001953125, 3.242431640625, 3.48291015625, 3.723388671875, 3.9638671875, 4.204345703125, 4.44482421875, 4.685302734375, 4.92578125, 5.166259765625, 5.40673828125, 5.647216796875, 5.8876953125, 6.128173828125, 6.36865234375, 6.609130859375, 6.849609375, 7.090087890625, 7.33056640625, 7.571044921875, 7.8115234375, 8.052001953125, 8.29248046875, 8.532958984375, 8.7734375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 5.0, 3.0, 3.0, 11.0, 11.0, 24.0, 24.0, 31.0, 36.0, 61.0, 71.0, 105.0, 182.0, 345.0, 934.0, 4902.0, 431975.0, 2695044.0, 9714.0, 1206.0, 398.0, 220.0, 111.0, 77.0, 40.0, 38.0, 30.0, 23.0, 15.0, 16.0, 14.0, 11.0, 7.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0703125, -14.60107421875, -14.1318359375, -13.66259765625, -13.193359375, -12.72412109375, -12.2548828125, -11.78564453125, -11.31640625, -10.84716796875, -10.3779296875, -9.90869140625, -9.439453125, -8.97021484375, -8.5009765625, -8.03173828125, -7.5625, -7.09326171875, -6.6240234375, -6.15478515625, -5.685546875, -5.21630859375, -4.7470703125, -4.27783203125, -3.80859375, -3.33935546875, -2.8701171875, -2.40087890625, -1.931640625, -1.46240234375, -0.9931640625, -0.52392578125, -0.0546875, 0.41455078125, 0.8837890625, 1.35302734375, 1.822265625, 2.29150390625, 2.7607421875, 3.22998046875, 3.69921875, 4.16845703125, 4.6376953125, 5.10693359375, 5.576171875, 6.04541015625, 6.5146484375, 6.98388671875, 7.453125, 7.92236328125, 8.3916015625, 8.86083984375, 9.330078125, 9.79931640625, 10.2685546875, 10.73779296875, 11.20703125, 11.67626953125, 12.1455078125, 12.61474609375, 13.083984375, 13.55322265625, 14.0224609375, 14.49169921875, 14.9609375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 61.0, 830.0, 123.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6708807945251465, -4.1117095947265625, -1.5525383949279785, 1.0066328048706055, 3.5658040046691895, 6.124975681304932, 8.684146881103516, 11.243316650390625, 13.802488327026367, 16.36166000366211, 18.92082977294922, 21.48000144958496, 24.039173126220703, 26.598344802856445, 29.157516479492188, 31.716686248779297, 34.27585983276367, 36.83502960205078, 39.394203186035156, 41.953372955322266, 44.512542724609375, 47.07171630859375, 49.63088607788086, 52.19005584716797, 54.749229431152344, 57.30839920043945, 59.86757278442383, 62.42674255371094, 64.98591613769531, 67.54508972167969, 70.10425567626953, 72.6634292602539, 75.22259521484375, 77.78176879882812, 80.34093475341797, 82.90010833740234, 85.45928192138672, 88.01844787597656, 90.57762145996094, 93.13679504394531, 95.69596862792969, 98.25514221191406, 100.8143081665039, 103.37348175048828, 105.93265533447266, 108.4918212890625, 111.05099487304688, 113.61016845703125, 116.1693344116211, 118.72850799560547, 121.28767395019531, 123.84684753417969, 126.40602111816406, 128.96519470214844, 131.5243682861328, 134.08352661132812, 136.6427001953125, 139.20187377929688, 141.76104736328125, 144.32022094726562, 146.87937927246094, 149.4385528564453, 151.9977264404297, 154.55690002441406, 157.11607360839844]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 10.0, 8.0, 11.0, 12.0, 10.0, 19.0, 15.0, 28.0, 33.0, 26.0, 35.0, 39.0, 43.0, 42.0, 41.0, 40.0, 41.0, 50.0, 38.0, 44.0, 41.0, 39.0, 46.0, 32.0, 37.0, 45.0, 37.0, 22.0, 20.0, 16.0, 19.0, 12.0, 6.0, 10.0, 4.0, 8.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.410625457763672, -24.621408462524414, -23.832191467285156, -23.0429744720459, -22.25375747680664, -21.464542388916016, -20.675325393676758, -19.8861083984375, -19.096891403198242, -18.307674407958984, -17.518457412719727, -16.72924041748047, -15.940024375915527, -15.15080738067627, -14.361591339111328, -13.57237434387207, -12.783157348632812, -11.993940353393555, -11.204723358154297, -10.415507316589355, -9.626290321350098, -8.83707332611084, -8.047857284545898, -7.258640289306641, -6.469423294067383, -5.680206298828125, -4.890989780426025, -4.101773262023926, -3.312556266784668, -2.5233395099639893, -1.7341227531433105, -0.9449062347412109, -0.15568923950195312, 0.6335275173187256, 1.4227442741394043, 2.211961030960083, 3.0011777877807617, 3.7903945446014404, 4.579611301422119, 5.368827819824219, 6.158044815063477, 6.947261810302734, 7.736478328704834, 8.525694847106934, 9.314911842346191, 10.10412883758545, 10.89334487915039, 11.682561874389648, 12.471778869628906, 13.260995864868164, 14.050212860107422, 14.839428901672363, 15.628645896911621, 16.417861938476562, 17.20707893371582, 17.996295928955078, 18.785512924194336, 19.574729919433594, 20.36394691467285, 21.15316390991211, 21.942378997802734, 22.731595993041992, 23.52081298828125, 24.310029983520508, 25.099246978759766]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 11.0, 4.0, 6.0, 10.0, 12.0, 14.0, 19.0, 20.0, 12.0, 14.0, 18.0, 23.0, 26.0, 27.0, 34.0, 33.0, 53.0, 34.0, 52.0, 47.0, 45.0, 43.0, 44.0, 47.0, 45.0, 35.0, 34.0, 56.0, 32.0, 24.0, 26.0, 17.0, 25.0, 13.0, 10.0, 5.0, 7.0, 7.0, 6.0, 11.0, 1.0, 0.0, 4.0, 2.0, 3.0], "bins": [-2.92578125, -2.8514556884765625, -2.777130126953125, -2.7028045654296875, -2.62847900390625, -2.5541534423828125, -2.479827880859375, -2.4055023193359375, -2.3311767578125, -2.2568511962890625, -2.182525634765625, -2.1082000732421875, -2.03387451171875, -1.9595489501953125, -1.885223388671875, -1.8108978271484375, -1.736572265625, -1.6622467041015625, -1.587921142578125, -1.5135955810546875, -1.43927001953125, -1.3649444580078125, -1.290618896484375, -1.2162933349609375, -1.1419677734375, -1.0676422119140625, -0.993316650390625, -0.9189910888671875, -0.84466552734375, -0.7703399658203125, -0.696014404296875, -0.6216888427734375, -0.54736328125, -0.4730377197265625, -0.398712158203125, -0.3243865966796875, -0.25006103515625, -0.1757354736328125, -0.101409912109375, -0.0270843505859375, 0.0472412109375, 0.1215667724609375, 0.195892333984375, 0.2702178955078125, 0.34454345703125, 0.4188690185546875, 0.493194580078125, 0.5675201416015625, 0.641845703125, 0.7161712646484375, 0.790496826171875, 0.8648223876953125, 0.93914794921875, 1.0134735107421875, 1.087799072265625, 1.1621246337890625, 1.2364501953125, 1.3107757568359375, 1.385101318359375, 1.4594268798828125, 1.53375244140625, 1.6080780029296875, 1.682403564453125, 1.7567291259765625, 1.8310546875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 8.0, 7.0, 8.0, 14.0, 21.0, 17.0, 36.0, 34.0, 33.0, 54.0, 83.0, 115.0, 227.0, 441.0, 951.0, 2538.0, 8113.0, 30121.0, 147084.0, 992768.0, 2233312.0, 645707.0, 100963.0, 21946.0, 6151.0, 1940.0, 753.0, 305.0, 142.0, 116.0, 74.0, 48.0, 37.0, 23.0, 20.0, 20.0, 13.0, 10.0, 8.0, 7.0, 6.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-5.25390625, -5.1094970703125, -4.965087890625, -4.8206787109375, -4.67626953125, -4.5318603515625, -4.387451171875, -4.2430419921875, -4.0986328125, -3.9542236328125, -3.809814453125, -3.6654052734375, -3.52099609375, -3.3765869140625, -3.232177734375, -3.0877685546875, -2.943359375, -2.7989501953125, -2.654541015625, -2.5101318359375, -2.36572265625, -2.2213134765625, -2.076904296875, -1.9324951171875, -1.7880859375, -1.6436767578125, -1.499267578125, -1.3548583984375, -1.21044921875, -1.0660400390625, -0.921630859375, -0.7772216796875, -0.6328125, -0.4884033203125, -0.343994140625, -0.1995849609375, -0.05517578125, 0.0892333984375, 0.233642578125, 0.3780517578125, 0.5224609375, 0.6668701171875, 0.811279296875, 0.9556884765625, 1.10009765625, 1.2445068359375, 1.388916015625, 1.5333251953125, 1.677734375, 1.8221435546875, 1.966552734375, 2.1109619140625, 2.25537109375, 2.3997802734375, 2.544189453125, 2.6885986328125, 2.8330078125, 2.9774169921875, 3.121826171875, 3.2662353515625, 3.41064453125, 3.5550537109375, 3.699462890625, 3.8438720703125, 3.98828125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 13.0, 31.0, 39.0, 94.0, 181.0, 323.0, 627.0, 974.0, 806.0, 464.0, 273.0, 117.0, 58.0, 32.0, 17.0, 12.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -16.04931640625, -15.6455078125, -15.24169921875, -14.837890625, -14.43408203125, -14.0302734375, -13.62646484375, -13.22265625, -12.81884765625, -12.4150390625, -12.01123046875, -11.607421875, -11.20361328125, -10.7998046875, -10.39599609375, -9.9921875, -9.58837890625, -9.1845703125, -8.78076171875, -8.376953125, -7.97314453125, -7.5693359375, -7.16552734375, -6.76171875, -6.35791015625, -5.9541015625, -5.55029296875, -5.146484375, -4.74267578125, -4.3388671875, -3.93505859375, -3.53125, -3.12744140625, -2.7236328125, -2.31982421875, -1.916015625, -1.51220703125, -1.1083984375, -0.70458984375, -0.30078125, 0.10302734375, 0.5068359375, 0.91064453125, 1.314453125, 1.71826171875, 2.1220703125, 2.52587890625, 2.9296875, 3.33349609375, 3.7373046875, 4.14111328125, 4.544921875, 4.94873046875, 5.3525390625, 5.75634765625, 6.16015625, 6.56396484375, 6.9677734375, 7.37158203125, 7.775390625, 8.17919921875, 8.5830078125, 8.98681640625, 9.390625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 5.0, 10.0, 11.0, 26.0, 30.0, 70.0, 155.0, 293.0, 947.0, 24119.0, 4097448.0, 69170.0, 1297.0, 334.0, 154.0, 88.0, 57.0, 19.0, 19.0, 10.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.59375, -22.50048828125, -21.4072265625, -20.31396484375, -19.220703125, -18.12744140625, -17.0341796875, -15.94091796875, -14.84765625, -13.75439453125, -12.6611328125, -11.56787109375, -10.474609375, -9.38134765625, -8.2880859375, -7.19482421875, -6.1015625, -5.00830078125, -3.9150390625, -2.82177734375, -1.728515625, -0.63525390625, 0.4580078125, 1.55126953125, 2.64453125, 3.73779296875, 4.8310546875, 5.92431640625, 7.017578125, 8.11083984375, 9.2041015625, 10.29736328125, 11.390625, 12.48388671875, 13.5771484375, 14.67041015625, 15.763671875, 16.85693359375, 17.9501953125, 19.04345703125, 20.13671875, 21.22998046875, 22.3232421875, 23.41650390625, 24.509765625, 25.60302734375, 26.6962890625, 27.78955078125, 28.8828125, 29.97607421875, 31.0693359375, 32.16259765625, 33.255859375, 34.34912109375, 35.4423828125, 36.53564453125, 37.62890625, 38.72216796875, 39.8154296875, 40.90869140625, 42.001953125, 43.09521484375, 44.1884765625, 45.28173828125, 46.375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 22.0, 62.0, 128.0, 199.0, 208.0, 201.0, 108.0, 46.0, 23.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.61354446411133, -51.95621871948242, -50.29888916015625, -48.641563415527344, -46.98423767089844, -45.326908111572266, -43.66958236694336, -42.01225280761719, -40.35492706298828, -38.697601318359375, -37.0402717590332, -35.3829460144043, -33.725616455078125, -32.06829071044922, -30.410964965820312, -28.753637313842773, -27.096309661865234, -25.438982009887695, -23.781654357910156, -22.12432861328125, -20.46700096130371, -18.809673309326172, -17.152347564697266, -15.495019912719727, -13.837692260742188, -12.180364608764648, -10.523037910461426, -8.865711212158203, -7.208383560180664, -5.551055908203125, -3.8937292098999023, -2.2364025115966797, -0.5790748596191406, 1.0782523155212402, 2.735579490661621, 4.392906665802002, 6.050233840942383, 7.707561492919922, 9.364888191223145, 11.022214889526367, 12.679542541503906, 14.336870193481445, 15.994196891784668, 17.65152359008789, 19.30885124206543, 20.96617889404297, 22.623504638671875, 24.280832290649414, 25.938159942626953, 27.595487594604492, 29.25281524658203, 30.910140991210938, 32.567466735839844, 34.224796295166016, 35.88212203979492, 37.539451599121094, 39.19677734375, 40.854103088378906, 42.51143264770508, 44.168758392333984, 45.826087951660156, 47.48341369628906, 49.14073944091797, 50.798065185546875, 52.45539474487305]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 11.0, 7.0, 10.0, 12.0, 13.0, 15.0, 15.0, 17.0, 25.0, 38.0, 34.0, 29.0, 40.0, 35.0, 45.0, 46.0, 35.0, 41.0, 39.0, 38.0, 46.0, 43.0, 39.0, 45.0, 30.0, 25.0, 29.0, 29.0, 41.0, 17.0, 21.0, 23.0, 13.0, 12.0, 14.0, 4.0, 4.0, 5.0, 4.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.47956657409668, -21.828731536865234, -21.177898406982422, -20.527063369750977, -19.87622833251953, -19.22539520263672, -18.574560165405273, -17.923725128173828, -17.272891998291016, -16.62205696105957, -15.971222877502441, -15.320388793945312, -14.669554710388184, -14.018720626831055, -13.36788558959961, -12.71705150604248, -12.066216468811035, -11.415382385253906, -10.764547348022461, -10.113713264465332, -9.462879180908203, -8.812044143676758, -8.161210060119629, -7.5103759765625, -6.859541416168213, -6.208706855773926, -5.557872772216797, -4.90703821182251, -4.256203651428223, -3.6053695678710938, -2.9545350074768066, -2.3037009239196777, -1.6528663635253906, -1.0020320415496826, -0.35119760036468506, 0.2996368408203125, 0.9504711627960205, 1.6013054847717285, 2.2521400451660156, 2.9029741287231445, 3.5538086891174316, 4.204643249511719, 4.855477333068848, 5.506311893463135, 6.157146453857422, 6.807980537414551, 7.458815097808838, 8.109649658203125, 8.760483741760254, 9.411317825317383, 10.062152862548828, 10.712986946105957, 11.363821029663086, 12.014656066894531, 12.66549015045166, 13.316324234008789, 13.967159271240234, 14.617993354797363, 15.268828392028809, 15.919662475585938, 16.570497512817383, 17.221330642700195, 17.87216567993164, 18.522998809814453, 19.1738338470459]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 11.0, 13.0, 11.0, 16.0, 14.0, 12.0, 21.0, 16.0, 25.0, 30.0, 37.0, 36.0, 42.0, 54.0, 44.0, 45.0, 50.0, 50.0, 52.0, 43.0, 41.0, 47.0, 42.0, 42.0, 39.0, 23.0, 29.0, 24.0, 10.0, 18.0, 14.0, 7.0, 11.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.232421875, -3.1514434814453125, -3.070465087890625, -2.9894866943359375, -2.90850830078125, -2.8275299072265625, -2.746551513671875, -2.6655731201171875, -2.5845947265625, -2.5036163330078125, -2.422637939453125, -2.3416595458984375, -2.26068115234375, -2.1797027587890625, -2.098724365234375, -2.0177459716796875, -1.936767578125, -1.8557891845703125, -1.774810791015625, -1.6938323974609375, -1.61285400390625, -1.5318756103515625, -1.450897216796875, -1.3699188232421875, -1.2889404296875, -1.2079620361328125, -1.126983642578125, -1.0460052490234375, -0.96502685546875, -0.8840484619140625, -0.803070068359375, -0.7220916748046875, -0.64111328125, -0.5601348876953125, -0.479156494140625, -0.3981781005859375, -0.31719970703125, -0.2362213134765625, -0.155242919921875, -0.0742645263671875, 0.0067138671875, 0.0876922607421875, 0.168670654296875, 0.2496490478515625, 0.33062744140625, 0.4116058349609375, 0.492584228515625, 0.5735626220703125, 0.654541015625, 0.7355194091796875, 0.816497802734375, 0.8974761962890625, 0.97845458984375, 1.0594329833984375, 1.140411376953125, 1.2213897705078125, 1.3023681640625, 1.3833465576171875, 1.464324951171875, 1.5453033447265625, 1.62628173828125, 1.7072601318359375, 1.788238525390625, 1.8692169189453125, 1.9501953125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 5.0, 10.0, 12.0, 14.0, 37.0, 56.0, 84.0, 147.0, 250.0, 483.0, 805.0, 1347.0, 2331.0, 3829.0, 6424.0, 10481.0, 17596.0, 30680.0, 56806.0, 118067.0, 316779.0, 261425.0, 102532.0, 49978.0, 27564.0, 16236.0, 9706.0, 5966.0, 3579.0, 2140.0, 1318.0, 761.0, 426.0, 265.0, 151.0, 85.0, 62.0, 30.0, 18.0, 22.0, 9.0, 10.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4462890625, -0.43085479736328125, -0.4154205322265625, -0.39998626708984375, -0.384552001953125, -0.36911773681640625, -0.3536834716796875, -0.33824920654296875, -0.32281494140625, -0.30738067626953125, -0.2919464111328125, -0.27651214599609375, -0.261077880859375, -0.24564361572265625, -0.2302093505859375, -0.21477508544921875, -0.1993408203125, -0.18390655517578125, -0.1684722900390625, -0.15303802490234375, -0.137603759765625, -0.12216949462890625, -0.1067352294921875, -0.09130096435546875, -0.07586669921875, -0.06043243408203125, -0.0449981689453125, -0.02956390380859375, -0.014129638671875, 0.00130462646484375, 0.0167388916015625, 0.03217315673828125, 0.047607421875, 0.06304168701171875, 0.0784759521484375, 0.09391021728515625, 0.109344482421875, 0.12477874755859375, 0.1402130126953125, 0.15564727783203125, 0.17108154296875, 0.18651580810546875, 0.2019500732421875, 0.21738433837890625, 0.232818603515625, 0.24825286865234375, 0.2636871337890625, 0.27912139892578125, 0.2945556640625, 0.30998992919921875, 0.3254241943359375, 0.34085845947265625, 0.356292724609375, 0.37172698974609375, 0.3871612548828125, 0.40259552001953125, 0.41802978515625, 0.43346405029296875, 0.4488983154296875, 0.46433258056640625, 0.479766845703125, 0.49520111083984375, 0.5106353759765625, 0.5260696411132812, 0.54150390625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 4.0, 14.0, 17.0, 15.0, 12.0, 10.0, 17.0, 17.0, 18.0, 18.0, 29.0, 25.0, 26.0, 34.0, 37.0, 35.0, 35.0, 38.0, 47.0, 1067.0, 38.0, 46.0, 37.0, 43.0, 33.0, 43.0, 33.0, 37.0, 26.0, 29.0, 16.0, 24.0, 16.0, 14.0, 10.0, 10.0, 12.0, 6.0, 6.0, 7.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.4453125, -1.4029998779296875, -1.360687255859375, -1.3183746337890625, -1.27606201171875, -1.2337493896484375, -1.191436767578125, -1.1491241455078125, -1.1068115234375, -1.0644989013671875, -1.022186279296875, -0.9798736572265625, -0.93756103515625, -0.8952484130859375, -0.852935791015625, -0.8106231689453125, -0.768310546875, -0.7259979248046875, -0.683685302734375, -0.6413726806640625, -0.59906005859375, -0.5567474365234375, -0.514434814453125, -0.4721221923828125, -0.4298095703125, -0.3874969482421875, -0.345184326171875, -0.3028717041015625, -0.26055908203125, -0.2182464599609375, -0.175933837890625, -0.1336212158203125, -0.09130859375, -0.0489959716796875, -0.006683349609375, 0.0356292724609375, 0.07794189453125, 0.1202545166015625, 0.162567138671875, 0.2048797607421875, 0.2471923828125, 0.2895050048828125, 0.331817626953125, 0.3741302490234375, 0.41644287109375, 0.4587554931640625, 0.501068115234375, 0.5433807373046875, 0.585693359375, 0.6280059814453125, 0.670318603515625, 0.7126312255859375, 0.75494384765625, 0.7972564697265625, 0.839569091796875, 0.8818817138671875, 0.9241943359375, 0.9665069580078125, 1.008819580078125, 1.0511322021484375, 1.09344482421875, 1.1357574462890625, 1.178070068359375, 1.2203826904296875, 1.2626953125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 20.0, 23.0, 35.0, 60.0, 70.0, 105.0, 140.0, 213.0, 272.0, 441.0, 660.0, 862.0, 1267.0, 1818.0, 2627.0, 3591.0, 5277.0, 7562.0, 10803.0, 15374.0, 22404.0, 34066.0, 53037.0, 87605.0, 167943.0, 1317842.0, 141310.0, 76666.0, 47566.0, 30733.0, 20426.0, 13736.0, 9531.0, 6697.0, 4802.0, 3395.0, 2456.0, 1754.0, 1214.0, 898.0, 591.0, 397.0, 284.0, 185.0, 123.0, 94.0, 44.0, 36.0, 24.0, 19.0, 7.0, 14.0, 7.0, 9.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2978515625, -0.288360595703125, -0.27886962890625, -0.269378662109375, -0.2598876953125, -0.250396728515625, -0.24090576171875, -0.231414794921875, -0.221923828125, -0.212432861328125, -0.20294189453125, -0.193450927734375, -0.1839599609375, -0.174468994140625, -0.16497802734375, -0.155487060546875, -0.14599609375, -0.136505126953125, -0.12701416015625, -0.117523193359375, -0.1080322265625, -0.098541259765625, -0.08905029296875, -0.079559326171875, -0.070068359375, -0.060577392578125, -0.05108642578125, -0.041595458984375, -0.0321044921875, -0.022613525390625, -0.01312255859375, -0.003631591796875, 0.005859375, 0.015350341796875, 0.02484130859375, 0.034332275390625, 0.0438232421875, 0.053314208984375, 0.06280517578125, 0.072296142578125, 0.081787109375, 0.091278076171875, 0.10076904296875, 0.110260009765625, 0.1197509765625, 0.129241943359375, 0.13873291015625, 0.148223876953125, 0.15771484375, 0.167205810546875, 0.17669677734375, 0.186187744140625, 0.1956787109375, 0.205169677734375, 0.21466064453125, 0.224151611328125, 0.233642578125, 0.243133544921875, 0.25262451171875, 0.262115478515625, 0.2716064453125, 0.281097412109375, 0.29058837890625, 0.300079345703125, 0.3095703125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 6.0, 4.0, 7.0, 12.0, 9.0, 14.0, 15.0, 24.0, 23.0, 29.0, 27.0, 40.0, 47.0, 60.0, 71.0, 85.0, 72.0, 69.0, 66.0, 65.0, 44.0, 41.0, 34.0, 33.0, 24.0, 16.0, 15.0, 9.0, 6.0, 5.0, 2.0, 4.0, 2.0, 7.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.855892181396484e-05, -7.606390863656998e-05, -7.356889545917511e-05, -7.107388228178024e-05, -6.857886910438538e-05, -6.608385592699051e-05, -6.358884274959564e-05, -6.109382957220078e-05, -5.859881639480591e-05, -5.610380321741104e-05, -5.3608790040016174e-05, -5.111377686262131e-05, -4.861876368522644e-05, -4.6123750507831573e-05, -4.3628737330436707e-05, -4.113372415304184e-05, -3.863871097564697e-05, -3.6143697798252106e-05, -3.364868462085724e-05, -3.115367144346237e-05, -2.8658658266067505e-05, -2.6163645088672638e-05, -2.366863191127777e-05, -2.1173618733882904e-05, -1.8678605556488037e-05, -1.618359237909317e-05, -1.3688579201698303e-05, -1.1193566024303436e-05, -8.69855284690857e-06, -6.203539669513702e-06, -3.7085264921188354e-06, -1.2135133147239685e-06, 1.2814998626708984e-06, 3.7765130400657654e-06, 6.271526217460632e-06, 8.7665393948555e-06, 1.1261552572250366e-05, 1.3756565749645233e-05, 1.62515789270401e-05, 1.8746592104434967e-05, 2.1241605281829834e-05, 2.37366184592247e-05, 2.6231631636619568e-05, 2.8726644814014435e-05, 3.12216579914093e-05, 3.371667116880417e-05, 3.6211684346199036e-05, 3.87066975235939e-05, 4.120171070098877e-05, 4.3696723878383636e-05, 4.6191737055778503e-05, 4.868675023317337e-05, 5.118176341056824e-05, 5.3676776587963104e-05, 5.617178976535797e-05, 5.866680294275284e-05, 6.11618161201477e-05, 6.365682929754257e-05, 6.615184247493744e-05, 6.86468556523323e-05, 7.114186882972717e-05, 7.363688200712204e-05, 7.61318951845169e-05, 7.862690836191177e-05, 8.112192153930664e-05]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 2.0, 3.0, 6.0, 7.0, 7.0, 7.0, 13.0, 13.0, 24.0, 25.0, 54.0, 64.0, 89.0, 119.0, 194.0, 315.0, 491.0, 1439.0, 476897.0, 565577.0, 1664.0, 505.0, 316.0, 218.0, 138.0, 93.0, 63.0, 40.0, 32.0, 23.0, 26.0, 21.0, 15.0, 15.0, 15.0, 3.0, 3.0, 2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00157928466796875, -0.001531451940536499, -0.001483619213104248, -0.001435786485671997, -0.001387953758239746, -0.0013401210308074951, -0.0012922883033752441, -0.0012444555759429932, -0.0011966228485107422, -0.0011487901210784912, -0.0011009573936462402, -0.0010531246662139893, -0.0010052919387817383, -0.0009574592113494873, -0.0009096264839172363, -0.0008617937564849854, -0.0008139610290527344, -0.0007661283016204834, -0.0007182955741882324, -0.0006704628467559814, -0.0006226301193237305, -0.0005747973918914795, -0.0005269646644592285, -0.00047913193702697754, -0.00043129920959472656, -0.0003834664821624756, -0.0003356337547302246, -0.00028780102729797363, -0.00023996829986572266, -0.00019213557243347168, -0.0001443028450012207, -9.647011756896973e-05, -4.863739013671875e-05, -8.046627044677734e-07, 4.70280647277832e-05, 9.486079216003418e-05, 0.00014269351959228516, 0.00019052624702453613, 0.0002383589744567871, 0.0002861917018890381, 0.00033402442932128906, 0.00038185715675354004, 0.000429689884185791, 0.000477522611618042, 0.000525355339050293, 0.0005731880664825439, 0.0006210207939147949, 0.0006688535213470459, 0.0007166862487792969, 0.0007645189762115479, 0.0008123517036437988, 0.0008601844310760498, 0.0009080171585083008, 0.0009558498859405518, 0.0010036826133728027, 0.0010515153408050537, 0.0010993480682373047, 0.0011471807956695557, 0.0011950135231018066, 0.0012428462505340576, 0.0012906789779663086, 0.0013385117053985596, 0.0013863444328308105, 0.0014341771602630615, 0.0014820098876953125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 35.0, 89.0, 200.0, 292.0, 227.0, 113.0, 41.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019078976765740663, -0.00018678136984817684, -0.00018277298659086227, -0.00017876458878163248, -0.0001747561909724027, -0.0001707477931631729, -0.0001667393953539431, -0.00016273101209662855, -0.00015872261428739876, -0.00015471421647816896, -0.0001507058332208544, -0.0001466974354116246, -0.00014268903760239482, -0.00013868063979316503, -0.00013467224198393524, -0.00013066385872662067, -0.00012665546091739088, -0.0001226470631081611, -0.00011863867257488891, -0.00011463028204161674, -0.00011062188423238695, -0.00010661348642315716, -0.00010260509588988498, -9.85967053566128e-05, -9.458830754738301e-05, -9.057990973815322e-05, -8.657151920488104e-05, -8.256312867160887e-05, -7.855473086237907e-05, -7.454633305314928e-05, -7.05379425198771e-05, -6.652955198660493e-05, -6.252114690141752e-05, -5.851275273016654e-05, -5.4504358558915555e-05, -5.049596438766457e-05, -4.648757021641359e-05, -4.24791760451626e-05, -3.847078187391162e-05, -3.4462387702660635e-05, -3.045399353140965e-05, -2.6445599360158667e-05, -2.2437205188907683e-05, -1.84288110176567e-05, -1.4420416846405715e-05, -1.041202267515473e-05, -6.403628503903747e-06, -2.3952343326527625e-06, 1.6131598385982215e-06, 5.621554009849206e-06, 9.62994818110019e-06, 1.3638342352351174e-05, 1.7646736523602158e-05, 2.1655130694853142e-05, 2.5663524866104126e-05, 2.967191903735511e-05, 3.3680313208606094e-05, 3.768870737985708e-05, 4.169710155110806e-05, 4.5705495722359046e-05, 4.971388989361003e-05, 5.3722284064861014e-05, 5.7730678236112e-05, 6.173907604534179e-05, 6.574746657861397e-05]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 9.0, 5.0, 8.0, 6.0, 7.0, 3.0, 23.0, 14.0, 19.0, 17.0, 21.0, 27.0, 42.0, 37.0, 32.0, 46.0, 41.0, 51.0, 52.0, 43.0, 42.0, 58.0, 47.0, 42.0, 50.0, 42.0, 39.0, 29.0, 31.0, 24.0, 13.0, 11.0, 14.0, 14.0, 11.0, 8.0, 6.0, 3.0, 6.0, 1.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.999471664428711e-05, -3.8691796362400055e-05, -3.7388876080513e-05, -3.6085955798625946e-05, -3.478303551673889e-05, -3.348011523485184e-05, -3.217719495296478e-05, -3.087427467107773e-05, -2.9571354389190674e-05, -2.826843410730362e-05, -2.6965513825416565e-05, -2.566259354352951e-05, -2.4359673261642456e-05, -2.30567529797554e-05, -2.1753832697868347e-05, -2.0450912415981293e-05, -1.9147992134094238e-05, -1.7845071852207184e-05, -1.654215157032013e-05, -1.5239231288433075e-05, -1.393631100654602e-05, -1.2633390724658966e-05, -1.1330470442771912e-05, -1.0027550160884857e-05, -8.724629878997803e-06, -7.421709597110748e-06, -6.118789315223694e-06, -4.815869033336639e-06, -3.512948751449585e-06, -2.2100284695625305e-06, -9.071081876754761e-07, 3.9581209421157837e-07, 1.6987323760986328e-06, 3.0016526579856873e-06, 4.304572939872742e-06, 5.607493221759796e-06, 6.910413503646851e-06, 8.213333785533905e-06, 9.51625406742096e-06, 1.0819174349308014e-05, 1.2122094631195068e-05, 1.3425014913082123e-05, 1.4727935194969177e-05, 1.603085547685623e-05, 1.7333775758743286e-05, 1.863669604063034e-05, 1.9939616322517395e-05, 2.124253660440445e-05, 2.2545456886291504e-05, 2.384837716817856e-05, 2.5151297450065613e-05, 2.6454217731952667e-05, 2.775713801383972e-05, 2.9060058295726776e-05, 3.036297857761383e-05, 3.1665898859500885e-05, 3.296881914138794e-05, 3.4271739423274994e-05, 3.557465970516205e-05, 3.68775799870491e-05, 3.818050026893616e-05, 3.948342055082321e-05, 4.0786340832710266e-05, 4.208926111459732e-05, 4.3392181396484375e-05]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 11.0, 13.0, 11.0, 16.0, 14.0, 12.0, 21.0, 16.0, 25.0, 30.0, 37.0, 36.0, 42.0, 54.0, 44.0, 45.0, 50.0, 50.0, 52.0, 43.0, 41.0, 47.0, 42.0, 42.0, 39.0, 23.0, 29.0, 24.0, 10.0, 18.0, 14.0, 7.0, 11.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.232421875, -3.1514434814453125, -3.070465087890625, -2.9894866943359375, -2.90850830078125, -2.8275299072265625, -2.746551513671875, -2.6655731201171875, -2.5845947265625, -2.5036163330078125, -2.422637939453125, -2.3416595458984375, -2.26068115234375, -2.1797027587890625, -2.098724365234375, -2.0177459716796875, -1.936767578125, -1.8557891845703125, -1.774810791015625, -1.6938323974609375, -1.61285400390625, -1.5318756103515625, -1.450897216796875, -1.3699188232421875, -1.2889404296875, -1.2079620361328125, -1.126983642578125, -1.0460052490234375, -0.96502685546875, -0.8840484619140625, -0.803070068359375, -0.7220916748046875, -0.64111328125, -0.5601348876953125, -0.479156494140625, -0.3981781005859375, -0.31719970703125, -0.2362213134765625, -0.155242919921875, -0.0742645263671875, 0.0067138671875, 0.0876922607421875, 0.168670654296875, 0.2496490478515625, 0.33062744140625, 0.4116058349609375, 0.492584228515625, 0.5735626220703125, 0.654541015625, 0.7355194091796875, 0.816497802734375, 0.8974761962890625, 0.97845458984375, 1.0594329833984375, 1.140411376953125, 1.2213897705078125, 1.3023681640625, 1.3833465576171875, 1.464324951171875, 1.5453033447265625, 1.62628173828125, 1.7072601318359375, 1.788238525390625, 1.8692169189453125, 1.9501953125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 9.0, 14.0, 30.0, 33.0, 48.0, 80.0, 112.0, 169.0, 323.0, 552.0, 1048.0, 1983.0, 3668.0, 7344.0, 15553.0, 37299.0, 94567.0, 231560.0, 338505.0, 186482.0, 73900.0, 29711.0, 12659.0, 6001.0, 3053.0, 1611.0, 915.0, 484.0, 320.0, 187.0, 128.0, 70.0, 55.0, 34.0, 17.0, 15.0, 5.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.24609375, -2.1859893798828125, -2.125885009765625, -2.0657806396484375, -2.00567626953125, -1.9455718994140625, -1.885467529296875, -1.8253631591796875, -1.7652587890625, -1.7051544189453125, -1.645050048828125, -1.5849456787109375, -1.52484130859375, -1.4647369384765625, -1.404632568359375, -1.3445281982421875, -1.284423828125, -1.2243194580078125, -1.164215087890625, -1.1041107177734375, -1.04400634765625, -0.9839019775390625, -0.923797607421875, -0.8636932373046875, -0.8035888671875, -0.7434844970703125, -0.683380126953125, -0.6232757568359375, -0.56317138671875, -0.5030670166015625, -0.442962646484375, -0.3828582763671875, -0.32275390625, -0.2626495361328125, -0.202545166015625, -0.1424407958984375, -0.08233642578125, -0.0222320556640625, 0.037872314453125, 0.0979766845703125, 0.1580810546875, 0.2181854248046875, 0.278289794921875, 0.3383941650390625, 0.39849853515625, 0.4586029052734375, 0.518707275390625, 0.5788116455078125, 0.638916015625, 0.6990203857421875, 0.759124755859375, 0.8192291259765625, 0.87933349609375, 0.9394378662109375, 0.999542236328125, 1.0596466064453125, 1.1197509765625, 1.1798553466796875, 1.239959716796875, 1.3000640869140625, 1.36016845703125, 1.4202728271484375, 1.480377197265625, 1.5404815673828125, 1.6005859375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 7.0, 9.0, 13.0, 14.0, 12.0, 16.0, 20.0, 22.0, 37.0, 38.0, 50.0, 60.0, 48.0, 76.0, 154.0, 439.0, 1467.0, 126.0, 84.0, 74.0, 49.0, 33.0, 33.0, 30.0, 23.0, 26.0, 22.0, 17.0, 13.0, 13.0, 10.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3984375, -10.07373046875, -9.7490234375, -9.42431640625, -9.099609375, -8.77490234375, -8.4501953125, -8.12548828125, -7.80078125, -7.47607421875, -7.1513671875, -6.82666015625, -6.501953125, -6.17724609375, -5.8525390625, -5.52783203125, -5.203125, -4.87841796875, -4.5537109375, -4.22900390625, -3.904296875, -3.57958984375, -3.2548828125, -2.93017578125, -2.60546875, -2.28076171875, -1.9560546875, -1.63134765625, -1.306640625, -0.98193359375, -0.6572265625, -0.33251953125, -0.0078125, 0.31689453125, 0.6416015625, 0.96630859375, 1.291015625, 1.61572265625, 1.9404296875, 2.26513671875, 2.58984375, 2.91455078125, 3.2392578125, 3.56396484375, 3.888671875, 4.21337890625, 4.5380859375, 4.86279296875, 5.1875, 5.51220703125, 5.8369140625, 6.16162109375, 6.486328125, 6.81103515625, 7.1357421875, 7.46044921875, 7.78515625, 8.10986328125, 8.4345703125, 8.75927734375, 9.083984375, 9.40869140625, 9.7333984375, 10.05810546875, 10.3828125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 14.0, 13.0, 20.0, 21.0, 21.0, 44.0, 45.0, 41.0, 73.0, 104.0, 187.0, 314.0, 759.0, 3352.0, 96768.0, 2997886.0, 42071.0, 2407.0, 666.0, 277.0, 195.0, 103.0, 68.0, 61.0, 33.0, 30.0, 26.0, 20.0, 13.0, 14.0, 14.0, 9.0, 6.0, 5.0, 6.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.4296875, -13.9552001953125, -13.480712890625, -13.0062255859375, -12.53173828125, -12.0572509765625, -11.582763671875, -11.1082763671875, -10.6337890625, -10.1593017578125, -9.684814453125, -9.2103271484375, -8.73583984375, -8.2613525390625, -7.786865234375, -7.3123779296875, -6.837890625, -6.3634033203125, -5.888916015625, -5.4144287109375, -4.93994140625, -4.4654541015625, -3.990966796875, -3.5164794921875, -3.0419921875, -2.5675048828125, -2.093017578125, -1.6185302734375, -1.14404296875, -0.6695556640625, -0.195068359375, 0.2794189453125, 0.75390625, 1.2283935546875, 1.702880859375, 2.1773681640625, 2.65185546875, 3.1263427734375, 3.600830078125, 4.0753173828125, 4.5498046875, 5.0242919921875, 5.498779296875, 5.9732666015625, 6.44775390625, 6.9222412109375, 7.396728515625, 7.8712158203125, 8.345703125, 8.8201904296875, 9.294677734375, 9.7691650390625, 10.24365234375, 10.7181396484375, 11.192626953125, 11.6671142578125, 12.1416015625, 12.6160888671875, 13.090576171875, 13.5650634765625, 14.03955078125, 14.5140380859375, 14.988525390625, 15.4630126953125, 15.9375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 5.0, 15.0, 40.0, 71.0, 137.0, 185.0, 200.0, 168.0, 109.0, 51.0, 19.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6231865882873535, -5.011821269989014, -4.400455474853516, -3.789090156555176, -3.177724599838257, -2.566359043121338, -1.954993724822998, -1.3436279296875, -0.7322626113891602, -0.12089711427688599, 0.4904683828353882, 1.1018338203430176, 1.7131993770599365, 2.3245649337768555, 2.9359302520751953, 3.5472960472106934, 4.158661365509033, 4.770026683807373, 5.381392478942871, 5.992757797241211, 6.604123115539551, 7.215488910675049, 7.826854228973389, 8.438220024108887, 9.049585342407227, 9.660950660705566, 10.272315979003906, 10.883682250976562, 11.495047569274902, 12.106412887573242, 12.717778205871582, 13.329143524169922, 13.940507888793945, 14.551873207092285, 15.163238525390625, 15.774604797363281, 16.385969161987305, 16.99733543395996, 17.608699798583984, 18.22006607055664, 18.831432342529297, 19.442798614501953, 20.054162979125977, 20.665529251098633, 21.276893615722656, 21.888259887695312, 22.49962615966797, 23.110990524291992, 23.722354888916016, 24.333721160888672, 24.945085525512695, 25.55645179748535, 26.167816162109375, 26.77918243408203, 27.390548706054688, 28.00191307067871, 28.613279342651367, 29.224645614624023, 29.836009979248047, 30.447376251220703, 31.058740615844727, 31.670106887817383, 32.281471252441406, 32.89283752441406, 33.50420379638672]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 9.0, 7.0, 4.0, 4.0, 8.0, 12.0, 8.0, 14.0, 18.0, 31.0, 25.0, 21.0, 34.0, 25.0, 26.0, 30.0, 58.0, 47.0, 41.0, 38.0, 44.0, 49.0, 38.0, 37.0, 43.0, 49.0, 35.0, 33.0, 28.0, 24.0, 31.0, 14.0, 11.0, 18.0, 10.0, 16.0, 19.0, 10.0, 10.0, 3.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.636640548706055, -28.737361907958984, -27.838083267211914, -26.938804626464844, -26.039527893066406, -25.140247344970703, -24.240970611572266, -23.341691970825195, -22.442413330078125, -21.543134689331055, -20.643856048583984, -19.744577407836914, -18.845298767089844, -17.946022033691406, -17.046743392944336, -16.147464752197266, -15.248186111450195, -14.348907470703125, -13.449628829956055, -12.5503511428833, -11.65107250213623, -10.75179386138916, -9.852516174316406, -8.953237533569336, -8.053958892822266, -7.154680252075195, -6.255402088165283, -5.356123924255371, -4.456845283508301, -3.5575666427612305, -2.6582884788513184, -1.7590103149414062, -0.8597335815429688, 0.03954482078552246, 0.9388232231140137, 1.8381016254425049, 2.737380027770996, 3.6366586685180664, 4.5359368324279785, 5.435214996337891, 6.334493637084961, 7.233772277832031, 8.133050918579102, 9.032328605651855, 9.931607246398926, 10.830885887145996, 11.73016357421875, 12.62944221496582, 13.52872085571289, 14.427999496459961, 15.327278137207031, 16.2265567779541, 17.125835418701172, 18.02511215209961, 18.92439079284668, 19.82366943359375, 20.72294807434082, 21.62222671508789, 22.52150535583496, 23.42078399658203, 24.32006072998047, 25.219341278076172, 26.11861801147461, 27.01789665222168, 27.91717529296875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 4.0, 10.0, 10.0, 16.0, 9.0, 20.0, 15.0, 12.0, 20.0, 20.0, 23.0, 32.0, 33.0, 43.0, 35.0, 56.0, 47.0, 51.0, 50.0, 44.0, 58.0, 45.0, 44.0, 45.0, 42.0, 39.0, 35.0, 30.0, 20.0, 25.0, 16.0, 9.0, 9.0, 10.0, 12.0, 6.0, 4.0, 6.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.52734375, -3.440399169921875, -3.35345458984375, -3.266510009765625, -3.1795654296875, -3.092620849609375, -3.00567626953125, -2.918731689453125, -2.831787109375, -2.744842529296875, -2.65789794921875, -2.570953369140625, -2.4840087890625, -2.397064208984375, -2.31011962890625, -2.223175048828125, -2.13623046875, -2.049285888671875, -1.96234130859375, -1.875396728515625, -1.7884521484375, -1.701507568359375, -1.61456298828125, -1.527618408203125, -1.440673828125, -1.353729248046875, -1.26678466796875, -1.179840087890625, -1.0928955078125, -1.005950927734375, -0.91900634765625, -0.832061767578125, -0.7451171875, -0.658172607421875, -0.57122802734375, -0.484283447265625, -0.3973388671875, -0.310394287109375, -0.22344970703125, -0.136505126953125, -0.049560546875, 0.037384033203125, 0.12432861328125, 0.211273193359375, 0.2982177734375, 0.385162353515625, 0.47210693359375, 0.559051513671875, 0.64599609375, 0.732940673828125, 0.81988525390625, 0.906829833984375, 0.9937744140625, 1.080718994140625, 1.16766357421875, 1.254608154296875, 1.341552734375, 1.428497314453125, 1.51544189453125, 1.602386474609375, 1.6893310546875, 1.776275634765625, 1.86322021484375, 1.950164794921875, 2.037109375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 8.0, 9.0, 10.0, 14.0, 10.0, 10.0, 21.0, 12.0, 27.0, 36.0, 56.0, 86.0, 115.0, 314.0, 794.0, 3004.0, 18718.0, 189584.0, 2281401.0, 1569903.0, 114078.0, 12595.0, 2273.0, 566.0, 239.0, 121.0, 73.0, 50.0, 39.0, 32.0, 13.0, 15.0, 10.0, 12.0, 8.0, 10.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.359375, -8.1387939453125, -7.918212890625, -7.6976318359375, -7.47705078125, -7.2564697265625, -7.035888671875, -6.8153076171875, -6.5947265625, -6.3741455078125, -6.153564453125, -5.9329833984375, -5.71240234375, -5.4918212890625, -5.271240234375, -5.0506591796875, -4.830078125, -4.6094970703125, -4.388916015625, -4.1683349609375, -3.94775390625, -3.7271728515625, -3.506591796875, -3.2860107421875, -3.0654296875, -2.8448486328125, -2.624267578125, -2.4036865234375, -2.18310546875, -1.9625244140625, -1.741943359375, -1.5213623046875, -1.30078125, -1.0802001953125, -0.859619140625, -0.6390380859375, -0.41845703125, -0.1978759765625, 0.022705078125, 0.2432861328125, 0.4638671875, 0.6844482421875, 0.905029296875, 1.1256103515625, 1.34619140625, 1.5667724609375, 1.787353515625, 2.0079345703125, 2.228515625, 2.4490966796875, 2.669677734375, 2.8902587890625, 3.11083984375, 3.3314208984375, 3.552001953125, 3.7725830078125, 3.9931640625, 4.2137451171875, 4.434326171875, 4.6549072265625, 4.87548828125, 5.0960693359375, 5.316650390625, 5.5372314453125, 5.7578125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 4.0, 13.0, 25.0, 28.0, 45.0, 81.0, 134.0, 216.0, 317.0, 462.0, 636.0, 633.0, 502.0, 347.0, 237.0, 149.0, 87.0, 60.0, 41.0, 17.0, 12.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.890625, -6.6044921875, -6.318359375, -6.0322265625, -5.74609375, -5.4599609375, -5.173828125, -4.8876953125, -4.6015625, -4.3154296875, -4.029296875, -3.7431640625, -3.45703125, -3.1708984375, -2.884765625, -2.5986328125, -2.3125, -2.0263671875, -1.740234375, -1.4541015625, -1.16796875, -0.8818359375, -0.595703125, -0.3095703125, -0.0234375, 0.2626953125, 0.548828125, 0.8349609375, 1.12109375, 1.4072265625, 1.693359375, 1.9794921875, 2.265625, 2.5517578125, 2.837890625, 3.1240234375, 3.41015625, 3.6962890625, 3.982421875, 4.2685546875, 4.5546875, 4.8408203125, 5.126953125, 5.4130859375, 5.69921875, 5.9853515625, 6.271484375, 6.5576171875, 6.84375, 7.1298828125, 7.416015625, 7.7021484375, 7.98828125, 8.2744140625, 8.560546875, 8.8466796875, 9.1328125, 9.4189453125, 9.705078125, 9.9912109375, 10.27734375, 10.5634765625, 10.849609375, 11.1357421875, 11.421875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 10.0, 9.0, 19.0, 21.0, 28.0, 53.0, 71.0, 131.0, 205.0, 349.0, 800.0, 3643.0, 119067.0, 3885003.0, 178717.0, 4426.0, 821.0, 371.0, 178.0, 121.0, 72.0, 51.0, 43.0, 26.0, 17.0, 12.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.9375, -24.23583984375, -23.5341796875, -22.83251953125, -22.130859375, -21.42919921875, -20.7275390625, -20.02587890625, -19.32421875, -18.62255859375, -17.9208984375, -17.21923828125, -16.517578125, -15.81591796875, -15.1142578125, -14.41259765625, -13.7109375, -13.00927734375, -12.3076171875, -11.60595703125, -10.904296875, -10.20263671875, -9.5009765625, -8.79931640625, -8.09765625, -7.39599609375, -6.6943359375, -5.99267578125, -5.291015625, -4.58935546875, -3.8876953125, -3.18603515625, -2.484375, -1.78271484375, -1.0810546875, -0.37939453125, 0.322265625, 1.02392578125, 1.7255859375, 2.42724609375, 3.12890625, 3.83056640625, 4.5322265625, 5.23388671875, 5.935546875, 6.63720703125, 7.3388671875, 8.04052734375, 8.7421875, 9.44384765625, 10.1455078125, 10.84716796875, 11.548828125, 12.25048828125, 12.9521484375, 13.65380859375, 14.35546875, 15.05712890625, 15.7587890625, 16.46044921875, 17.162109375, 17.86376953125, 18.5654296875, 19.26708984375, 19.96875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 50.0, 143.0, 312.0, 282.0, 162.0, 44.0, 14.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.97673034667969, -57.36958312988281, -54.76243591308594, -52.15528869628906, -49.54814529418945, -46.94099807739258, -44.3338508605957, -41.726707458496094, -39.11956024169922, -36.512413024902344, -33.90526580810547, -31.298120498657227, -28.690975189208984, -26.08382797241211, -23.476680755615234, -20.869535446166992, -18.262386322021484, -15.655240058898926, -13.048093795776367, -10.440946578979492, -7.833800315856934, -5.226654052734375, -2.6195068359375, -0.012361526489257812, 2.594785690307617, 5.201931953430176, 7.809078693389893, 10.41622543334961, 13.023371696472168, 15.630517959594727, 18.2376651763916, 20.844810485839844, 23.45195770263672, 26.059104919433594, 28.666250228881836, 31.27339744567871, 33.88054275512695, 36.48768997192383, 39.0948371887207, 41.70198059082031, 44.30912780761719, 46.91627502441406, 49.52342224121094, 52.13056945800781, 54.73771286010742, 57.3448600769043, 59.95200729370117, 62.55915069580078, 65.16630554199219, 67.77345275878906, 70.38059997558594, 72.98774719238281, 75.59489440917969, 78.20204162597656, 80.80918884277344, 83.41632843017578, 86.02347564697266, 88.63062286376953, 91.2377700805664, 93.84491729736328, 96.45206451416016, 99.0592041015625, 101.66635131835938, 104.27349853515625, 106.88064575195312]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 0.0, 4.0, 10.0, 11.0, 12.0, 19.0, 16.0, 11.0, 22.0, 17.0, 21.0, 19.0, 20.0, 39.0, 41.0, 43.0, 36.0, 36.0, 31.0, 39.0, 42.0, 36.0, 29.0, 33.0, 41.0, 30.0, 47.0, 34.0, 29.0, 23.0, 28.0, 29.0, 26.0, 21.0, 16.0, 15.0, 13.0, 10.0, 4.0, 10.0, 12.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-20.96520233154297, -20.3347225189209, -19.704240798950195, -19.073760986328125, -18.443281173706055, -17.812801361083984, -17.18231964111328, -16.55183982849121, -15.921359062194824, -15.290878295898438, -14.660398483276367, -14.02991771697998, -13.399436950683594, -12.768957138061523, -12.138476371765137, -11.50799560546875, -10.87751579284668, -10.247035026550293, -9.616555213928223, -8.986074447631836, -8.355594635009766, -7.725113868713379, -7.094633102416992, -6.464152812957764, -5.833672523498535, -5.203192234039307, -4.572711944580078, -3.9422311782836914, -3.311750888824463, -2.6812705993652344, -2.0507900714874268, -1.4203095436096191, -0.7898292541503906, -0.15934884548187256, 0.4711315631866455, 1.1016119718551636, 1.7320923805236816, 2.36257266998291, 2.9930531978607178, 3.6235337257385254, 4.254014015197754, 4.884494304656982, 5.514974594116211, 6.145455360412598, 6.775935649871826, 7.406415939331055, 8.036896705627441, 8.667377471923828, 9.297857284545898, 9.928338050842285, 10.558817863464355, 11.189298629760742, 11.819778442382812, 12.4502592086792, 13.080739974975586, 13.711219787597656, 14.341700553894043, 14.97218132019043, 15.6026611328125, 16.23314094543457, 16.863622665405273, 17.494102478027344, 18.124582290649414, 18.755064010620117, 19.385543823242188]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 9.0, 5.0, 10.0, 10.0, 17.0, 18.0, 13.0, 20.0, 26.0, 24.0, 32.0, 37.0, 37.0, 33.0, 53.0, 50.0, 55.0, 55.0, 51.0, 45.0, 55.0, 55.0, 41.0, 36.0, 33.0, 36.0, 18.0, 29.0, 24.0, 14.0, 15.0, 11.0, 15.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.546875, -3.4552001953125, -3.363525390625, -3.2718505859375, -3.18017578125, -3.0885009765625, -2.996826171875, -2.9051513671875, -2.8134765625, -2.7218017578125, -2.630126953125, -2.5384521484375, -2.44677734375, -2.3551025390625, -2.263427734375, -2.1717529296875, -2.080078125, -1.9884033203125, -1.896728515625, -1.8050537109375, -1.71337890625, -1.6217041015625, -1.530029296875, -1.4383544921875, -1.3466796875, -1.2550048828125, -1.163330078125, -1.0716552734375, -0.97998046875, -0.8883056640625, -0.796630859375, -0.7049560546875, -0.61328125, -0.5216064453125, -0.429931640625, -0.3382568359375, -0.24658203125, -0.1549072265625, -0.063232421875, 0.0284423828125, 0.1201171875, 0.2117919921875, 0.303466796875, 0.3951416015625, 0.48681640625, 0.5784912109375, 0.670166015625, 0.7618408203125, 0.853515625, 0.9451904296875, 1.036865234375, 1.1285400390625, 1.22021484375, 1.3118896484375, 1.403564453125, 1.4952392578125, 1.5869140625, 1.6785888671875, 1.770263671875, 1.8619384765625, 1.95361328125, 2.0452880859375, 2.136962890625, 2.2286376953125, 2.3203125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 5.0, 14.0, 17.0, 26.0, 41.0, 74.0, 101.0, 165.0, 290.0, 421.0, 763.0, 1257.0, 2105.0, 3448.0, 5817.0, 9934.0, 16766.0, 29955.0, 56664.0, 117734.0, 313142.0, 265863.0, 106161.0, 51585.0, 27820.0, 15837.0, 8979.0, 5376.0, 3265.0, 2004.0, 1127.0, 707.0, 436.0, 238.0, 148.0, 88.0, 58.0, 36.0, 24.0, 17.0, 14.0, 10.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5673828125, -0.5496139526367188, -0.5318450927734375, -0.5140762329101562, -0.496307373046875, -0.47853851318359375, -0.4607696533203125, -0.44300079345703125, -0.42523193359375, -0.40746307373046875, -0.3896942138671875, -0.37192535400390625, -0.354156494140625, -0.33638763427734375, -0.3186187744140625, -0.30084991455078125, -0.2830810546875, -0.26531219482421875, -0.2475433349609375, -0.22977447509765625, -0.212005615234375, -0.19423675537109375, -0.1764678955078125, -0.15869903564453125, -0.14093017578125, -0.12316131591796875, -0.1053924560546875, -0.08762359619140625, -0.069854736328125, -0.05208587646484375, -0.0343170166015625, -0.01654815673828125, 0.001220703125, 0.01898956298828125, 0.0367584228515625, 0.05452728271484375, 0.072296142578125, 0.09006500244140625, 0.1078338623046875, 0.12560272216796875, 0.14337158203125, 0.16114044189453125, 0.1789093017578125, 0.19667816162109375, 0.214447021484375, 0.23221588134765625, 0.2499847412109375, 0.26775360107421875, 0.2855224609375, 0.30329132080078125, 0.3210601806640625, 0.33882904052734375, 0.356597900390625, 0.37436676025390625, 0.3921356201171875, 0.40990447998046875, 0.42767333984375, 0.44544219970703125, 0.4632110595703125, 0.48097991943359375, 0.498748779296875, 0.5165176391601562, 0.5342864990234375, 0.5520553588867188, 0.56982421875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 8.0, 2.0, 2.0, 3.0, 10.0, 15.0, 9.0, 9.0, 15.0, 14.0, 24.0, 23.0, 26.0, 28.0, 19.0, 26.0, 31.0, 47.0, 37.0, 48.0, 43.0, 43.0, 1055.0, 44.0, 37.0, 32.0, 35.0, 43.0, 29.0, 38.0, 29.0, 30.0, 31.0, 20.0, 19.0, 18.0, 26.0, 15.0, 5.0, 9.0, 4.0, 6.0, 2.0, 10.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.470703125, -1.4229278564453125, -1.375152587890625, -1.3273773193359375, -1.27960205078125, -1.2318267822265625, -1.184051513671875, -1.1362762451171875, -1.0885009765625, -1.0407257080078125, -0.992950439453125, -0.9451751708984375, -0.89739990234375, -0.8496246337890625, -0.801849365234375, -0.7540740966796875, -0.706298828125, -0.6585235595703125, -0.610748291015625, -0.5629730224609375, -0.51519775390625, -0.4674224853515625, -0.419647216796875, -0.3718719482421875, -0.3240966796875, -0.2763214111328125, -0.228546142578125, -0.1807708740234375, -0.13299560546875, -0.0852203369140625, -0.037445068359375, 0.0103302001953125, 0.05810546875, 0.1058807373046875, 0.153656005859375, 0.2014312744140625, 0.24920654296875, 0.2969818115234375, 0.344757080078125, 0.3925323486328125, 0.4403076171875, 0.4880828857421875, 0.535858154296875, 0.5836334228515625, 0.63140869140625, 0.6791839599609375, 0.726959228515625, 0.7747344970703125, 0.822509765625, 0.8702850341796875, 0.918060302734375, 0.9658355712890625, 1.01361083984375, 1.0613861083984375, 1.109161376953125, 1.1569366455078125, 1.2047119140625, 1.2524871826171875, 1.300262451171875, 1.3480377197265625, 1.39581298828125, 1.4435882568359375, 1.491363525390625, 1.5391387939453125, 1.5869140625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 2.0, 6.0, 19.0, 16.0, 20.0, 42.0, 61.0, 98.0, 119.0, 168.0, 271.0, 347.0, 498.0, 667.0, 980.0, 1314.0, 1971.0, 2782.0, 3946.0, 5708.0, 8182.0, 12009.0, 17587.0, 25895.0, 39375.0, 62290.0, 107691.0, 217972.0, 1280980.0, 114065.0, 65832.0, 41027.0, 26663.0, 17942.0, 12212.0, 8565.0, 5910.0, 4172.0, 2856.0, 2048.0, 1398.0, 1055.0, 743.0, 488.0, 331.0, 236.0, 192.0, 113.0, 90.0, 70.0, 40.0, 34.0, 18.0, 15.0, 7.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.34423828125, -0.33349609375, -0.32275390625, -0.31201171875, -0.30126953125, -0.29052734375, -0.27978515625, -0.26904296875, -0.25830078125, -0.24755859375, -0.23681640625, -0.22607421875, -0.21533203125, -0.20458984375, -0.19384765625, -0.18310546875, -0.17236328125, -0.16162109375, -0.15087890625, -0.14013671875, -0.12939453125, -0.11865234375, -0.10791015625, -0.09716796875, -0.08642578125, -0.07568359375, -0.06494140625, -0.05419921875, -0.04345703125, -0.03271484375, -0.02197265625, -0.01123046875, -0.00048828125, 0.01025390625, 0.02099609375, 0.03173828125, 0.04248046875, 0.05322265625, 0.06396484375, 0.07470703125, 0.08544921875, 0.09619140625, 0.10693359375, 0.11767578125, 0.12841796875, 0.13916015625, 0.14990234375, 0.16064453125, 0.17138671875, 0.18212890625, 0.19287109375, 0.20361328125, 0.21435546875, 0.22509765625, 0.23583984375, 0.24658203125, 0.25732421875, 0.26806640625, 0.27880859375, 0.28955078125, 0.30029296875, 0.31103515625, 0.32177734375, 0.33251953125, 0.34326171875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 11.0, 7.0, 5.0, 7.0, 4.0, 17.0, 14.0, 35.0, 37.0, 44.0, 53.0, 40.0, 56.0, 86.0, 93.0, 82.0, 69.0, 59.0, 58.0, 55.0, 32.0, 28.0, 23.0, 20.0, 10.0, 12.0, 10.0, 5.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012302398681640625, -0.0001193443313241005, -0.00011566467583179474, -0.00011198502033948898, -0.00010830536484718323, -0.00010462570935487747, -0.00010094605386257172, -9.726639837026596e-05, -9.35867428779602e-05, -8.990708738565445e-05, -8.62274318933487e-05, -8.254777640104294e-05, -7.886812090873718e-05, -7.518846541643143e-05, -7.150880992412567e-05, -6.782915443181992e-05, -6.414949893951416e-05, -6.0469843447208405e-05, -5.679018795490265e-05, -5.311053246259689e-05, -4.943087697029114e-05, -4.575122147798538e-05, -4.2071565985679626e-05, -3.839191049337387e-05, -3.4712255001068115e-05, -3.103259950876236e-05, -2.7352944016456604e-05, -2.367328852415085e-05, -1.9993633031845093e-05, -1.6313977539539337e-05, -1.2634322047233582e-05, -8.954666554927826e-06, -5.27501106262207e-06, -1.5953555703163147e-06, 2.084299921989441e-06, 5.7639554142951965e-06, 9.443610906600952e-06, 1.3123266398906708e-05, 1.6802921891212463e-05, 2.048257738351822e-05, 2.4162232875823975e-05, 2.784188836812973e-05, 3.1521543860435486e-05, 3.520119935274124e-05, 3.8880854845047e-05, 4.256051033735275e-05, 4.624016582965851e-05, 4.9919821321964264e-05, 5.359947681427002e-05, 5.7279132306575775e-05, 6.095878779888153e-05, 6.463844329118729e-05, 6.831809878349304e-05, 7.19977542757988e-05, 7.567740976810455e-05, 7.935706526041031e-05, 8.303672075271606e-05, 8.671637624502182e-05, 9.039603173732758e-05, 9.407568722963333e-05, 9.775534272193909e-05, 0.00010143499821424484, 0.0001051146537065506, 0.00010879430919885635, 0.00011247396469116211]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 8.0, 16.0, 14.0, 25.0, 34.0, 51.0, 77.0, 98.0, 170.0, 268.0, 490.0, 1442.0, 883484.0, 160292.0, 955.0, 426.0, 237.0, 151.0, 112.0, 54.0, 35.0, 32.0, 20.0, 13.0, 9.0, 5.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0021686553955078125, -0.0020935535430908203, -0.002018451690673828, -0.001943349838256836, -0.0018682479858398438, -0.0017931461334228516, -0.0017180442810058594, -0.0016429424285888672, -0.001567840576171875, -0.0014927387237548828, -0.0014176368713378906, -0.0013425350189208984, -0.0012674331665039062, -0.001192331314086914, -0.0011172294616699219, -0.0010421276092529297, -0.0009670257568359375, -0.0008919239044189453, -0.0008168220520019531, -0.0007417201995849609, -0.0006666183471679688, -0.0005915164947509766, -0.0005164146423339844, -0.0004413127899169922, -0.0003662109375, -0.0002911090850830078, -0.00021600723266601562, -0.00014090538024902344, -6.580352783203125e-05, 9.298324584960938e-06, 8.440017700195312e-05, 0.0001595020294189453, 0.0002346038818359375, 0.0003097057342529297, 0.0003848075866699219, 0.00045990943908691406, 0.0005350112915039062, 0.0006101131439208984, 0.0006852149963378906, 0.0007603168487548828, 0.000835418701171875, 0.0009105205535888672, 0.0009856224060058594, 0.0010607242584228516, 0.0011358261108398438, 0.001210927963256836, 0.0012860298156738281, 0.0013611316680908203, 0.0014362335205078125, 0.0015113353729248047, 0.0015864372253417969, 0.001661539077758789, 0.0017366409301757812, 0.0018117427825927734, 0.0018868446350097656, 0.001961946487426758, 0.00203704833984375, 0.002112150192260742, 0.0021872520446777344, 0.0022623538970947266, 0.0023374557495117188, 0.002412557601928711, 0.002487659454345703, 0.0025627613067626953, 0.0026378631591796875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 10.0, 74.0, 178.0, 319.0, 252.0, 126.0, 42.0, 9.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002227829972980544, -0.00021745401318185031, -0.00021212502906564623, -0.00020679604494944215, -0.00020146706083323807, -0.00019613807671703398, -0.00019080910715274513, -0.00018548010848462582, -0.00018015113892033696, -0.00017482215480413288, -0.0001694931706879288, -0.0001641641865717247, -0.00015883520245552063, -0.00015350621833931655, -0.00014817723422311246, -0.0001428482646588236, -0.0001375192659907043, -0.00013219028187450022, -0.00012686129775829613, -0.00012153231364209205, -0.00011620332952588797, -0.00011087434540968388, -0.00010554536856943741, -0.00010021638445323333, -9.488740033702925e-05, -8.955841622082517e-05, -8.422943210462108e-05, -7.890045526437461e-05, -7.357147114817053e-05, -6.824248703196645e-05, -6.291350291576236e-05, -5.758451879955828e-05, -5.22555346833542e-05, -4.6926550567150116e-05, -4.159756645094603e-05, -3.626858597272076e-05, -3.0939601856516674e-05, -2.561061774031259e-05, -2.0281637262087315e-05, -1.4952653145883232e-05, -9.62366902967915e-06, -4.294685822969768e-06, 1.034297383739613e-06, 6.363279680954292e-06, 1.1692263797158375e-05, 1.702124791336246e-05, 2.2350228391587734e-05, 2.7679212507791817e-05, 3.30081966239959e-05, 3.833718074019998e-05, 4.3666164856404066e-05, 4.899514533462934e-05, 5.4324129450833425e-05, 5.965311356703751e-05, 6.498209404526278e-05, 7.031107816146687e-05, 7.564006227767095e-05, 8.096904639387503e-05, 8.629803051007912e-05, 9.162700735032558e-05, 9.695599146652967e-05, 0.00010228497558273375, 0.00010761395969893783, 0.00011294294381514192, 0.000118271927931346]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 7.0, 8.0, 8.0, 13.0, 9.0, 11.0, 13.0, 25.0, 17.0, 17.0, 24.0, 22.0, 30.0, 31.0, 42.0, 39.0, 50.0, 33.0, 39.0, 55.0, 39.0, 44.0, 49.0, 37.0, 29.0, 38.0, 34.0, 32.0, 26.0, 38.0, 31.0, 19.0, 11.0, 19.0, 15.0, 10.0, 12.0, 2.0, 6.0, 5.0, 5.0, 6.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.710124969482422e-05, -5.5429525673389435e-05, -5.375780165195465e-05, -5.208607763051987e-05, -5.041435360908508e-05, -4.87426295876503e-05, -4.7070905566215515e-05, -4.539918154478073e-05, -4.372745752334595e-05, -4.205573350191116e-05, -4.038400948047638e-05, -3.8712285459041595e-05, -3.704056143760681e-05, -3.536883741617203e-05, -3.3697113394737244e-05, -3.202538937330246e-05, -3.0353665351867676e-05, -2.8681941330432892e-05, -2.7010217308998108e-05, -2.5338493287563324e-05, -2.366676926612854e-05, -2.1995045244693756e-05, -2.0323321223258972e-05, -1.8651597201824188e-05, -1.6979873180389404e-05, -1.530814915895462e-05, -1.3636425137519836e-05, -1.1964701116085052e-05, -1.0292977094650269e-05, -8.621253073215485e-06, -6.949529051780701e-06, -5.277805030345917e-06, -3.606081008911133e-06, -1.934356987476349e-06, -2.6263296604156494e-07, 1.409091055393219e-06, 3.080815076828003e-06, 4.752539098262787e-06, 6.424263119697571e-06, 8.095987141132355e-06, 9.767711162567139e-06, 1.1439435184001923e-05, 1.3111159205436707e-05, 1.478288322687149e-05, 1.6454607248306274e-05, 1.812633126974106e-05, 1.9798055291175842e-05, 2.1469779312610626e-05, 2.314150333404541e-05, 2.4813227355480194e-05, 2.6484951376914978e-05, 2.8156675398349762e-05, 2.9828399419784546e-05, 3.150012344121933e-05, 3.3171847462654114e-05, 3.48435714840889e-05, 3.651529550552368e-05, 3.8187019526958466e-05, 3.985874354839325e-05, 4.1530467569828033e-05, 4.320219159126282e-05, 4.48739156126976e-05, 4.6545639634132385e-05, 4.821736365556717e-05, 4.988908767700195e-05]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 9.0, 5.0, 10.0, 10.0, 17.0, 18.0, 13.0, 20.0, 26.0, 24.0, 32.0, 37.0, 37.0, 33.0, 53.0, 50.0, 55.0, 55.0, 51.0, 45.0, 55.0, 55.0, 41.0, 36.0, 33.0, 36.0, 18.0, 29.0, 24.0, 14.0, 15.0, 11.0, 15.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.546875, -3.4552001953125, -3.363525390625, -3.2718505859375, -3.18017578125, -3.0885009765625, -2.996826171875, -2.9051513671875, -2.8134765625, -2.7218017578125, -2.630126953125, -2.5384521484375, -2.44677734375, -2.3551025390625, -2.263427734375, -2.1717529296875, -2.080078125, -1.9884033203125, -1.896728515625, -1.8050537109375, -1.71337890625, -1.6217041015625, -1.530029296875, -1.4383544921875, -1.3466796875, -1.2550048828125, -1.163330078125, -1.0716552734375, -0.97998046875, -0.8883056640625, -0.796630859375, -0.7049560546875, -0.61328125, -0.5216064453125, -0.429931640625, -0.3382568359375, -0.24658203125, -0.1549072265625, -0.063232421875, 0.0284423828125, 0.1201171875, 0.2117919921875, 0.303466796875, 0.3951416015625, 0.48681640625, 0.5784912109375, 0.670166015625, 0.7618408203125, 0.853515625, 0.9451904296875, 1.036865234375, 1.1285400390625, 1.22021484375, 1.3118896484375, 1.403564453125, 1.4952392578125, 1.5869140625, 1.6785888671875, 1.770263671875, 1.8619384765625, 1.95361328125, 2.0452880859375, 2.136962890625, 2.2286376953125, 2.3203125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 14.0, 14.0, 16.0, 23.0, 26.0, 50.0, 64.0, 71.0, 168.0, 256.0, 415.0, 793.0, 1380.0, 2698.0, 5352.0, 11418.0, 29065.0, 97757.0, 481515.0, 308960.0, 68181.0, 21553.0, 9296.0, 4360.0, 2244.0, 1162.0, 629.0, 383.0, 210.0, 162.0, 99.0, 67.0, 44.0, 29.0, 32.0, 14.0, 9.0, 8.0, 6.0, 2.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2578125, -3.13653564453125, -3.0152587890625, -2.89398193359375, -2.772705078125, -2.65142822265625, -2.5301513671875, -2.40887451171875, -2.28759765625, -2.16632080078125, -2.0450439453125, -1.92376708984375, -1.802490234375, -1.68121337890625, -1.5599365234375, -1.43865966796875, -1.3173828125, -1.19610595703125, -1.0748291015625, -0.95355224609375, -0.832275390625, -0.71099853515625, -0.5897216796875, -0.46844482421875, -0.34716796875, -0.22589111328125, -0.1046142578125, 0.01666259765625, 0.137939453125, 0.25921630859375, 0.3804931640625, 0.50177001953125, 0.623046875, 0.74432373046875, 0.8656005859375, 0.98687744140625, 1.108154296875, 1.22943115234375, 1.3507080078125, 1.47198486328125, 1.59326171875, 1.71453857421875, 1.8358154296875, 1.95709228515625, 2.078369140625, 2.19964599609375, 2.3209228515625, 2.44219970703125, 2.5634765625, 2.68475341796875, 2.8060302734375, 2.92730712890625, 3.048583984375, 3.16986083984375, 3.2911376953125, 3.41241455078125, 3.53369140625, 3.65496826171875, 3.7762451171875, 3.89752197265625, 4.018798828125, 4.14007568359375, 4.2613525390625, 4.38262939453125, 4.50390625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 1.0, 5.0, 8.0, 10.0, 7.0, 11.0, 15.0, 24.0, 18.0, 35.0, 28.0, 38.0, 44.0, 47.0, 61.0, 63.0, 94.0, 201.0, 1590.0, 201.0, 91.0, 64.0, 64.0, 47.0, 50.0, 38.0, 35.0, 25.0, 20.0, 27.0, 13.0, 21.0, 7.0, 9.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.296875, -8.9923095703125, -8.687744140625, -8.3831787109375, -8.07861328125, -7.7740478515625, -7.469482421875, -7.1649169921875, -6.8603515625, -6.5557861328125, -6.251220703125, -5.9466552734375, -5.64208984375, -5.3375244140625, -5.032958984375, -4.7283935546875, -4.423828125, -4.1192626953125, -3.814697265625, -3.5101318359375, -3.20556640625, -2.9010009765625, -2.596435546875, -2.2918701171875, -1.9873046875, -1.6827392578125, -1.378173828125, -1.0736083984375, -0.76904296875, -0.4644775390625, -0.159912109375, 0.1446533203125, 0.44921875, 0.7537841796875, 1.058349609375, 1.3629150390625, 1.66748046875, 1.9720458984375, 2.276611328125, 2.5811767578125, 2.8857421875, 3.1903076171875, 3.494873046875, 3.7994384765625, 4.10400390625, 4.4085693359375, 4.713134765625, 5.0177001953125, 5.322265625, 5.6268310546875, 5.931396484375, 6.2359619140625, 6.54052734375, 6.8450927734375, 7.149658203125, 7.4542236328125, 7.7587890625, 8.0633544921875, 8.367919921875, 8.6724853515625, 8.97705078125, 9.2816162109375, 9.586181640625, 9.8907470703125, 10.1953125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 13.0, 9.0, 6.0, 12.0, 27.0, 33.0, 41.0, 66.0, 90.0, 146.0, 268.0, 537.0, 2887.0, 386636.0, 2748022.0, 5382.0, 697.0, 288.0, 188.0, 111.0, 59.0, 46.0, 42.0, 17.0, 19.0, 12.0, 12.0, 6.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.890625, -29.01416015625, -28.1376953125, -27.26123046875, -26.384765625, -25.50830078125, -24.6318359375, -23.75537109375, -22.87890625, -22.00244140625, -21.1259765625, -20.24951171875, -19.373046875, -18.49658203125, -17.6201171875, -16.74365234375, -15.8671875, -14.99072265625, -14.1142578125, -13.23779296875, -12.361328125, -11.48486328125, -10.6083984375, -9.73193359375, -8.85546875, -7.97900390625, -7.1025390625, -6.22607421875, -5.349609375, -4.47314453125, -3.5966796875, -2.72021484375, -1.84375, -0.96728515625, -0.0908203125, 0.78564453125, 1.662109375, 2.53857421875, 3.4150390625, 4.29150390625, 5.16796875, 6.04443359375, 6.9208984375, 7.79736328125, 8.673828125, 9.55029296875, 10.4267578125, 11.30322265625, 12.1796875, 13.05615234375, 13.9326171875, 14.80908203125, 15.685546875, 16.56201171875, 17.4384765625, 18.31494140625, 19.19140625, 20.06787109375, 20.9443359375, 21.82080078125, 22.697265625, 23.57373046875, 24.4501953125, 25.32666015625, 26.203125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 6.0, 15.0, 23.0, 33.0, 50.0, 79.0, 98.0, 114.0, 141.0, 112.0, 92.0, 91.0, 53.0, 43.0, 25.0, 7.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.73713207244873, -9.322479248046875, -8.907827377319336, -8.49317455291748, -8.078522682189941, -7.663869857788086, -7.249217510223389, -6.834565162658691, -6.419912815093994, -6.005260467529297, -5.5906081199646, -5.175955772399902, -4.761302947998047, -4.346651077270508, -3.9319982528686523, -3.517345905303955, -3.102693557739258, -2.6880412101745605, -2.2733888626098633, -1.858736276626587, -1.4440839290618896, -1.0294315814971924, -0.614778995513916, -0.20012664794921875, 0.21452569961547852, 0.6291781067848206, 1.0438305139541626, 1.4584829807281494, 1.8731353282928467, 2.287787675857544, 2.7024402618408203, 3.1170926094055176, 3.5317459106445312, 3.9463982582092285, 4.361050605773926, 4.775703430175781, 5.19035530090332, 5.605008125305176, 6.019660472869873, 6.43431282043457, 6.848965167999268, 7.263617515563965, 7.678269863128662, 8.09292221069336, 8.507575035095215, 8.922226905822754, 9.33687973022461, 9.751531600952148, 10.166184425354004, 10.58083724975586, 10.995489120483398, 11.410141944885254, 11.824793815612793, 12.239446640014648, 12.654098510742188, 13.068751335144043, 13.483404159545898, 13.898056983947754, 14.312708854675293, 14.727361679077148, 15.142013549804688, 15.556666374206543, 15.971319198608398, 16.385971069335938, 16.800622940063477]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 0.0, 3.0, 5.0, 3.0, 3.0, 9.0, 13.0, 10.0, 9.0, 16.0, 20.0, 16.0, 18.0, 25.0, 41.0, 31.0, 23.0, 27.0, 46.0, 34.0, 45.0, 56.0, 49.0, 42.0, 46.0, 42.0, 47.0, 36.0, 34.0, 36.0, 28.0, 28.0, 20.0, 23.0, 15.0, 20.0, 15.0, 14.0, 13.0, 11.0, 11.0, 8.0, 5.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.16049575805664, -27.354175567626953, -26.5478572845459, -25.74153709411621, -24.935216903686523, -24.12889862060547, -23.32257843017578, -22.516258239746094, -21.709938049316406, -20.90361785888672, -20.097299575805664, -19.290979385375977, -18.48465919494629, -17.678340911865234, -16.872020721435547, -16.06570053100586, -15.259382247924805, -14.453063011169434, -13.646742820739746, -12.840423583984375, -12.034103393554688, -11.227784156799316, -10.421464920043945, -9.615144729614258, -8.808825492858887, -8.002506256103516, -7.196186065673828, -6.389866828918457, -5.583547115325928, -4.777227401733398, -3.9709081649780273, -3.164588451385498, -2.358266830444336, -1.5519472360610962, -0.7456276416778564, 0.06069183349609375, 0.867011547088623, 1.6733312606811523, 2.4796504974365234, 3.2859702110290527, 4.092289924621582, 4.898609638214111, 5.704929351806641, 6.511248588562012, 7.317568302154541, 8.12388801574707, 8.930207252502441, 9.736526489257812, 10.5428466796875, 11.349165916442871, 12.155486106872559, 12.96180534362793, 13.768125534057617, 14.574444770812988, 15.38076400756836, 16.187084197998047, 16.993404388427734, 17.799724578857422, 18.606042861938477, 19.412363052368164, 20.21868324279785, 21.025001525878906, 21.831321716308594, 22.63764190673828, 23.443960189819336]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 10.0, 8.0, 14.0, 14.0, 17.0, 19.0, 19.0, 19.0, 32.0, 28.0, 24.0, 37.0, 52.0, 44.0, 47.0, 49.0, 53.0, 42.0, 51.0, 40.0, 52.0, 47.0, 41.0, 34.0, 24.0, 35.0, 29.0, 18.0, 19.0, 18.0, 15.0, 9.0, 11.0, 7.0, 8.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.52734375, -3.4345703125, -3.341796875, -3.2490234375, -3.15625, -3.0634765625, -2.970703125, -2.8779296875, -2.78515625, -2.6923828125, -2.599609375, -2.5068359375, -2.4140625, -2.3212890625, -2.228515625, -2.1357421875, -2.04296875, -1.9501953125, -1.857421875, -1.7646484375, -1.671875, -1.5791015625, -1.486328125, -1.3935546875, -1.30078125, -1.2080078125, -1.115234375, -1.0224609375, -0.9296875, -0.8369140625, -0.744140625, -0.6513671875, -0.55859375, -0.4658203125, -0.373046875, -0.2802734375, -0.1875, -0.0947265625, -0.001953125, 0.0908203125, 0.18359375, 0.2763671875, 0.369140625, 0.4619140625, 0.5546875, 0.6474609375, 0.740234375, 0.8330078125, 0.92578125, 1.0185546875, 1.111328125, 1.2041015625, 1.296875, 1.3896484375, 1.482421875, 1.5751953125, 1.66796875, 1.7607421875, 1.853515625, 1.9462890625, 2.0390625, 2.1318359375, 2.224609375, 2.3173828125, 2.41015625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 8.0, 4.0, 10.0, 13.0, 15.0, 22.0, 36.0, 39.0, 49.0, 75.0, 105.0, 138.0, 245.0, 378.0, 608.0, 1175.0, 2280.0, 5060.0, 11889.0, 31186.0, 91513.0, 300274.0, 880384.0, 1434242.0, 934082.0, 337108.0, 104542.0, 34983.0, 13094.0, 5404.0, 2450.0, 1202.0, 596.0, 332.0, 211.0, 143.0, 97.0, 89.0, 58.0, 43.0, 26.0, 16.0, 18.0, 10.0, 9.0, 10.0, 2.0, 6.0, 5.0, 1.0, 2.0], "bins": [-3.470703125, -3.375732421875, -3.28076171875, -3.185791015625, -3.0908203125, -2.995849609375, -2.90087890625, -2.805908203125, -2.7109375, -2.615966796875, -2.52099609375, -2.426025390625, -2.3310546875, -2.236083984375, -2.14111328125, -2.046142578125, -1.951171875, -1.856201171875, -1.76123046875, -1.666259765625, -1.5712890625, -1.476318359375, -1.38134765625, -1.286376953125, -1.19140625, -1.096435546875, -1.00146484375, -0.906494140625, -0.8115234375, -0.716552734375, -0.62158203125, -0.526611328125, -0.431640625, -0.336669921875, -0.24169921875, -0.146728515625, -0.0517578125, 0.043212890625, 0.13818359375, 0.233154296875, 0.328125, 0.423095703125, 0.51806640625, 0.613037109375, 0.7080078125, 0.802978515625, 0.89794921875, 0.992919921875, 1.087890625, 1.182861328125, 1.27783203125, 1.372802734375, 1.4677734375, 1.562744140625, 1.65771484375, 1.752685546875, 1.84765625, 1.942626953125, 2.03759765625, 2.132568359375, 2.2275390625, 2.322509765625, 2.41748046875, 2.512451171875, 2.607421875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 5.0, 5.0, 7.0, 23.0, 32.0, 57.0, 72.0, 115.0, 186.0, 282.0, 388.0, 511.0, 633.0, 591.0, 381.0, 259.0, 179.0, 139.0, 81.0, 43.0, 33.0, 25.0, 8.0, 10.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8203125, -10.53961181640625, -10.2589111328125, -9.97821044921875, -9.697509765625, -9.41680908203125, -9.1361083984375, -8.85540771484375, -8.57470703125, -8.29400634765625, -8.0133056640625, -7.73260498046875, -7.451904296875, -7.17120361328125, -6.8905029296875, -6.60980224609375, -6.3291015625, -6.04840087890625, -5.7677001953125, -5.48699951171875, -5.206298828125, -4.92559814453125, -4.6448974609375, -4.36419677734375, -4.08349609375, -3.80279541015625, -3.5220947265625, -3.24139404296875, -2.960693359375, -2.67999267578125, -2.3992919921875, -2.11859130859375, -1.837890625, -1.55718994140625, -1.2764892578125, -0.99578857421875, -0.715087890625, -0.43438720703125, -0.1536865234375, 0.12701416015625, 0.40771484375, 0.68841552734375, 0.9691162109375, 1.24981689453125, 1.530517578125, 1.81121826171875, 2.0919189453125, 2.37261962890625, 2.6533203125, 2.93402099609375, 3.2147216796875, 3.49542236328125, 3.776123046875, 4.05682373046875, 4.3375244140625, 4.61822509765625, 4.89892578125, 5.17962646484375, 5.4603271484375, 5.74102783203125, 6.021728515625, 6.30242919921875, 6.5831298828125, 6.86383056640625, 7.14453125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 9.0, 21.0, 16.0, 15.0, 36.0, 58.0, 86.0, 114.0, 191.0, 372.0, 827.0, 4837.0, 196554.0, 3784228.0, 200357.0, 4862.0, 803.0, 324.0, 187.0, 105.0, 79.0, 56.0, 40.0, 24.0, 20.0, 16.0, 16.0, 5.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-22.015625, -21.3955078125, -20.775390625, -20.1552734375, -19.53515625, -18.9150390625, -18.294921875, -17.6748046875, -17.0546875, -16.4345703125, -15.814453125, -15.1943359375, -14.57421875, -13.9541015625, -13.333984375, -12.7138671875, -12.09375, -11.4736328125, -10.853515625, -10.2333984375, -9.61328125, -8.9931640625, -8.373046875, -7.7529296875, -7.1328125, -6.5126953125, -5.892578125, -5.2724609375, -4.65234375, -4.0322265625, -3.412109375, -2.7919921875, -2.171875, -1.5517578125, -0.931640625, -0.3115234375, 0.30859375, 0.9287109375, 1.548828125, 2.1689453125, 2.7890625, 3.4091796875, 4.029296875, 4.6494140625, 5.26953125, 5.8896484375, 6.509765625, 7.1298828125, 7.75, 8.3701171875, 8.990234375, 9.6103515625, 10.23046875, 10.8505859375, 11.470703125, 12.0908203125, 12.7109375, 13.3310546875, 13.951171875, 14.5712890625, 15.19140625, 15.8115234375, 16.431640625, 17.0517578125, 17.671875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 18.0, 39.0, 90.0, 189.0, 238.0, 209.0, 130.0, 61.0, 22.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.017578125, -71.08941650390625, -69.16124725341797, -67.23308563232422, -65.30491638183594, -63.37675476074219, -61.44858932495117, -59.520423889160156, -57.59225845336914, -55.664093017578125, -53.73592758178711, -51.807762145996094, -49.879600524902344, -47.95143127441406, -46.02326965332031, -44.0951042175293, -42.16693878173828, -40.238773345947266, -38.31060791015625, -36.382442474365234, -34.45427703857422, -32.52611541748047, -30.597949981689453, -28.669784545898438, -26.741619110107422, -24.813453674316406, -22.88528823852539, -20.957124710083008, -19.028959274291992, -17.100793838500977, -15.172629356384277, -13.244464874267578, -11.316303253173828, -9.388137817382812, -7.459973335266113, -5.531808376312256, -3.6036434173583984, -1.6754779815673828, 0.2526865005493164, 2.1808509826660156, 4.109016418457031, 6.037181377410889, 7.965346336364746, 9.893510818481445, 11.821676254272461, 13.749841690063477, 15.678006172180176, 17.606170654296875, 19.53433609008789, 21.462501525878906, 23.390666961669922, 25.318830490112305, 27.24699592590332, 29.175161361694336, 31.10332489013672, 33.031490325927734, 34.95965576171875, 36.887821197509766, 38.81598663330078, 40.7441520690918, 42.67231750488281, 44.60047912597656, 46.52864456176758, 48.456809997558594, 50.38497543334961]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 8.0, 6.0, 9.0, 11.0, 9.0, 14.0, 16.0, 21.0, 20.0, 18.0, 30.0, 26.0, 34.0, 40.0, 42.0, 51.0, 47.0, 38.0, 47.0, 47.0, 48.0, 61.0, 47.0, 25.0, 41.0, 35.0, 31.0, 27.0, 22.0, 21.0, 14.0, 17.0, 22.0, 12.0, 12.0, 8.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.206607818603516, -25.440139770507812, -24.67367172241211, -23.907203674316406, -23.140737533569336, -22.374269485473633, -21.60780143737793, -20.841333389282227, -20.074867248535156, -19.308399200439453, -18.54193115234375, -17.775463104248047, -17.008996963500977, -16.242528915405273, -15.47606086730957, -14.709592819213867, -13.943124771118164, -13.176656723022461, -12.410189628601074, -11.643721580505371, -10.877254486083984, -10.110786437988281, -9.344318389892578, -8.577850341796875, -7.811383247375488, -7.044915676116943, -6.278448104858398, -5.511980056762695, -4.74551248550415, -3.9790449142456055, -3.2125768661499023, -2.4461092948913574, -1.6796398162841797, -0.9131721258163452, -0.14670443534851074, 0.6197633743286133, 1.3862309455871582, 2.152698516845703, 2.9191665649414062, 3.685634136199951, 4.452101707458496, 5.218569278717041, 5.985036849975586, 6.751504898071289, 7.517972469329834, 8.284440040588379, 9.050908088684082, 9.817375183105469, 10.583843231201172, 11.350311279296875, 12.116778373718262, 12.883246421813965, 13.649713516235352, 14.416181564331055, 15.182649612426758, 15.949117660522461, 16.71558380126953, 17.482051849365234, 18.248519897460938, 19.01498794555664, 19.78145408630371, 20.547922134399414, 21.314390182495117, 22.08085823059082, 22.847326278686523]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 5.0, 3.0, 10.0, 12.0, 10.0, 13.0, 11.0, 23.0, 24.0, 24.0, 22.0, 28.0, 29.0, 33.0, 32.0, 41.0, 41.0, 49.0, 52.0, 51.0, 46.0, 47.0, 38.0, 47.0, 47.0, 36.0, 28.0, 27.0, 32.0, 20.0, 23.0, 18.0, 23.0, 15.0, 8.0, 7.0, 14.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.48828125, -3.39752197265625, -3.3067626953125, -3.21600341796875, -3.125244140625, -3.03448486328125, -2.9437255859375, -2.85296630859375, -2.76220703125, -2.67144775390625, -2.5806884765625, -2.48992919921875, -2.399169921875, -2.30841064453125, -2.2176513671875, -2.12689208984375, -2.0361328125, -1.94537353515625, -1.8546142578125, -1.76385498046875, -1.673095703125, -1.58233642578125, -1.4915771484375, -1.40081787109375, -1.31005859375, -1.21929931640625, -1.1285400390625, -1.03778076171875, -0.947021484375, -0.85626220703125, -0.7655029296875, -0.67474365234375, -0.583984375, -0.49322509765625, -0.4024658203125, -0.31170654296875, -0.220947265625, -0.13018798828125, -0.0394287109375, 0.05133056640625, 0.14208984375, 0.23284912109375, 0.3236083984375, 0.41436767578125, 0.505126953125, 0.59588623046875, 0.6866455078125, 0.77740478515625, 0.8681640625, 0.95892333984375, 1.0496826171875, 1.14044189453125, 1.231201171875, 1.32196044921875, 1.4127197265625, 1.50347900390625, 1.59423828125, 1.68499755859375, 1.7757568359375, 1.86651611328125, 1.957275390625, 2.04803466796875, 2.1387939453125, 2.22955322265625, 2.3203125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 12.0, 16.0, 35.0, 48.0, 85.0, 143.0, 185.0, 298.0, 511.0, 780.0, 1269.0, 2028.0, 3165.0, 5121.0, 8338.0, 13489.0, 22218.0, 37510.0, 67126.0, 134326.0, 323971.0, 209656.0, 93429.0, 50254.0, 29272.0, 17349.0, 10639.0, 6545.0, 4044.0, 2484.0, 1471.0, 984.0, 608.0, 420.0, 234.0, 171.0, 99.0, 63.0, 45.0, 34.0, 23.0, 14.0, 8.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.464111328125, -0.4479713439941406, -0.43183135986328125, -0.4156913757324219, -0.3995513916015625, -0.3834114074707031, -0.36727142333984375, -0.3511314392089844, -0.334991455078125, -0.3188514709472656, -0.30271148681640625, -0.2865715026855469, -0.2704315185546875, -0.2542915344238281, -0.23815155029296875, -0.22201156616210938, -0.20587158203125, -0.18973159790039062, -0.17359161376953125, -0.15745162963867188, -0.1413116455078125, -0.12517166137695312, -0.10903167724609375, -0.09289169311523438, -0.076751708984375, -0.060611724853515625, -0.04447174072265625, -0.028331756591796875, -0.0121917724609375, 0.003948211669921875, 0.02008819580078125, 0.036228179931640625, 0.0523681640625, 0.06850814819335938, 0.08464813232421875, 0.10078811645507812, 0.1169281005859375, 0.13306808471679688, 0.14920806884765625, 0.16534805297851562, 0.181488037109375, 0.19762802124023438, 0.21376800537109375, 0.22990798950195312, 0.2460479736328125, 0.2621879577636719, 0.27832794189453125, 0.2944679260253906, 0.31060791015625, 0.3267478942871094, 0.34288787841796875, 0.3590278625488281, 0.3751678466796875, 0.3913078308105469, 0.40744781494140625, 0.4235877990722656, 0.439727783203125, 0.4558677673339844, 0.47200775146484375, 0.4881477355957031, 0.5042877197265625, 0.5204277038574219, 0.5365676879882812, 0.5527076721191406, 0.56884765625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 3.0, 7.0, 6.0, 7.0, 8.0, 11.0, 9.0, 14.0, 15.0, 25.0, 18.0, 26.0, 21.0, 26.0, 24.0, 33.0, 39.0, 40.0, 48.0, 30.0, 49.0, 1073.0, 40.0, 30.0, 58.0, 41.0, 33.0, 38.0, 33.0, 34.0, 30.0, 29.0, 20.0, 15.0, 20.0, 12.0, 13.0, 11.0, 5.0, 11.0, 9.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7998046875, -1.7458953857421875, -1.691986083984375, -1.6380767822265625, -1.58416748046875, -1.5302581787109375, -1.476348876953125, -1.4224395751953125, -1.3685302734375, -1.3146209716796875, -1.260711669921875, -1.2068023681640625, -1.15289306640625, -1.0989837646484375, -1.045074462890625, -0.9911651611328125, -0.937255859375, -0.8833465576171875, -0.829437255859375, -0.7755279541015625, -0.72161865234375, -0.6677093505859375, -0.613800048828125, -0.5598907470703125, -0.5059814453125, -0.4520721435546875, -0.398162841796875, -0.3442535400390625, -0.29034423828125, -0.2364349365234375, -0.182525634765625, -0.1286163330078125, -0.07470703125, -0.0207977294921875, 0.033111572265625, 0.0870208740234375, 0.14093017578125, 0.1948394775390625, 0.248748779296875, 0.3026580810546875, 0.3565673828125, 0.4104766845703125, 0.464385986328125, 0.5182952880859375, 0.57220458984375, 0.6261138916015625, 0.680023193359375, 0.7339324951171875, 0.787841796875, 0.8417510986328125, 0.895660400390625, 0.9495697021484375, 1.00347900390625, 1.0573883056640625, 1.111297607421875, 1.1652069091796875, 1.2191162109375, 1.2730255126953125, 1.326934814453125, 1.3808441162109375, 1.43475341796875, 1.4886627197265625, 1.542572021484375, 1.5964813232421875, 1.650390625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 13.0, 10.0, 18.0, 31.0, 44.0, 70.0, 92.0, 160.0, 214.0, 348.0, 488.0, 672.0, 1003.0, 1431.0, 1984.0, 2911.0, 4098.0, 5830.0, 8440.0, 12601.0, 18339.0, 27434.0, 42086.0, 69565.0, 128134.0, 1307992.0, 200803.0, 97701.0, 56548.0, 35408.0, 22665.0, 15471.0, 10498.0, 7310.0, 5170.0, 3462.0, 2530.0, 1663.0, 1157.0, 816.0, 571.0, 402.0, 282.0, 217.0, 128.0, 99.0, 69.0, 45.0, 37.0, 24.0, 21.0, 10.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0], "bins": [-0.385009765625, -0.37290191650390625, -0.3607940673828125, -0.34868621826171875, -0.336578369140625, -0.32447052001953125, -0.3123626708984375, -0.30025482177734375, -0.28814697265625, -0.27603912353515625, -0.2639312744140625, -0.25182342529296875, -0.239715576171875, -0.22760772705078125, -0.2154998779296875, -0.20339202880859375, -0.1912841796875, -0.17917633056640625, -0.1670684814453125, -0.15496063232421875, -0.142852783203125, -0.13074493408203125, -0.1186370849609375, -0.10652923583984375, -0.09442138671875, -0.08231353759765625, -0.0702056884765625, -0.05809783935546875, -0.045989990234375, -0.03388214111328125, -0.0217742919921875, -0.00966644287109375, 0.00244140625, 0.01454925537109375, 0.0266571044921875, 0.03876495361328125, 0.050872802734375, 0.06298065185546875, 0.0750885009765625, 0.08719635009765625, 0.09930419921875, 0.11141204833984375, 0.1235198974609375, 0.13562774658203125, 0.147735595703125, 0.15984344482421875, 0.1719512939453125, 0.18405914306640625, 0.1961669921875, 0.20827484130859375, 0.2203826904296875, 0.23249053955078125, 0.244598388671875, 0.25670623779296875, 0.2688140869140625, 0.28092193603515625, 0.29302978515625, 0.30513763427734375, 0.3172454833984375, 0.32935333251953125, 0.341461181640625, 0.35356903076171875, 0.3656768798828125, 0.37778472900390625, 0.389892578125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 0.0, 1.0, 5.0, 6.0, 7.0, 9.0, 9.0, 18.0, 13.0, 20.0, 13.0, 26.0, 24.0, 43.0, 35.0, 47.0, 52.0, 61.0, 65.0, 62.0, 67.0, 59.0, 51.0, 50.0, 45.0, 35.0, 24.0, 36.0, 21.0, 13.0, 18.0, 22.0, 9.0, 5.0, 7.0, 4.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.00011789798736572266, -0.00011467467993497849, -0.00011145137250423431, -0.00010822806507349014, -0.00010500475764274597, -0.0001017814502120018, -9.855814278125763e-05, -9.533483535051346e-05, -9.211152791976929e-05, -8.888822048902512e-05, -8.566491305828094e-05, -8.244160562753677e-05, -7.92182981967926e-05, -7.599499076604843e-05, -7.277168333530426e-05, -6.954837590456009e-05, -6.632506847381592e-05, -6.310176104307175e-05, -5.9878453612327576e-05, -5.6655146181583405e-05, -5.3431838750839233e-05, -5.020853132009506e-05, -4.698522388935089e-05, -4.376191645860672e-05, -4.053860902786255e-05, -3.731530159711838e-05, -3.4091994166374207e-05, -3.0868686735630035e-05, -2.7645379304885864e-05, -2.4422071874141693e-05, -2.1198764443397522e-05, -1.797545701265335e-05, -1.475214958190918e-05, -1.1528842151165009e-05, -8.305534720420837e-06, -5.082227289676666e-06, -1.8589198589324951e-06, 1.364387571811676e-06, 4.587695002555847e-06, 7.811002433300018e-06, 1.103430986404419e-05, 1.425761729478836e-05, 1.7480924725532532e-05, 2.0704232156276703e-05, 2.3927539587020874e-05, 2.7150847017765045e-05, 3.0374154448509216e-05, 3.359746187925339e-05, 3.682076930999756e-05, 4.004407674074173e-05, 4.32673841714859e-05, 4.649069160223007e-05, 4.971399903297424e-05, 5.2937306463718414e-05, 5.6160613894462585e-05, 5.9383921325206757e-05, 6.260722875595093e-05, 6.58305361866951e-05, 6.905384361743927e-05, 7.227715104818344e-05, 7.550045847892761e-05, 7.872376590967178e-05, 8.194707334041595e-05, 8.517038077116013e-05, 8.83936882019043e-05]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 5.0, 8.0, 7.0, 17.0, 15.0, 20.0, 37.0, 34.0, 60.0, 105.0, 113.0, 189.0, 292.0, 561.0, 1497.0, 598272.0, 444482.0, 1393.0, 553.0, 304.0, 168.0, 129.0, 82.0, 55.0, 38.0, 25.0, 25.0, 12.0, 16.0, 5.0, 8.0, 4.0, 2.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019092559814453125, -0.0018410086631774902, -0.001772761344909668, -0.0017045140266418457, -0.0016362667083740234, -0.0015680193901062012, -0.001499772071838379, -0.0014315247535705566, -0.0013632774353027344, -0.0012950301170349121, -0.0012267827987670898, -0.0011585354804992676, -0.0010902881622314453, -0.001022040843963623, -0.0009537935256958008, -0.0008855462074279785, -0.0008172988891601562, -0.000749051570892334, -0.0006808042526245117, -0.0006125569343566895, -0.0005443096160888672, -0.0004760622978210449, -0.00040781497955322266, -0.0003395676612854004, -0.0002713203430175781, -0.00020307302474975586, -0.0001348257064819336, -6.657838821411133e-05, 1.6689300537109375e-06, 6.99162483215332e-05, 0.00013816356658935547, 0.00020641088485717773, 0.000274658203125, 0.00034290552139282227, 0.00041115283966064453, 0.0004794001579284668, 0.0005476474761962891, 0.0006158947944641113, 0.0006841421127319336, 0.0007523894309997559, 0.0008206367492675781, 0.0008888840675354004, 0.0009571313858032227, 0.001025378704071045, 0.0010936260223388672, 0.0011618733406066895, 0.0012301206588745117, 0.001298367977142334, 0.0013666152954101562, 0.0014348626136779785, 0.0015031099319458008, 0.001571357250213623, 0.0016396045684814453, 0.0017078518867492676, 0.0017760992050170898, 0.0018443465232849121, 0.0019125938415527344, 0.0019808411598205566, 0.002049088478088379, 0.002117335796356201, 0.0021855831146240234, 0.0022538304328918457, 0.002322077751159668, 0.0023903250694274902, 0.0024585723876953125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 57.0, 291.0, 433.0, 206.0, 21.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021717695926781744, -0.00020923932606820017, -0.0002013016928685829, -0.00019336407422088087, -0.0001854264410212636, -0.00017748880782164633, -0.00016955117462202907, -0.0001616135414224118, -0.00015367590822279453, -0.00014573827502317727, -0.00013780064182356, -0.00012986300862394273, -0.0001219253899762407, -0.00011398775677662343, -0.00010605012357700616, -9.81124903773889e-05, -9.017487172968686e-05, -8.223723853006959e-05, -7.429961260640994e-05, -6.636197940679267e-05, -5.842434984515421e-05, -5.048672028351575e-05, -4.2549087083898485e-05, -3.4611457522260025e-05, -2.6673827960621566e-05, -1.8736198398983106e-05, -1.0798567018355243e-05, -2.86093563772738e-06, 5.07669392391108e-06, 1.301432348554954e-05, 2.0951956685166806e-05, 2.8889586246805266e-05, 3.6827230360358953e-05, 4.476485992199741e-05, 5.270248948363587e-05, 6.064012268325314e-05, 6.857774860691279e-05, 7.651538180653006e-05, 8.445301500614733e-05, 9.239064820576459e-05, 0.00010032827412942424, 0.00010826590732904151, 0.00011620353325270116, 0.00012414116645231843, 0.0001320787996519357, 0.00014001643285155296, 0.00014795406605117023, 0.00015589168469887227, 0.00016382931789848953, 0.0001717669510981068, 0.00017970458429772407, 0.0001876422029454261, 0.00019557983614504337, 0.00020351746934466064, 0.0002114551025442779, 0.00021939273574389517, 0.00022733036894351244, 0.0002352680021431297, 0.00024320563534274697, 0.00025114326854236424, 0.0002590809017419815, 0.0002670185058377683, 0.00027495616814121604, 0.00028289377223700285, 0.0002908314054366201]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 7.0, 5.0, 5.0, 5.0, 10.0, 11.0, 9.0, 14.0, 14.0, 16.0, 16.0, 27.0, 29.0, 24.0, 40.0, 33.0, 39.0, 43.0, 40.0, 40.0, 36.0, 28.0, 41.0, 40.0, 38.0, 34.0, 39.0, 37.0, 36.0, 43.0, 22.0, 21.0, 22.0, 18.0, 20.0, 17.0, 14.0, 18.0, 10.0, 9.0, 8.0, 4.0, 11.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.881620407104492e-05, -4.726182669401169e-05, -4.5707449316978455e-05, -4.415307193994522e-05, -4.259869456291199e-05, -4.1044317185878754e-05, -3.948993980884552e-05, -3.7935562431812286e-05, -3.638118505477905e-05, -3.482680767774582e-05, -3.3272430300712585e-05, -3.171805292367935e-05, -3.0163675546646118e-05, -2.8609298169612885e-05, -2.705492079257965e-05, -2.5500543415546417e-05, -2.3946166038513184e-05, -2.239178866147995e-05, -2.0837411284446716e-05, -1.9283033907413483e-05, -1.772865653038025e-05, -1.6174279153347015e-05, -1.4619901776313782e-05, -1.3065524399280548e-05, -1.1511147022247314e-05, -9.95676964521408e-06, -8.402392268180847e-06, -6.8480148911476135e-06, -5.29363751411438e-06, -3.7392601370811462e-06, -2.1848827600479126e-06, -6.30505383014679e-07, 9.238719940185547e-07, 2.4782493710517883e-06, 4.032626748085022e-06, 5.587004125118256e-06, 7.141381502151489e-06, 8.695758879184723e-06, 1.0250136256217957e-05, 1.180451363325119e-05, 1.3358891010284424e-05, 1.4913268387317657e-05, 1.646764576435089e-05, 1.8022023141384125e-05, 1.957640051841736e-05, 2.1130777895450592e-05, 2.2685155272483826e-05, 2.423953264951706e-05, 2.5793910026550293e-05, 2.7348287403583527e-05, 2.890266478061676e-05, 3.0457042157649994e-05, 3.201141953468323e-05, 3.356579691171646e-05, 3.5120174288749695e-05, 3.667455166578293e-05, 3.822892904281616e-05, 3.9783306419849396e-05, 4.133768379688263e-05, 4.289206117391586e-05, 4.44464385509491e-05, 4.600081592798233e-05, 4.7555193305015564e-05, 4.91095706820488e-05, 5.066394805908203e-05]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 5.0, 3.0, 10.0, 12.0, 10.0, 13.0, 11.0, 23.0, 24.0, 24.0, 22.0, 28.0, 29.0, 33.0, 32.0, 41.0, 41.0, 49.0, 52.0, 51.0, 46.0, 47.0, 38.0, 47.0, 47.0, 36.0, 28.0, 27.0, 32.0, 20.0, 23.0, 18.0, 23.0, 15.0, 8.0, 7.0, 14.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.48828125, -3.39752197265625, -3.3067626953125, -3.21600341796875, -3.125244140625, -3.03448486328125, -2.9437255859375, -2.85296630859375, -2.76220703125, -2.67144775390625, -2.5806884765625, -2.48992919921875, -2.399169921875, -2.30841064453125, -2.2176513671875, -2.12689208984375, -2.0361328125, -1.94537353515625, -1.8546142578125, -1.76385498046875, -1.673095703125, -1.58233642578125, -1.4915771484375, -1.40081787109375, -1.31005859375, -1.21929931640625, -1.1285400390625, -1.03778076171875, -0.947021484375, -0.85626220703125, -0.7655029296875, -0.67474365234375, -0.583984375, -0.49322509765625, -0.4024658203125, -0.31170654296875, -0.220947265625, -0.13018798828125, -0.0394287109375, 0.05133056640625, 0.14208984375, 0.23284912109375, 0.3236083984375, 0.41436767578125, 0.505126953125, 0.59588623046875, 0.6866455078125, 0.77740478515625, 0.8681640625, 0.95892333984375, 1.0496826171875, 1.14044189453125, 1.231201171875, 1.32196044921875, 1.4127197265625, 1.50347900390625, 1.59423828125, 1.68499755859375, 1.7757568359375, 1.86651611328125, 1.957275390625, 2.04803466796875, 2.1387939453125, 2.22955322265625, 2.3203125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 6.0, 5.0, 2.0, 7.0, 9.0, 17.0, 16.0, 32.0, 44.0, 78.0, 118.0, 175.0, 283.0, 464.0, 795.0, 1479.0, 2761.0, 5428.0, 11499.0, 26069.0, 68385.0, 210360.0, 418787.0, 192132.0, 62959.0, 24601.0, 10866.0, 5210.0, 2657.0, 1359.0, 772.0, 486.0, 234.0, 154.0, 99.0, 76.0, 46.0, 25.0, 18.0, 9.0, 11.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0], "bins": [-3.697265625, -3.60113525390625, -3.5050048828125, -3.40887451171875, -3.312744140625, -3.21661376953125, -3.1204833984375, -3.02435302734375, -2.92822265625, -2.83209228515625, -2.7359619140625, -2.63983154296875, -2.543701171875, -2.44757080078125, -2.3514404296875, -2.25531005859375, -2.1591796875, -2.06304931640625, -1.9669189453125, -1.87078857421875, -1.774658203125, -1.67852783203125, -1.5823974609375, -1.48626708984375, -1.39013671875, -1.29400634765625, -1.1978759765625, -1.10174560546875, -1.005615234375, -0.90948486328125, -0.8133544921875, -0.71722412109375, -0.62109375, -0.52496337890625, -0.4288330078125, -0.33270263671875, -0.236572265625, -0.14044189453125, -0.0443115234375, 0.05181884765625, 0.14794921875, 0.24407958984375, 0.3402099609375, 0.43634033203125, 0.532470703125, 0.62860107421875, 0.7247314453125, 0.82086181640625, 0.9169921875, 1.01312255859375, 1.1092529296875, 1.20538330078125, 1.301513671875, 1.39764404296875, 1.4937744140625, 1.58990478515625, 1.68603515625, 1.78216552734375, 1.8782958984375, 1.97442626953125, 2.070556640625, 2.16668701171875, 2.2628173828125, 2.35894775390625, 2.455078125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 5.0, 3.0, 8.0, 6.0, 7.0, 7.0, 16.0, 17.0, 8.0, 23.0, 23.0, 20.0, 25.0, 37.0, 41.0, 43.0, 43.0, 53.0, 96.0, 205.0, 1506.0, 291.0, 115.0, 70.0, 50.0, 47.0, 45.0, 26.0, 31.0, 28.0, 23.0, 17.0, 23.0, 22.0, 19.0, 14.0, 5.0, 10.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0], "bins": [-12.53125, -12.198974609375, -11.86669921875, -11.534423828125, -11.2021484375, -10.869873046875, -10.53759765625, -10.205322265625, -9.873046875, -9.540771484375, -9.20849609375, -8.876220703125, -8.5439453125, -8.211669921875, -7.87939453125, -7.547119140625, -7.21484375, -6.882568359375, -6.55029296875, -6.218017578125, -5.8857421875, -5.553466796875, -5.22119140625, -4.888916015625, -4.556640625, -4.224365234375, -3.89208984375, -3.559814453125, -3.2275390625, -2.895263671875, -2.56298828125, -2.230712890625, -1.8984375, -1.566162109375, -1.23388671875, -0.901611328125, -0.5693359375, -0.237060546875, 0.09521484375, 0.427490234375, 0.759765625, 1.092041015625, 1.42431640625, 1.756591796875, 2.0888671875, 2.421142578125, 2.75341796875, 3.085693359375, 3.41796875, 3.750244140625, 4.08251953125, 4.414794921875, 4.7470703125, 5.079345703125, 5.41162109375, 5.743896484375, 6.076171875, 6.408447265625, 6.74072265625, 7.072998046875, 7.4052734375, 7.737548828125, 8.06982421875, 8.402099609375, 8.734375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 8.0, 4.0, 4.0, 9.0, 6.0, 28.0, 20.0, 41.0, 40.0, 59.0, 85.0, 104.0, 173.0, 301.0, 630.0, 3625.0, 2420970.0, 715503.0, 2713.0, 543.0, 281.0, 184.0, 97.0, 67.0, 48.0, 42.0, 36.0, 26.0, 11.0, 8.0, 11.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.03125, -32.0859375, -31.140625, -30.1953125, -29.25, -28.3046875, -27.359375, -26.4140625, -25.46875, -24.5234375, -23.578125, -22.6328125, -21.6875, -20.7421875, -19.796875, -18.8515625, -17.90625, -16.9609375, -16.015625, -15.0703125, -14.125, -13.1796875, -12.234375, -11.2890625, -10.34375, -9.3984375, -8.453125, -7.5078125, -6.5625, -5.6171875, -4.671875, -3.7265625, -2.78125, -1.8359375, -0.890625, 0.0546875, 1.0, 1.9453125, 2.890625, 3.8359375, 4.78125, 5.7265625, 6.671875, 7.6171875, 8.5625, 9.5078125, 10.453125, 11.3984375, 12.34375, 13.2890625, 14.234375, 15.1796875, 16.125, 17.0703125, 18.015625, 18.9609375, 19.90625, 20.8515625, 21.796875, 22.7421875, 23.6875, 24.6328125, 25.578125, 26.5234375, 27.46875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 4.0, 178.0, 732.0, 100.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.644240379333496, -12.759722709655762, -9.875204086303711, -6.990686416625977, -4.106168746948242, -1.2216510772705078, 1.662867546081543, 4.547385215759277, 7.431902885437012, 10.316420555114746, 13.200939178466797, 16.08545684814453, 18.969974517822266, 21.8544921875, 24.739009857177734, 27.62352752685547, 30.508045196533203, 33.39256286621094, 36.27708053588867, 39.161598205566406, 42.04611587524414, 44.930633544921875, 47.815155029296875, 50.699668884277344, 53.584190368652344, 56.46870803833008, 59.35322570800781, 62.23774337768555, 65.12226104736328, 68.00678253173828, 70.89129638671875, 73.77581787109375, 76.66033172607422, 79.54485321044922, 82.42936706542969, 85.31388854980469, 88.19840240478516, 91.08292388916016, 93.96743774414062, 96.85195922851562, 99.7364730834961, 102.6209945678711, 105.50550842285156, 108.39002990722656, 111.27454376220703, 114.15906524658203, 117.0435791015625, 119.9281005859375, 122.8126220703125, 125.6971435546875, 128.5816650390625, 131.46617126464844, 134.35069274902344, 137.23521423339844, 140.11973571777344, 143.00424194335938, 145.88876342773438, 148.77328491210938, 151.65780639648438, 154.5423126220703, 157.4268341064453, 160.3113555908203, 163.1958770751953, 166.08038330078125, 168.96490478515625]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 9.0, 10.0, 6.0, 9.0, 13.0, 10.0, 24.0, 24.0, 27.0, 22.0, 36.0, 29.0, 34.0, 38.0, 40.0, 37.0, 38.0, 39.0, 41.0, 44.0, 42.0, 50.0, 38.0, 45.0, 37.0, 27.0, 32.0, 34.0, 19.0, 14.0, 26.0, 25.0, 15.0, 12.0, 16.0, 9.0, 7.0, 4.0, 4.0, 6.0, 5.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.087427139282227, -26.29973602294922, -25.51204490661621, -24.724353790283203, -23.936662673950195, -23.148971557617188, -22.36128044128418, -21.573589324951172, -20.785898208618164, -19.998207092285156, -19.21051597595215, -18.42282485961914, -17.635133743286133, -16.847442626953125, -16.059751510620117, -15.27206039428711, -14.484368324279785, -13.696677207946777, -12.90898609161377, -12.121294975280762, -11.333603858947754, -10.545912742614746, -9.758220672607422, -8.970529556274414, -8.182838439941406, -7.395147323608398, -6.607456207275391, -5.819765090942383, -5.032073974609375, -4.244382858276367, -3.456691265106201, -2.6690001487731934, -1.8813095092773438, -1.093618392944336, -0.3059271574020386, 0.4817640781402588, 1.2694551944732666, 2.0571463108062744, 2.8448376655578613, 3.632528781890869, 4.420219898223877, 5.207911014556885, 5.995602130889893, 6.783293724060059, 7.570984840393066, 8.358675956726074, 9.146367073059082, 9.93405818939209, 10.721749305725098, 11.509440422058105, 12.297131538391113, 13.084822654724121, 13.872513771057129, 14.660204887390137, 15.447896957397461, 16.23558807373047, 17.023279190063477, 17.810970306396484, 18.598661422729492, 19.3863525390625, 20.174043655395508, 20.961734771728516, 21.749425888061523, 22.53711700439453, 23.32480812072754]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 9.0, 2.0, 9.0, 9.0, 13.0, 10.0, 18.0, 18.0, 20.0, 26.0, 29.0, 32.0, 37.0, 33.0, 38.0, 37.0, 52.0, 49.0, 39.0, 50.0, 48.0, 49.0, 43.0, 47.0, 30.0, 36.0, 28.0, 31.0, 22.0, 26.0, 22.0, 20.0, 14.0, 14.0, 11.0, 8.0, 12.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.72265625, -3.62689208984375, -3.5311279296875, -3.43536376953125, -3.339599609375, -3.24383544921875, -3.1480712890625, -3.05230712890625, -2.95654296875, -2.86077880859375, -2.7650146484375, -2.66925048828125, -2.573486328125, -2.47772216796875, -2.3819580078125, -2.28619384765625, -2.1904296875, -2.09466552734375, -1.9989013671875, -1.90313720703125, -1.807373046875, -1.71160888671875, -1.6158447265625, -1.52008056640625, -1.42431640625, -1.32855224609375, -1.2327880859375, -1.13702392578125, -1.041259765625, -0.94549560546875, -0.8497314453125, -0.75396728515625, -0.658203125, -0.56243896484375, -0.4666748046875, -0.37091064453125, -0.275146484375, -0.17938232421875, -0.0836181640625, 0.01214599609375, 0.10791015625, 0.20367431640625, 0.2994384765625, 0.39520263671875, 0.490966796875, 0.58673095703125, 0.6824951171875, 0.77825927734375, 0.8740234375, 0.96978759765625, 1.0655517578125, 1.16131591796875, 1.257080078125, 1.35284423828125, 1.4486083984375, 1.54437255859375, 1.64013671875, 1.73590087890625, 1.8316650390625, 1.92742919921875, 2.023193359375, 2.11895751953125, 2.2147216796875, 2.31048583984375, 2.40625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 7.0, 5.0, 4.0, 7.0, 11.0, 10.0, 10.0, 24.0, 19.0, 21.0, 34.0, 43.0, 49.0, 48.0, 65.0, 78.0, 132.0, 214.0, 558.0, 3366.0, 114100.0, 3649984.0, 417365.0, 6543.0, 741.0, 221.0, 151.0, 85.0, 71.0, 60.0, 41.0, 42.0, 25.0, 32.0, 28.0, 28.0, 12.0, 17.0, 4.0, 11.0, 7.0, 6.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-16.578125, -16.14892578125, -15.7197265625, -15.29052734375, -14.861328125, -14.43212890625, -14.0029296875, -13.57373046875, -13.14453125, -12.71533203125, -12.2861328125, -11.85693359375, -11.427734375, -10.99853515625, -10.5693359375, -10.14013671875, -9.7109375, -9.28173828125, -8.8525390625, -8.42333984375, -7.994140625, -7.56494140625, -7.1357421875, -6.70654296875, -6.27734375, -5.84814453125, -5.4189453125, -4.98974609375, -4.560546875, -4.13134765625, -3.7021484375, -3.27294921875, -2.84375, -2.41455078125, -1.9853515625, -1.55615234375, -1.126953125, -0.69775390625, -0.2685546875, 0.16064453125, 0.58984375, 1.01904296875, 1.4482421875, 1.87744140625, 2.306640625, 2.73583984375, 3.1650390625, 3.59423828125, 4.0234375, 4.45263671875, 4.8818359375, 5.31103515625, 5.740234375, 6.16943359375, 6.5986328125, 7.02783203125, 7.45703125, 7.88623046875, 8.3154296875, 8.74462890625, 9.173828125, 9.60302734375, 10.0322265625, 10.46142578125, 10.890625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 11.0, 21.0, 23.0, 50.0, 84.0, 111.0, 198.0, 324.0, 463.0, 681.0, 668.0, 518.0, 347.0, 208.0, 134.0, 90.0, 63.0, 22.0, 30.0, 11.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.3507080078125, -10.037353515625, -9.7239990234375, -9.41064453125, -9.0972900390625, -8.783935546875, -8.4705810546875, -8.1572265625, -7.8438720703125, -7.530517578125, -7.2171630859375, -6.90380859375, -6.5904541015625, -6.277099609375, -5.9637451171875, -5.650390625, -5.3370361328125, -5.023681640625, -4.7103271484375, -4.39697265625, -4.0836181640625, -3.770263671875, -3.4569091796875, -3.1435546875, -2.8302001953125, -2.516845703125, -2.2034912109375, -1.89013671875, -1.5767822265625, -1.263427734375, -0.9500732421875, -0.63671875, -0.3233642578125, -0.010009765625, 0.3033447265625, 0.61669921875, 0.9300537109375, 1.243408203125, 1.5567626953125, 1.8701171875, 2.1834716796875, 2.496826171875, 2.8101806640625, 3.12353515625, 3.4368896484375, 3.750244140625, 4.0635986328125, 4.376953125, 4.6903076171875, 5.003662109375, 5.3170166015625, 5.63037109375, 5.9437255859375, 6.257080078125, 6.5704345703125, 6.8837890625, 7.1971435546875, 7.510498046875, 7.8238525390625, 8.13720703125, 8.4505615234375, 8.763916015625, 9.0772705078125, 9.390625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 15.0, 14.0, 33.0, 54.0, 83.0, 149.0, 210.0, 329.0, 901.0, 6439.0, 2433339.0, 1746017.0, 4995.0, 822.0, 324.0, 222.0, 131.0, 75.0, 42.0, 36.0, 15.0, 12.0, 8.0, 4.0, 1.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.21875, -24.28369140625, -23.3486328125, -22.41357421875, -21.478515625, -20.54345703125, -19.6083984375, -18.67333984375, -17.73828125, -16.80322265625, -15.8681640625, -14.93310546875, -13.998046875, -13.06298828125, -12.1279296875, -11.19287109375, -10.2578125, -9.32275390625, -8.3876953125, -7.45263671875, -6.517578125, -5.58251953125, -4.6474609375, -3.71240234375, -2.77734375, -1.84228515625, -0.9072265625, 0.02783203125, 0.962890625, 1.89794921875, 2.8330078125, 3.76806640625, 4.703125, 5.63818359375, 6.5732421875, 7.50830078125, 8.443359375, 9.37841796875, 10.3134765625, 11.24853515625, 12.18359375, 13.11865234375, 14.0537109375, 14.98876953125, 15.923828125, 16.85888671875, 17.7939453125, 18.72900390625, 19.6640625, 20.59912109375, 21.5341796875, 22.46923828125, 23.404296875, 24.33935546875, 25.2744140625, 26.20947265625, 27.14453125, 28.07958984375, 29.0146484375, 29.94970703125, 30.884765625, 31.81982421875, 32.7548828125, 33.68994140625, 34.625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 19.0, 81.0, 217.0, 317.0, 255.0, 92.0, 25.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.065269470214844, -15.283468246459961, -12.501667976379395, -9.719867706298828, -6.938066482543945, -4.1562652587890625, -1.3744659423828125, 1.4073352813720703, 4.189136505126953, 6.970937252044678, 9.752737998962402, 12.534538269042969, 15.316339492797852, 18.098140716552734, 20.879940032958984, 23.661741256713867, 26.44354248046875, 29.225343704223633, 32.007144927978516, 34.788944244384766, 37.57074737548828, 40.35254669189453, 43.13434600830078, 45.91614532470703, 48.69794845581055, 51.4797477722168, 54.26155090332031, 57.04335021972656, 59.82514953613281, 62.60695266723633, 65.38874816894531, 68.1705551147461, 70.95234680175781, 73.73414611816406, 76.51594543457031, 79.29774475097656, 82.07955169677734, 84.8613510131836, 87.64315032958984, 90.4249496459961, 93.20675659179688, 95.98855590820312, 98.77035522460938, 101.55215454101562, 104.3339614868164, 107.11576080322266, 109.8975601196289, 112.67935943603516, 115.4611587524414, 118.24295806884766, 121.0247573852539, 123.80656433105469, 126.58836364746094, 129.3701629638672, 132.15196228027344, 134.9337615966797, 137.71556091308594, 140.4973602294922, 143.27915954589844, 146.0609588623047, 148.84275817871094, 151.62457275390625, 154.4063720703125, 157.18817138671875, 159.969970703125]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 7.0, 2.0, 2.0, 7.0, 10.0, 10.0, 7.0, 12.0, 20.0, 16.0, 15.0, 18.0, 18.0, 15.0, 27.0, 25.0, 37.0, 22.0, 31.0, 38.0, 30.0, 36.0, 40.0, 26.0, 43.0, 50.0, 47.0, 31.0, 43.0, 33.0, 33.0, 29.0, 21.0, 34.0, 18.0, 19.0, 16.0, 16.0, 19.0, 11.0, 12.0, 8.0, 8.0, 10.0, 10.0, 6.0, 4.0, 2.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.316221237182617, -17.724740982055664, -17.13326072692871, -16.541780471801758, -15.950300216674805, -15.358819961547852, -14.767340660095215, -14.175860404968262, -13.584380149841309, -12.992899894714355, -12.401419639587402, -11.80993938446045, -11.218460083007812, -10.62697982788086, -10.035499572753906, -9.444019317626953, -8.8525390625, -8.261058807373047, -7.669578552246094, -7.078098773956299, -6.486618518829346, -5.895138263702393, -5.303658485412598, -4.7121782302856445, -4.120697975158691, -3.5292177200317383, -2.9377377033233643, -2.3462576866149902, -1.754777431488037, -1.163297176361084, -0.57181715965271, 0.019662857055664062, 0.61114501953125, 1.2026251554489136, 1.7941052913665771, 2.385585308074951, 2.9770655632019043, 3.5685458183288574, 4.160025596618652, 4.7515058517456055, 5.342986106872559, 5.934466361999512, 6.525946617126465, 7.11742639541626, 7.708906650543213, 8.300386428833008, 8.891866683959961, 9.483346939086914, 10.074827194213867, 10.66630744934082, 11.257787704467773, 11.849267959594727, 12.44074821472168, 13.032228469848633, 13.62370777130127, 14.215188026428223, 14.806668281555176, 15.398148536682129, 15.989628791809082, 16.58110809326172, 17.172588348388672, 17.764068603515625, 18.355548858642578, 18.94702911376953, 19.538509368896484]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 7.0, 5.0, 15.0, 10.0, 14.0, 10.0, 14.0, 19.0, 22.0, 22.0, 28.0, 33.0, 48.0, 43.0, 47.0, 46.0, 34.0, 47.0, 47.0, 50.0, 45.0, 53.0, 45.0, 33.0, 31.0, 26.0, 30.0, 25.0, 34.0, 18.0, 17.0, 22.0, 21.0, 12.0, 6.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.9296875, -3.831787109375, -3.73388671875, -3.635986328125, -3.5380859375, -3.440185546875, -3.34228515625, -3.244384765625, -3.146484375, -3.048583984375, -2.95068359375, -2.852783203125, -2.7548828125, -2.656982421875, -2.55908203125, -2.461181640625, -2.36328125, -2.265380859375, -2.16748046875, -2.069580078125, -1.9716796875, -1.873779296875, -1.77587890625, -1.677978515625, -1.580078125, -1.482177734375, -1.38427734375, -1.286376953125, -1.1884765625, -1.090576171875, -0.99267578125, -0.894775390625, -0.796875, -0.698974609375, -0.60107421875, -0.503173828125, -0.4052734375, -0.307373046875, -0.20947265625, -0.111572265625, -0.013671875, 0.084228515625, 0.18212890625, 0.280029296875, 0.3779296875, 0.475830078125, 0.57373046875, 0.671630859375, 0.76953125, 0.867431640625, 0.96533203125, 1.063232421875, 1.1611328125, 1.259033203125, 1.35693359375, 1.454833984375, 1.552734375, 1.650634765625, 1.74853515625, 1.846435546875, 1.9443359375, 2.042236328125, 2.14013671875, 2.238037109375, 2.3359375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 7.0, 17.0, 22.0, 33.0, 40.0, 66.0, 113.0, 196.0, 349.0, 598.0, 1173.0, 2159.0, 3912.0, 7220.0, 13312.0, 25795.0, 52789.0, 120005.0, 330069.0, 286200.0, 106489.0, 47495.0, 23536.0, 12517.0, 6712.0, 3496.0, 1859.0, 1000.0, 587.0, 316.0, 184.0, 114.0, 61.0, 36.0, 30.0, 10.0, 14.0, 11.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.75927734375, -0.7369003295898438, -0.7145233154296875, -0.6921463012695312, -0.669769287109375, -0.6473922729492188, -0.6250152587890625, -0.6026382446289062, -0.58026123046875, -0.5578842163085938, -0.5355072021484375, -0.5131301879882812, -0.490753173828125, -0.46837615966796875, -0.4459991455078125, -0.42362213134765625, -0.4012451171875, -0.37886810302734375, -0.3564910888671875, -0.33411407470703125, -0.311737060546875, -0.28936004638671875, -0.2669830322265625, -0.24460601806640625, -0.22222900390625, -0.19985198974609375, -0.1774749755859375, -0.15509796142578125, -0.132720947265625, -0.11034393310546875, -0.0879669189453125, -0.06558990478515625, -0.043212890625, -0.02083587646484375, 0.0015411376953125, 0.02391815185546875, 0.046295166015625, 0.06867218017578125, 0.0910491943359375, 0.11342620849609375, 0.13580322265625, 0.15818023681640625, 0.1805572509765625, 0.20293426513671875, 0.225311279296875, 0.24768829345703125, 0.2700653076171875, 0.29244232177734375, 0.3148193359375, 0.33719635009765625, 0.3595733642578125, 0.38195037841796875, 0.404327392578125, 0.42670440673828125, 0.4490814208984375, 0.47145843505859375, 0.49383544921875, 0.5162124633789062, 0.5385894775390625, 0.5609664916992188, 0.583343505859375, 0.6057205200195312, 0.6280975341796875, 0.6504745483398438, 0.6728515625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 4.0, 6.0, 10.0, 14.0, 11.0, 12.0, 14.0, 15.0, 30.0, 30.0, 27.0, 31.0, 34.0, 31.0, 40.0, 35.0, 31.0, 40.0, 41.0, 44.0, 1060.0, 38.0, 34.0, 29.0, 45.0, 49.0, 34.0, 13.0, 31.0, 22.0, 16.0, 29.0, 17.0, 23.0, 14.0, 10.0, 9.0, 7.0, 13.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.8388671875, -1.7852935791015625, -1.731719970703125, -1.6781463623046875, -1.62457275390625, -1.5709991455078125, -1.517425537109375, -1.4638519287109375, -1.4102783203125, -1.3567047119140625, -1.303131103515625, -1.2495574951171875, -1.19598388671875, -1.1424102783203125, -1.088836669921875, -1.0352630615234375, -0.981689453125, -0.9281158447265625, -0.874542236328125, -0.8209686279296875, -0.76739501953125, -0.7138214111328125, -0.660247802734375, -0.6066741943359375, -0.5531005859375, -0.4995269775390625, -0.445953369140625, -0.3923797607421875, -0.33880615234375, -0.2852325439453125, -0.231658935546875, -0.1780853271484375, -0.12451171875, -0.0709381103515625, -0.017364501953125, 0.0362091064453125, 0.08978271484375, 0.1433563232421875, 0.196929931640625, 0.2505035400390625, 0.3040771484375, 0.3576507568359375, 0.411224365234375, 0.4647979736328125, 0.51837158203125, 0.5719451904296875, 0.625518798828125, 0.6790924072265625, 0.732666015625, 0.7862396240234375, 0.839813232421875, 0.8933868408203125, 0.94696044921875, 1.0005340576171875, 1.054107666015625, 1.1076812744140625, 1.1612548828125, 1.2148284912109375, 1.268402099609375, 1.3219757080078125, 1.37554931640625, 1.4291229248046875, 1.482696533203125, 1.5362701416015625, 1.58984375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 8.0, 13.0, 21.0, 27.0, 51.0, 87.0, 126.0, 160.0, 243.0, 343.0, 512.0, 741.0, 1018.0, 1533.0, 2162.0, 3028.0, 4493.0, 6457.0, 9237.0, 13545.0, 19938.0, 29827.0, 46058.0, 73770.0, 132589.0, 1305608.0, 181939.0, 94788.0, 56250.0, 35796.0, 24133.0, 16305.0, 11381.0, 7612.0, 5325.0, 3647.0, 2476.0, 1807.0, 1238.0, 819.0, 614.0, 415.0, 308.0, 195.0, 141.0, 100.0, 67.0, 55.0, 43.0, 37.0, 18.0, 12.0, 10.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.3896484375, -0.3773651123046875, -0.365081787109375, -0.3527984619140625, -0.34051513671875, -0.3282318115234375, -0.315948486328125, -0.3036651611328125, -0.2913818359375, -0.2790985107421875, -0.266815185546875, -0.2545318603515625, -0.24224853515625, -0.2299652099609375, -0.217681884765625, -0.2053985595703125, -0.193115234375, -0.1808319091796875, -0.168548583984375, -0.1562652587890625, -0.14398193359375, -0.1316986083984375, -0.119415283203125, -0.1071319580078125, -0.0948486328125, -0.0825653076171875, -0.070281982421875, -0.0579986572265625, -0.04571533203125, -0.0334320068359375, -0.021148681640625, -0.0088653564453125, 0.00341796875, 0.0157012939453125, 0.027984619140625, 0.0402679443359375, 0.05255126953125, 0.0648345947265625, 0.077117919921875, 0.0894012451171875, 0.1016845703125, 0.1139678955078125, 0.126251220703125, 0.1385345458984375, 0.15081787109375, 0.1631011962890625, 0.175384521484375, 0.1876678466796875, 0.199951171875, 0.2122344970703125, 0.224517822265625, 0.2368011474609375, 0.24908447265625, 0.2613677978515625, 0.273651123046875, 0.2859344482421875, 0.2982177734375, 0.3105010986328125, 0.322784423828125, 0.3350677490234375, 0.34735107421875, 0.3596343994140625, 0.371917724609375, 0.3842010498046875, 0.396484375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 11.0, 7.0, 12.0, 9.0, 13.0, 7.0, 24.0, 36.0, 41.0, 53.0, 77.0, 66.0, 84.0, 96.0, 79.0, 73.0, 71.0, 49.0, 44.0, 36.0, 23.0, 14.0, 13.0, 11.0, 8.0, 6.0, 7.0, 7.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010526180267333984, -0.00010079145431518555, -9.632110595703125e-05, -9.185075759887695e-05, -8.738040924072266e-05, -8.291006088256836e-05, -7.843971252441406e-05, -7.396936416625977e-05, -6.949901580810547e-05, -6.502866744995117e-05, -6.0558319091796875e-05, -5.608797073364258e-05, -5.161762237548828e-05, -4.7147274017333984e-05, -4.267692565917969e-05, -3.820657730102539e-05, -3.3736228942871094e-05, -2.9265880584716797e-05, -2.47955322265625e-05, -2.0325183868408203e-05, -1.5854835510253906e-05, -1.138448715209961e-05, -6.9141387939453125e-06, -2.4437904357910156e-06, 2.0265579223632812e-06, 6.496906280517578e-06, 1.0967254638671875e-05, 1.5437602996826172e-05, 1.990795135498047e-05, 2.4378299713134766e-05, 2.8848648071289062e-05, 3.331899642944336e-05, 3.7789344787597656e-05, 4.225969314575195e-05, 4.673004150390625e-05, 5.120038986206055e-05, 5.5670738220214844e-05, 6.014108657836914e-05, 6.461143493652344e-05, 6.908178329467773e-05, 7.355213165283203e-05, 7.802248001098633e-05, 8.249282836914062e-05, 8.696317672729492e-05, 9.143352508544922e-05, 9.590387344360352e-05, 0.00010037422180175781, 0.00010484457015991211, 0.0001093149185180664, 0.0001137852668762207, 0.000118255615234375, 0.0001227259635925293, 0.0001271963119506836, 0.0001316666603088379, 0.0001361370086669922, 0.00014060735702514648, 0.00014507770538330078, 0.00014954805374145508, 0.00015401840209960938, 0.00015848875045776367, 0.00016295909881591797, 0.00016742944717407227, 0.00017189979553222656, 0.00017637014389038086, 0.00018084049224853516]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 7.0, 2.0, 4.0, 6.0, 6.0, 3.0, 11.0, 8.0, 10.0, 24.0, 30.0, 34.0, 48.0, 65.0, 103.0, 176.0, 338.0, 573.0, 2753.0, 996935.0, 45371.0, 971.0, 397.0, 234.0, 144.0, 99.0, 55.0, 36.0, 27.0, 17.0, 12.0, 13.0, 7.0, 14.0, 4.0, 5.0, 6.0, 2.0, 1.0, 0.0, 5.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.003032684326171875, -0.0029523074626922607, -0.0028719305992126465, -0.0027915537357330322, -0.002711176872253418, -0.0026308000087738037, -0.0025504231452941895, -0.002470046281814575, -0.002389669418334961, -0.0023092925548553467, -0.0022289156913757324, -0.002148538827896118, -0.002068161964416504, -0.0019877851009368896, -0.0019074082374572754, -0.0018270313739776611, -0.0017466545104980469, -0.0016662776470184326, -0.0015859007835388184, -0.001505523920059204, -0.0014251470565795898, -0.0013447701930999756, -0.0012643933296203613, -0.001184016466140747, -0.0011036396026611328, -0.0010232627391815186, -0.0009428858757019043, -0.00086250901222229, -0.0007821321487426758, -0.0007017552852630615, -0.0006213784217834473, -0.000541001558303833, -0.00046062469482421875, -0.0003802478313446045, -0.00029987096786499023, -0.00021949410438537598, -0.00013911724090576172, -5.874037742614746e-05, 2.1636486053466797e-05, 0.00010201334953308105, 0.0001823902130126953, 0.00026276707649230957, 0.00034314393997192383, 0.0004235208034515381, 0.0005038976669311523, 0.0005842745304107666, 0.0006646513938903809, 0.0007450282573699951, 0.0008254051208496094, 0.0009057819843292236, 0.0009861588478088379, 0.0010665357112884521, 0.0011469125747680664, 0.0012272894382476807, 0.001307666301727295, 0.0013880431652069092, 0.0014684200286865234, 0.0015487968921661377, 0.001629173755645752, 0.0017095506191253662, 0.0017899274826049805, 0.0018703043460845947, 0.001950681209564209, 0.0020310580730438232, 0.0021114349365234375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 48.0, 143.0, 282.0, 263.0, 176.0, 68.0, 12.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.282000246457756e-05, -8.704788342583925e-05, -8.127576438710093e-05, -7.550364534836262e-05, -6.973153358558193e-05, -6.395941454684362e-05, -5.818729550810531e-05, -5.2415180107345805e-05, -4.6643061068607494e-05, -4.0870942029869184e-05, -3.509882662910968e-05, -2.932670759037137e-05, -2.3554590370622464e-05, -1.7782473150873557e-05, -1.2010354112135246e-05, -6.238238711375743e-06, -4.661196726374328e-07, 5.305998001858825e-06, 1.1078115676355083e-05, 1.685023380559869e-05, 2.2622351025347598e-05, 2.8394468245096505e-05, 3.4166587283834815e-05, 3.993870268459432e-05, 4.571082172333263e-05, 5.148294076207094e-05, 5.725505616283044e-05, 6.302717520156875e-05, 6.879929424030706e-05, 7.457140600308776e-05, 8.034352504182607e-05, 8.611564408056438e-05, 9.188776311930269e-05, 9.7659882158041e-05, 0.00010343200119677931, 0.00010920412023551762, 0.00011497623199829832, 0.00012074835103703663, 0.00012652046279981732, 0.00013229258183855563, 0.00013806470087729394, 0.00014383681991603225, 0.00014960893895477057, 0.00015538105799350888, 0.00016115317703224719, 0.00016692528151907027, 0.0001726974151097238, 0.0001784695195965469, 0.00018424165318720043, 0.00019001377222593874, 0.00019578589126467705, 0.00020155801030341536, 0.00020733012934215367, 0.00021310223382897675, 0.0002188743674196303, 0.00022464647190645337, 0.00023041859094519168, 0.00023619070998393, 0.0002419628290226683, 0.0002477349480614066, 0.0002535070525482297, 0.00025927918613888323, 0.0002650512906257063, 0.00027082342421635985, 0.00027659552870318294]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 2.0, 10.0, 13.0, 11.0, 16.0, 16.0, 15.0, 15.0, 26.0, 24.0, 32.0, 27.0, 33.0, 38.0, 35.0, 37.0, 42.0, 53.0, 42.0, 38.0, 44.0, 34.0, 43.0, 34.0, 41.0, 35.0, 34.0, 38.0, 25.0, 28.0, 18.0, 19.0, 13.0, 9.0, 11.0, 9.0, 8.0, 6.0, 6.0, 7.0, 0.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.252527236938477e-05, -6.053224205970764e-05, -5.853921175003052e-05, -5.6546181440353394e-05, -5.455315113067627e-05, -5.2560120820999146e-05, -5.056709051132202e-05, -4.85740602016449e-05, -4.6581029891967773e-05, -4.458799958229065e-05, -4.2594969272613525e-05, -4.06019389629364e-05, -3.860890865325928e-05, -3.661587834358215e-05, -3.462284803390503e-05, -3.2629817724227905e-05, -3.063678741455078e-05, -2.8643757104873657e-05, -2.6650726795196533e-05, -2.465769648551941e-05, -2.2664666175842285e-05, -2.067163586616516e-05, -1.8678605556488037e-05, -1.6685575246810913e-05, -1.4692544937133789e-05, -1.2699514627456665e-05, -1.0706484317779541e-05, -8.713454008102417e-06, -6.720423698425293e-06, -4.727393388748169e-06, -2.734363079071045e-06, -7.413327693939209e-07, 1.2516975402832031e-06, 3.244727849960327e-06, 5.237758159637451e-06, 7.230788469314575e-06, 9.2238187789917e-06, 1.1216849088668823e-05, 1.3209879398345947e-05, 1.5202909708023071e-05, 1.7195940017700195e-05, 1.918897032737732e-05, 2.1182000637054443e-05, 2.3175030946731567e-05, 2.516806125640869e-05, 2.7161091566085815e-05, 2.915412187576294e-05, 3.1147152185440063e-05, 3.314018249511719e-05, 3.513321280479431e-05, 3.7126243114471436e-05, 3.911927342414856e-05, 4.1112303733825684e-05, 4.310533404350281e-05, 4.509836435317993e-05, 4.7091394662857056e-05, 4.908442497253418e-05, 5.1077455282211304e-05, 5.307048559188843e-05, 5.506351590156555e-05, 5.7056546211242676e-05, 5.90495765209198e-05, 6.104260683059692e-05, 6.303563714027405e-05, 6.502866744995117e-05]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 7.0, 5.0, 15.0, 10.0, 14.0, 10.0, 14.0, 19.0, 22.0, 22.0, 28.0, 33.0, 48.0, 43.0, 47.0, 46.0, 34.0, 47.0, 47.0, 50.0, 45.0, 53.0, 45.0, 33.0, 31.0, 26.0, 30.0, 25.0, 34.0, 18.0, 17.0, 22.0, 21.0, 12.0, 6.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.9296875, -3.831787109375, -3.73388671875, -3.635986328125, -3.5380859375, -3.440185546875, -3.34228515625, -3.244384765625, -3.146484375, -3.048583984375, -2.95068359375, -2.852783203125, -2.7548828125, -2.656982421875, -2.55908203125, -2.461181640625, -2.36328125, -2.265380859375, -2.16748046875, -2.069580078125, -1.9716796875, -1.873779296875, -1.77587890625, -1.677978515625, -1.580078125, -1.482177734375, -1.38427734375, -1.286376953125, -1.1884765625, -1.090576171875, -0.99267578125, -0.894775390625, -0.796875, -0.698974609375, -0.60107421875, -0.503173828125, -0.4052734375, -0.307373046875, -0.20947265625, -0.111572265625, -0.013671875, 0.084228515625, 0.18212890625, 0.280029296875, 0.3779296875, 0.475830078125, 0.57373046875, 0.671630859375, 0.76953125, 0.867431640625, 0.96533203125, 1.063232421875, 1.1611328125, 1.259033203125, 1.35693359375, 1.454833984375, 1.552734375, 1.650634765625, 1.74853515625, 1.846435546875, 1.9443359375, 2.042236328125, 2.14013671875, 2.238037109375, 2.3359375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 12.0, 15.0, 19.0, 19.0, 36.0, 57.0, 77.0, 157.0, 247.0, 469.0, 861.0, 1831.0, 3604.0, 7369.0, 14911.0, 31104.0, 67229.0, 163699.0, 383447.0, 215767.0, 83685.0, 37819.0, 18380.0, 8952.0, 4323.0, 2157.0, 1074.0, 504.0, 279.0, 168.0, 86.0, 55.0, 39.0, 33.0, 24.0, 11.0, 6.0, 10.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.150482177734375, -2.06658935546875, -1.982696533203125, -1.8988037109375, -1.814910888671875, -1.73101806640625, -1.647125244140625, -1.563232421875, -1.479339599609375, -1.39544677734375, -1.311553955078125, -1.2276611328125, -1.143768310546875, -1.05987548828125, -0.975982666015625, -0.89208984375, -0.808197021484375, -0.72430419921875, -0.640411376953125, -0.5565185546875, -0.472625732421875, -0.38873291015625, -0.304840087890625, -0.220947265625, -0.137054443359375, -0.05316162109375, 0.030731201171875, 0.1146240234375, 0.198516845703125, 0.28240966796875, 0.366302490234375, 0.4501953125, 0.534088134765625, 0.61798095703125, 0.701873779296875, 0.7857666015625, 0.869659423828125, 0.95355224609375, 1.037445068359375, 1.121337890625, 1.205230712890625, 1.28912353515625, 1.373016357421875, 1.4569091796875, 1.540802001953125, 1.62469482421875, 1.708587646484375, 1.79248046875, 1.876373291015625, 1.96026611328125, 2.044158935546875, 2.1280517578125, 2.211944580078125, 2.29583740234375, 2.379730224609375, 2.463623046875, 2.547515869140625, 2.63140869140625, 2.715301513671875, 2.7991943359375, 2.883087158203125, 2.96697998046875, 3.050872802734375, 3.134765625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 5.0, 12.0, 4.0, 7.0, 19.0, 17.0, 28.0, 31.0, 45.0, 39.0, 52.0, 52.0, 56.0, 74.0, 184.0, 1578.0, 280.0, 105.0, 56.0, 52.0, 47.0, 45.0, 29.0, 48.0, 30.0, 22.0, 19.0, 16.0, 21.0, 11.0, 6.0, 16.0, 5.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.9296875, -12.5455322265625, -12.161376953125, -11.7772216796875, -11.39306640625, -11.0089111328125, -10.624755859375, -10.2406005859375, -9.8564453125, -9.4722900390625, -9.088134765625, -8.7039794921875, -8.31982421875, -7.9356689453125, -7.551513671875, -7.1673583984375, -6.783203125, -6.3990478515625, -6.014892578125, -5.6307373046875, -5.24658203125, -4.8624267578125, -4.478271484375, -4.0941162109375, -3.7099609375, -3.3258056640625, -2.941650390625, -2.5574951171875, -2.17333984375, -1.7891845703125, -1.405029296875, -1.0208740234375, -0.63671875, -0.2525634765625, 0.131591796875, 0.5157470703125, 0.89990234375, 1.2840576171875, 1.668212890625, 2.0523681640625, 2.4365234375, 2.8206787109375, 3.204833984375, 3.5889892578125, 3.97314453125, 4.3572998046875, 4.741455078125, 5.1256103515625, 5.509765625, 5.8939208984375, 6.278076171875, 6.6622314453125, 7.04638671875, 7.4305419921875, 7.814697265625, 8.1988525390625, 8.5830078125, 8.9671630859375, 9.351318359375, 9.7354736328125, 10.11962890625, 10.5037841796875, 10.887939453125, 11.2720947265625, 11.65625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 7.0, 14.0, 18.0, 27.0, 52.0, 64.0, 93.0, 156.0, 327.0, 758.0, 19809.0, 3120747.0, 2531.0, 491.0, 230.0, 117.0, 71.0, 55.0, 37.0, 28.0, 17.0, 12.0, 9.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.03125, -61.34228515625, -59.6533203125, -57.96435546875, -56.275390625, -54.58642578125, -52.8974609375, -51.20849609375, -49.51953125, -47.83056640625, -46.1416015625, -44.45263671875, -42.763671875, -41.07470703125, -39.3857421875, -37.69677734375, -36.0078125, -34.31884765625, -32.6298828125, -30.94091796875, -29.251953125, -27.56298828125, -25.8740234375, -24.18505859375, -22.49609375, -20.80712890625, -19.1181640625, -17.42919921875, -15.740234375, -14.05126953125, -12.3623046875, -10.67333984375, -8.984375, -7.29541015625, -5.6064453125, -3.91748046875, -2.228515625, -0.53955078125, 1.1494140625, 2.83837890625, 4.52734375, 6.21630859375, 7.9052734375, 9.59423828125, 11.283203125, 12.97216796875, 14.6611328125, 16.35009765625, 18.0390625, 19.72802734375, 21.4169921875, 23.10595703125, 24.794921875, 26.48388671875, 28.1728515625, 29.86181640625, 31.55078125, 33.23974609375, 34.9287109375, 36.61767578125, 38.306640625, 39.99560546875, 41.6845703125, 43.37353515625, 45.0625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [725.0, 293.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.27552604675293, 0.7519025802612305, 10.77933120727539, 20.806760787963867, 30.83418846130371, 40.86161804199219, 50.88904571533203, 60.916473388671875, 70.94390106201172, 80.97132873535156, 90.9987564086914, 101.02618408203125, 111.05361938476562, 121.08103942871094, 131.1084747314453, 141.13589477539062, 151.163330078125, 161.19076538085938, 171.2181854248047, 181.24562072753906, 191.27304077148438, 201.30047607421875, 211.32791137695312, 221.35533142089844, 231.3827667236328, 241.4102020263672, 251.4376220703125, 261.4650573730469, 271.49249267578125, 281.5198974609375, 291.5473327636719, 301.57476806640625, 311.6022033691406, 321.629638671875, 331.6570739746094, 341.6844787597656, 351.7119140625, 361.7393493652344, 371.76678466796875, 381.794189453125, 391.8216247558594, 401.84906005859375, 411.8764953613281, 421.9039001464844, 431.93133544921875, 441.9587707519531, 451.9862060546875, 462.01361083984375, 472.04107666015625, 482.0685119628906, 492.095947265625, 502.12335205078125, 512.1508178710938, 522.17822265625, 532.2056274414062, 542.2330932617188, 552.260498046875, 562.2879028320312, 572.3153686523438, 582.3427734375, 592.3702392578125, 602.3976440429688, 612.425048828125, 622.4525146484375, 632.4799194335938]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 3.0, 6.0, 8.0, 12.0, 14.0, 6.0, 15.0, 9.0, 16.0, 15.0, 23.0, 23.0, 32.0, 26.0, 33.0, 37.0, 39.0, 42.0, 49.0, 42.0, 33.0, 30.0, 53.0, 32.0, 39.0, 39.0, 39.0, 43.0, 27.0, 30.0, 23.0, 33.0, 26.0, 17.0, 14.0, 16.0, 12.0, 9.0, 10.0, 8.0, 8.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-38.100563049316406, -37.094482421875, -36.088401794433594, -35.08232116699219, -34.07624053955078, -33.070159912109375, -32.06407928466797, -31.05799674987793, -30.05191421508789, -29.045833587646484, -28.039752960205078, -27.033672332763672, -26.027589797973633, -25.021509170532227, -24.01542854309082, -23.009347915649414, -22.003267288208008, -20.9971866607666, -19.991106033325195, -18.985023498535156, -17.97894287109375, -16.972862243652344, -15.966781616210938, -14.960700988769531, -13.954619407653809, -12.948538780212402, -11.94245719909668, -10.936376571655273, -9.930295944213867, -8.924214363098145, -7.918133735656738, -6.912052631378174, -5.905971527099609, -4.899890422821045, -3.8938095569610596, -2.887728691101074, -1.8816475868225098, -0.8755664825439453, 0.13051414489746094, 1.1365952491760254, 2.14267635345459, 3.1487574577331543, 4.154838562011719, 5.160919189453125, 6.1670002937316895, 7.173081398010254, 8.17916202545166, 9.185243606567383, 10.191324234008789, 11.197404861450195, 12.203486442565918, 13.209567070007324, 14.215648651123047, 15.221729278564453, 16.22780990600586, 17.233890533447266, 18.239971160888672, 19.246051788330078, 20.252132415771484, 21.25821304321289, 22.26429557800293, 23.270376205444336, 24.276456832885742, 25.28253746032715, 26.288619995117188]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 9.0, 3.0, 18.0, 10.0, 13.0, 11.0, 14.0, 19.0, 23.0, 24.0, 28.0, 35.0, 43.0, 48.0, 50.0, 46.0, 46.0, 36.0, 47.0, 41.0, 44.0, 44.0, 41.0, 37.0, 39.0, 29.0, 27.0, 25.0, 29.0, 26.0, 23.0, 16.0, 15.0, 13.0, 12.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0, -3.892120361328125, -3.78424072265625, -3.676361083984375, -3.5684814453125, -3.460601806640625, -3.35272216796875, -3.244842529296875, -3.136962890625, -3.029083251953125, -2.92120361328125, -2.813323974609375, -2.7054443359375, -2.597564697265625, -2.48968505859375, -2.381805419921875, -2.27392578125, -2.166046142578125, -2.05816650390625, -1.950286865234375, -1.8424072265625, -1.734527587890625, -1.62664794921875, -1.518768310546875, -1.410888671875, -1.303009033203125, -1.19512939453125, -1.087249755859375, -0.9793701171875, -0.871490478515625, -0.76361083984375, -0.655731201171875, -0.5478515625, -0.439971923828125, -0.33209228515625, -0.224212646484375, -0.1163330078125, -0.008453369140625, 0.09942626953125, 0.207305908203125, 0.315185546875, 0.423065185546875, 0.53094482421875, 0.638824462890625, 0.7467041015625, 0.854583740234375, 0.96246337890625, 1.070343017578125, 1.17822265625, 1.286102294921875, 1.39398193359375, 1.501861572265625, 1.6097412109375, 1.717620849609375, 1.82550048828125, 1.933380126953125, 2.041259765625, 2.149139404296875, 2.25701904296875, 2.364898681640625, 2.4727783203125, 2.580657958984375, 2.68853759765625, 2.796417236328125, 2.904296875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 3.0, 5.0, 2.0, 10.0, 12.0, 9.0, 9.0, 15.0, 12.0, 18.0, 28.0, 26.0, 48.0, 56.0, 93.0, 164.0, 271.0, 424.0, 868.0, 2014.0, 6708.0, 29587.0, 165876.0, 919522.0, 1908192.0, 932550.0, 185288.0, 31737.0, 6888.0, 1962.0, 771.0, 402.0, 242.0, 128.0, 98.0, 61.0, 33.0, 31.0, 28.0, 19.0, 16.0, 13.0, 18.0, 4.0, 8.0, 7.0, 4.0, 5.0, 4.0, 0.0, 4.0], "bins": [-5.8203125, -5.6651611328125, -5.510009765625, -5.3548583984375, -5.19970703125, -5.0445556640625, -4.889404296875, -4.7342529296875, -4.5791015625, -4.4239501953125, -4.268798828125, -4.1136474609375, -3.95849609375, -3.8033447265625, -3.648193359375, -3.4930419921875, -3.337890625, -3.1827392578125, -3.027587890625, -2.8724365234375, -2.71728515625, -2.5621337890625, -2.406982421875, -2.2518310546875, -2.0966796875, -1.9415283203125, -1.786376953125, -1.6312255859375, -1.47607421875, -1.3209228515625, -1.165771484375, -1.0106201171875, -0.85546875, -0.7003173828125, -0.545166015625, -0.3900146484375, -0.23486328125, -0.0797119140625, 0.075439453125, 0.2305908203125, 0.3857421875, 0.5408935546875, 0.696044921875, 0.8511962890625, 1.00634765625, 1.1614990234375, 1.316650390625, 1.4718017578125, 1.626953125, 1.7821044921875, 1.937255859375, 2.0924072265625, 2.24755859375, 2.4027099609375, 2.557861328125, 2.7130126953125, 2.8681640625, 3.0233154296875, 3.178466796875, 3.3336181640625, 3.48876953125, 3.6439208984375, 3.799072265625, 3.9542236328125, 4.109375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 9.0, 19.0, 40.0, 56.0, 91.0, 124.0, 218.0, 313.0, 504.0, 637.0, 647.0, 485.0, 337.0, 228.0, 127.0, 97.0, 64.0, 34.0, 24.0, 10.0, 10.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -8.002197265625, -7.66845703125, -7.334716796875, -7.0009765625, -6.667236328125, -6.33349609375, -5.999755859375, -5.666015625, -5.332275390625, -4.99853515625, -4.664794921875, -4.3310546875, -3.997314453125, -3.66357421875, -3.329833984375, -2.99609375, -2.662353515625, -2.32861328125, -1.994873046875, -1.6611328125, -1.327392578125, -0.99365234375, -0.659912109375, -0.326171875, 0.007568359375, 0.34130859375, 0.675048828125, 1.0087890625, 1.342529296875, 1.67626953125, 2.010009765625, 2.34375, 2.677490234375, 3.01123046875, 3.344970703125, 3.6787109375, 4.012451171875, 4.34619140625, 4.679931640625, 5.013671875, 5.347412109375, 5.68115234375, 6.014892578125, 6.3486328125, 6.682373046875, 7.01611328125, 7.349853515625, 7.68359375, 8.017333984375, 8.35107421875, 8.684814453125, 9.0185546875, 9.352294921875, 9.68603515625, 10.019775390625, 10.353515625, 10.687255859375, 11.02099609375, 11.354736328125, 11.6884765625, 12.022216796875, 12.35595703125, 12.689697265625, 13.0234375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 9.0, 10.0, 13.0, 28.0, 25.0, 45.0, 50.0, 70.0, 115.0, 166.0, 245.0, 350.0, 689.0, 2849.0, 89844.0, 3610989.0, 478946.0, 7464.0, 1033.0, 481.0, 287.0, 165.0, 123.0, 88.0, 59.0, 49.0, 28.0, 21.0, 9.0, 9.0, 7.0, 8.0, 5.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-25.046875, -24.4156494140625, -23.784423828125, -23.1531982421875, -22.52197265625, -21.8907470703125, -21.259521484375, -20.6282958984375, -19.9970703125, -19.3658447265625, -18.734619140625, -18.1033935546875, -17.47216796875, -16.8409423828125, -16.209716796875, -15.5784912109375, -14.947265625, -14.3160400390625, -13.684814453125, -13.0535888671875, -12.42236328125, -11.7911376953125, -11.159912109375, -10.5286865234375, -9.8974609375, -9.2662353515625, -8.635009765625, -8.0037841796875, -7.37255859375, -6.7413330078125, -6.110107421875, -5.4788818359375, -4.84765625, -4.2164306640625, -3.585205078125, -2.9539794921875, -2.32275390625, -1.6915283203125, -1.060302734375, -0.4290771484375, 0.2021484375, 0.8333740234375, 1.464599609375, 2.0958251953125, 2.72705078125, 3.3582763671875, 3.989501953125, 4.6207275390625, 5.251953125, 5.8831787109375, 6.514404296875, 7.1456298828125, 7.77685546875, 8.4080810546875, 9.039306640625, 9.6705322265625, 10.3017578125, 10.9329833984375, 11.564208984375, 12.1954345703125, 12.82666015625, 13.4578857421875, 14.089111328125, 14.7203369140625, 15.3515625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 10.0, 66.0, 197.0, 318.0, 278.0, 108.0, 33.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.41168975830078, -69.58451080322266, -66.75733184814453, -63.93014907836914, -61.102970123291016, -58.275787353515625, -55.4486083984375, -52.621429443359375, -49.79425048828125, -46.967071533203125, -44.139888763427734, -41.31270980834961, -38.485530853271484, -35.658348083496094, -32.83116912841797, -30.003990173339844, -27.176807403564453, -24.349626541137695, -21.52244758605957, -18.695266723632812, -15.868086814880371, -13.04090690612793, -10.213726043701172, -7.386547088623047, -4.559366226196289, -1.7321860790252686, 1.094994068145752, 3.9221744537353516, 6.749354362487793, 9.576534271240234, 12.403715133666992, 15.230894088745117, 18.058074951171875, 20.885255813598633, 23.712434768676758, 26.539615631103516, 29.36679458618164, 32.19397735595703, 35.021156311035156, 37.84833526611328, 40.675514221191406, 43.50269317626953, 46.32987594604492, 49.15705490112305, 51.98423385620117, 54.81141662597656, 57.63859558105469, 60.46577453613281, 63.2929573059082, 66.1201400756836, 68.94731903076172, 71.77449798583984, 74.60167694091797, 77.4288558959961, 80.25604248046875, 83.08322143554688, 85.910400390625, 88.73757934570312, 91.56475830078125, 94.39193725585938, 97.21912384033203, 100.04630279541016, 102.87348175048828, 105.7006607055664, 108.52783966064453]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 1.0, 3.0, 5.0, 8.0, 5.0, 4.0, 8.0, 17.0, 21.0, 11.0, 18.0, 19.0, 30.0, 26.0, 23.0, 21.0, 34.0, 27.0, 32.0, 36.0, 42.0, 31.0, 34.0, 36.0, 39.0, 38.0, 50.0, 48.0, 30.0, 24.0, 24.0, 33.0, 16.0, 26.0, 21.0, 28.0, 26.0, 16.0, 10.0, 14.0, 12.0, 5.0, 9.0, 13.0, 7.0, 1.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0], "bins": [-22.092737197875977, -21.41645622253418, -20.74017333984375, -20.063892364501953, -19.387609481811523, -18.711328506469727, -18.035045623779297, -17.3587646484375, -16.682483673095703, -16.006202697753906, -15.329919815063477, -14.65363883972168, -13.97735595703125, -13.301074981689453, -12.62479305267334, -11.948511123657227, -11.272228240966797, -10.595946311950684, -9.91966438293457, -9.243383407592773, -8.567100524902344, -7.890819072723389, -7.214537620544434, -6.53825569152832, -5.861973762512207, -5.185691833496094, -4.5094099044799805, -3.8331284523010254, -3.156846523284912, -2.480564594268799, -1.8042831420898438, -1.1280012130737305, -0.4517173767089844, 0.22456443309783936, 0.9008462429046631, 1.5771279335021973, 2.2534098625183105, 2.929691791534424, 3.605973243713379, 4.282255172729492, 4.9585371017456055, 5.634819030761719, 6.311100959777832, 6.987382411956787, 7.6636643409729, 8.339946746826172, 9.016227722167969, 9.692509651184082, 10.368791580200195, 11.045073509216309, 11.721355438232422, 12.397636413574219, 13.073919296264648, 13.750200271606445, 14.426482200622559, 15.102764129638672, 15.779046058654785, 16.4553279876709, 17.131608963012695, 17.807891845703125, 18.484172821044922, 19.16045570373535, 19.83673667907715, 20.513019561767578, 21.189300537109375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 4.0, 4.0, 6.0, 5.0, 9.0, 12.0, 14.0, 14.0, 21.0, 15.0, 27.0, 24.0, 34.0, 22.0, 33.0, 39.0, 45.0, 39.0, 47.0, 50.0, 48.0, 50.0, 41.0, 31.0, 61.0, 37.0, 36.0, 35.0, 28.0, 24.0, 35.0, 26.0, 20.0, 12.0, 15.0, 8.0, 8.0, 7.0, 3.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.00390625, -3.896942138671875, -3.78997802734375, -3.683013916015625, -3.5760498046875, -3.469085693359375, -3.36212158203125, -3.255157470703125, -3.148193359375, -3.041229248046875, -2.93426513671875, -2.827301025390625, -2.7203369140625, -2.613372802734375, -2.50640869140625, -2.399444580078125, -2.29248046875, -2.185516357421875, -2.07855224609375, -1.971588134765625, -1.8646240234375, -1.757659912109375, -1.65069580078125, -1.543731689453125, -1.436767578125, -1.329803466796875, -1.22283935546875, -1.115875244140625, -1.0089111328125, -0.901947021484375, -0.79498291015625, -0.688018798828125, -0.5810546875, -0.474090576171875, -0.36712646484375, -0.260162353515625, -0.1531982421875, -0.046234130859375, 0.06072998046875, 0.167694091796875, 0.274658203125, 0.381622314453125, 0.48858642578125, 0.595550537109375, 0.7025146484375, 0.809478759765625, 0.91644287109375, 1.023406982421875, 1.13037109375, 1.237335205078125, 1.34429931640625, 1.451263427734375, 1.5582275390625, 1.665191650390625, 1.77215576171875, 1.879119873046875, 1.986083984375, 2.093048095703125, 2.20001220703125, 2.306976318359375, 2.4139404296875, 2.520904541015625, 2.62786865234375, 2.734832763671875, 2.841796875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 8.0, 10.0, 23.0, 32.0, 30.0, 42.0, 91.0, 123.0, 165.0, 240.0, 348.0, 542.0, 793.0, 1244.0, 1866.0, 2963.0, 4587.0, 7052.0, 10931.0, 17860.0, 28486.0, 47724.0, 86013.0, 174728.0, 314658.0, 153931.0, 77851.0, 44371.0, 26491.0, 16290.0, 10296.0, 6503.0, 4280.0, 2723.0, 1759.0, 1137.0, 810.0, 538.0, 332.0, 238.0, 154.0, 95.0, 64.0, 49.0, 31.0, 21.0, 8.0, 5.0, 9.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.5859375, -0.5684051513671875, -0.550872802734375, -0.5333404541015625, -0.51580810546875, -0.4982757568359375, -0.480743408203125, -0.4632110595703125, -0.4456787109375, -0.4281463623046875, -0.410614013671875, -0.3930816650390625, -0.37554931640625, -0.3580169677734375, -0.340484619140625, -0.3229522705078125, -0.305419921875, -0.2878875732421875, -0.270355224609375, -0.2528228759765625, -0.23529052734375, -0.2177581787109375, -0.200225830078125, -0.1826934814453125, -0.1651611328125, -0.1476287841796875, -0.130096435546875, -0.1125640869140625, -0.09503173828125, -0.0774993896484375, -0.059967041015625, -0.0424346923828125, -0.02490234375, -0.0073699951171875, 0.010162353515625, 0.0276947021484375, 0.04522705078125, 0.0627593994140625, 0.080291748046875, 0.0978240966796875, 0.1153564453125, 0.1328887939453125, 0.150421142578125, 0.1679534912109375, 0.18548583984375, 0.2030181884765625, 0.220550537109375, 0.2380828857421875, 0.255615234375, 0.2731475830078125, 0.290679931640625, 0.3082122802734375, 0.32574462890625, 0.3432769775390625, 0.360809326171875, 0.3783416748046875, 0.3958740234375, 0.4134063720703125, 0.430938720703125, 0.4484710693359375, 0.46600341796875, 0.4835357666015625, 0.501068115234375, 0.5186004638671875, 0.5361328125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 12.0, 6.0, 9.0, 10.0, 9.0, 13.0, 9.0, 14.0, 26.0, 26.0, 15.0, 29.0, 25.0, 36.0, 24.0, 37.0, 42.0, 42.0, 40.0, 1057.0, 46.0, 42.0, 40.0, 34.0, 34.0, 41.0, 46.0, 38.0, 21.0, 34.0, 25.0, 22.0, 26.0, 14.0, 12.0, 12.0, 10.0, 6.0, 8.0, 6.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.0078125, -1.946502685546875, -1.88519287109375, -1.823883056640625, -1.7625732421875, -1.701263427734375, -1.63995361328125, -1.578643798828125, -1.517333984375, -1.456024169921875, -1.39471435546875, -1.333404541015625, -1.2720947265625, -1.210784912109375, -1.14947509765625, -1.088165283203125, -1.02685546875, -0.965545654296875, -0.90423583984375, -0.842926025390625, -0.7816162109375, -0.720306396484375, -0.65899658203125, -0.597686767578125, -0.536376953125, -0.475067138671875, -0.41375732421875, -0.352447509765625, -0.2911376953125, -0.229827880859375, -0.16851806640625, -0.107208251953125, -0.0458984375, 0.015411376953125, 0.07672119140625, 0.138031005859375, 0.1993408203125, 0.260650634765625, 0.32196044921875, 0.383270263671875, 0.444580078125, 0.505889892578125, 0.56719970703125, 0.628509521484375, 0.6898193359375, 0.751129150390625, 0.81243896484375, 0.873748779296875, 0.93505859375, 0.996368408203125, 1.05767822265625, 1.118988037109375, 1.1802978515625, 1.241607666015625, 1.30291748046875, 1.364227294921875, 1.425537109375, 1.486846923828125, 1.54815673828125, 1.609466552734375, 1.6707763671875, 1.732086181640625, 1.79339599609375, 1.854705810546875, 1.916015625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 7.0, 14.0, 12.0, 20.0, 23.0, 43.0, 60.0, 91.0, 136.0, 186.0, 264.0, 366.0, 512.0, 684.0, 991.0, 1339.0, 1912.0, 2622.0, 3713.0, 5144.0, 7206.0, 10272.0, 14764.0, 21578.0, 31931.0, 48479.0, 78792.0, 141772.0, 1304729.0, 165472.0, 88323.0, 53985.0, 34884.0, 23131.0, 15901.0, 10951.0, 7489.0, 5463.0, 3944.0, 2739.0, 1970.0, 1441.0, 1039.0, 788.0, 541.0, 418.0, 283.0, 204.0, 152.0, 98.0, 83.0, 51.0, 54.0, 31.0, 23.0, 7.0, 7.0, 9.0, 2.0, 0.0, 1.0], "bins": [-0.42041015625, -0.40711212158203125, -0.3938140869140625, -0.38051605224609375, -0.367218017578125, -0.35391998291015625, -0.3406219482421875, -0.32732391357421875, -0.31402587890625, -0.30072784423828125, -0.2874298095703125, -0.27413177490234375, -0.260833740234375, -0.24753570556640625, -0.2342376708984375, -0.22093963623046875, -0.2076416015625, -0.19434356689453125, -0.1810455322265625, -0.16774749755859375, -0.154449462890625, -0.14115142822265625, -0.1278533935546875, -0.11455535888671875, -0.10125732421875, -0.08795928955078125, -0.0746612548828125, -0.06136322021484375, -0.048065185546875, -0.03476715087890625, -0.0214691162109375, -0.00817108154296875, 0.005126953125, 0.01842498779296875, 0.0317230224609375, 0.04502105712890625, 0.058319091796875, 0.07161712646484375, 0.0849151611328125, 0.09821319580078125, 0.11151123046875, 0.12480926513671875, 0.1381072998046875, 0.15140533447265625, 0.164703369140625, 0.17800140380859375, 0.1912994384765625, 0.20459747314453125, 0.2178955078125, 0.23119354248046875, 0.2444915771484375, 0.25778961181640625, 0.271087646484375, 0.28438568115234375, 0.2976837158203125, 0.31098175048828125, 0.32427978515625, 0.33757781982421875, 0.3508758544921875, 0.36417388916015625, 0.377471923828125, 0.39076995849609375, 0.4040679931640625, 0.41736602783203125, 0.4306640625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 7.0, 8.0, 3.0, 9.0, 4.0, 10.0, 11.0, 10.0, 20.0, 14.0, 23.0, 29.0, 37.0, 44.0, 45.0, 40.0, 53.0, 59.0, 54.0, 66.0, 59.0, 60.0, 48.0, 49.0, 40.0, 30.0, 31.0, 15.0, 19.0, 18.0, 27.0, 5.0, 11.0, 12.0, 8.0, 3.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.620189666748047e-05, -9.30512323975563e-05, -8.990056812763214e-05, -8.674990385770798e-05, -8.359923958778381e-05, -8.044857531785965e-05, -7.729791104793549e-05, -7.414724677801132e-05, -7.099658250808716e-05, -6.7845918238163e-05, -6.469525396823883e-05, -6.154458969831467e-05, -5.83939254283905e-05, -5.524326115846634e-05, -5.2092596888542175e-05, -4.894193261861801e-05, -4.579126834869385e-05, -4.2640604078769684e-05, -3.948993980884552e-05, -3.6339275538921356e-05, -3.318861126899719e-05, -3.003794699907303e-05, -2.6887282729148865e-05, -2.37366184592247e-05, -2.0585954189300537e-05, -1.7435289919376373e-05, -1.428462564945221e-05, -1.1133961379528046e-05, -7.983297109603882e-06, -4.832632839679718e-06, -1.6819685697555542e-06, 1.4686957001686096e-06, 4.6193599700927734e-06, 7.770024240016937e-06, 1.0920688509941101e-05, 1.4071352779865265e-05, 1.722201704978943e-05, 2.0372681319713593e-05, 2.3523345589637756e-05, 2.667400985956192e-05, 2.9824674129486084e-05, 3.297533839941025e-05, 3.612600266933441e-05, 3.9276666939258575e-05, 4.242733120918274e-05, 4.55779954791069e-05, 4.872865974903107e-05, 5.187932401895523e-05, 5.5029988288879395e-05, 5.818065255880356e-05, 6.133131682872772e-05, 6.448198109865189e-05, 6.763264536857605e-05, 7.078330963850021e-05, 7.393397390842438e-05, 7.708463817834854e-05, 8.02353024482727e-05, 8.338596671819687e-05, 8.653663098812103e-05, 8.96872952580452e-05, 9.283795952796936e-05, 9.598862379789352e-05, 9.913928806781769e-05, 0.00010228995233774185, 0.00010544061660766602]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 5.0, 6.0, 11.0, 3.0, 10.0, 16.0, 19.0, 14.0, 25.0, 49.0, 41.0, 64.0, 107.0, 148.0, 267.0, 469.0, 1124.0, 61887.0, 977988.0, 4480.0, 708.0, 382.0, 230.0, 134.0, 106.0, 56.0, 43.0, 33.0, 29.0, 19.0, 10.0, 17.0, 14.0, 8.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002185821533203125, -0.0021201670169830322, -0.0020545125007629395, -0.0019888579845428467, -0.001923203468322754, -0.0018575489521026611, -0.0017918944358825684, -0.0017262399196624756, -0.0016605854034423828, -0.00159493088722229, -0.0015292763710021973, -0.0014636218547821045, -0.0013979673385620117, -0.001332312822341919, -0.0012666583061218262, -0.0012010037899017334, -0.0011353492736816406, -0.0010696947574615479, -0.001004040241241455, -0.0009383857250213623, -0.0008727312088012695, -0.0008070766925811768, -0.000741422176361084, -0.0006757676601409912, -0.0006101131439208984, -0.0005444586277008057, -0.0004788041114807129, -0.0004131495952606201, -0.00034749507904052734, -0.00028184056282043457, -0.0002161860466003418, -0.00015053153038024902, -8.487701416015625e-05, -1.9222497940063477e-05, 4.64320182800293e-05, 0.00011208653450012207, 0.00017774105072021484, 0.00024339556694030762, 0.0003090500831604004, 0.00037470459938049316, 0.00044035911560058594, 0.0005060136318206787, 0.0005716681480407715, 0.0006373226642608643, 0.000702977180480957, 0.0007686316967010498, 0.0008342862129211426, 0.0008999407291412354, 0.0009655952453613281, 0.001031249761581421, 0.0010969042778015137, 0.0011625587940216064, 0.0012282133102416992, 0.001293867826461792, 0.0013595223426818848, 0.0014251768589019775, 0.0014908313751220703, 0.001556485891342163, 0.0016221404075622559, 0.0016877949237823486, 0.0017534494400024414, 0.0018191039562225342, 0.001884758472442627, 0.0019504129886627197, 0.0020160675048828125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 39.0, 96.0, 225.0, 269.0, 214.0, 111.0, 30.0, 10.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001448805705877021, -0.00013960935757495463, -0.00013433814456220716, -0.0001290669315494597, -0.00012379571853671223, -0.00011852450552396476, -0.00011325328523525968, -0.00010798207222251222, -0.00010271085920976475, -9.743964619701728e-05, -9.216843318426982e-05, -8.689721289556473e-05, -8.162599988281727e-05, -7.63547868700698e-05, -7.108357385732234e-05, -6.581236084457487e-05, -6.05411478318274e-05, -5.5269934819079936e-05, -4.999872180633247e-05, -4.4727505155606195e-05, -3.945629214285873e-05, -3.418507913011126e-05, -2.891386247938499e-05, -2.3642649466637522e-05, -1.8371436453890055e-05, -1.3100222531647887e-05, -7.829008609405719e-06, -2.5577937776688486e-06, 2.713419235078618e-06, 7.984632247826084e-06, 1.3255848898552358e-05, 1.8527061911299825e-05, 2.379828947596252e-05, 2.9069502488709986e-05, 3.434071550145745e-05, 3.9611932152183726e-05, 4.488314516493119e-05, 5.015435817767866e-05, 5.542557482840493e-05, 6.06967878411524e-05, 6.596800085389987e-05, 7.123921386664733e-05, 7.65104268793948e-05, 8.178164716809988e-05, 8.705286018084735e-05, 9.232407319359481e-05, 9.759528620634228e-05, 0.00010286649921908975, 0.00010813771223183721, 0.00011340892524458468, 0.00011868013825733215, 0.0001239513512700796, 0.00012922256428282708, 0.00013449377729557455, 0.00013976500486023724, 0.00014503620332106948, 0.00015030743088573217, 0.00015557864389847964, 0.0001608498569112271, 0.00016612106992397457, 0.00017139228293672204, 0.0001766634959494695, 0.00018193470896221697, 0.00018720593652687967, 0.0001924771349877119]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 5.0, 7.0, 11.0, 14.0, 15.0, 24.0, 30.0, 23.0, 26.0, 22.0, 28.0, 33.0, 38.0, 46.0, 39.0, 45.0, 48.0, 59.0, 40.0, 53.0, 44.0, 42.0, 50.0, 34.0, 29.0, 25.0, 30.0, 27.0, 20.0, 16.0, 14.0, 13.0, 8.0, 12.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9664249420166016e-05, -5.783233791589737e-05, -5.600042641162872e-05, -5.416851490736008e-05, -5.233660340309143e-05, -5.0504691898822784e-05, -4.867278039455414e-05, -4.684086889028549e-05, -4.5008957386016846e-05, -4.31770458817482e-05, -4.134513437747955e-05, -3.951322287321091e-05, -3.768131136894226e-05, -3.5849399864673615e-05, -3.401748836040497e-05, -3.218557685613632e-05, -3.0353665351867676e-05, -2.852175384759903e-05, -2.6689842343330383e-05, -2.4857930839061737e-05, -2.302601933479309e-05, -2.1194107830524445e-05, -1.93621963262558e-05, -1.7530284821987152e-05, -1.5698373317718506e-05, -1.386646181344986e-05, -1.2034550309181213e-05, -1.0202638804912567e-05, -8.370727300643921e-06, -6.538815796375275e-06, -4.706904292106628e-06, -2.874992787837982e-06, -1.043081283569336e-06, 7.888302206993103e-07, 2.6207417249679565e-06, 4.452653229236603e-06, 6.284564733505249e-06, 8.116476237773895e-06, 9.948387742042542e-06, 1.1780299246311188e-05, 1.3612210750579834e-05, 1.544412225484848e-05, 1.7276033759117126e-05, 1.9107945263385773e-05, 2.093985676765442e-05, 2.2771768271923065e-05, 2.460367977619171e-05, 2.6435591280460358e-05, 2.8267502784729004e-05, 3.009941428899765e-05, 3.1931325793266296e-05, 3.376323729753494e-05, 3.559514880180359e-05, 3.7427060306072235e-05, 3.925897181034088e-05, 4.109088331460953e-05, 4.2922794818878174e-05, 4.475470632314682e-05, 4.6586617827415466e-05, 4.841852933168411e-05, 5.025044083595276e-05, 5.2082352340221405e-05, 5.391426384449005e-05, 5.57461753487587e-05, 5.7578086853027344e-05]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 4.0, 4.0, 6.0, 5.0, 9.0, 12.0, 14.0, 14.0, 21.0, 15.0, 27.0, 24.0, 34.0, 22.0, 32.0, 40.0, 45.0, 39.0, 47.0, 50.0, 48.0, 50.0, 41.0, 31.0, 61.0, 37.0, 36.0, 35.0, 28.0, 24.0, 35.0, 26.0, 20.0, 12.0, 15.0, 8.0, 8.0, 7.0, 3.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.00390625, -3.896942138671875, -3.78997802734375, -3.683013916015625, -3.5760498046875, -3.469085693359375, -3.36212158203125, -3.255157470703125, -3.148193359375, -3.041229248046875, -2.93426513671875, -2.827301025390625, -2.7203369140625, -2.613372802734375, -2.50640869140625, -2.399444580078125, -2.29248046875, -2.185516357421875, -2.07855224609375, -1.971588134765625, -1.8646240234375, -1.757659912109375, -1.65069580078125, -1.543731689453125, -1.436767578125, -1.329803466796875, -1.22283935546875, -1.115875244140625, -1.0089111328125, -0.901947021484375, -0.79498291015625, -0.688018798828125, -0.5810546875, -0.474090576171875, -0.36712646484375, -0.260162353515625, -0.1531982421875, -0.046234130859375, 0.06072998046875, 0.167694091796875, 0.274658203125, 0.381622314453125, 0.48858642578125, 0.595550537109375, 0.7025146484375, 0.809478759765625, 0.91644287109375, 1.023406982421875, 1.13037109375, 1.237335205078125, 1.34429931640625, 1.451263427734375, 1.5582275390625, 1.665191650390625, 1.77215576171875, 1.879119873046875, 1.986083984375, 2.093048095703125, 2.20001220703125, 2.306976318359375, 2.4139404296875, 2.520904541015625, 2.62786865234375, 2.734832763671875, 2.841796875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 3.0, 8.0, 6.0, 16.0, 18.0, 30.0, 45.0, 66.0, 89.0, 114.0, 157.0, 235.0, 346.0, 605.0, 949.0, 1706.0, 3073.0, 5700.0, 11007.0, 20918.0, 40590.0, 76829.0, 147774.0, 255466.0, 225896.0, 122654.0, 63646.0, 33139.0, 17450.0, 8958.0, 4799.0, 2557.0, 1406.0, 809.0, 511.0, 315.0, 214.0, 142.0, 104.0, 58.0, 50.0, 41.0, 13.0, 14.0, 16.0, 4.0, 9.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.599609375, -2.520477294921875, -2.44134521484375, -2.362213134765625, -2.2830810546875, -2.203948974609375, -2.12481689453125, -2.045684814453125, -1.966552734375, -1.887420654296875, -1.80828857421875, -1.729156494140625, -1.6500244140625, -1.570892333984375, -1.49176025390625, -1.412628173828125, -1.33349609375, -1.254364013671875, -1.17523193359375, -1.096099853515625, -1.0169677734375, -0.937835693359375, -0.85870361328125, -0.779571533203125, -0.700439453125, -0.621307373046875, -0.54217529296875, -0.463043212890625, -0.3839111328125, -0.304779052734375, -0.22564697265625, -0.146514892578125, -0.0673828125, 0.011749267578125, 0.09088134765625, 0.170013427734375, 0.2491455078125, 0.328277587890625, 0.40740966796875, 0.486541748046875, 0.565673828125, 0.644805908203125, 0.72393798828125, 0.803070068359375, 0.8822021484375, 0.961334228515625, 1.04046630859375, 1.119598388671875, 1.19873046875, 1.277862548828125, 1.35699462890625, 1.436126708984375, 1.5152587890625, 1.594390869140625, 1.67352294921875, 1.752655029296875, 1.831787109375, 1.910919189453125, 1.99005126953125, 2.069183349609375, 2.1483154296875, 2.227447509765625, 2.30657958984375, 2.385711669921875, 2.46484375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 5.0, 13.0, 13.0, 21.0, 23.0, 33.0, 23.0, 51.0, 43.0, 53.0, 67.0, 104.0, 170.0, 1520.0, 345.0, 132.0, 71.0, 59.0, 57.0, 37.0, 36.0, 30.0, 35.0, 20.0, 16.0, 15.0, 11.0, 7.0, 9.0, 3.0, 10.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-19.484375, -18.9698486328125, -18.455322265625, -17.9407958984375, -17.42626953125, -16.9117431640625, -16.397216796875, -15.8826904296875, -15.3681640625, -14.8536376953125, -14.339111328125, -13.8245849609375, -13.31005859375, -12.7955322265625, -12.281005859375, -11.7664794921875, -11.251953125, -10.7374267578125, -10.222900390625, -9.7083740234375, -9.19384765625, -8.6793212890625, -8.164794921875, -7.6502685546875, -7.1357421875, -6.6212158203125, -6.106689453125, -5.5921630859375, -5.07763671875, -4.5631103515625, -4.048583984375, -3.5340576171875, -3.01953125, -2.5050048828125, -1.990478515625, -1.4759521484375, -0.96142578125, -0.4468994140625, 0.067626953125, 0.5821533203125, 1.0966796875, 1.6112060546875, 2.125732421875, 2.6402587890625, 3.15478515625, 3.6693115234375, 4.183837890625, 4.6983642578125, 5.212890625, 5.7274169921875, 6.241943359375, 6.7564697265625, 7.27099609375, 7.7855224609375, 8.300048828125, 8.8145751953125, 9.3291015625, 9.8436279296875, 10.358154296875, 10.8726806640625, 11.38720703125, 11.9017333984375, 12.416259765625, 12.9307861328125, 13.4453125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 7.0, 12.0, 16.0, 17.0, 19.0, 19.0, 39.0, 51.0, 74.0, 101.0, 135.0, 192.0, 303.0, 579.0, 2800.0, 2409730.0, 728039.0, 2071.0, 541.0, 316.0, 179.0, 101.0, 93.0, 72.0, 50.0, 39.0, 29.0, 15.0, 8.0, 11.0, 6.0, 8.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.78125, -38.49560546875, -37.2099609375, -35.92431640625, -34.638671875, -33.35302734375, -32.0673828125, -30.78173828125, -29.49609375, -28.21044921875, -26.9248046875, -25.63916015625, -24.353515625, -23.06787109375, -21.7822265625, -20.49658203125, -19.2109375, -17.92529296875, -16.6396484375, -15.35400390625, -14.068359375, -12.78271484375, -11.4970703125, -10.21142578125, -8.92578125, -7.64013671875, -6.3544921875, -5.06884765625, -3.783203125, -2.49755859375, -1.2119140625, 0.07373046875, 1.359375, 2.64501953125, 3.9306640625, 5.21630859375, 6.501953125, 7.78759765625, 9.0732421875, 10.35888671875, 11.64453125, 12.93017578125, 14.2158203125, 15.50146484375, 16.787109375, 18.07275390625, 19.3583984375, 20.64404296875, 21.9296875, 23.21533203125, 24.5009765625, 25.78662109375, 27.072265625, 28.35791015625, 29.6435546875, 30.92919921875, 32.21484375, 33.50048828125, 34.7861328125, 36.07177734375, 37.357421875, 38.64306640625, 39.9287109375, 41.21435546875, 42.5]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 12.0, 660.0, 344.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.052346229553223, -9.838336944580078, -4.62432861328125, 0.5896806716918945, 5.803689002990723, 11.01769733428955, 16.231708526611328, 21.445716857910156, 26.659725189208984, 31.873733520507812, 37.08774185180664, 42.30175018310547, 47.51576232910156, 52.729766845703125, 57.94377899169922, 63.15778732299805, 68.37179565429688, 73.58580780029297, 78.79981231689453, 84.01382446289062, 89.22782897949219, 94.44184112548828, 99.65585327148438, 104.86985778808594, 110.0838623046875, 115.2978744506836, 120.51187896728516, 125.72589111328125, 130.9398956298828, 136.15390014648438, 141.367919921875, 146.58192443847656, 151.7959442138672, 157.00994873046875, 162.22396850585938, 167.43797302246094, 172.6519775390625, 177.86598205566406, 183.0800018310547, 188.29400634765625, 193.5080108642578, 198.72201538085938, 203.93603515625, 209.15003967285156, 214.36404418945312, 219.5780487060547, 224.7920684814453, 230.00607299804688, 235.2200927734375, 240.43409729003906, 245.6481170654297, 250.86212158203125, 256.0761413574219, 261.2901306152344, 266.504150390625, 271.7181396484375, 276.9321594238281, 282.14617919921875, 287.36016845703125, 292.5741882324219, 297.7882080078125, 303.002197265625, 308.2162170410156, 313.43023681640625, 318.64422607421875]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 3.0, 1.0, 9.0, 8.0, 4.0, 14.0, 12.0, 11.0, 22.0, 12.0, 20.0, 13.0, 20.0, 23.0, 33.0, 34.0, 33.0, 30.0, 31.0, 28.0, 38.0, 43.0, 28.0, 31.0, 42.0, 50.0, 33.0, 31.0, 39.0, 28.0, 34.0, 29.0, 23.0, 27.0, 19.0, 18.0, 17.0, 13.0, 10.0, 11.0, 21.0, 10.0, 6.0, 7.0, 8.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-26.892616271972656, -26.06068229675293, -25.228750228881836, -24.39681625366211, -23.564882278442383, -22.732948303222656, -21.901016235351562, -21.069082260131836, -20.23714828491211, -19.405214309692383, -18.57328224182129, -17.741348266601562, -16.909414291381836, -16.07748031616211, -15.245548248291016, -14.413614273071289, -13.581681251525879, -12.749748229980469, -11.917814254760742, -11.085881233215332, -10.253947257995605, -9.422014236450195, -8.590080261230469, -7.758147239685059, -6.92621374130249, -6.094280242919922, -5.2623467445373535, -4.430413246154785, -3.598479986190796, -2.7665467262268066, -1.9346132278442383, -1.10267972946167, -0.27074623107910156, 0.561187207698822, 1.3931206464767456, 2.2250540256500244, 3.0569875240325928, 3.888920783996582, 4.72085428237915, 5.552787780761719, 6.384721279144287, 7.2166547775268555, 8.048587799072266, 8.880521774291992, 9.712454795837402, 10.544387817382812, 11.376321792602539, 12.208255767822266, 13.040188789367676, 13.872121810913086, 14.704055786132812, 15.535988807678223, 16.367921829223633, 17.19985580444336, 18.031789779663086, 18.863723754882812, 19.695655822753906, 20.527589797973633, 21.359521865844727, 22.191455841064453, 23.02338981628418, 23.855323791503906, 24.687255859375, 25.519189834594727, 26.351123809814453]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 4.0, 8.0, 7.0, 11.0, 14.0, 16.0, 13.0, 20.0, 12.0, 30.0, 28.0, 35.0, 37.0, 39.0, 34.0, 46.0, 42.0, 41.0, 55.0, 50.0, 50.0, 39.0, 31.0, 37.0, 37.0, 38.0, 31.0, 24.0, 19.0, 28.0, 23.0, 11.0, 22.0, 18.0, 9.0, 11.0, 6.0, 7.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.955078125, -3.84149169921875, -3.7279052734375, -3.61431884765625, -3.500732421875, -3.38714599609375, -3.2735595703125, -3.15997314453125, -3.04638671875, -2.93280029296875, -2.8192138671875, -2.70562744140625, -2.592041015625, -2.47845458984375, -2.3648681640625, -2.25128173828125, -2.1376953125, -2.02410888671875, -1.9105224609375, -1.79693603515625, -1.683349609375, -1.56976318359375, -1.4561767578125, -1.34259033203125, -1.22900390625, -1.11541748046875, -1.0018310546875, -0.88824462890625, -0.774658203125, -0.66107177734375, -0.5474853515625, -0.43389892578125, -0.3203125, -0.20672607421875, -0.0931396484375, 0.02044677734375, 0.134033203125, 0.24761962890625, 0.3612060546875, 0.47479248046875, 0.58837890625, 0.70196533203125, 0.8155517578125, 0.92913818359375, 1.042724609375, 1.15631103515625, 1.2698974609375, 1.38348388671875, 1.4970703125, 1.61065673828125, 1.7242431640625, 1.83782958984375, 1.951416015625, 2.06500244140625, 2.1785888671875, 2.29217529296875, 2.40576171875, 2.51934814453125, 2.6329345703125, 2.74652099609375, 2.860107421875, 2.97369384765625, 3.0872802734375, 3.20086669921875, 3.314453125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 6.0, 5.0, 2.0, 5.0, 8.0, 11.0, 8.0, 17.0, 17.0, 14.0, 19.0, 16.0, 25.0, 30.0, 39.0, 53.0, 79.0, 167.0, 342.0, 1341.0, 11334.0, 493605.0, 3344308.0, 332975.0, 8046.0, 1031.0, 307.0, 123.0, 78.0, 38.0, 33.0, 27.0, 17.0, 27.0, 26.0, 20.0, 21.0, 14.0, 13.0, 14.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.255126953125, -11.87744140625, -11.499755859375, -11.1220703125, -10.744384765625, -10.36669921875, -9.989013671875, -9.611328125, -9.233642578125, -8.85595703125, -8.478271484375, -8.1005859375, -7.722900390625, -7.34521484375, -6.967529296875, -6.58984375, -6.212158203125, -5.83447265625, -5.456787109375, -5.0791015625, -4.701416015625, -4.32373046875, -3.946044921875, -3.568359375, -3.190673828125, -2.81298828125, -2.435302734375, -2.0576171875, -1.679931640625, -1.30224609375, -0.924560546875, -0.546875, -0.169189453125, 0.20849609375, 0.586181640625, 0.9638671875, 1.341552734375, 1.71923828125, 2.096923828125, 2.474609375, 2.852294921875, 3.22998046875, 3.607666015625, 3.9853515625, 4.363037109375, 4.74072265625, 5.118408203125, 5.49609375, 5.873779296875, 6.25146484375, 6.629150390625, 7.0068359375, 7.384521484375, 7.76220703125, 8.139892578125, 8.517578125, 8.895263671875, 9.27294921875, 9.650634765625, 10.0283203125, 10.406005859375, 10.78369140625, 11.161376953125, 11.5390625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 8.0, 9.0, 18.0, 26.0, 25.0, 47.0, 57.0, 68.0, 116.0, 173.0, 236.0, 315.0, 384.0, 476.0, 467.0, 398.0, 356.0, 239.0, 189.0, 112.0, 92.0, 75.0, 50.0, 42.0, 31.0, 18.0, 10.0, 6.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.84765625, -6.60382080078125, -6.3599853515625, -6.11614990234375, -5.872314453125, -5.62847900390625, -5.3846435546875, -5.14080810546875, -4.89697265625, -4.65313720703125, -4.4093017578125, -4.16546630859375, -3.921630859375, -3.67779541015625, -3.4339599609375, -3.19012451171875, -2.9462890625, -2.70245361328125, -2.4586181640625, -2.21478271484375, -1.970947265625, -1.72711181640625, -1.4832763671875, -1.23944091796875, -0.99560546875, -0.75177001953125, -0.5079345703125, -0.26409912109375, -0.020263671875, 0.22357177734375, 0.4674072265625, 0.71124267578125, 0.955078125, 1.19891357421875, 1.4427490234375, 1.68658447265625, 1.930419921875, 2.17425537109375, 2.4180908203125, 2.66192626953125, 2.90576171875, 3.14959716796875, 3.3934326171875, 3.63726806640625, 3.881103515625, 4.12493896484375, 4.3687744140625, 4.61260986328125, 4.8564453125, 5.10028076171875, 5.3441162109375, 5.58795166015625, 5.831787109375, 6.07562255859375, 6.3194580078125, 6.56329345703125, 6.80712890625, 7.05096435546875, 7.2947998046875, 7.53863525390625, 7.782470703125, 8.02630615234375, 8.2701416015625, 8.51397705078125, 8.7578125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 10.0, 7.0, 11.0, 15.0, 21.0, 20.0, 33.0, 44.0, 63.0, 90.0, 97.0, 131.0, 155.0, 271.0, 441.0, 926.0, 6117.0, 230831.0, 3673553.0, 272325.0, 6704.0, 1010.0, 456.0, 253.0, 168.0, 136.0, 94.0, 67.0, 46.0, 43.0, 27.0, 31.0, 21.0, 16.0, 11.0, 7.0, 7.0, 9.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.484375, -18.903076171875, -18.32177734375, -17.740478515625, -17.1591796875, -16.577880859375, -15.99658203125, -15.415283203125, -14.833984375, -14.252685546875, -13.67138671875, -13.090087890625, -12.5087890625, -11.927490234375, -11.34619140625, -10.764892578125, -10.18359375, -9.602294921875, -9.02099609375, -8.439697265625, -7.8583984375, -7.277099609375, -6.69580078125, -6.114501953125, -5.533203125, -4.951904296875, -4.37060546875, -3.789306640625, -3.2080078125, -2.626708984375, -2.04541015625, -1.464111328125, -0.8828125, -0.301513671875, 0.27978515625, 0.861083984375, 1.4423828125, 2.023681640625, 2.60498046875, 3.186279296875, 3.767578125, 4.348876953125, 4.93017578125, 5.511474609375, 6.0927734375, 6.674072265625, 7.25537109375, 7.836669921875, 8.41796875, 8.999267578125, 9.58056640625, 10.161865234375, 10.7431640625, 11.324462890625, 11.90576171875, 12.487060546875, 13.068359375, 13.649658203125, 14.23095703125, 14.812255859375, 15.3935546875, 15.974853515625, 16.55615234375, 17.137451171875, 17.71875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 16.0, 66.0, 167.0, 278.0, 277.0, 141.0, 49.0, 12.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.045875549316406, -29.544979095458984, -27.04408073425293, -24.543182373046875, -22.042285919189453, -19.54138946533203, -17.040491104125977, -14.539592742919922, -12.0386962890625, -9.537798881530762, -7.036901473999023, -4.536004066467285, -2.035106658935547, 0.4657907485961914, 2.9666881561279297, 5.467586517333984, 7.968482971191406, 10.469380378723145, 12.970277786254883, 15.471175193786621, 17.97207260131836, 20.47296905517578, 22.973867416381836, 25.47476577758789, 27.975662231445312, 30.476558685302734, 32.977455139160156, 35.478355407714844, 37.979251861572266, 40.48014831542969, 42.981048583984375, 45.4819450378418, 47.98283386230469, 50.48373031616211, 52.98462677001953, 55.48552703857422, 57.98642349243164, 60.48731994628906, 62.98822021484375, 65.48912048339844, 67.9900131225586, 70.49091339111328, 72.99180603027344, 75.49270629882812, 77.99360656738281, 80.49449920654297, 82.99539947509766, 85.49629211425781, 87.9971923828125, 90.49809265136719, 92.99898529052734, 95.49988555908203, 98.00077819824219, 100.50167846679688, 103.00257873535156, 105.50347900390625, 108.0043716430664, 110.5052719116211, 113.00616455078125, 115.50706481933594, 118.00796508789062, 120.50885772705078, 123.00975799560547, 125.51065063476562, 128.0115509033203]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 2.0, 9.0, 14.0, 11.0, 11.0, 19.0, 13.0, 24.0, 20.0, 22.0, 30.0, 24.0, 35.0, 29.0, 41.0, 30.0, 30.0, 32.0, 45.0, 49.0, 43.0, 42.0, 40.0, 35.0, 31.0, 35.0, 18.0, 24.0, 33.0, 27.0, 31.0, 19.0, 23.0, 15.0, 17.0, 8.0, 19.0, 9.0, 12.0, 7.0, 3.0, 2.0, 9.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.791484832763672, -20.0788631439209, -19.366241455078125, -18.65361976623535, -17.940998077392578, -17.228376388549805, -16.51575469970703, -15.803133964538574, -15.0905122756958, -14.377890586853027, -13.665268898010254, -12.952648162841797, -12.240026473999023, -11.52740478515625, -10.814783096313477, -10.102161407470703, -9.38953971862793, -8.676918029785156, -7.964296340942383, -7.251675128936768, -6.539053440093994, -5.826431751251221, -5.1138105392456055, -4.401188850402832, -3.6885671615600586, -2.975945472717285, -2.263324022293091, -1.5507025718688965, -0.838080883026123, -0.1254591941833496, 0.5871620178222656, 1.299783706665039, 2.0124073028564453, 2.7250289916992188, 3.437650442123413, 4.150271892547607, 4.862893581390381, 5.575515270233154, 6.2881364822387695, 7.000758171081543, 7.713379859924316, 8.42600154876709, 9.138623237609863, 9.85124397277832, 10.563865661621094, 11.276487350463867, 11.98910903930664, 12.701730728149414, 13.414352416992188, 14.126974105834961, 14.839595794677734, 15.552217483520508, 16.26483917236328, 16.977460861206055, 17.690082550048828, 18.40270233154297, 19.115325927734375, 19.82794761657715, 20.540569305419922, 21.253190994262695, 21.96581268310547, 22.678434371948242, 23.391056060791016, 24.103675842285156, 24.81629753112793]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 9.0, 5.0, 12.0, 8.0, 19.0, 18.0, 23.0, 27.0, 22.0, 30.0, 34.0, 29.0, 38.0, 44.0, 49.0, 49.0, 33.0, 42.0, 53.0, 44.0, 50.0, 37.0, 44.0, 26.0, 37.0, 27.0, 24.0, 34.0, 20.0, 25.0, 14.0, 15.0, 11.0, 10.0, 8.0, 6.0, 8.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.591796875, -3.47906494140625, -3.3663330078125, -3.25360107421875, -3.140869140625, -3.02813720703125, -2.9154052734375, -2.80267333984375, -2.68994140625, -2.57720947265625, -2.4644775390625, -2.35174560546875, -2.239013671875, -2.12628173828125, -2.0135498046875, -1.90081787109375, -1.7880859375, -1.67535400390625, -1.5626220703125, -1.44989013671875, -1.337158203125, -1.22442626953125, -1.1116943359375, -0.99896240234375, -0.88623046875, -0.77349853515625, -0.6607666015625, -0.54803466796875, -0.435302734375, -0.32257080078125, -0.2098388671875, -0.09710693359375, 0.015625, 0.12835693359375, 0.2410888671875, 0.35382080078125, 0.466552734375, 0.57928466796875, 0.6920166015625, 0.80474853515625, 0.91748046875, 1.03021240234375, 1.1429443359375, 1.25567626953125, 1.368408203125, 1.48114013671875, 1.5938720703125, 1.70660400390625, 1.8193359375, 1.93206787109375, 2.0447998046875, 2.15753173828125, 2.270263671875, 2.38299560546875, 2.4957275390625, 2.60845947265625, 2.72119140625, 2.83392333984375, 2.9466552734375, 3.05938720703125, 3.172119140625, 3.28485107421875, 3.3975830078125, 3.51031494140625, 3.623046875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 7.0, 2.0, 13.0, 18.0, 21.0, 37.0, 41.0, 68.0, 99.0, 155.0, 228.0, 328.0, 484.0, 685.0, 1046.0, 1520.0, 2301.0, 3405.0, 5078.0, 7474.0, 11643.0, 17644.0, 27880.0, 44875.0, 77510.0, 151498.0, 291996.0, 177524.0, 87259.0, 50113.0, 30731.0, 19319.0, 12444.0, 8348.0, 5438.0, 3704.0, 2450.0, 1670.0, 1156.0, 739.0, 512.0, 340.0, 240.0, 184.0, 112.0, 81.0, 41.0, 31.0, 20.0, 20.0, 15.0, 11.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.56103515625, -0.5427017211914062, -0.5243682861328125, -0.5060348510742188, -0.487701416015625, -0.46936798095703125, -0.4510345458984375, -0.43270111083984375, -0.41436767578125, -0.39603424072265625, -0.3777008056640625, -0.35936737060546875, -0.341033935546875, -0.32270050048828125, -0.3043670654296875, -0.28603363037109375, -0.2677001953125, -0.24936676025390625, -0.2310333251953125, -0.21269989013671875, -0.194366455078125, -0.17603302001953125, -0.1576995849609375, -0.13936614990234375, -0.12103271484375, -0.10269927978515625, -0.0843658447265625, -0.06603240966796875, -0.047698974609375, -0.02936553955078125, -0.0110321044921875, 0.00730133056640625, 0.025634765625, 0.04396820068359375, 0.0623016357421875, 0.08063507080078125, 0.098968505859375, 0.11730194091796875, 0.1356353759765625, 0.15396881103515625, 0.17230224609375, 0.19063568115234375, 0.2089691162109375, 0.22730255126953125, 0.245635986328125, 0.26396942138671875, 0.2823028564453125, 0.30063629150390625, 0.3189697265625, 0.33730316162109375, 0.3556365966796875, 0.37397003173828125, 0.392303466796875, 0.41063690185546875, 0.4289703369140625, 0.44730377197265625, 0.46563720703125, 0.48397064208984375, 0.5023040771484375, 0.5206375122070312, 0.538970947265625, 0.5573043823242188, 0.5756378173828125, 0.5939712524414062, 0.6123046875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 7.0, 10.0, 7.0, 10.0, 14.0, 19.0, 16.0, 24.0, 22.0, 27.0, 33.0, 28.0, 31.0, 27.0, 34.0, 45.0, 37.0, 38.0, 35.0, 1071.0, 53.0, 35.0, 35.0, 32.0, 37.0, 40.0, 22.0, 44.0, 25.0, 27.0, 19.0, 22.0, 16.0, 24.0, 12.0, 8.0, 7.0, 5.0, 8.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9580078125, -1.8905792236328125, -1.823150634765625, -1.7557220458984375, -1.68829345703125, -1.6208648681640625, -1.553436279296875, -1.4860076904296875, -1.4185791015625, -1.3511505126953125, -1.283721923828125, -1.2162933349609375, -1.14886474609375, -1.0814361572265625, -1.014007568359375, -0.9465789794921875, -0.879150390625, -0.8117218017578125, -0.744293212890625, -0.6768646240234375, -0.60943603515625, -0.5420074462890625, -0.474578857421875, -0.4071502685546875, -0.3397216796875, -0.2722930908203125, -0.204864501953125, -0.1374359130859375, -0.07000732421875, -0.0025787353515625, 0.064849853515625, 0.1322784423828125, 0.19970703125, 0.2671356201171875, 0.334564208984375, 0.4019927978515625, 0.46942138671875, 0.5368499755859375, 0.604278564453125, 0.6717071533203125, 0.7391357421875, 0.8065643310546875, 0.873992919921875, 0.9414215087890625, 1.00885009765625, 1.0762786865234375, 1.143707275390625, 1.2111358642578125, 1.278564453125, 1.3459930419921875, 1.413421630859375, 1.4808502197265625, 1.54827880859375, 1.6157073974609375, 1.683135986328125, 1.7505645751953125, 1.8179931640625, 1.8854217529296875, 1.952850341796875, 2.0202789306640625, 2.08770751953125, 2.1551361083984375, 2.222564697265625, 2.2899932861328125, 2.357421875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 10.0, 8.0, 18.0, 19.0, 32.0, 36.0, 60.0, 88.0, 153.0, 208.0, 296.0, 439.0, 598.0, 921.0, 1348.0, 2080.0, 3006.0, 4395.0, 6460.0, 9573.0, 14339.0, 21239.0, 32352.0, 49679.0, 81903.0, 156438.0, 1326280.0, 156362.0, 81740.0, 49621.0, 32315.0, 21433.0, 14119.0, 9565.0, 6470.0, 4300.0, 2940.0, 1967.0, 1348.0, 966.0, 674.0, 418.0, 299.0, 206.0, 135.0, 95.0, 65.0, 47.0, 25.0, 22.0, 12.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.50537109375, -0.4898223876953125, -0.474273681640625, -0.4587249755859375, -0.44317626953125, -0.4276275634765625, -0.412078857421875, -0.3965301513671875, -0.3809814453125, -0.3654327392578125, -0.349884033203125, -0.3343353271484375, -0.31878662109375, -0.3032379150390625, -0.287689208984375, -0.2721405029296875, -0.256591796875, -0.2410430908203125, -0.225494384765625, -0.2099456787109375, -0.19439697265625, -0.1788482666015625, -0.163299560546875, -0.1477508544921875, -0.1322021484375, -0.1166534423828125, -0.101104736328125, -0.0855560302734375, -0.07000732421875, -0.0544586181640625, -0.038909912109375, -0.0233612060546875, -0.0078125, 0.0077362060546875, 0.023284912109375, 0.0388336181640625, 0.05438232421875, 0.0699310302734375, 0.085479736328125, 0.1010284423828125, 0.1165771484375, 0.1321258544921875, 0.147674560546875, 0.1632232666015625, 0.17877197265625, 0.1943206787109375, 0.209869384765625, 0.2254180908203125, 0.240966796875, 0.2565155029296875, 0.272064208984375, 0.2876129150390625, 0.30316162109375, 0.3187103271484375, 0.334259033203125, 0.3498077392578125, 0.3653564453125, 0.3809051513671875, 0.396453857421875, 0.4120025634765625, 0.42755126953125, 0.4430999755859375, 0.458648681640625, 0.4741973876953125, 0.48974609375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 10.0, 10.0, 11.0, 15.0, 21.0, 24.0, 31.0, 39.0, 60.0, 69.0, 75.0, 70.0, 88.0, 74.0, 86.0, 60.0, 55.0, 42.0, 29.0, 39.0, 17.0, 19.0, 14.0, 8.0, 6.0, 11.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001627206802368164, -0.0001574549823999405, -0.00015218928456306458, -0.00014692358672618866, -0.00014165788888931274, -0.00013639219105243683, -0.0001311264932155609, -0.000125860795378685, -0.00012059509754180908, -0.00011532939970493317, -0.00011006370186805725, -0.00010479800403118134, -9.953230619430542e-05, -9.42666083574295e-05, -8.900091052055359e-05, -8.373521268367767e-05, -7.846951484680176e-05, -7.320381700992584e-05, -6.793811917304993e-05, -6.267242133617401e-05, -5.7406723499298096e-05, -5.214102566242218e-05, -4.6875327825546265e-05, -4.160962998867035e-05, -3.6343932151794434e-05, -3.107823431491852e-05, -2.5812536478042603e-05, -2.0546838641166687e-05, -1.528114080429077e-05, -1.0015442967414856e-05, -4.7497451305389404e-06, 5.159527063369751e-07, 5.781650543212891e-06, 1.1047348380088806e-05, 1.631304621696472e-05, 2.1578744053840637e-05, 2.6844441890716553e-05, 3.211013972759247e-05, 3.7375837564468384e-05, 4.26415354013443e-05, 4.7907233238220215e-05, 5.317293107509613e-05, 5.8438628911972046e-05, 6.370432674884796e-05, 6.897002458572388e-05, 7.423572242259979e-05, 7.950142025947571e-05, 8.476711809635162e-05, 9.003281593322754e-05, 9.529851377010345e-05, 0.00010056421160697937, 0.00010582990944385529, 0.0001110956072807312, 0.00011636130511760712, 0.00012162700295448303, 0.00012689270079135895, 0.00013215839862823486, 0.00013742409646511078, 0.0001426897943019867, 0.0001479554921388626, 0.00015322118997573853, 0.00015848688781261444, 0.00016375258564949036, 0.00016901828348636627, 0.0001742839813232422]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 9.0, 16.0, 22.0, 35.0, 50.0, 54.0, 89.0, 153.0, 262.0, 713.0, 7543.0, 1035717.0, 2586.0, 586.0, 268.0, 130.0, 88.0, 61.0, 43.0, 28.0, 34.0, 15.0, 8.0, 11.0, 9.0, 5.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0037899017333984375, -0.0036764442920684814, -0.0035629868507385254, -0.0034495294094085693, -0.0033360719680786133, -0.0032226145267486572, -0.003109157085418701, -0.002995699644088745, -0.002882242202758789, -0.002768784761428833, -0.002655327320098877, -0.002541869878768921, -0.002428412437438965, -0.002314954996109009, -0.0022014975547790527, -0.0020880401134490967, -0.0019745826721191406, -0.0018611252307891846, -0.0017476677894592285, -0.0016342103481292725, -0.0015207529067993164, -0.0014072954654693604, -0.0012938380241394043, -0.0011803805828094482, -0.0010669231414794922, -0.0009534657001495361, -0.0008400082588195801, -0.000726550817489624, -0.000613093376159668, -0.0004996359348297119, -0.00038617849349975586, -0.0002727210521697998, -0.00015926361083984375, -4.5806169509887695e-05, 6.765127182006836e-05, 0.00018110871315002441, 0.00029456615447998047, 0.0004080235958099365, 0.0005214810371398926, 0.0006349384784698486, 0.0007483959197998047, 0.0008618533611297607, 0.0009753108024597168, 0.0010887682437896729, 0.001202225685119629, 0.001315683126449585, 0.001429140567779541, 0.001542598009109497, 0.0016560554504394531, 0.0017695128917694092, 0.0018829703330993652, 0.0019964277744293213, 0.0021098852157592773, 0.0022233426570892334, 0.0023368000984191895, 0.0024502575397491455, 0.0025637149810791016, 0.0026771724224090576, 0.0027906298637390137, 0.0029040873050689697, 0.0030175447463989258, 0.003131002187728882, 0.003244459629058838, 0.003357917070388794, 0.00347137451171875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 22.0, 99.0, 228.0, 302.0, 239.0, 99.0, 15.0, 10.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.797560202656314e-05, -3.105178984696977e-05, -2.41279776673764e-05, -1.7204167306772433e-05, -1.0280355127179064e-05, -3.356544766575098e-06, 3.5672674130182713e-06, 1.049107959261164e-05, 1.741489177220501e-05, 2.433870395179838e-05, 3.126251613139175e-05, 3.818632831098512e-05, 4.511013685259968e-05, 5.203394903219305e-05, 5.895776121178642e-05, 6.588156975340098e-05, 7.280538557097316e-05, 7.972919411258772e-05, 8.66530099301599e-05, 9.357681847177446e-05, 0.00010050063428934664, 0.0001074244428309612, 0.00011434825137257576, 0.00012127206719014794, 0.0001281958830077201, 0.0001351196988252923, 0.00014204350009094924, 0.00014896731590852141, 0.0001558911317260936, 0.00016281494754366577, 0.00016973874880932271, 0.0001766625646268949, 0.00018358636589255184, 0.00019051018171012402, 0.00019743398297578096, 0.00020435779879335314, 0.00021128161461092532, 0.00021820541587658226, 0.00022512923169415444, 0.00023205304751172662, 0.0002389768633292988, 0.00024590067914687097, 0.0002528244804125279, 0.0002597483107820153, 0.00026667211204767227, 0.0002735959133133292, 0.0002805197436828166, 0.00028744354494847357, 0.0002943673462141305, 0.00030129114747978747, 0.0003082149778492749, 0.0003151387791149318, 0.00032206258038058877, 0.0003289864107500762, 0.0003359102120157331, 0.00034283404238522053, 0.0003497578436508775, 0.0003566816449165344, 0.00036360547528602183, 0.0003705292765516788, 0.0003774530778173357, 0.00038437690818682313, 0.0003913007094524801, 0.000398224510718137, 0.00040514834108762443]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 8.0, 7.0, 7.0, 12.0, 7.0, 16.0, 10.0, 6.0, 13.0, 15.0, 17.0, 26.0, 21.0, 27.0, 45.0, 43.0, 34.0, 40.0, 42.0, 42.0, 33.0, 51.0, 32.0, 41.0, 22.0, 44.0, 39.0, 39.0, 35.0, 35.0, 32.0, 28.0, 20.0, 23.0, 20.0, 12.0, 10.0, 14.0, 10.0, 6.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.257129669189453e-05, -5.047023296356201e-05, -4.836916923522949e-05, -4.626810550689697e-05, -4.416704177856445e-05, -4.2065978050231934e-05, -3.9964914321899414e-05, -3.7863850593566895e-05, -3.5762786865234375e-05, -3.3661723136901855e-05, -3.1560659408569336e-05, -2.9459595680236816e-05, -2.7358531951904297e-05, -2.5257468223571777e-05, -2.3156404495239258e-05, -2.1055340766906738e-05, -1.895427703857422e-05, -1.68532133102417e-05, -1.475214958190918e-05, -1.265108585357666e-05, -1.055002212524414e-05, -8.448958396911621e-06, -6.3478946685791016e-06, -4.246830940246582e-06, -2.1457672119140625e-06, -4.470348358154297e-08, 2.0563602447509766e-06, 4.157423973083496e-06, 6.258487701416016e-06, 8.359551429748535e-06, 1.0460615158081055e-05, 1.2561678886413574e-05, 1.4662742614746094e-05, 1.6763806343078613e-05, 1.8864870071411133e-05, 2.0965933799743652e-05, 2.3066997528076172e-05, 2.516806125640869e-05, 2.726912498474121e-05, 2.937018871307373e-05, 3.147125244140625e-05, 3.357231616973877e-05, 3.567337989807129e-05, 3.777444362640381e-05, 3.987550735473633e-05, 4.197657108306885e-05, 4.407763481140137e-05, 4.617869853973389e-05, 4.8279762268066406e-05, 5.0380825996398926e-05, 5.2481889724731445e-05, 5.4582953453063965e-05, 5.6684017181396484e-05, 5.8785080909729004e-05, 6.0886144638061523e-05, 6.298720836639404e-05, 6.508827209472656e-05, 6.718933582305908e-05, 6.92903995513916e-05, 7.139146327972412e-05, 7.349252700805664e-05, 7.559359073638916e-05, 7.769465446472168e-05, 7.97957181930542e-05, 8.189678192138672e-05]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 9.0, 5.0, 12.0, 8.0, 19.0, 18.0, 23.0, 27.0, 22.0, 30.0, 34.0, 29.0, 38.0, 44.0, 49.0, 49.0, 33.0, 42.0, 53.0, 44.0, 50.0, 37.0, 44.0, 26.0, 37.0, 27.0, 24.0, 34.0, 20.0, 25.0, 14.0, 15.0, 11.0, 10.0, 8.0, 6.0, 8.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.591796875, -3.47906494140625, -3.3663330078125, -3.25360107421875, -3.140869140625, -3.02813720703125, -2.9154052734375, -2.80267333984375, -2.68994140625, -2.57720947265625, -2.4644775390625, -2.35174560546875, -2.239013671875, -2.12628173828125, -2.0135498046875, -1.90081787109375, -1.7880859375, -1.67535400390625, -1.5626220703125, -1.44989013671875, -1.337158203125, -1.22442626953125, -1.1116943359375, -0.99896240234375, -0.88623046875, -0.77349853515625, -0.6607666015625, -0.54803466796875, -0.435302734375, -0.32257080078125, -0.2098388671875, -0.09710693359375, 0.015625, 0.12835693359375, 0.2410888671875, 0.35382080078125, 0.466552734375, 0.57928466796875, 0.6920166015625, 0.80474853515625, 0.91748046875, 1.03021240234375, 1.1429443359375, 1.25567626953125, 1.368408203125, 1.48114013671875, 1.5938720703125, 1.70660400390625, 1.8193359375, 1.93206787109375, 2.0447998046875, 2.15753173828125, 2.270263671875, 2.38299560546875, 2.4957275390625, 2.60845947265625, 2.72119140625, 2.83392333984375, 2.9466552734375, 3.05938720703125, 3.172119140625, 3.28485107421875, 3.3975830078125, 3.51031494140625, 3.623046875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 9.0, 13.0, 16.0, 32.0, 41.0, 56.0, 89.0, 136.0, 217.0, 379.0, 672.0, 1432.0, 3494.0, 9328.0, 25098.0, 66703.0, 179319.0, 394431.0, 230284.0, 84595.0, 32163.0, 11969.0, 4402.0, 1778.0, 822.0, 409.0, 239.0, 149.0, 93.0, 59.0, 44.0, 33.0, 14.0, 13.0, 7.0, 7.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5, -3.373291015625, -3.24658203125, -3.119873046875, -2.9931640625, -2.866455078125, -2.73974609375, -2.613037109375, -2.486328125, -2.359619140625, -2.23291015625, -2.106201171875, -1.9794921875, -1.852783203125, -1.72607421875, -1.599365234375, -1.47265625, -1.345947265625, -1.21923828125, -1.092529296875, -0.9658203125, -0.839111328125, -0.71240234375, -0.585693359375, -0.458984375, -0.332275390625, -0.20556640625, -0.078857421875, 0.0478515625, 0.174560546875, 0.30126953125, 0.427978515625, 0.5546875, 0.681396484375, 0.80810546875, 0.934814453125, 1.0615234375, 1.188232421875, 1.31494140625, 1.441650390625, 1.568359375, 1.695068359375, 1.82177734375, 1.948486328125, 2.0751953125, 2.201904296875, 2.32861328125, 2.455322265625, 2.58203125, 2.708740234375, 2.83544921875, 2.962158203125, 3.0888671875, 3.215576171875, 3.34228515625, 3.468994140625, 3.595703125, 3.722412109375, 3.84912109375, 3.975830078125, 4.1025390625, 4.229248046875, 4.35595703125, 4.482666015625, 4.609375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 3.0, 7.0, 8.0, 11.0, 13.0, 12.0, 21.0, 20.0, 28.0, 39.0, 32.0, 45.0, 47.0, 57.0, 103.0, 273.0, 1613.0, 222.0, 88.0, 70.0, 49.0, 44.0, 47.0, 39.0, 38.0, 26.0, 20.0, 15.0, 11.0, 10.0, 10.0, 6.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.0, -13.5408935546875, -13.081787109375, -12.6226806640625, -12.16357421875, -11.7044677734375, -11.245361328125, -10.7862548828125, -10.3271484375, -9.8680419921875, -9.408935546875, -8.9498291015625, -8.49072265625, -8.0316162109375, -7.572509765625, -7.1134033203125, -6.654296875, -6.1951904296875, -5.736083984375, -5.2769775390625, -4.81787109375, -4.3587646484375, -3.899658203125, -3.4405517578125, -2.9814453125, -2.5223388671875, -2.063232421875, -1.6041259765625, -1.14501953125, -0.6859130859375, -0.226806640625, 0.2322998046875, 0.69140625, 1.1505126953125, 1.609619140625, 2.0687255859375, 2.52783203125, 2.9869384765625, 3.446044921875, 3.9051513671875, 4.3642578125, 4.8233642578125, 5.282470703125, 5.7415771484375, 6.20068359375, 6.6597900390625, 7.118896484375, 7.5780029296875, 8.037109375, 8.4962158203125, 8.955322265625, 9.4144287109375, 9.87353515625, 10.3326416015625, 10.791748046875, 11.2508544921875, 11.7099609375, 12.1690673828125, 12.628173828125, 13.0872802734375, 13.54638671875, 14.0054931640625, 14.464599609375, 14.9237060546875, 15.3828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 3.0, 8.0, 10.0, 14.0, 23.0, 22.0, 39.0, 41.0, 70.0, 94.0, 138.0, 210.0, 462.0, 1612.0, 2845950.0, 294976.0, 1109.0, 362.0, 173.0, 111.0, 71.0, 59.0, 42.0, 31.0, 17.0, 13.0, 13.0, 13.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.6875, -51.0859375, -49.484375, -47.8828125, -46.28125, -44.6796875, -43.078125, -41.4765625, -39.875, -38.2734375, -36.671875, -35.0703125, -33.46875, -31.8671875, -30.265625, -28.6640625, -27.0625, -25.4609375, -23.859375, -22.2578125, -20.65625, -19.0546875, -17.453125, -15.8515625, -14.25, -12.6484375, -11.046875, -9.4453125, -7.84375, -6.2421875, -4.640625, -3.0390625, -1.4375, 0.1640625, 1.765625, 3.3671875, 4.96875, 6.5703125, 8.171875, 9.7734375, 11.375, 12.9765625, 14.578125, 16.1796875, 17.78125, 19.3828125, 20.984375, 22.5859375, 24.1875, 25.7890625, 27.390625, 28.9921875, 30.59375, 32.1953125, 33.796875, 35.3984375, 37.0, 38.6015625, 40.203125, 41.8046875, 43.40625, 45.0078125, 46.609375, 48.2109375, 49.8125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [242.0, 773.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.701264381408691, -1.5497503280639648, 5.601763725280762, 12.753277778625488, 19.90479278564453, 27.056304931640625, 34.207820892333984, 41.359336853027344, 48.51084899902344, 55.66236114501953, 62.81387710571289, 69.96539306640625, 77.11690521240234, 84.26841735839844, 91.41993713378906, 98.57144927978516, 105.72296142578125, 112.87447357177734, 120.02598571777344, 127.17750549316406, 134.32901000976562, 141.48052978515625, 148.63204956054688, 155.7835693359375, 162.93507385253906, 170.0865936279297, 177.23809814453125, 184.38961791992188, 191.5411376953125, 198.69264221191406, 205.8441619873047, 212.99566650390625, 220.14718627929688, 227.2987060546875, 234.45021057128906, 241.6017303466797, 248.75323486328125, 255.90475463867188, 263.0562744140625, 270.2077941894531, 277.35931396484375, 284.5108337402344, 291.662353515625, 298.8138427734375, 305.9653625488281, 313.11688232421875, 320.2684020996094, 327.419921875, 334.5714111328125, 341.7229309082031, 348.87445068359375, 356.02593994140625, 363.1774597167969, 370.3289794921875, 377.4804992675781, 384.63201904296875, 391.78350830078125, 398.9350280761719, 406.0865478515625, 413.238037109375, 420.3895568847656, 427.54107666015625, 434.6925964355469, 441.8441162109375, 448.9956359863281]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 11.0, 5.0, 14.0, 14.0, 15.0, 21.0, 27.0, 21.0, 28.0, 22.0, 32.0, 37.0, 26.0, 41.0, 50.0, 41.0, 53.0, 33.0, 43.0, 37.0, 34.0, 26.0, 34.0, 43.0, 40.0, 41.0, 30.0, 28.0, 19.0, 19.0, 14.0, 11.0, 16.0, 17.0, 12.0, 10.0, 12.0, 5.0, 3.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.32056427001953, -38.190773010253906, -37.06098175048828, -35.93118667602539, -34.801395416259766, -33.67160415649414, -32.541812896728516, -31.41202163696289, -30.282228469848633, -29.152437210083008, -28.02264404296875, -26.892852783203125, -25.7630615234375, -24.633268356323242, -23.503477096557617, -22.37368392944336, -21.243892669677734, -20.11410140991211, -18.98430824279785, -17.854516983032227, -16.72472381591797, -15.594932556152344, -14.465141296386719, -13.335349082946777, -12.205556869506836, -11.075764656066895, -9.945972442626953, -8.816181182861328, -7.686388969421387, -6.556596755981445, -5.426805019378662, -4.297013282775879, -3.167217254638672, -2.0374252796173096, -0.9076333045959473, 0.22215867042541504, 1.3519506454467773, 2.4817428588867188, 3.611534595489502, 4.741326332092285, 5.871118545532227, 7.000910758972168, 8.13070297241211, 9.260494232177734, 10.390286445617676, 11.520078659057617, 12.649869918823242, 13.779662132263184, 14.909454345703125, 16.03924560546875, 17.169038772583008, 18.298830032348633, 19.42862319946289, 20.558414459228516, 21.68820571899414, 22.817996978759766, 23.947790145874023, 25.07758140563965, 26.207374572753906, 27.33716583251953, 28.466957092285156, 29.596750259399414, 30.72654151916504, 31.856334686279297, 32.98612594604492]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 6.0, 4.0, 7.0, 4.0, 9.0, 15.0, 13.0, 21.0, 16.0, 21.0, 21.0, 21.0, 32.0, 41.0, 44.0, 43.0, 43.0, 35.0, 35.0, 43.0, 48.0, 39.0, 47.0, 30.0, 49.0, 39.0, 36.0, 35.0, 31.0, 33.0, 28.0, 16.0, 14.0, 12.0, 17.0, 14.0, 7.0, 6.0, 11.0, 6.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.125, -3.998046875, -3.87109375, -3.744140625, -3.6171875, -3.490234375, -3.36328125, -3.236328125, -3.109375, -2.982421875, -2.85546875, -2.728515625, -2.6015625, -2.474609375, -2.34765625, -2.220703125, -2.09375, -1.966796875, -1.83984375, -1.712890625, -1.5859375, -1.458984375, -1.33203125, -1.205078125, -1.078125, -0.951171875, -0.82421875, -0.697265625, -0.5703125, -0.443359375, -0.31640625, -0.189453125, -0.0625, 0.064453125, 0.19140625, 0.318359375, 0.4453125, 0.572265625, 0.69921875, 0.826171875, 0.953125, 1.080078125, 1.20703125, 1.333984375, 1.4609375, 1.587890625, 1.71484375, 1.841796875, 1.96875, 2.095703125, 2.22265625, 2.349609375, 2.4765625, 2.603515625, 2.73046875, 2.857421875, 2.984375, 3.111328125, 3.23828125, 3.365234375, 3.4921875, 3.619140625, 3.74609375, 3.873046875, 4.0]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 11.0, 9.0, 10.0, 15.0, 18.0, 15.0, 22.0, 25.0, 18.0, 33.0, 48.0, 48.0, 76.0, 131.0, 381.0, 1410.0, 11417.0, 523601.0, 3307037.0, 340126.0, 7977.0, 1084.0, 301.0, 131.0, 58.0, 51.0, 31.0, 26.0, 20.0, 26.0, 23.0, 13.0, 13.0, 17.0, 8.0, 3.0, 10.0, 5.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.125, -12.720458984375, -12.31591796875, -11.911376953125, -11.5068359375, -11.102294921875, -10.69775390625, -10.293212890625, -9.888671875, -9.484130859375, -9.07958984375, -8.675048828125, -8.2705078125, -7.865966796875, -7.46142578125, -7.056884765625, -6.65234375, -6.247802734375, -5.84326171875, -5.438720703125, -5.0341796875, -4.629638671875, -4.22509765625, -3.820556640625, -3.416015625, -3.011474609375, -2.60693359375, -2.202392578125, -1.7978515625, -1.393310546875, -0.98876953125, -0.584228515625, -0.1796875, 0.224853515625, 0.62939453125, 1.033935546875, 1.4384765625, 1.843017578125, 2.24755859375, 2.652099609375, 3.056640625, 3.461181640625, 3.86572265625, 4.270263671875, 4.6748046875, 5.079345703125, 5.48388671875, 5.888427734375, 6.29296875, 6.697509765625, 7.10205078125, 7.506591796875, 7.9111328125, 8.315673828125, 8.72021484375, 9.124755859375, 9.529296875, 9.933837890625, 10.33837890625, 10.742919921875, 11.1474609375, 11.552001953125, 11.95654296875, 12.361083984375, 12.765625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 10.0, 7.0, 6.0, 12.0, 22.0, 42.0, 62.0, 83.0, 130.0, 198.0, 286.0, 365.0, 538.0, 559.0, 515.0, 372.0, 266.0, 202.0, 123.0, 78.0, 70.0, 36.0, 35.0, 16.0, 11.0, 10.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.4124755859375, -8.106201171875, -7.7999267578125, -7.49365234375, -7.1873779296875, -6.881103515625, -6.5748291015625, -6.2685546875, -5.9622802734375, -5.656005859375, -5.3497314453125, -5.04345703125, -4.7371826171875, -4.430908203125, -4.1246337890625, -3.818359375, -3.5120849609375, -3.205810546875, -2.8995361328125, -2.59326171875, -2.2869873046875, -1.980712890625, -1.6744384765625, -1.3681640625, -1.0618896484375, -0.755615234375, -0.4493408203125, -0.14306640625, 0.1632080078125, 0.469482421875, 0.7757568359375, 1.08203125, 1.3883056640625, 1.694580078125, 2.0008544921875, 2.30712890625, 2.6134033203125, 2.919677734375, 3.2259521484375, 3.5322265625, 3.8385009765625, 4.144775390625, 4.4510498046875, 4.75732421875, 5.0635986328125, 5.369873046875, 5.6761474609375, 5.982421875, 6.2886962890625, 6.594970703125, 6.9012451171875, 7.20751953125, 7.5137939453125, 7.820068359375, 8.1263427734375, 8.4326171875, 8.7388916015625, 9.045166015625, 9.3514404296875, 9.65771484375, 9.9639892578125, 10.270263671875, 10.5765380859375, 10.8828125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 6.0, 6.0, 14.0, 21.0, 16.0, 37.0, 58.0, 90.0, 114.0, 162.0, 273.0, 385.0, 777.0, 9814.0, 3827696.0, 351404.0, 1916.0, 515.0, 302.0, 200.0, 169.0, 104.0, 67.0, 46.0, 27.0, 17.0, 15.0, 9.0, 12.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-38.59375, -37.5146484375, -36.435546875, -35.3564453125, -34.27734375, -33.1982421875, -32.119140625, -31.0400390625, -29.9609375, -28.8818359375, -27.802734375, -26.7236328125, -25.64453125, -24.5654296875, -23.486328125, -22.4072265625, -21.328125, -20.2490234375, -19.169921875, -18.0908203125, -17.01171875, -15.9326171875, -14.853515625, -13.7744140625, -12.6953125, -11.6162109375, -10.537109375, -9.4580078125, -8.37890625, -7.2998046875, -6.220703125, -5.1416015625, -4.0625, -2.9833984375, -1.904296875, -0.8251953125, 0.25390625, 1.3330078125, 2.412109375, 3.4912109375, 4.5703125, 5.6494140625, 6.728515625, 7.8076171875, 8.88671875, 9.9658203125, 11.044921875, 12.1240234375, 13.203125, 14.2822265625, 15.361328125, 16.4404296875, 17.51953125, 18.5986328125, 19.677734375, 20.7568359375, 21.8359375, 22.9150390625, 23.994140625, 25.0732421875, 26.15234375, 27.2314453125, 28.310546875, 29.3896484375, 30.46875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 232.0, 594.0, 172.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.4194793701172, -152.83926391601562, -147.25904846191406, -141.6788330078125, -136.09861755371094, -130.51840209960938, -124.93819427490234, -119.35797882080078, -113.77776336669922, -108.19754791259766, -102.6173324584961, -97.03712463378906, -91.4569091796875, -85.87669372558594, -80.29647827148438, -74.71626281738281, -69.13604736328125, -63.55583190917969, -57.975616455078125, -52.39540481567383, -46.815189361572266, -41.2349739074707, -35.654762268066406, -30.074546813964844, -24.49433135986328, -18.91411590576172, -13.333902359008789, -7.753688812255859, -2.173473358154297, 3.4067420959472656, 8.986953735351562, 14.567169189453125, 20.147369384765625, 25.727584838867188, 31.307798385620117, 36.88801193237305, 42.46822738647461, 48.04844284057617, 53.62865447998047, 59.20886993408203, 64.7890853881836, 70.36930084228516, 75.94951629638672, 81.52972412109375, 87.10993957519531, 92.69015502929688, 98.27037048339844, 103.8505859375, 109.43080139160156, 115.01101684570312, 120.59123229980469, 126.17144775390625, 131.7516632080078, 137.33187866210938, 142.91207885742188, 148.4923095703125, 154.072509765625, 159.65272521972656, 165.23294067382812, 170.8131561279297, 176.39337158203125, 181.9735870361328, 187.55380249023438, 193.13400268554688, 198.7142333984375]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 5.0, 7.0, 12.0, 8.0, 9.0, 16.0, 13.0, 17.0, 18.0, 26.0, 24.0, 26.0, 30.0, 27.0, 41.0, 40.0, 36.0, 39.0, 37.0, 45.0, 50.0, 47.0, 38.0, 37.0, 42.0, 40.0, 34.0, 27.0, 28.0, 25.0, 23.0, 23.0, 23.0, 10.0, 11.0, 15.0, 10.0, 14.0, 5.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.617599487304688, -24.805749893188477, -23.993900299072266, -23.182048797607422, -22.37019920349121, -21.558349609375, -20.74650001525879, -19.934650421142578, -19.122798919677734, -18.310949325561523, -17.499099731445312, -16.68724822998047, -15.875398635864258, -15.063549041748047, -14.251699447631836, -13.439849853515625, -12.628000259399414, -11.816150665283203, -11.004300117492676, -10.192450523376465, -9.380599975585938, -8.568750381469727, -7.756900787353516, -6.9450507164001465, -6.133200645446777, -5.321350574493408, -4.509500503540039, -3.697650909423828, -2.885800838470459, -2.07395076751709, -1.262101173400879, -0.45025110244750977, 0.3616008758544922, 1.1734508275985718, 1.9853007793426514, 2.7971506118774414, 3.6090006828308105, 4.42085075378418, 5.232700347900391, 6.04455041885376, 6.856400489807129, 7.668250560760498, 8.480100631713867, 9.291950225830078, 10.103799819946289, 10.915650367736816, 11.727499961853027, 12.539350509643555, 13.351200103759766, 14.163049697875977, 14.974900245666504, 15.786749839782715, 16.598600387573242, 17.410449981689453, 18.222299575805664, 19.034149169921875, 19.84600067138672, 20.65785026550293, 21.46969985961914, 22.281551361083984, 23.093400955200195, 23.905250549316406, 24.717100143432617, 25.528949737548828, 26.34079933166504]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 6.0, 5.0, 4.0, 9.0, 7.0, 5.0, 18.0, 10.0, 15.0, 23.0, 23.0, 23.0, 24.0, 30.0, 29.0, 33.0, 38.0, 46.0, 40.0, 30.0, 54.0, 46.0, 43.0, 38.0, 45.0, 43.0, 33.0, 37.0, 39.0, 38.0, 26.0, 19.0, 9.0, 16.0, 21.0, 15.0, 11.0, 8.0, 14.0, 12.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8984375, -3.78204345703125, -3.6656494140625, -3.54925537109375, -3.432861328125, -3.31646728515625, -3.2000732421875, -3.08367919921875, -2.96728515625, -2.85089111328125, -2.7344970703125, -2.61810302734375, -2.501708984375, -2.38531494140625, -2.2689208984375, -2.15252685546875, -2.0361328125, -1.91973876953125, -1.8033447265625, -1.68695068359375, -1.570556640625, -1.45416259765625, -1.3377685546875, -1.22137451171875, -1.10498046875, -0.98858642578125, -0.8721923828125, -0.75579833984375, -0.639404296875, -0.52301025390625, -0.4066162109375, -0.29022216796875, -0.173828125, -0.05743408203125, 0.0589599609375, 0.17535400390625, 0.291748046875, 0.40814208984375, 0.5245361328125, 0.64093017578125, 0.75732421875, 0.87371826171875, 0.9901123046875, 1.10650634765625, 1.222900390625, 1.33929443359375, 1.4556884765625, 1.57208251953125, 1.6884765625, 1.80487060546875, 1.9212646484375, 2.03765869140625, 2.154052734375, 2.27044677734375, 2.3868408203125, 2.50323486328125, 2.61962890625, 2.73602294921875, 2.8524169921875, 2.96881103515625, 3.085205078125, 3.20159912109375, 3.3179931640625, 3.43438720703125, 3.55078125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 11.0, 11.0, 22.0, 31.0, 36.0, 54.0, 74.0, 113.0, 163.0, 230.0, 352.0, 511.0, 711.0, 992.0, 1471.0, 2058.0, 3092.0, 4357.0, 6194.0, 9273.0, 13450.0, 20537.0, 31857.0, 51407.0, 89186.0, 176059.0, 283937.0, 144756.0, 76359.0, 45400.0, 28111.0, 18476.0, 12333.0, 8357.0, 5685.0, 3894.0, 2703.0, 1873.0, 1284.0, 922.0, 686.0, 468.0, 345.0, 220.0, 149.0, 114.0, 78.0, 46.0, 42.0, 31.0, 7.0, 14.0, 8.0, 4.0, 0.0, 2.0, 1.0], "bins": [-0.6064453125, -0.5882720947265625, -0.570098876953125, -0.5519256591796875, -0.53375244140625, -0.5155792236328125, -0.497406005859375, -0.4792327880859375, -0.4610595703125, -0.4428863525390625, -0.424713134765625, -0.4065399169921875, -0.38836669921875, -0.3701934814453125, -0.352020263671875, -0.3338470458984375, -0.315673828125, -0.2975006103515625, -0.279327392578125, -0.2611541748046875, -0.24298095703125, -0.2248077392578125, -0.206634521484375, -0.1884613037109375, -0.1702880859375, -0.1521148681640625, -0.133941650390625, -0.1157684326171875, -0.09759521484375, -0.0794219970703125, -0.061248779296875, -0.0430755615234375, -0.02490234375, -0.0067291259765625, 0.011444091796875, 0.0296173095703125, 0.04779052734375, 0.0659637451171875, 0.084136962890625, 0.1023101806640625, 0.1204833984375, 0.1386566162109375, 0.156829833984375, 0.1750030517578125, 0.19317626953125, 0.2113494873046875, 0.229522705078125, 0.2476959228515625, 0.265869140625, 0.2840423583984375, 0.302215576171875, 0.3203887939453125, 0.33856201171875, 0.3567352294921875, 0.374908447265625, 0.3930816650390625, 0.4112548828125, 0.4294281005859375, 0.447601318359375, 0.4657745361328125, 0.48394775390625, 0.5021209716796875, 0.520294189453125, 0.5384674072265625, 0.556640625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 8.0, 9.0, 8.0, 13.0, 6.0, 15.0, 12.0, 24.0, 16.0, 19.0, 17.0, 28.0, 22.0, 39.0, 25.0, 28.0, 34.0, 43.0, 41.0, 38.0, 1061.0, 36.0, 40.0, 46.0, 31.0, 44.0, 35.0, 26.0, 42.0, 38.0, 22.0, 21.0, 18.0, 21.0, 15.0, 21.0, 9.0, 10.0, 13.0, 11.0, 2.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.158203125, -2.088470458984375, -2.01873779296875, -1.949005126953125, -1.8792724609375, -1.809539794921875, -1.73980712890625, -1.670074462890625, -1.600341796875, -1.530609130859375, -1.46087646484375, -1.391143798828125, -1.3214111328125, -1.251678466796875, -1.18194580078125, -1.112213134765625, -1.04248046875, -0.972747802734375, -0.90301513671875, -0.833282470703125, -0.7635498046875, -0.693817138671875, -0.62408447265625, -0.554351806640625, -0.484619140625, -0.414886474609375, -0.34515380859375, -0.275421142578125, -0.2056884765625, -0.135955810546875, -0.06622314453125, 0.003509521484375, 0.0732421875, 0.142974853515625, 0.21270751953125, 0.282440185546875, 0.3521728515625, 0.421905517578125, 0.49163818359375, 0.561370849609375, 0.631103515625, 0.700836181640625, 0.77056884765625, 0.840301513671875, 0.9100341796875, 0.979766845703125, 1.04949951171875, 1.119232177734375, 1.18896484375, 1.258697509765625, 1.32843017578125, 1.398162841796875, 1.4678955078125, 1.537628173828125, 1.60736083984375, 1.677093505859375, 1.746826171875, 1.816558837890625, 1.88629150390625, 1.956024169921875, 2.0257568359375, 2.095489501953125, 2.16522216796875, 2.234954833984375, 2.3046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 14.0, 11.0, 10.0, 22.0, 28.0, 49.0, 57.0, 99.0, 122.0, 168.0, 248.0, 354.0, 539.0, 728.0, 1063.0, 1507.0, 2031.0, 2870.0, 4194.0, 5664.0, 8085.0, 11297.0, 16352.0, 23637.0, 34971.0, 53150.0, 87596.0, 163476.0, 1304221.0, 142133.0, 77933.0, 48841.0, 32228.0, 21839.0, 14966.0, 10609.0, 7468.0, 5277.0, 3740.0, 2751.0, 1903.0, 1414.0, 997.0, 704.0, 522.0, 362.0, 264.0, 184.0, 139.0, 89.0, 72.0, 41.0, 32.0, 33.0, 13.0, 10.0, 6.0, 2.0, 5.0, 3.0], "bins": [-0.494384765625, -0.4791259765625, -0.4638671875, -0.4486083984375, -0.433349609375, -0.4180908203125, -0.40283203125, -0.3875732421875, -0.372314453125, -0.3570556640625, -0.341796875, -0.3265380859375, -0.311279296875, -0.2960205078125, -0.28076171875, -0.2655029296875, -0.250244140625, -0.2349853515625, -0.2197265625, -0.2044677734375, -0.189208984375, -0.1739501953125, -0.15869140625, -0.1434326171875, -0.128173828125, -0.1129150390625, -0.09765625, -0.0823974609375, -0.067138671875, -0.0518798828125, -0.03662109375, -0.0213623046875, -0.006103515625, 0.0091552734375, 0.0244140625, 0.0396728515625, 0.054931640625, 0.0701904296875, 0.08544921875, 0.1007080078125, 0.115966796875, 0.1312255859375, 0.146484375, 0.1617431640625, 0.177001953125, 0.1922607421875, 0.20751953125, 0.2227783203125, 0.238037109375, 0.2532958984375, 0.2685546875, 0.2838134765625, 0.299072265625, 0.3143310546875, 0.32958984375, 0.3448486328125, 0.360107421875, 0.3753662109375, 0.390625, 0.4058837890625, 0.421142578125, 0.4364013671875, 0.45166015625, 0.4669189453125, 0.482177734375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 6.0, 6.0, 5.0, 5.0, 7.0, 8.0, 16.0, 17.0, 23.0, 46.0, 32.0, 43.0, 49.0, 51.0, 63.0, 60.0, 80.0, 62.0, 59.0, 63.0, 53.0, 50.0, 38.0, 28.0, 29.0, 23.0, 20.0, 12.0, 8.0, 10.0, 5.0, 4.0, 1.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00012958049774169922, -0.00012500397861003876, -0.0001204274594783783, -0.00011585094034671783, -0.00011127442121505737, -0.00010669790208339691, -0.00010212138295173645, -9.754486382007599e-05, -9.296834468841553e-05, -8.839182555675507e-05, -8.38153064250946e-05, -7.923878729343414e-05, -7.466226816177368e-05, -7.008574903011322e-05, -6.550922989845276e-05, -6.09327107667923e-05, -5.6356191635131836e-05, -5.1779672503471375e-05, -4.720315337181091e-05, -4.262663424015045e-05, -3.805011510848999e-05, -3.347359597682953e-05, -2.8897076845169067e-05, -2.4320557713508606e-05, -1.9744038581848145e-05, -1.5167519450187683e-05, -1.0591000318527222e-05, -6.01448118686676e-06, -1.4379620552062988e-06, 3.1385570764541626e-06, 7.715076208114624e-06, 1.2291595339775085e-05, 1.6868114471435547e-05, 2.1444633603096008e-05, 2.602115273475647e-05, 3.059767186641693e-05, 3.517419099807739e-05, 3.9750710129737854e-05, 4.4327229261398315e-05, 4.890374839305878e-05, 5.348026752471924e-05, 5.80567866563797e-05, 6.263330578804016e-05, 6.720982491970062e-05, 7.178634405136108e-05, 7.636286318302155e-05, 8.093938231468201e-05, 8.551590144634247e-05, 9.009242057800293e-05, 9.466893970966339e-05, 9.924545884132385e-05, 0.00010382197797298431, 0.00010839849710464478, 0.00011297501623630524, 0.0001175515353679657, 0.00012212805449962616, 0.00012670457363128662, 0.00013128109276294708, 0.00013585761189460754, 0.000140434131026268, 0.00014501065015792847, 0.00014958716928958893, 0.0001541636884212494, 0.00015874020755290985, 0.0001633167266845703]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0, 8.0, 16.0, 16.0, 27.0, 26.0, 32.0, 41.0, 70.0, 99.0, 131.0, 217.0, 368.0, 1119.0, 209194.0, 834384.0, 1637.0, 467.0, 229.0, 120.0, 86.0, 56.0, 58.0, 32.0, 24.0, 18.0, 16.0, 12.0, 4.0, 8.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0035247802734375, -0.00342714786529541, -0.0033295154571533203, -0.0032318830490112305, -0.0031342506408691406, -0.0030366182327270508, -0.002938985824584961, -0.002841353416442871, -0.0027437210083007812, -0.0026460886001586914, -0.0025484561920166016, -0.0024508237838745117, -0.002353191375732422, -0.002255558967590332, -0.002157926559448242, -0.0020602941513061523, -0.0019626617431640625, -0.0018650293350219727, -0.0017673969268798828, -0.001669764518737793, -0.0015721321105957031, -0.0014744997024536133, -0.0013768672943115234, -0.0012792348861694336, -0.0011816024780273438, -0.001083970069885254, -0.000986337661743164, -0.0008887052536010742, -0.0007910728454589844, -0.0006934404373168945, -0.0005958080291748047, -0.0004981756210327148, -0.000400543212890625, -0.00030291080474853516, -0.0002052783966064453, -0.00010764598846435547, -1.0013580322265625e-05, 8.761882781982422e-05, 0.00018525123596191406, 0.0002828836441040039, 0.00038051605224609375, 0.0004781484603881836, 0.0005757808685302734, 0.0006734132766723633, 0.0007710456848144531, 0.000868678092956543, 0.0009663105010986328, 0.0010639429092407227, 0.0011615753173828125, 0.0012592077255249023, 0.0013568401336669922, 0.001454472541809082, 0.0015521049499511719, 0.0016497373580932617, 0.0017473697662353516, 0.0018450021743774414, 0.0019426345825195312, 0.002040266990661621, 0.002137899398803711, 0.0022355318069458008, 0.0023331642150878906, 0.0024307966232299805, 0.0025284290313720703, 0.00262606143951416, 0.00272369384765625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 10.0, 38.0, 159.0, 275.0, 277.0, 157.0, 70.0, 16.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016755824617575854, -0.00016060580674093217, -0.0001536533673061058, -0.00014670092787127942, -0.00013974847388453782, -0.00013279603444971144, -0.00012584359501488507, -0.0001188911555800587, -0.00011193871614523232, -0.00010498627671040595, -9.803383727557957e-05, -9.108139056479558e-05, -8.412895112996921e-05, -7.717651169514284e-05, -7.022406498435885e-05, -6.327162554953247e-05, -5.63191861147061e-05, -4.9366746679879725e-05, -4.2414303607074544e-05, -3.546186053426936e-05, -2.850942109944299e-05, -2.1556981664616615e-05, -1.4604538591811433e-05, -7.652095519006252e-06, -6.996560841798782e-07, 6.252785169635899e-06, 1.3205226423451677e-05, 2.0157667677267455e-05, 2.7110108931083232e-05, 3.4062548365909606e-05, 4.101499143871479e-05, 4.796743451151997e-05, 5.491988849826157e-05, 6.187232793308794e-05, 6.882476736791432e-05, 7.577721407869831e-05, 8.272965351352468e-05, 8.968209294835106e-05, 9.663453965913504e-05, 0.00010358697909396142, 0.00011053941852878779, 0.00011749185796361417, 0.00012444429739844054, 0.00013139673683326691, 0.00013834919082000852, 0.0001453016302548349, 0.00015225406968966126, 0.00015920650912448764, 0.000166158948559314, 0.0001731113879941404, 0.00018006382742896676, 0.00018701626686379313, 0.0001939687062986195, 0.00020092114573344588, 0.00020787359972018749, 0.00021482603915501386, 0.00022177847858984023, 0.0002287309180246666, 0.00023568335745949298, 0.00024263579689431936, 0.00024958825088106096, 0.00025654069031588733, 0.0002634931297507137, 0.0002704455691855401, 0.00027739800862036645]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 3.0, 6.0, 4.0, 6.0, 3.0, 10.0, 7.0, 18.0, 14.0, 12.0, 19.0, 38.0, 17.0, 25.0, 24.0, 33.0, 39.0, 48.0, 32.0, 38.0, 31.0, 37.0, 50.0, 47.0, 40.0, 36.0, 32.0, 29.0, 31.0, 33.0, 25.0, 28.0, 26.0, 19.0, 17.0, 22.0, 12.0, 9.0, 18.0, 13.0, 7.0, 8.0, 3.0, 8.0, 5.0, 11.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.538629531860352e-05, -6.334111094474792e-05, -6.129592657089233e-05, -5.925074219703674e-05, -5.720555782318115e-05, -5.516037344932556e-05, -5.311518907546997e-05, -5.107000470161438e-05, -4.902482032775879e-05, -4.69796359539032e-05, -4.493445158004761e-05, -4.2889267206192017e-05, -4.0844082832336426e-05, -3.8798898458480835e-05, -3.6753714084625244e-05, -3.470852971076965e-05, -3.266334533691406e-05, -3.061816096305847e-05, -2.857297658920288e-05, -2.652779221534729e-05, -2.44826078414917e-05, -2.243742346763611e-05, -2.0392239093780518e-05, -1.8347054719924927e-05, -1.6301870346069336e-05, -1.4256685972213745e-05, -1.2211501598358154e-05, -1.0166317224502563e-05, -8.121132850646973e-06, -6.075948476791382e-06, -4.030764102935791e-06, -1.9855797290802e-06, 5.960464477539063e-08, 2.1047890186309814e-06, 4.149973392486572e-06, 6.195157766342163e-06, 8.240342140197754e-06, 1.0285526514053345e-05, 1.2330710887908936e-05, 1.4375895261764526e-05, 1.6421079635620117e-05, 1.8466264009475708e-05, 2.05114483833313e-05, 2.255663275718689e-05, 2.460181713104248e-05, 2.664700150489807e-05, 2.8692185878753662e-05, 3.073737025260925e-05, 3.2782554626464844e-05, 3.4827739000320435e-05, 3.6872923374176025e-05, 3.8918107748031616e-05, 4.096329212188721e-05, 4.30084764957428e-05, 4.505366086959839e-05, 4.709884524345398e-05, 4.914402961730957e-05, 5.118921399116516e-05, 5.323439836502075e-05, 5.527958273887634e-05, 5.7324767112731934e-05, 5.9369951486587524e-05, 6.141513586044312e-05, 6.34603202342987e-05, 6.55055046081543e-05]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 6.0, 5.0, 4.0, 9.0, 7.0, 5.0, 18.0, 10.0, 15.0, 23.0, 23.0, 23.0, 24.0, 30.0, 29.0, 33.0, 38.0, 46.0, 40.0, 30.0, 54.0, 46.0, 43.0, 38.0, 45.0, 43.0, 33.0, 37.0, 39.0, 38.0, 26.0, 19.0, 9.0, 16.0, 21.0, 15.0, 11.0, 8.0, 14.0, 12.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8984375, -3.78204345703125, -3.6656494140625, -3.54925537109375, -3.432861328125, -3.31646728515625, -3.2000732421875, -3.08367919921875, -2.96728515625, -2.85089111328125, -2.7344970703125, -2.61810302734375, -2.501708984375, -2.38531494140625, -2.2689208984375, -2.15252685546875, -2.0361328125, -1.91973876953125, -1.8033447265625, -1.68695068359375, -1.570556640625, -1.45416259765625, -1.3377685546875, -1.22137451171875, -1.10498046875, -0.98858642578125, -0.8721923828125, -0.75579833984375, -0.639404296875, -0.52301025390625, -0.4066162109375, -0.29022216796875, -0.173828125, -0.05743408203125, 0.0589599609375, 0.17535400390625, 0.291748046875, 0.40814208984375, 0.5245361328125, 0.64093017578125, 0.75732421875, 0.87371826171875, 0.9901123046875, 1.10650634765625, 1.222900390625, 1.33929443359375, 1.4556884765625, 1.57208251953125, 1.6884765625, 1.80487060546875, 1.9212646484375, 2.03765869140625, 2.154052734375, 2.27044677734375, 2.3868408203125, 2.50323486328125, 2.61962890625, 2.73602294921875, 2.8524169921875, 2.96881103515625, 3.085205078125, 3.20159912109375, 3.3179931640625, 3.43438720703125, 3.55078125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 17.0, 10.0, 20.0, 25.0, 37.0, 55.0, 57.0, 89.0, 121.0, 197.0, 308.0, 460.0, 873.0, 1687.0, 3702.0, 8564.0, 20025.0, 48135.0, 115888.0, 271075.0, 327819.0, 144160.0, 60278.0, 25085.0, 10444.0, 4628.0, 2077.0, 1074.0, 581.0, 334.0, 213.0, 130.0, 119.0, 70.0, 55.0, 43.0, 33.0, 25.0, 7.0, 13.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.68359375, -3.568939208984375, -3.45428466796875, -3.339630126953125, -3.2249755859375, -3.110321044921875, -2.99566650390625, -2.881011962890625, -2.766357421875, -2.651702880859375, -2.53704833984375, -2.422393798828125, -2.3077392578125, -2.193084716796875, -2.07843017578125, -1.963775634765625, -1.84912109375, -1.734466552734375, -1.61981201171875, -1.505157470703125, -1.3905029296875, -1.275848388671875, -1.16119384765625, -1.046539306640625, -0.931884765625, -0.817230224609375, -0.70257568359375, -0.587921142578125, -0.4732666015625, -0.358612060546875, -0.24395751953125, -0.129302978515625, -0.0146484375, 0.100006103515625, 0.21466064453125, 0.329315185546875, 0.4439697265625, 0.558624267578125, 0.67327880859375, 0.787933349609375, 0.902587890625, 1.017242431640625, 1.13189697265625, 1.246551513671875, 1.3612060546875, 1.475860595703125, 1.59051513671875, 1.705169677734375, 1.81982421875, 1.934478759765625, 2.04913330078125, 2.163787841796875, 2.2784423828125, 2.393096923828125, 2.50775146484375, 2.622406005859375, 2.737060546875, 2.851715087890625, 2.96636962890625, 3.081024169921875, 3.1956787109375, 3.310333251953125, 3.42498779296875, 3.539642333984375, 3.654296875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 10.0, 6.0, 2.0, 7.0, 14.0, 12.0, 13.0, 13.0, 24.0, 27.0, 28.0, 36.0, 41.0, 39.0, 56.0, 58.0, 60.0, 121.0, 279.0, 1507.0, 210.0, 83.0, 64.0, 50.0, 45.0, 38.0, 30.0, 24.0, 28.0, 21.0, 23.0, 18.0, 17.0, 7.0, 6.0, 7.0, 10.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.796875, -12.3604736328125, -11.924072265625, -11.4876708984375, -11.05126953125, -10.6148681640625, -10.178466796875, -9.7420654296875, -9.3056640625, -8.8692626953125, -8.432861328125, -7.9964599609375, -7.56005859375, -7.1236572265625, -6.687255859375, -6.2508544921875, -5.814453125, -5.3780517578125, -4.941650390625, -4.5052490234375, -4.06884765625, -3.6324462890625, -3.196044921875, -2.7596435546875, -2.3232421875, -1.8868408203125, -1.450439453125, -1.0140380859375, -0.57763671875, -0.1412353515625, 0.295166015625, 0.7315673828125, 1.16796875, 1.6043701171875, 2.040771484375, 2.4771728515625, 2.91357421875, 3.3499755859375, 3.786376953125, 4.2227783203125, 4.6591796875, 5.0955810546875, 5.531982421875, 5.9683837890625, 6.40478515625, 6.8411865234375, 7.277587890625, 7.7139892578125, 8.150390625, 8.5867919921875, 9.023193359375, 9.4595947265625, 9.89599609375, 10.3323974609375, 10.768798828125, 11.2052001953125, 11.6416015625, 12.0780029296875, 12.514404296875, 12.9508056640625, 13.38720703125, 13.8236083984375, 14.260009765625, 14.6964111328125, 15.1328125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 2.0, 8.0, 11.0, 11.0, 10.0, 11.0, 11.0, 15.0, 20.0, 25.0, 58.0, 64.0, 107.0, 188.0, 311.0, 653.0, 6130.0, 3131795.0, 4728.0, 625.0, 341.0, 178.0, 109.0, 74.0, 57.0, 38.0, 39.0, 15.0, 21.0, 6.0, 12.0, 5.0, 7.0, 3.0, 3.0, 7.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.1875, -64.1494140625, -62.111328125, -60.0732421875, -58.03515625, -55.9970703125, -53.958984375, -51.9208984375, -49.8828125, -47.8447265625, -45.806640625, -43.7685546875, -41.73046875, -39.6923828125, -37.654296875, -35.6162109375, -33.578125, -31.5400390625, -29.501953125, -27.4638671875, -25.42578125, -23.3876953125, -21.349609375, -19.3115234375, -17.2734375, -15.2353515625, -13.197265625, -11.1591796875, -9.12109375, -7.0830078125, -5.044921875, -3.0068359375, -0.96875, 1.0693359375, 3.107421875, 5.1455078125, 7.18359375, 9.2216796875, 11.259765625, 13.2978515625, 15.3359375, 17.3740234375, 19.412109375, 21.4501953125, 23.48828125, 25.5263671875, 27.564453125, 29.6025390625, 31.640625, 33.6787109375, 35.716796875, 37.7548828125, 39.79296875, 41.8310546875, 43.869140625, 45.9072265625, 47.9453125, 49.9833984375, 52.021484375, 54.0595703125, 56.09765625, 58.1357421875, 60.173828125, 62.2119140625, 64.25]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 16.0, 110.0, 511.0, 338.0, 38.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.560304641723633, -17.05166244506836, -14.543020248413086, -12.034379005432129, -9.525736808776855, -7.017094612121582, -4.508453369140625, -1.9998111724853516, 0.5088310241699219, 3.017472982406616, 5.5261149406433105, 8.034756660461426, 10.5433988571167, 13.052041053771973, 15.56068229675293, 18.069324493408203, 20.577966690063477, 23.08660888671875, 25.595251083374023, 28.103893280029297, 30.612533569335938, 33.121177673339844, 35.629817962646484, 38.138458251953125, 40.64710235595703, 43.15574264526367, 45.66438674926758, 48.17302703857422, 50.681671142578125, 53.190311431884766, 55.698951721191406, 58.20759582519531, 60.71623992919922, 63.22488021850586, 65.7335205078125, 68.2421646118164, 70.75080871582031, 73.25945281982422, 75.7680892944336, 78.2767333984375, 80.7853775024414, 83.29402160644531, 85.80265808105469, 88.3113021850586, 90.8199462890625, 93.3285903930664, 95.83722686767578, 98.34587097167969, 100.85450744628906, 103.36315155029297, 105.87178802490234, 108.38043212890625, 110.88907623291016, 113.39772033691406, 115.90635681152344, 118.41500091552734, 120.92364501953125, 123.43228912353516, 125.94092559814453, 128.44956970214844, 130.9582061767578, 133.46685791015625, 135.97549438476562, 138.484130859375, 140.99278259277344]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 1.0, 5.0, 3.0, 12.0, 8.0, 8.0, 16.0, 15.0, 14.0, 10.0, 14.0, 23.0, 20.0, 18.0, 25.0, 18.0, 28.0, 37.0, 41.0, 38.0, 38.0, 35.0, 40.0, 29.0, 32.0, 33.0, 37.0, 28.0, 32.0, 29.0, 26.0, 40.0, 25.0, 28.0, 27.0, 30.0, 25.0, 23.0, 11.0, 13.0, 8.0, 13.0, 12.0, 7.0, 4.0, 4.0, 5.0, 8.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0], "bins": [-32.69915771484375, -31.740915298461914, -30.782670974731445, -29.82442855834961, -28.86618423461914, -27.907941818237305, -26.94969940185547, -25.991455078125, -25.033212661743164, -24.074970245361328, -23.11672592163086, -22.158483505249023, -21.200241088867188, -20.24199676513672, -19.283754348754883, -18.325511932373047, -17.367267608642578, -16.409025192260742, -15.450780868530273, -14.492538452148438, -13.534295082092285, -12.576051712036133, -11.617809295654297, -10.659565925598145, -9.701322555541992, -8.74307918548584, -7.784836292266846, -6.826593399047852, -5.868350028991699, -4.910106658935547, -3.9518637657165527, -2.9936208724975586, -2.0353755950927734, -1.0771324634552002, -0.11888933181762695, 0.8393537998199463, 1.7975969314575195, 2.755840301513672, 3.714083194732666, 4.67232608795166, 5.6305694580078125, 6.588812828063965, 7.547055721282959, 8.505298614501953, 9.463541984558105, 10.421785354614258, 11.380027770996094, 12.338271141052246, 13.296514511108398, 14.25475788116455, 15.213001251220703, 16.17124366760254, 17.129486083984375, 18.087730407714844, 19.04597282409668, 20.004215240478516, 20.962459564208984, 21.92070198059082, 22.87894630432129, 23.837188720703125, 24.795433044433594, 25.75367546081543, 26.711917877197266, 27.670162200927734, 28.62840461730957]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 3.0, 11.0, 10.0, 16.0, 7.0, 8.0, 11.0, 17.0, 16.0, 18.0, 25.0, 22.0, 28.0, 29.0, 41.0, 37.0, 35.0, 52.0, 41.0, 34.0, 44.0, 40.0, 42.0, 51.0, 40.0, 30.0, 38.0, 34.0, 29.0, 36.0, 21.0, 16.0, 18.0, 16.0, 15.0, 13.0, 15.0, 6.0, 8.0, 4.0, 11.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 4.0], "bins": [-4.75390625, -4.62432861328125, -4.4947509765625, -4.36517333984375, -4.235595703125, -4.10601806640625, -3.9764404296875, -3.84686279296875, -3.71728515625, -3.58770751953125, -3.4581298828125, -3.32855224609375, -3.198974609375, -3.06939697265625, -2.9398193359375, -2.81024169921875, -2.6806640625, -2.55108642578125, -2.4215087890625, -2.29193115234375, -2.162353515625, -2.03277587890625, -1.9031982421875, -1.77362060546875, -1.64404296875, -1.51446533203125, -1.3848876953125, -1.25531005859375, -1.125732421875, -0.99615478515625, -0.8665771484375, -0.73699951171875, -0.607421875, -0.47784423828125, -0.3482666015625, -0.21868896484375, -0.089111328125, 0.04046630859375, 0.1700439453125, 0.29962158203125, 0.42919921875, 0.55877685546875, 0.6883544921875, 0.81793212890625, 0.947509765625, 1.07708740234375, 1.2066650390625, 1.33624267578125, 1.4658203125, 1.59539794921875, 1.7249755859375, 1.85455322265625, 1.984130859375, 2.11370849609375, 2.2432861328125, 2.37286376953125, 2.50244140625, 2.63201904296875, 2.7615966796875, 2.89117431640625, 3.020751953125, 3.15032958984375, 3.2799072265625, 3.40948486328125, 3.5390625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 8.0, 8.0, 11.0, 7.0, 15.0, 12.0, 11.0, 20.0, 21.0, 24.0, 37.0, 59.0, 77.0, 106.0, 167.0, 285.0, 676.0, 2834.0, 33418.0, 785883.0, 2789221.0, 553822.0, 23917.0, 2219.0, 581.0, 283.0, 162.0, 99.0, 64.0, 58.0, 34.0, 33.0, 21.0, 15.0, 12.0, 9.0, 10.0, 10.0, 5.0, 9.0, 6.0, 5.0, 5.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.0, -10.6895751953125, -10.379150390625, -10.0687255859375, -9.75830078125, -9.4478759765625, -9.137451171875, -8.8270263671875, -8.5166015625, -8.2061767578125, -7.895751953125, -7.5853271484375, -7.27490234375, -6.9644775390625, -6.654052734375, -6.3436279296875, -6.033203125, -5.7227783203125, -5.412353515625, -5.1019287109375, -4.79150390625, -4.4810791015625, -4.170654296875, -3.8602294921875, -3.5498046875, -3.2393798828125, -2.928955078125, -2.6185302734375, -2.30810546875, -1.9976806640625, -1.687255859375, -1.3768310546875, -1.06640625, -0.7559814453125, -0.445556640625, -0.1351318359375, 0.17529296875, 0.4857177734375, 0.796142578125, 1.1065673828125, 1.4169921875, 1.7274169921875, 2.037841796875, 2.3482666015625, 2.65869140625, 2.9691162109375, 3.279541015625, 3.5899658203125, 3.900390625, 4.2108154296875, 4.521240234375, 4.8316650390625, 5.14208984375, 5.4525146484375, 5.762939453125, 6.0733642578125, 6.3837890625, 6.6942138671875, 7.004638671875, 7.3150634765625, 7.62548828125, 7.9359130859375, 8.246337890625, 8.5567626953125, 8.8671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 7.0, 9.0, 6.0, 17.0, 17.0, 26.0, 20.0, 43.0, 50.0, 74.0, 98.0, 125.0, 148.0, 230.0, 317.0, 371.0, 411.0, 443.0, 401.0, 326.0, 245.0, 185.0, 135.0, 93.0, 60.0, 53.0, 36.0, 37.0, 29.0, 15.0, 8.0, 14.0, 10.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.65625, -7.41644287109375, -7.1766357421875, -6.93682861328125, -6.697021484375, -6.45721435546875, -6.2174072265625, -5.97760009765625, -5.73779296875, -5.49798583984375, -5.2581787109375, -5.01837158203125, -4.778564453125, -4.53875732421875, -4.2989501953125, -4.05914306640625, -3.8193359375, -3.57952880859375, -3.3397216796875, -3.09991455078125, -2.860107421875, -2.62030029296875, -2.3804931640625, -2.14068603515625, -1.90087890625, -1.66107177734375, -1.4212646484375, -1.18145751953125, -0.941650390625, -0.70184326171875, -0.4620361328125, -0.22222900390625, 0.017578125, 0.25738525390625, 0.4971923828125, 0.73699951171875, 0.976806640625, 1.21661376953125, 1.4564208984375, 1.69622802734375, 1.93603515625, 2.17584228515625, 2.4156494140625, 2.65545654296875, 2.895263671875, 3.13507080078125, 3.3748779296875, 3.61468505859375, 3.8544921875, 4.09429931640625, 4.3341064453125, 4.57391357421875, 4.813720703125, 5.05352783203125, 5.2933349609375, 5.53314208984375, 5.77294921875, 6.01275634765625, 6.2525634765625, 6.49237060546875, 6.732177734375, 6.97198486328125, 7.2117919921875, 7.45159912109375, 7.69140625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 4.0, 10.0, 14.0, 18.0, 17.0, 27.0, 39.0, 52.0, 66.0, 78.0, 92.0, 146.0, 190.0, 259.0, 388.0, 556.0, 2700.0, 316918.0, 3824235.0, 45760.0, 1124.0, 464.0, 277.0, 175.0, 154.0, 118.0, 114.0, 73.0, 53.0, 41.0, 24.0, 27.0, 20.0, 14.0, 8.0, 10.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.21875, -25.40771484375, -24.5966796875, -23.78564453125, -22.974609375, -22.16357421875, -21.3525390625, -20.54150390625, -19.73046875, -18.91943359375, -18.1083984375, -17.29736328125, -16.486328125, -15.67529296875, -14.8642578125, -14.05322265625, -13.2421875, -12.43115234375, -11.6201171875, -10.80908203125, -9.998046875, -9.18701171875, -8.3759765625, -7.56494140625, -6.75390625, -5.94287109375, -5.1318359375, -4.32080078125, -3.509765625, -2.69873046875, -1.8876953125, -1.07666015625, -0.265625, 0.54541015625, 1.3564453125, 2.16748046875, 2.978515625, 3.78955078125, 4.6005859375, 5.41162109375, 6.22265625, 7.03369140625, 7.8447265625, 8.65576171875, 9.466796875, 10.27783203125, 11.0888671875, 11.89990234375, 12.7109375, 13.52197265625, 14.3330078125, 15.14404296875, 15.955078125, 16.76611328125, 17.5771484375, 18.38818359375, 19.19921875, 20.01025390625, 20.8212890625, 21.63232421875, 22.443359375, 23.25439453125, 24.0654296875, 24.87646484375, 25.6875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 52.0, 185.0, 376.0, 286.0, 93.0, 12.0, 2.0, 1.0, 0.0, 1.0], "bins": [-181.3253936767578, -178.1287078857422, -174.93203735351562, -171.7353515625, -168.53868103027344, -165.3419952392578, -162.14532470703125, -158.94863891601562, -155.751953125, -152.55526733398438, -149.3585968017578, -146.1619110107422, -142.96524047851562, -139.7685546875, -136.57186889648438, -133.3751983642578, -130.17852783203125, -126.98184967041016, -123.78517150878906, -120.58848571777344, -117.39180755615234, -114.19512939453125, -110.99845123291016, -107.80177307128906, -104.60508728027344, -101.40840911865234, -98.21173095703125, -95.01504516601562, -91.81836700439453, -88.62168884277344, -85.42501068115234, -82.22833251953125, -79.03164672851562, -75.83496856689453, -72.63829040527344, -69.44160461425781, -66.24492645263672, -63.048248291015625, -59.85157012939453, -56.65489196777344, -53.458213806152344, -50.26153564453125, -47.06485366821289, -43.8681755065918, -40.6714973449707, -37.474815368652344, -34.27813720703125, -31.081459045410156, -27.88477897644043, -24.688098907470703, -21.49142074584961, -18.294740676879883, -15.098061561584473, -11.901382446289062, -8.704702377319336, -5.508024215698242, -2.3113441467285156, 0.8853352069854736, 4.082014560699463, 7.278694152832031, 10.475373268127441, 13.672052383422852, 16.868732452392578, 20.065410614013672, 23.2620906829834]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 12.0, 6.0, 13.0, 13.0, 20.0, 18.0, 24.0, 26.0, 30.0, 37.0, 27.0, 47.0, 36.0, 36.0, 37.0, 41.0, 40.0, 42.0, 44.0, 42.0, 42.0, 42.0, 31.0, 39.0, 38.0, 29.0, 27.0, 25.0, 18.0, 22.0, 14.0, 18.0, 16.0, 8.0, 7.0, 8.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.400285720825195, -26.552488327026367, -25.704692840576172, -24.856895446777344, -24.009098052978516, -23.161300659179688, -22.313505172729492, -21.465707778930664, -20.61791229248047, -19.77011489868164, -18.922319412231445, -18.074522018432617, -17.22672462463379, -16.378929138183594, -15.531131744384766, -14.683334350585938, -13.83553695678711, -12.987740516662598, -12.13994312286377, -11.292146682739258, -10.44434928894043, -9.596552848815918, -8.748756408691406, -7.900959491729736, -7.053162574768066, -6.2053656578063965, -5.357568740844727, -4.509772300720215, -3.661975383758545, -2.814178466796875, -1.9663820266723633, -1.1185851097106934, -0.2707862854003906, 0.5770105123519897, 1.4248073101043701, 2.272603988647461, 3.120400905609131, 3.968197822570801, 4.8159942626953125, 5.663791179656982, 6.511588096618652, 7.359385013580322, 8.207181930541992, 9.054978370666504, 9.902774810791016, 10.750572204589844, 11.598368644714355, 12.446165084838867, 13.293962478637695, 14.141758918762207, 14.989556312561035, 15.837352752685547, 16.685150146484375, 17.532947540283203, 18.3807430267334, 19.228540420532227, 20.076335906982422, 20.92413330078125, 21.771928787231445, 22.619726181030273, 23.4675235748291, 24.315319061279297, 25.163116455078125, 26.010913848876953, 26.85871124267578]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 0.0, 5.0, 5.0, 8.0, 9.0, 12.0, 12.0, 13.0, 16.0, 21.0, 17.0, 26.0, 20.0, 30.0, 26.0, 29.0, 30.0, 34.0, 41.0, 32.0, 30.0, 55.0, 39.0, 45.0, 36.0, 38.0, 32.0, 41.0, 35.0, 41.0, 32.0, 25.0, 23.0, 19.0, 23.0, 18.0, 15.0, 8.0, 8.0, 13.0, 9.0, 7.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.623046875, -3.507965087890625, -3.39288330078125, -3.277801513671875, -3.1627197265625, -3.047637939453125, -2.93255615234375, -2.817474365234375, -2.702392578125, -2.587310791015625, -2.47222900390625, -2.357147216796875, -2.2420654296875, -2.126983642578125, -2.01190185546875, -1.896820068359375, -1.78173828125, -1.666656494140625, -1.55157470703125, -1.436492919921875, -1.3214111328125, -1.206329345703125, -1.09124755859375, -0.976165771484375, -0.861083984375, -0.746002197265625, -0.63092041015625, -0.515838623046875, -0.4007568359375, -0.285675048828125, -0.17059326171875, -0.055511474609375, 0.0595703125, 0.174652099609375, 0.28973388671875, 0.404815673828125, 0.5198974609375, 0.634979248046875, 0.75006103515625, 0.865142822265625, 0.980224609375, 1.095306396484375, 1.21038818359375, 1.325469970703125, 1.4405517578125, 1.555633544921875, 1.67071533203125, 1.785797119140625, 1.90087890625, 2.015960693359375, 2.13104248046875, 2.246124267578125, 2.3612060546875, 2.476287841796875, 2.59136962890625, 2.706451416015625, 2.821533203125, 2.936614990234375, 3.05169677734375, 3.166778564453125, 3.2818603515625, 3.396942138671875, 3.51202392578125, 3.627105712890625, 3.7421875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 9.0, 13.0, 22.0, 25.0, 43.0, 67.0, 98.0, 129.0, 188.0, 274.0, 402.0, 578.0, 834.0, 1165.0, 1766.0, 2577.0, 3796.0, 5471.0, 8384.0, 12478.0, 19027.0, 29713.0, 47320.0, 78849.0, 146605.0, 282241.0, 170482.0, 89136.0, 52020.0, 32468.0, 20932.0, 13398.0, 9145.0, 5962.0, 3992.0, 2753.0, 1932.0, 1370.0, 925.0, 577.0, 424.0, 326.0, 185.0, 132.0, 125.0, 68.0, 54.0, 23.0, 18.0, 20.0, 11.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.62060546875, -0.6015701293945312, -0.5825347900390625, -0.5634994506835938, -0.544464111328125, -0.5254287719726562, -0.5063934326171875, -0.48735809326171875, -0.46832275390625, -0.44928741455078125, -0.4302520751953125, -0.41121673583984375, -0.392181396484375, -0.37314605712890625, -0.3541107177734375, -0.33507537841796875, -0.3160400390625, -0.29700469970703125, -0.2779693603515625, -0.25893402099609375, -0.239898681640625, -0.22086334228515625, -0.2018280029296875, -0.18279266357421875, -0.16375732421875, -0.14472198486328125, -0.1256866455078125, -0.10665130615234375, -0.087615966796875, -0.06858062744140625, -0.0495452880859375, -0.03050994873046875, -0.011474609375, 0.00756072998046875, 0.0265960693359375, 0.04563140869140625, 0.064666748046875, 0.08370208740234375, 0.1027374267578125, 0.12177276611328125, 0.14080810546875, 0.15984344482421875, 0.1788787841796875, 0.19791412353515625, 0.216949462890625, 0.23598480224609375, 0.2550201416015625, 0.27405548095703125, 0.2930908203125, 0.31212615966796875, 0.3311614990234375, 0.35019683837890625, 0.369232177734375, 0.38826751708984375, 0.4073028564453125, 0.42633819580078125, 0.44537353515625, 0.46440887451171875, 0.4834442138671875, 0.5024795532226562, 0.521514892578125, 0.5405502319335938, 0.5595855712890625, 0.5786209106445312, 0.59765625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 6.0, 11.0, 6.0, 16.0, 12.0, 19.0, 21.0, 23.0, 25.0, 24.0, 29.0, 22.0, 28.0, 33.0, 22.0, 42.0, 39.0, 43.0, 1069.0, 45.0, 28.0, 40.0, 36.0, 48.0, 37.0, 37.0, 34.0, 36.0, 32.0, 18.0, 22.0, 23.0, 19.0, 17.0, 8.0, 14.0, 6.0, 5.0, 6.0, 3.0, 5.0, 9.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.42578125, -2.3487548828125, -2.271728515625, -2.1947021484375, -2.11767578125, -2.0406494140625, -1.963623046875, -1.8865966796875, -1.8095703125, -1.7325439453125, -1.655517578125, -1.5784912109375, -1.50146484375, -1.4244384765625, -1.347412109375, -1.2703857421875, -1.193359375, -1.1163330078125, -1.039306640625, -0.9622802734375, -0.88525390625, -0.8082275390625, -0.731201171875, -0.6541748046875, -0.5771484375, -0.5001220703125, -0.423095703125, -0.3460693359375, -0.26904296875, -0.1920166015625, -0.114990234375, -0.0379638671875, 0.0390625, 0.1160888671875, 0.193115234375, 0.2701416015625, 0.34716796875, 0.4241943359375, 0.501220703125, 0.5782470703125, 0.6552734375, 0.7322998046875, 0.809326171875, 0.8863525390625, 0.96337890625, 1.0404052734375, 1.117431640625, 1.1944580078125, 1.271484375, 1.3485107421875, 1.425537109375, 1.5025634765625, 1.57958984375, 1.6566162109375, 1.733642578125, 1.8106689453125, 1.8876953125, 1.9647216796875, 2.041748046875, 2.1187744140625, 2.19580078125, 2.2728271484375, 2.349853515625, 2.4268798828125, 2.50390625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 5.0, 6.0, 8.0, 13.0, 26.0, 47.0, 60.0, 81.0, 124.0, 189.0, 232.0, 306.0, 477.0, 653.0, 944.0, 1371.0, 2014.0, 2689.0, 3915.0, 5623.0, 8057.0, 11734.0, 16563.0, 24304.0, 35424.0, 53516.0, 86596.0, 163923.0, 1307802.0, 140440.0, 77334.0, 48535.0, 32141.0, 21961.0, 15181.0, 10528.0, 7489.0, 5188.0, 3615.0, 2512.0, 1774.0, 1189.0, 783.0, 591.0, 390.0, 268.0, 176.0, 128.0, 61.0, 58.0, 36.0, 15.0, 14.0, 13.0, 11.0, 4.0, 2.0, 3.0, 0.0, 3.0], "bins": [-0.5380859375, -0.5214767456054688, -0.5048675537109375, -0.48825836181640625, -0.471649169921875, -0.45503997802734375, -0.4384307861328125, -0.42182159423828125, -0.40521240234375, -0.38860321044921875, -0.3719940185546875, -0.35538482666015625, -0.338775634765625, -0.32216644287109375, -0.3055572509765625, -0.28894805908203125, -0.2723388671875, -0.25572967529296875, -0.2391204833984375, -0.22251129150390625, -0.205902099609375, -0.18929290771484375, -0.1726837158203125, -0.15607452392578125, -0.13946533203125, -0.12285614013671875, -0.1062469482421875, -0.08963775634765625, -0.073028564453125, -0.05641937255859375, -0.0398101806640625, -0.02320098876953125, -0.006591796875, 0.01001739501953125, 0.0266265869140625, 0.04323577880859375, 0.059844970703125, 0.07645416259765625, 0.0930633544921875, 0.10967254638671875, 0.12628173828125, 0.14289093017578125, 0.1595001220703125, 0.17610931396484375, 0.192718505859375, 0.20932769775390625, 0.2259368896484375, 0.24254608154296875, 0.2591552734375, 0.27576446533203125, 0.2923736572265625, 0.30898284912109375, 0.325592041015625, 0.34220123291015625, 0.3588104248046875, 0.37541961669921875, 0.39202880859375, 0.40863800048828125, 0.4252471923828125, 0.44185638427734375, 0.458465576171875, 0.47507476806640625, 0.4916839599609375, 0.5082931518554688, 0.52490234375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 9.0, 5.0, 7.0, 12.0, 18.0, 17.0, 18.0, 24.0, 28.0, 28.0, 39.0, 35.0, 63.0, 68.0, 68.0, 71.0, 70.0, 65.0, 68.0, 55.0, 38.0, 34.0, 42.0, 27.0, 28.0, 11.0, 5.0, 9.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001456737518310547, -0.00014094635844230652, -0.00013621896505355835, -0.00013149157166481018, -0.000126764178276062, -0.00012203678488731384, -0.00011730939149856567, -0.0001125819981098175, -0.00010785460472106934, -0.00010312721133232117, -9.8399817943573e-05, -9.367242455482483e-05, -8.894503116607666e-05, -8.421763777732849e-05, -7.949024438858032e-05, -7.476285099983215e-05, -7.003545761108398e-05, -6.530806422233582e-05, -6.0580670833587646e-05, -5.585327744483948e-05, -5.112588405609131e-05, -4.639849066734314e-05, -4.167109727859497e-05, -3.69437038898468e-05, -3.221631050109863e-05, -2.7488917112350464e-05, -2.2761523723602295e-05, -1.8034130334854126e-05, -1.3306736946105957e-05, -8.579343557357788e-06, -3.851950168609619e-06, 8.754432201385498e-07, 5.602836608886719e-06, 1.0330229997634888e-05, 1.5057623386383057e-05, 1.9785016775131226e-05, 2.4512410163879395e-05, 2.9239803552627563e-05, 3.396719694137573e-05, 3.86945903301239e-05, 4.342198371887207e-05, 4.814937710762024e-05, 5.287677049636841e-05, 5.760416388511658e-05, 6.233155727386475e-05, 6.705895066261292e-05, 7.178634405136108e-05, 7.651373744010925e-05, 8.124113082885742e-05, 8.596852421760559e-05, 9.069591760635376e-05, 9.542331099510193e-05, 0.0001001507043838501, 0.00010487809777259827, 0.00010960549116134644, 0.0001143328845500946, 0.00011906027793884277, 0.00012378767132759094, 0.0001285150647163391, 0.00013324245810508728, 0.00013796985149383545, 0.00014269724488258362, 0.0001474246382713318, 0.00015215203166007996, 0.00015687942504882812]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 5.0, 5.0, 16.0, 11.0, 16.0, 24.0, 36.0, 50.0, 70.0, 80.0, 119.0, 237.0, 511.0, 2830.0, 1034999.0, 8152.0, 605.0, 266.0, 155.0, 75.0, 58.0, 53.0, 38.0, 27.0, 24.0, 18.0, 13.0, 18.0, 9.0, 6.0, 5.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003475189208984375, -0.003368556499481201, -0.0032619237899780273, -0.0031552910804748535, -0.0030486583709716797, -0.002942025661468506, -0.002835392951965332, -0.002728760242462158, -0.0026221275329589844, -0.0025154948234558105, -0.0024088621139526367, -0.002302229404449463, -0.002195596694946289, -0.0020889639854431152, -0.0019823312759399414, -0.0018756985664367676, -0.0017690658569335938, -0.00166243314743042, -0.001555800437927246, -0.0014491677284240723, -0.0013425350189208984, -0.0012359023094177246, -0.0011292695999145508, -0.001022636890411377, -0.0009160041809082031, -0.0008093714714050293, -0.0007027387619018555, -0.0005961060523986816, -0.0004894733428955078, -0.000382840633392334, -0.00027620792388916016, -0.00016957521438598633, -6.29425048828125e-05, 4.369020462036133e-05, 0.00015032291412353516, 0.000256955623626709, 0.0003635883331298828, 0.00047022104263305664, 0.0005768537521362305, 0.0006834864616394043, 0.0007901191711425781, 0.000896751880645752, 0.0010033845901489258, 0.0011100172996520996, 0.0012166500091552734, 0.0013232827186584473, 0.001429915428161621, 0.001536548137664795, 0.0016431808471679688, 0.0017498135566711426, 0.0018564462661743164, 0.0019630789756774902, 0.002069711685180664, 0.002176344394683838, 0.0022829771041870117, 0.0023896098136901855, 0.0024962425231933594, 0.002602875232696533, 0.002709507942199707, 0.002816140651702881, 0.0029227733612060547, 0.0030294060707092285, 0.0031360387802124023, 0.003242671489715576, 0.00334930419921875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 64.0, 330.0, 447.0, 145.0, 23.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005411451566033065, -0.0005305749364197254, -0.0005200047162361443, -0.0005094344960525632, -0.0004988642176613212, -0.00048829399747774, -0.00047772377729415894, -0.0004671535571105778, -0.0004565833369269967, -0.0004460131167434156, -0.000435442867456004, -0.0004248726472724229, -0.0004143024270888418, -0.0004037321778014302, -0.0003931619576178491, -0.000382591737434268, -0.00037202148814685643, -0.0003614512679632753, -0.00035088101867586374, -0.00034031079849228263, -0.0003297405783087015, -0.0003191703581251204, -0.00030860010883770883, -0.0002980298886541277, -0.00028745963936671615, -0.00027688941918313503, -0.00026631916989572346, -0.00025574894971214235, -0.00024517872952856123, -0.0002346084947930649, -0.00022403826005756855, -0.00021346803987398744, -0.00020289779058657587, -0.00019232755585107952, -0.0001817573356674984, -0.00017118710093200207, -0.00016061688074842095, -0.0001500466460129246, -0.00013947641127742827, -0.00012890619109384716, -0.00011833595635835081, -0.00010776572889881209, -9.719550143927336e-05, -8.662526670377702e-05, -7.605503924423829e-05, -6.548481178469956e-05, -5.491457704920322e-05, -4.434434958966449e-05, -3.377412213012576e-05, -2.320389285159763e-05, -1.2633663573069498e-05, -2.063432475551963e-06, 8.506794983986765e-06, 1.9077022443525493e-05, 2.9647257179021835e-05, 4.021748463856056e-05, 5.078771209809929e-05, 6.135793955763802e-05, 7.192816701717675e-05, 8.249840175267309e-05, 9.306862921221182e-05, 0.00010363885667175055, 0.00011420909140724689, 0.00012477932614274323, 0.00013534954632632434]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 4.0, 12.0, 9.0, 8.0, 13.0, 25.0, 20.0, 16.0, 30.0, 45.0, 33.0, 27.0, 31.0, 47.0, 42.0, 47.0, 48.0, 43.0, 43.0, 51.0, 53.0, 48.0, 39.0, 32.0, 37.0, 27.0, 35.0, 32.0, 17.0, 15.0, 14.0, 10.0, 16.0, 14.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.338689804077148e-05, -8.092913776636124e-05, -7.847137749195099e-05, -7.601361721754074e-05, -7.355585694313049e-05, -7.109809666872025e-05, -6.864033639431e-05, -6.618257611989975e-05, -6.37248158454895e-05, -6.126705557107925e-05, -5.8809295296669006e-05, -5.635153502225876e-05, -5.389377474784851e-05, -5.143601447343826e-05, -4.8978254199028015e-05, -4.652049392461777e-05, -4.406273365020752e-05, -4.160497337579727e-05, -3.9147213101387024e-05, -3.6689452826976776e-05, -3.423169255256653e-05, -3.177393227815628e-05, -2.9316172003746033e-05, -2.6858411729335785e-05, -2.4400651454925537e-05, -2.194289118051529e-05, -1.948513090610504e-05, -1.7027370631694794e-05, -1.4569610357284546e-05, -1.2111850082874298e-05, -9.65408980846405e-06, -7.1963295340538025e-06, -4.738569259643555e-06, -2.280808985233307e-06, 1.7695128917694092e-07, 2.6347115635871887e-06, 5.0924718379974365e-06, 7.550232112407684e-06, 1.0007992386817932e-05, 1.246575266122818e-05, 1.4923512935638428e-05, 1.7381273210048676e-05, 1.9839033484458923e-05, 2.229679375886917e-05, 2.475455403327942e-05, 2.7212314307689667e-05, 2.9670074582099915e-05, 3.212783485651016e-05, 3.458559513092041e-05, 3.704335540533066e-05, 3.9501115679740906e-05, 4.1958875954151154e-05, 4.44166362285614e-05, 4.687439650297165e-05, 4.93321567773819e-05, 5.1789917051792145e-05, 5.424767732620239e-05, 5.670543760061264e-05, 5.916319787502289e-05, 6.162095814943314e-05, 6.407871842384338e-05, 6.653647869825363e-05, 6.899423897266388e-05, 7.145199924707413e-05, 7.390975952148438e-05]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 0.0, 5.0, 5.0, 8.0, 9.0, 12.0, 12.0, 13.0, 16.0, 21.0, 17.0, 26.0, 20.0, 30.0, 26.0, 29.0, 30.0, 34.0, 41.0, 32.0, 30.0, 55.0, 39.0, 45.0, 36.0, 38.0, 32.0, 41.0, 35.0, 41.0, 32.0, 25.0, 23.0, 19.0, 23.0, 18.0, 15.0, 8.0, 8.0, 13.0, 9.0, 7.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.623046875, -3.507965087890625, -3.39288330078125, -3.277801513671875, -3.1627197265625, -3.047637939453125, -2.93255615234375, -2.817474365234375, -2.702392578125, -2.587310791015625, -2.47222900390625, -2.357147216796875, -2.2420654296875, -2.126983642578125, -2.01190185546875, -1.896820068359375, -1.78173828125, -1.666656494140625, -1.55157470703125, -1.436492919921875, -1.3214111328125, -1.206329345703125, -1.09124755859375, -0.976165771484375, -0.861083984375, -0.746002197265625, -0.63092041015625, -0.515838623046875, -0.4007568359375, -0.285675048828125, -0.17059326171875, -0.055511474609375, 0.0595703125, 0.174652099609375, 0.28973388671875, 0.404815673828125, 0.5198974609375, 0.634979248046875, 0.75006103515625, 0.865142822265625, 0.980224609375, 1.095306396484375, 1.21038818359375, 1.325469970703125, 1.4405517578125, 1.555633544921875, 1.67071533203125, 1.785797119140625, 1.90087890625, 2.015960693359375, 2.13104248046875, 2.246124267578125, 2.3612060546875, 2.476287841796875, 2.59136962890625, 2.706451416015625, 2.821533203125, 2.936614990234375, 3.05169677734375, 3.166778564453125, 3.2818603515625, 3.396942138671875, 3.51202392578125, 3.627105712890625, 3.7421875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 5.0, 5.0, 3.0, 10.0, 11.0, 16.0, 24.0, 21.0, 34.0, 40.0, 44.0, 90.0, 117.0, 176.0, 231.0, 372.0, 676.0, 1407.0, 2775.0, 6289.0, 14848.0, 34883.0, 84010.0, 196458.0, 371859.0, 191496.0, 81830.0, 34303.0, 14367.0, 6225.0, 2749.0, 1333.0, 702.0, 374.0, 220.0, 145.0, 102.0, 77.0, 57.0, 42.0, 25.0, 23.0, 22.0, 11.0, 13.0, 12.0, 6.0, 4.0, 6.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.5234375, -3.411529541015625, -3.29962158203125, -3.187713623046875, -3.0758056640625, -2.963897705078125, -2.85198974609375, -2.740081787109375, -2.628173828125, -2.516265869140625, -2.40435791015625, -2.292449951171875, -2.1805419921875, -2.068634033203125, -1.95672607421875, -1.844818115234375, -1.73291015625, -1.621002197265625, -1.50909423828125, -1.397186279296875, -1.2852783203125, -1.173370361328125, -1.06146240234375, -0.949554443359375, -0.837646484375, -0.725738525390625, -0.61383056640625, -0.501922607421875, -0.3900146484375, -0.278106689453125, -0.16619873046875, -0.054290771484375, 0.0576171875, 0.169525146484375, 0.28143310546875, 0.393341064453125, 0.5052490234375, 0.617156982421875, 0.72906494140625, 0.840972900390625, 0.952880859375, 1.064788818359375, 1.17669677734375, 1.288604736328125, 1.4005126953125, 1.512420654296875, 1.62432861328125, 1.736236572265625, 1.84814453125, 1.960052490234375, 2.07196044921875, 2.183868408203125, 2.2957763671875, 2.407684326171875, 2.51959228515625, 2.631500244140625, 2.743408203125, 2.855316162109375, 2.96722412109375, 3.079132080078125, 3.1910400390625, 3.302947998046875, 3.41485595703125, 3.526763916015625, 3.638671875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 8.0, 5.0, 14.0, 15.0, 15.0, 16.0, 15.0, 13.0, 22.0, 26.0, 18.0, 27.0, 35.0, 33.0, 40.0, 35.0, 54.0, 90.0, 174.0, 1505.0, 344.0, 124.0, 73.0, 48.0, 45.0, 34.0, 34.0, 17.0, 27.0, 23.0, 21.0, 18.0, 15.0, 14.0, 15.0, 13.0, 7.0, 4.0, 2.0, 5.0, 1.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8359375, -11.3946533203125, -10.953369140625, -10.5120849609375, -10.07080078125, -9.6295166015625, -9.188232421875, -8.7469482421875, -8.3056640625, -7.8643798828125, -7.423095703125, -6.9818115234375, -6.54052734375, -6.0992431640625, -5.657958984375, -5.2166748046875, -4.775390625, -4.3341064453125, -3.892822265625, -3.4515380859375, -3.01025390625, -2.5689697265625, -2.127685546875, -1.6864013671875, -1.2451171875, -0.8038330078125, -0.362548828125, 0.0787353515625, 0.52001953125, 0.9613037109375, 1.402587890625, 1.8438720703125, 2.28515625, 2.7264404296875, 3.167724609375, 3.6090087890625, 4.05029296875, 4.4915771484375, 4.932861328125, 5.3741455078125, 5.8154296875, 6.2567138671875, 6.697998046875, 7.1392822265625, 7.58056640625, 8.0218505859375, 8.463134765625, 8.9044189453125, 9.345703125, 9.7869873046875, 10.228271484375, 10.6695556640625, 11.11083984375, 11.5521240234375, 11.993408203125, 12.4346923828125, 12.8759765625, 13.3172607421875, 13.758544921875, 14.1998291015625, 14.64111328125, 15.0823974609375, 15.523681640625, 15.9649658203125, 16.40625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 6.0, 3.0, 5.0, 7.0, 9.0, 9.0, 23.0, 32.0, 25.0, 71.0, 102.0, 161.0, 331.0, 790.0, 15921.0, 3124723.0, 2358.0, 476.0, 226.0, 141.0, 95.0, 69.0, 39.0, 29.0, 15.0, 8.0, 10.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.375, -68.9365234375, -66.498046875, -64.0595703125, -61.62109375, -59.1826171875, -56.744140625, -54.3056640625, -51.8671875, -49.4287109375, -46.990234375, -44.5517578125, -42.11328125, -39.6748046875, -37.236328125, -34.7978515625, -32.359375, -29.9208984375, -27.482421875, -25.0439453125, -22.60546875, -20.1669921875, -17.728515625, -15.2900390625, -12.8515625, -10.4130859375, -7.974609375, -5.5361328125, -3.09765625, -0.6591796875, 1.779296875, 4.2177734375, 6.65625, 9.0947265625, 11.533203125, 13.9716796875, 16.41015625, 18.8486328125, 21.287109375, 23.7255859375, 26.1640625, 28.6025390625, 31.041015625, 33.4794921875, 35.91796875, 38.3564453125, 40.794921875, 43.2333984375, 45.671875, 48.1103515625, 50.548828125, 52.9873046875, 55.42578125, 57.8642578125, 60.302734375, 62.7412109375, 65.1796875, 67.6181640625, 70.056640625, 72.4951171875, 74.93359375, 77.3720703125, 79.810546875, 82.2490234375, 84.6875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 713.0, 301.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.10687255859375, -18.36716079711914, -13.627450942993164, -8.887740135192871, -4.148029327392578, 0.5916824340820312, 5.331392288208008, 10.071102142333984, 14.810813903808594, 19.550525665283203, 24.29023551940918, 29.029945373535156, 33.769657135009766, 38.509368896484375, 43.24907684326172, 47.98878860473633, 52.72850036621094, 57.46821212768555, 62.207923889160156, 66.9476318359375, 71.68734741210938, 76.42705535888672, 81.16676330566406, 85.90647888183594, 90.64618682861328, 95.38589477539062, 100.1256103515625, 104.86531829833984, 109.60502624511719, 114.34474182128906, 119.0844497680664, 123.82415771484375, 128.56387329101562, 133.3035888671875, 138.0432891845703, 142.7830047607422, 147.52272033691406, 152.26242065429688, 157.00213623046875, 161.74185180664062, 166.4815673828125, 171.22128295898438, 175.9609832763672, 180.70069885253906, 185.44041442871094, 190.18011474609375, 194.91983032226562, 199.6595458984375, 204.3992462158203, 209.1389617919922, 213.878662109375, 218.61837768554688, 223.35809326171875, 228.09780883789062, 232.83750915527344, 237.5772247314453, 242.31692504882812, 247.056640625, 251.7963409423828, 256.53607177734375, 261.2757568359375, 266.0154724121094, 270.75518798828125, 275.4949035644531, 280.234619140625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 9.0, 2.0, 5.0, 10.0, 13.0, 12.0, 14.0, 16.0, 15.0, 19.0, 14.0, 21.0, 24.0, 26.0, 42.0, 43.0, 30.0, 36.0, 43.0, 38.0, 35.0, 44.0, 56.0, 50.0, 37.0, 30.0, 41.0, 31.0, 28.0, 29.0, 30.0, 31.0, 20.0, 22.0, 22.0, 18.0, 10.0, 8.0, 8.0, 8.0, 5.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.92547607421875, -33.87828063964844, -32.831085205078125, -31.78388786315918, -30.736690521240234, -29.689495086669922, -28.64229965209961, -27.595104217529297, -26.54790687561035, -25.50071144104004, -24.453514099121094, -23.40631866455078, -22.35912322998047, -21.311925888061523, -20.26473045349121, -19.217533111572266, -18.170337677001953, -17.12314224243164, -16.075944900512695, -15.028749465942383, -13.981553077697754, -12.934356689453125, -11.887161254882812, -10.839964866638184, -9.792768478393555, -8.745572090148926, -7.698376178741455, -6.651180267333984, -5.6039838790893555, -4.556787490844727, -3.509591579437256, -2.462395668029785, -1.4151992797851562, -0.36800312995910645, 0.6791930198669434, 1.7263891696929932, 2.773585319519043, 3.820781707763672, 4.867977619171143, 5.915173530578613, 6.962369918823242, 8.009566307067871, 9.0567626953125, 10.103958129882812, 11.151154518127441, 12.19835090637207, 13.245546340942383, 14.292742729187012, 15.33993911743164, 16.387134552001953, 17.4343318939209, 18.48152732849121, 19.528724670410156, 20.57592010498047, 21.62311553955078, 22.670310974121094, 23.71750831604004, 24.76470375061035, 25.811901092529297, 26.85909652709961, 27.906291961669922, 28.953489303588867, 30.00068473815918, 31.047882080078125, 32.09507751464844]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 5.0, 12.0, 10.0, 9.0, 20.0, 17.0, 20.0, 17.0, 18.0, 31.0, 38.0, 23.0, 28.0, 38.0, 48.0, 41.0, 37.0, 37.0, 34.0, 43.0, 46.0, 51.0, 45.0, 43.0, 23.0, 46.0, 39.0, 27.0, 16.0, 20.0, 24.0, 9.0, 15.0, 8.0, 11.0, 12.0, 5.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.234375, -4.1005859375, -3.966796875, -3.8330078125, -3.69921875, -3.5654296875, -3.431640625, -3.2978515625, -3.1640625, -3.0302734375, -2.896484375, -2.7626953125, -2.62890625, -2.4951171875, -2.361328125, -2.2275390625, -2.09375, -1.9599609375, -1.826171875, -1.6923828125, -1.55859375, -1.4248046875, -1.291015625, -1.1572265625, -1.0234375, -0.8896484375, -0.755859375, -0.6220703125, -0.48828125, -0.3544921875, -0.220703125, -0.0869140625, 0.046875, 0.1806640625, 0.314453125, 0.4482421875, 0.58203125, 0.7158203125, 0.849609375, 0.9833984375, 1.1171875, 1.2509765625, 1.384765625, 1.5185546875, 1.65234375, 1.7861328125, 1.919921875, 2.0537109375, 2.1875, 2.3212890625, 2.455078125, 2.5888671875, 2.72265625, 2.8564453125, 2.990234375, 3.1240234375, 3.2578125, 3.3916015625, 3.525390625, 3.6591796875, 3.79296875, 3.9267578125, 4.060546875, 4.1943359375, 4.328125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 5.0, 2.0, 8.0, 9.0, 12.0, 20.0, 16.0, 18.0, 35.0, 25.0, 39.0, 43.0, 37.0, 57.0, 59.0, 90.0, 127.0, 147.0, 336.0, 791.0, 3354.0, 37166.0, 707376.0, 2696852.0, 704982.0, 37445.0, 3324.0, 850.0, 318.0, 155.0, 109.0, 88.0, 68.0, 53.0, 35.0, 44.0, 27.0, 31.0, 25.0, 24.0, 19.0, 9.0, 16.0, 12.0, 2.0, 8.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.453369140625, -8.15673828125, -7.860107421875, -7.5634765625, -7.266845703125, -6.97021484375, -6.673583984375, -6.376953125, -6.080322265625, -5.78369140625, -5.487060546875, -5.1904296875, -4.893798828125, -4.59716796875, -4.300537109375, -4.00390625, -3.707275390625, -3.41064453125, -3.114013671875, -2.8173828125, -2.520751953125, -2.22412109375, -1.927490234375, -1.630859375, -1.334228515625, -1.03759765625, -0.740966796875, -0.4443359375, -0.147705078125, 0.14892578125, 0.445556640625, 0.7421875, 1.038818359375, 1.33544921875, 1.632080078125, 1.9287109375, 2.225341796875, 2.52197265625, 2.818603515625, 3.115234375, 3.411865234375, 3.70849609375, 4.005126953125, 4.3017578125, 4.598388671875, 4.89501953125, 5.191650390625, 5.48828125, 5.784912109375, 6.08154296875, 6.378173828125, 6.6748046875, 6.971435546875, 7.26806640625, 7.564697265625, 7.861328125, 8.157958984375, 8.45458984375, 8.751220703125, 9.0478515625, 9.344482421875, 9.64111328125, 9.937744140625, 10.234375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 6.0, 9.0, 11.0, 12.0, 19.0, 28.0, 41.0, 45.0, 64.0, 133.0, 221.0, 258.0, 389.0, 493.0, 552.0, 527.0, 410.0, 238.0, 177.0, 121.0, 93.0, 66.0, 49.0, 23.0, 33.0, 17.0, 13.0, 10.0, 6.0, 5.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.15234375, -6.86016845703125, -6.5679931640625, -6.27581787109375, -5.983642578125, -5.69146728515625, -5.3992919921875, -5.10711669921875, -4.81494140625, -4.52276611328125, -4.2305908203125, -3.93841552734375, -3.646240234375, -3.35406494140625, -3.0618896484375, -2.76971435546875, -2.4775390625, -2.18536376953125, -1.8931884765625, -1.60101318359375, -1.308837890625, -1.01666259765625, -0.7244873046875, -0.43231201171875, -0.14013671875, 0.15203857421875, 0.4442138671875, 0.73638916015625, 1.028564453125, 1.32073974609375, 1.6129150390625, 1.90509033203125, 2.197265625, 2.48944091796875, 2.7816162109375, 3.07379150390625, 3.365966796875, 3.65814208984375, 3.9503173828125, 4.24249267578125, 4.53466796875, 4.82684326171875, 5.1190185546875, 5.41119384765625, 5.703369140625, 5.99554443359375, 6.2877197265625, 6.57989501953125, 6.8720703125, 7.16424560546875, 7.4564208984375, 7.74859619140625, 8.040771484375, 8.33294677734375, 8.6251220703125, 8.91729736328125, 9.20947265625, 9.50164794921875, 9.7938232421875, 10.08599853515625, 10.378173828125, 10.67034912109375, 10.9625244140625, 11.25469970703125, 11.546875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 4.0, 10.0, 11.0, 15.0, 22.0, 20.0, 32.0, 51.0, 89.0, 120.0, 160.0, 263.0, 347.0, 628.0, 8948.0, 4134414.0, 47178.0, 758.0, 363.0, 308.0, 187.0, 122.0, 58.0, 57.0, 32.0, 23.0, 17.0, 14.0, 9.0, 12.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.03125, -52.6669921875, -51.302734375, -49.9384765625, -48.57421875, -47.2099609375, -45.845703125, -44.4814453125, -43.1171875, -41.7529296875, -40.388671875, -39.0244140625, -37.66015625, -36.2958984375, -34.931640625, -33.5673828125, -32.203125, -30.8388671875, -29.474609375, -28.1103515625, -26.74609375, -25.3818359375, -24.017578125, -22.6533203125, -21.2890625, -19.9248046875, -18.560546875, -17.1962890625, -15.83203125, -14.4677734375, -13.103515625, -11.7392578125, -10.375, -9.0107421875, -7.646484375, -6.2822265625, -4.91796875, -3.5537109375, -2.189453125, -0.8251953125, 0.5390625, 1.9033203125, 3.267578125, 4.6318359375, 5.99609375, 7.3603515625, 8.724609375, 10.0888671875, 11.453125, 12.8173828125, 14.181640625, 15.5458984375, 16.91015625, 18.2744140625, 19.638671875, 21.0029296875, 22.3671875, 23.7314453125, 25.095703125, 26.4599609375, 27.82421875, 29.1884765625, 30.552734375, 31.9169921875, 33.28125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 20.0, 575.0, 409.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.62611389160156, -94.29499816894531, -86.96387481689453, -79.63275909423828, -72.3016357421875, -64.97052001953125, -57.639404296875, -50.308284759521484, -42.97716522216797, -35.64604568481445, -28.31492805480957, -20.983810424804688, -13.652690887451172, -6.321571350097656, 1.0095443725585938, 8.34066390991211, 15.671783447265625, 23.00290298461914, 30.334020614624023, 37.665138244628906, 44.99625778198242, 52.32737731933594, 59.65849304199219, 66.98960876464844, 74.32073211669922, 81.65184783935547, 88.98297119140625, 96.3140869140625, 103.64520263671875, 110.97632598876953, 118.30744171142578, 125.63856506347656, 132.96969604492188, 140.30081176757812, 147.63192749023438, 154.96304321289062, 162.29417419433594, 169.6252899169922, 176.95640563964844, 184.2875213623047, 191.61865234375, 198.94976806640625, 206.2808837890625, 213.61199951171875, 220.94313049316406, 228.2742462158203, 235.60536193847656, 242.9364776611328, 250.26759338378906, 257.5987243652344, 264.9298400878906, 272.2609558105469, 279.5920715332031, 286.9231872558594, 294.2543029785156, 301.5854187011719, 308.9165344238281, 316.2476501464844, 323.5787658691406, 330.9098815917969, 338.2409973144531, 345.5721435546875, 352.90325927734375, 360.234375, 367.56549072265625]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 9.0, 5.0, 9.0, 19.0, 11.0, 26.0, 20.0, 34.0, 32.0, 46.0, 41.0, 46.0, 46.0, 67.0, 58.0, 49.0, 43.0, 55.0, 43.0, 49.0, 35.0, 43.0, 41.0, 26.0, 31.0, 24.0, 23.0, 14.0, 17.0, 9.0, 10.0, 10.0, 4.0, 6.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-36.49530792236328, -35.49312210083008, -34.49094009399414, -33.48875427246094, -32.486568450927734, -31.484384536743164, -30.482200622558594, -29.48001480102539, -28.477828979492188, -27.475645065307617, -26.473459243774414, -25.471275329589844, -24.46908950805664, -23.46690559387207, -22.4647216796875, -21.462535858154297, -20.460351943969727, -19.458168029785156, -18.455982208251953, -17.453798294067383, -16.45161247253418, -15.44942855834961, -14.447243690490723, -13.445058822631836, -12.44287395477295, -11.440689086914062, -10.438504219055176, -9.436319351196289, -8.434135437011719, -7.431950092315674, -6.429765701293945, -5.427580833435059, -4.425397872924805, -3.423213005065918, -2.4210283756256104, -1.4188437461853027, -0.416658878326416, 0.5855259895324707, 1.5877103805541992, 2.589895248413086, 3.5920801162719727, 4.594264984130859, 5.596449851989746, 6.598634243011475, 7.600819110870361, 8.603004455566406, 9.605188369750977, 10.607373237609863, 11.60955810546875, 12.611742973327637, 13.613927841186523, 14.616111755371094, 15.618297576904297, 16.620481491088867, 17.622665405273438, 18.62485122680664, 19.627037048339844, 20.629220962524414, 21.631406784057617, 22.633590698242188, 23.63577651977539, 24.63796043395996, 25.64014434814453, 26.642330169677734, 27.644514083862305]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 4.0, 6.0, 7.0, 8.0, 10.0, 11.0, 19.0, 18.0, 24.0, 26.0, 21.0, 30.0, 28.0, 29.0, 36.0, 27.0, 46.0, 27.0, 39.0, 47.0, 26.0, 49.0, 49.0, 29.0, 37.0, 29.0, 38.0, 32.0, 33.0, 32.0, 17.0, 18.0, 21.0, 15.0, 18.0, 14.0, 14.0, 16.0, 6.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.37890625, -3.265045166015625, -3.15118408203125, -3.037322998046875, -2.9234619140625, -2.809600830078125, -2.69573974609375, -2.581878662109375, -2.468017578125, -2.354156494140625, -2.24029541015625, -2.126434326171875, -2.0125732421875, -1.898712158203125, -1.78485107421875, -1.670989990234375, -1.55712890625, -1.443267822265625, -1.32940673828125, -1.215545654296875, -1.1016845703125, -0.987823486328125, -0.87396240234375, -0.760101318359375, -0.646240234375, -0.532379150390625, -0.41851806640625, -0.304656982421875, -0.1907958984375, -0.076934814453125, 0.03692626953125, 0.150787353515625, 0.2646484375, 0.378509521484375, 0.49237060546875, 0.606231689453125, 0.7200927734375, 0.833953857421875, 0.94781494140625, 1.061676025390625, 1.175537109375, 1.289398193359375, 1.40325927734375, 1.517120361328125, 1.6309814453125, 1.744842529296875, 1.85870361328125, 1.972564697265625, 2.08642578125, 2.200286865234375, 2.31414794921875, 2.428009033203125, 2.5418701171875, 2.655731201171875, 2.76959228515625, 2.883453369140625, 2.997314453125, 3.111175537109375, 3.22503662109375, 3.338897705078125, 3.4527587890625, 3.566619873046875, 3.68048095703125, 3.794342041015625, 3.908203125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 5.0, 11.0, 17.0, 31.0, 31.0, 48.0, 83.0, 109.0, 162.0, 276.0, 369.0, 533.0, 753.0, 1158.0, 1675.0, 2504.0, 3786.0, 5457.0, 8135.0, 12154.0, 18980.0, 29231.0, 47959.0, 81060.0, 155117.0, 296223.0, 161728.0, 84145.0, 49041.0, 29948.0, 19412.0, 12772.0, 8241.0, 5558.0, 3798.0, 2645.0, 1752.0, 1146.0, 810.0, 550.0, 372.0, 243.0, 195.0, 110.0, 66.0, 44.0, 39.0, 32.0, 17.0, 12.0, 6.0, 9.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.58642578125, -0.5665664672851562, -0.5467071533203125, -0.5268478393554688, -0.506988525390625, -0.48712921142578125, -0.4672698974609375, -0.44741058349609375, -0.42755126953125, -0.40769195556640625, -0.3878326416015625, -0.36797332763671875, -0.348114013671875, -0.32825469970703125, -0.3083953857421875, -0.28853607177734375, -0.2686767578125, -0.24881744384765625, -0.2289581298828125, -0.20909881591796875, -0.189239501953125, -0.16938018798828125, -0.1495208740234375, -0.12966156005859375, -0.10980224609375, -0.08994293212890625, -0.0700836181640625, -0.05022430419921875, -0.030364990234375, -0.01050567626953125, 0.0093536376953125, 0.02921295166015625, 0.049072265625, 0.06893157958984375, 0.0887908935546875, 0.10865020751953125, 0.128509521484375, 0.14836883544921875, 0.1682281494140625, 0.18808746337890625, 0.20794677734375, 0.22780609130859375, 0.2476654052734375, 0.26752471923828125, 0.287384033203125, 0.30724334716796875, 0.3271026611328125, 0.34696197509765625, 0.3668212890625, 0.38668060302734375, 0.4065399169921875, 0.42639923095703125, 0.446258544921875, 0.46611785888671875, 0.4859771728515625, 0.5058364868164062, 0.52569580078125, 0.5455551147460938, 0.5654144287109375, 0.5852737426757812, 0.605133056640625, 0.6249923706054688, 0.6448516845703125, 0.6647109985351562, 0.6845703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 6.0, 9.0, 7.0, 6.0, 12.0, 20.0, 15.0, 6.0, 16.0, 21.0, 16.0, 23.0, 24.0, 37.0, 22.0, 23.0, 32.0, 31.0, 41.0, 33.0, 41.0, 43.0, 1066.0, 38.0, 34.0, 37.0, 32.0, 36.0, 29.0, 21.0, 24.0, 26.0, 24.0, 16.0, 23.0, 21.0, 20.0, 18.0, 15.0, 9.0, 11.0, 8.0, 7.0, 9.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.1015625, -2.034393310546875, -1.96722412109375, -1.900054931640625, -1.8328857421875, -1.765716552734375, -1.69854736328125, -1.631378173828125, -1.564208984375, -1.497039794921875, -1.42987060546875, -1.362701416015625, -1.2955322265625, -1.228363037109375, -1.16119384765625, -1.094024658203125, -1.02685546875, -0.959686279296875, -0.89251708984375, -0.825347900390625, -0.7581787109375, -0.691009521484375, -0.62384033203125, -0.556671142578125, -0.489501953125, -0.422332763671875, -0.35516357421875, -0.287994384765625, -0.2208251953125, -0.153656005859375, -0.08648681640625, -0.019317626953125, 0.0478515625, 0.115020751953125, 0.18218994140625, 0.249359130859375, 0.3165283203125, 0.383697509765625, 0.45086669921875, 0.518035888671875, 0.585205078125, 0.652374267578125, 0.71954345703125, 0.786712646484375, 0.8538818359375, 0.921051025390625, 0.98822021484375, 1.055389404296875, 1.12255859375, 1.189727783203125, 1.25689697265625, 1.324066162109375, 1.3912353515625, 1.458404541015625, 1.52557373046875, 1.592742919921875, 1.659912109375, 1.727081298828125, 1.79425048828125, 1.861419677734375, 1.9285888671875, 1.995758056640625, 2.06292724609375, 2.130096435546875, 2.197265625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 6.0, 5.0, 15.0, 28.0, 28.0, 48.0, 72.0, 96.0, 136.0, 164.0, 274.0, 380.0, 523.0, 765.0, 1030.0, 1468.0, 1982.0, 2885.0, 3905.0, 5385.0, 7296.0, 9876.0, 13859.0, 19375.0, 27337.0, 39882.0, 60306.0, 101560.0, 193780.0, 1272268.0, 116650.0, 67647.0, 43591.0, 29465.0, 20959.0, 15085.0, 10752.0, 7885.0, 5673.0, 4097.0, 3000.0, 2170.0, 1589.0, 1124.0, 805.0, 582.0, 425.0, 284.0, 205.0, 158.0, 90.0, 57.0, 33.0, 31.0, 21.0, 10.0, 7.0, 3.0, 7.0, 1.0, 3.0], "bins": [-0.47607421875, -0.46125030517578125, -0.4464263916015625, -0.43160247802734375, -0.416778564453125, -0.40195465087890625, -0.3871307373046875, -0.37230682373046875, -0.35748291015625, -0.34265899658203125, -0.3278350830078125, -0.31301116943359375, -0.298187255859375, -0.28336334228515625, -0.2685394287109375, -0.25371551513671875, -0.2388916015625, -0.22406768798828125, -0.2092437744140625, -0.19441986083984375, -0.179595947265625, -0.16477203369140625, -0.1499481201171875, -0.13512420654296875, -0.12030029296875, -0.10547637939453125, -0.0906524658203125, -0.07582855224609375, -0.061004638671875, -0.04618072509765625, -0.0313568115234375, -0.01653289794921875, -0.001708984375, 0.01311492919921875, 0.0279388427734375, 0.04276275634765625, 0.057586669921875, 0.07241058349609375, 0.0872344970703125, 0.10205841064453125, 0.11688232421875, 0.13170623779296875, 0.1465301513671875, 0.16135406494140625, 0.176177978515625, 0.19100189208984375, 0.2058258056640625, 0.22064971923828125, 0.2354736328125, 0.25029754638671875, 0.2651214599609375, 0.27994537353515625, 0.294769287109375, 0.30959320068359375, 0.3244171142578125, 0.33924102783203125, 0.35406494140625, 0.36888885498046875, 0.3837127685546875, 0.39853668212890625, 0.413360595703125, 0.42818450927734375, 0.4430084228515625, 0.45783233642578125, 0.47265625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 6.0, 7.0, 4.0, 8.0, 8.0, 16.0, 13.0, 26.0, 27.0, 26.0, 29.0, 41.0, 43.0, 42.0, 39.0, 47.0, 51.0, 51.0, 55.0, 53.0, 42.0, 57.0, 46.0, 28.0, 32.0, 30.0, 22.0, 26.0, 22.0, 21.0, 17.0, 9.0, 12.0, 7.0, 6.0, 7.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00011676549911499023, -0.0001131836324930191, -0.00010960176587104797, -0.00010601989924907684, -0.00010243803262710571, -9.885616600513458e-05, -9.527429938316345e-05, -9.169243276119232e-05, -8.811056613922119e-05, -8.452869951725006e-05, -8.094683289527893e-05, -7.73649662733078e-05, -7.378309965133667e-05, -7.020123302936554e-05, -6.661936640739441e-05, -6.303749978542328e-05, -5.945563316345215e-05, -5.587376654148102e-05, -5.229189991950989e-05, -4.871003329753876e-05, -4.512816667556763e-05, -4.1546300053596497e-05, -3.7964433431625366e-05, -3.4382566809654236e-05, -3.0800700187683105e-05, -2.7218833565711975e-05, -2.3636966943740845e-05, -2.0055100321769714e-05, -1.6473233699798584e-05, -1.2891367077827454e-05, -9.309500455856323e-06, -5.727633833885193e-06, -2.1457672119140625e-06, 1.4360994100570679e-06, 5.017966032028198e-06, 8.599832653999329e-06, 1.2181699275970459e-05, 1.576356589794159e-05, 1.934543251991272e-05, 2.292729914188385e-05, 2.650916576385498e-05, 3.009103238582611e-05, 3.367289900779724e-05, 3.725476562976837e-05, 4.08366322517395e-05, 4.441849887371063e-05, 4.800036549568176e-05, 5.158223211765289e-05, 5.5164098739624023e-05, 5.8745965361595154e-05, 6.232783198356628e-05, 6.590969860553741e-05, 6.949156522750854e-05, 7.307343184947968e-05, 7.66552984714508e-05, 8.023716509342194e-05, 8.381903171539307e-05, 8.74008983373642e-05, 9.098276495933533e-05, 9.456463158130646e-05, 9.814649820327759e-05, 0.00010172836482524872, 0.00010531023144721985, 0.00010889209806919098, 0.00011247396469116211]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 4.0, 2.0, 4.0, 7.0, 7.0, 14.0, 17.0, 13.0, 26.0, 29.0, 31.0, 45.0, 71.0, 77.0, 103.0, 150.0, 325.0, 742.0, 12242.0, 1026697.0, 6245.0, 711.0, 318.0, 150.0, 120.0, 89.0, 71.0, 57.0, 47.0, 33.0, 30.0, 12.0, 16.0, 10.0, 10.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0026607513427734375, -0.0025761425495147705, -0.0024915337562561035, -0.0024069249629974365, -0.0023223161697387695, -0.0022377073764801025, -0.0021530985832214355, -0.0020684897899627686, -0.0019838809967041016, -0.0018992722034454346, -0.0018146634101867676, -0.0017300546169281006, -0.0016454458236694336, -0.0015608370304107666, -0.0014762282371520996, -0.0013916194438934326, -0.0013070106506347656, -0.0012224018573760986, -0.0011377930641174316, -0.0010531842708587646, -0.0009685754776000977, -0.0008839666843414307, -0.0007993578910827637, -0.0007147490978240967, -0.0006301403045654297, -0.0005455315113067627, -0.0004609227180480957, -0.0003763139247894287, -0.0002917051315307617, -0.00020709633827209473, -0.00012248754501342773, -3.787875175476074e-05, 4.673004150390625e-05, 0.00013133883476257324, 0.00021594762802124023, 0.0003005564212799072, 0.0003851652145385742, 0.0004697740077972412, 0.0005543828010559082, 0.0006389915943145752, 0.0007236003875732422, 0.0008082091808319092, 0.0008928179740905762, 0.0009774267673492432, 0.0010620355606079102, 0.0011466443538665771, 0.0012312531471252441, 0.0013158619403839111, 0.0014004707336425781, 0.0014850795269012451, 0.0015696883201599121, 0.001654297113418579, 0.001738905906677246, 0.001823514699935913, 0.00190812349319458, 0.001992732286453247, 0.002077341079711914, 0.002161949872970581, 0.002246558666229248, 0.002331167459487915, 0.002415776252746582, 0.002500385046005249, 0.002584993839263916, 0.002669602632522583, 0.00275421142578125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 30.0, 144.0, 372.0, 365.0, 93.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016670180775690824, -0.00015681717195548117, -0.00014693252160213888, -0.0001370478858007118, -0.00012716324999928474, -0.00011727860692190006, -0.00010739396384451538, -9.750932804308832e-05, -8.762468496570364e-05, -7.774004188831896e-05, -6.785540608689189e-05, -5.797076300950721e-05, -4.8086123570101336e-05, -3.820148413069546e-05, -2.8316841053310782e-05, -1.8432205251883715e-05, -8.547562174499035e-06, 1.3370781744015403e-06, 1.1221718523302115e-05, 2.1106359781697392e-05, 3.0990999221103266e-05, 4.087563866050914e-05, 5.076028173789382e-05, 6.0644917539320886e-05, 7.052956061670557e-05, 8.041420369409025e-05, 9.029883949551731e-05, 0.000100183482572902, 0.00011006812565028667, 0.00011995276145171374, 0.0001298373972531408, 0.0001397220476064831, 0.00014960666885599494, 0.000159491304657422, 0.0001693759550107643, 0.00017926059081219137, 0.00018914522661361843, 0.0001990298624150455, 0.0002089145127683878, 0.00021879914856981486, 0.00022868378437124193, 0.000238568420172669, 0.00024845305597409606, 0.00025833770632743835, 0.00026822235668078065, 0.0002781069779302925, 0.0002879916282836348, 0.0002978762495331466, 0.0003077608998864889, 0.0003176455502398312, 0.00032753017148934305, 0.00033741482184268534, 0.00034729947219602764, 0.0003571840934455395, 0.00036706874379888177, 0.00037695339415222406, 0.00038683804450556636, 0.00039672269485890865, 0.0004066073161084205, 0.0004164919664617628, 0.0004263766168151051, 0.0004362612380646169, 0.0004461458884179592, 0.0004560305387713015, 0.00046591516002081335]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 5.0, 9.0, 6.0, 10.0, 9.0, 18.0, 17.0, 19.0, 20.0, 20.0, 30.0, 24.0, 31.0, 26.0, 22.0, 34.0, 40.0, 36.0, 48.0, 30.0, 48.0, 30.0, 33.0, 37.0, 36.0, 34.0, 37.0, 40.0, 31.0, 31.0, 22.0, 24.0, 26.0, 18.0, 12.0, 15.0, 15.0, 6.0, 5.0, 12.0, 6.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0], "bins": [-6.645917892456055e-05, -6.452761590480804e-05, -6.259605288505554e-05, -6.066448986530304e-05, -5.873292684555054e-05, -5.6801363825798035e-05, -5.486980080604553e-05, -5.293823778629303e-05, -5.100667476654053e-05, -4.9075111746788025e-05, -4.714354872703552e-05, -4.521198570728302e-05, -4.328042268753052e-05, -4.1348859667778015e-05, -3.941729664802551e-05, -3.748573362827301e-05, -3.555417060852051e-05, -3.3622607588768005e-05, -3.16910445690155e-05, -2.9759481549263e-05, -2.7827918529510498e-05, -2.5896355509757996e-05, -2.3964792490005493e-05, -2.203322947025299e-05, -2.0101666450500488e-05, -1.8170103430747986e-05, -1.6238540410995483e-05, -1.4306977391242981e-05, -1.2375414371490479e-05, -1.0443851351737976e-05, -8.512288331985474e-06, -6.580725312232971e-06, -4.649162292480469e-06, -2.7175992727279663e-06, -7.860362529754639e-07, 1.1455267667770386e-06, 3.077089786529541e-06, 5.0086528062820435e-06, 6.940215826034546e-06, 8.871778845787048e-06, 1.080334186553955e-05, 1.2734904885292053e-05, 1.4666467905044556e-05, 1.6598030924797058e-05, 1.852959394454956e-05, 2.0461156964302063e-05, 2.2392719984054565e-05, 2.4324283003807068e-05, 2.625584602355957e-05, 2.8187409043312073e-05, 3.0118972063064575e-05, 3.205053508281708e-05, 3.398209810256958e-05, 3.591366112232208e-05, 3.7845224142074585e-05, 3.977678716182709e-05, 4.170835018157959e-05, 4.363991320133209e-05, 4.5571476221084595e-05, 4.75030392408371e-05, 4.94346022605896e-05, 5.13661652803421e-05, 5.3297728300094604e-05, 5.522929131984711e-05, 5.716085433959961e-05]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 4.0, 6.0, 7.0, 8.0, 10.0, 11.0, 19.0, 18.0, 24.0, 26.0, 21.0, 30.0, 28.0, 29.0, 36.0, 27.0, 46.0, 27.0, 39.0, 47.0, 26.0, 49.0, 49.0, 29.0, 37.0, 29.0, 38.0, 32.0, 33.0, 32.0, 17.0, 18.0, 21.0, 15.0, 18.0, 14.0, 14.0, 16.0, 6.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.37890625, -3.265045166015625, -3.15118408203125, -3.037322998046875, -2.9234619140625, -2.809600830078125, -2.69573974609375, -2.581878662109375, -2.468017578125, -2.354156494140625, -2.24029541015625, -2.126434326171875, -2.0125732421875, -1.898712158203125, -1.78485107421875, -1.670989990234375, -1.55712890625, -1.443267822265625, -1.32940673828125, -1.215545654296875, -1.1016845703125, -0.987823486328125, -0.87396240234375, -0.760101318359375, -0.646240234375, -0.532379150390625, -0.41851806640625, -0.304656982421875, -0.1907958984375, -0.076934814453125, 0.03692626953125, 0.150787353515625, 0.2646484375, 0.378509521484375, 0.49237060546875, 0.606231689453125, 0.7200927734375, 0.833953857421875, 0.94781494140625, 1.061676025390625, 1.175537109375, 1.289398193359375, 1.40325927734375, 1.517120361328125, 1.6309814453125, 1.744842529296875, 1.85870361328125, 1.972564697265625, 2.08642578125, 2.200286865234375, 2.31414794921875, 2.428009033203125, 2.5418701171875, 2.655731201171875, 2.76959228515625, 2.883453369140625, 2.997314453125, 3.111175537109375, 3.22503662109375, 3.338897705078125, 3.4527587890625, 3.566619873046875, 3.68048095703125, 3.794342041015625, 3.908203125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 1.0, 6.0, 5.0, 8.0, 12.0, 8.0, 20.0, 12.0, 19.0, 39.0, 52.0, 100.0, 133.0, 274.0, 571.0, 1250.0, 2726.0, 5896.0, 13356.0, 29905.0, 75337.0, 222431.0, 411629.0, 177090.0, 61705.0, 25081.0, 11375.0, 5113.0, 2294.0, 1043.0, 496.0, 231.0, 123.0, 54.0, 39.0, 34.0, 12.0, 24.0, 9.0, 8.0, 9.0, 4.0, 8.0, 5.0, 4.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7421875, -3.61907958984375, -3.4959716796875, -3.37286376953125, -3.249755859375, -3.12664794921875, -3.0035400390625, -2.88043212890625, -2.75732421875, -2.63421630859375, -2.5111083984375, -2.38800048828125, -2.264892578125, -2.14178466796875, -2.0186767578125, -1.89556884765625, -1.7724609375, -1.64935302734375, -1.5262451171875, -1.40313720703125, -1.280029296875, -1.15692138671875, -1.0338134765625, -0.91070556640625, -0.78759765625, -0.66448974609375, -0.5413818359375, -0.41827392578125, -0.295166015625, -0.17205810546875, -0.0489501953125, 0.07415771484375, 0.197265625, 0.32037353515625, 0.4434814453125, 0.56658935546875, 0.689697265625, 0.81280517578125, 0.9359130859375, 1.05902099609375, 1.18212890625, 1.30523681640625, 1.4283447265625, 1.55145263671875, 1.674560546875, 1.79766845703125, 1.9207763671875, 2.04388427734375, 2.1669921875, 2.29010009765625, 2.4132080078125, 2.53631591796875, 2.659423828125, 2.78253173828125, 2.9056396484375, 3.02874755859375, 3.15185546875, 3.27496337890625, 3.3980712890625, 3.52117919921875, 3.644287109375, 3.76739501953125, 3.8905029296875, 4.01361083984375, 4.13671875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 7.0, 3.0, 8.0, 11.0, 9.0, 10.0, 16.0, 15.0, 16.0, 22.0, 23.0, 32.0, 40.0, 31.0, 37.0, 37.0, 63.0, 101.0, 251.0, 1590.0, 243.0, 95.0, 51.0, 51.0, 42.0, 36.0, 36.0, 33.0, 29.0, 24.0, 22.0, 18.0, 15.0, 10.0, 10.0, 4.0, 2.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-18.015625, -17.521728515625, -17.02783203125, -16.533935546875, -16.0400390625, -15.546142578125, -15.05224609375, -14.558349609375, -14.064453125, -13.570556640625, -13.07666015625, -12.582763671875, -12.0888671875, -11.594970703125, -11.10107421875, -10.607177734375, -10.11328125, -9.619384765625, -9.12548828125, -8.631591796875, -8.1376953125, -7.643798828125, -7.14990234375, -6.656005859375, -6.162109375, -5.668212890625, -5.17431640625, -4.680419921875, -4.1865234375, -3.692626953125, -3.19873046875, -2.704833984375, -2.2109375, -1.717041015625, -1.22314453125, -0.729248046875, -0.2353515625, 0.258544921875, 0.75244140625, 1.246337890625, 1.740234375, 2.234130859375, 2.72802734375, 3.221923828125, 3.7158203125, 4.209716796875, 4.70361328125, 5.197509765625, 5.69140625, 6.185302734375, 6.67919921875, 7.173095703125, 7.6669921875, 8.160888671875, 8.65478515625, 9.148681640625, 9.642578125, 10.136474609375, 10.63037109375, 11.124267578125, 11.6181640625, 12.112060546875, 12.60595703125, 13.099853515625, 13.59375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 12.0, 6.0, 7.0, 17.0, 26.0, 22.0, 33.0, 49.0, 58.0, 73.0, 94.0, 141.0, 170.0, 259.0, 468.0, 1238.0, 119226.0, 3017997.0, 4016.0, 618.0, 327.0, 242.0, 146.0, 99.0, 69.0, 54.0, 48.0, 30.0, 26.0, 28.0, 19.0, 19.0, 9.0, 13.0, 8.0, 2.0, 1.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-38.65625, -37.41796875, -36.1796875, -34.94140625, -33.703125, -32.46484375, -31.2265625, -29.98828125, -28.75, -27.51171875, -26.2734375, -25.03515625, -23.796875, -22.55859375, -21.3203125, -20.08203125, -18.84375, -17.60546875, -16.3671875, -15.12890625, -13.890625, -12.65234375, -11.4140625, -10.17578125, -8.9375, -7.69921875, -6.4609375, -5.22265625, -3.984375, -2.74609375, -1.5078125, -0.26953125, 0.96875, 2.20703125, 3.4453125, 4.68359375, 5.921875, 7.16015625, 8.3984375, 9.63671875, 10.875, 12.11328125, 13.3515625, 14.58984375, 15.828125, 17.06640625, 18.3046875, 19.54296875, 20.78125, 22.01953125, 23.2578125, 24.49609375, 25.734375, 26.97265625, 28.2109375, 29.44921875, 30.6875, 31.92578125, 33.1640625, 34.40234375, 35.640625, 36.87890625, 38.1171875, 39.35546875, 40.59375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 207.0, 796.0, 14.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.495949745178223, -5.851185321807861, -1.2064208984375, 3.4383440017700195, 8.083107948303223, 12.727871894836426, 17.372638702392578, 22.01740264892578, 26.662166595458984, 31.306930541992188, 35.95169448852539, 40.596458435058594, 45.24122619628906, 49.885986328125, 54.53075408935547, 59.17551803588867, 63.820281982421875, 68.46504974365234, 73.10980987548828, 77.75457763671875, 82.39933776855469, 87.04410552978516, 91.68887329101562, 96.33363342285156, 100.9783935546875, 105.62316131591797, 110.2679214477539, 114.91268920898438, 119.55744934082031, 124.20221710205078, 128.84698486328125, 133.4917449951172, 138.1365203857422, 142.78128051757812, 147.42605590820312, 152.07081604003906, 156.715576171875, 161.36033630371094, 166.00511169433594, 170.64987182617188, 175.2946319580078, 179.93939208984375, 184.58416748046875, 189.2289276123047, 193.87368774414062, 198.51844787597656, 203.16322326660156, 207.8079833984375, 212.4527587890625, 217.09751892089844, 221.74229431152344, 226.38705444335938, 231.0318145751953, 235.67657470703125, 240.32135009765625, 244.9661102294922, 249.61087036132812, 254.25563049316406, 258.900390625, 263.545166015625, 268.18994140625, 272.8346862792969, 277.4794616699219, 282.12420654296875, 286.76898193359375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 4.0, 19.0, 14.0, 11.0, 16.0, 20.0, 22.0, 29.0, 26.0, 34.0, 30.0, 29.0, 34.0, 38.0, 44.0, 55.0, 37.0, 36.0, 43.0, 50.0, 35.0, 45.0, 40.0, 38.0, 36.0, 31.0, 19.0, 26.0, 31.0, 12.0, 16.0, 13.0, 16.0, 12.0, 5.0, 5.0, 6.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.09455490112305, -34.94756317138672, -33.800575256347656, -32.65358352661133, -31.506591796875, -30.359601974487305, -29.21261215209961, -28.06562042236328, -26.918630599975586, -25.77164077758789, -24.624649047851562, -23.477659225463867, -22.330669403076172, -21.183677673339844, -20.03668785095215, -18.889698028564453, -17.742706298828125, -16.59571647644043, -15.448724746704102, -14.301734924316406, -13.154744148254395, -12.007753372192383, -10.860763549804688, -9.713772773742676, -8.566781997680664, -7.419791221618652, -6.272800922393799, -5.125810623168945, -3.9788198471069336, -2.831829071044922, -1.6848387718200684, -0.5378484725952148, 0.6091384887695312, 1.7561290264129639, 2.9031195640563965, 4.05010986328125, 5.197100639343262, 6.344091415405273, 7.491081714630127, 8.63807201385498, 9.785062789916992, 10.932053565979004, 12.079044342041016, 13.226034164428711, 14.373024940490723, 15.520015716552734, 16.66700553894043, 17.813995361328125, 18.960987091064453, 20.10797691345215, 21.254968643188477, 22.401958465576172, 23.5489501953125, 24.695940017700195, 25.84292984008789, 26.98992156982422, 28.136911392211914, 29.28390121459961, 30.430892944335938, 31.577882766723633, 32.72487258911133, 33.871864318847656, 35.018856048583984, 36.16584396362305, 37.312835693359375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 11.0, 7.0, 8.0, 12.0, 11.0, 20.0, 26.0, 29.0, 30.0, 18.0, 25.0, 37.0, 40.0, 26.0, 36.0, 33.0, 41.0, 29.0, 49.0, 42.0, 45.0, 53.0, 28.0, 36.0, 36.0, 30.0, 27.0, 20.0, 31.0, 25.0, 19.0, 22.0, 19.0, 9.0, 6.0, 12.0, 19.0, 7.0, 2.0, 7.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-4.0078125, -3.8782958984375, -3.748779296875, -3.6192626953125, -3.48974609375, -3.3602294921875, -3.230712890625, -3.1011962890625, -2.9716796875, -2.8421630859375, -2.712646484375, -2.5831298828125, -2.45361328125, -2.3240966796875, -2.194580078125, -2.0650634765625, -1.935546875, -1.8060302734375, -1.676513671875, -1.5469970703125, -1.41748046875, -1.2879638671875, -1.158447265625, -1.0289306640625, -0.8994140625, -0.7698974609375, -0.640380859375, -0.5108642578125, -0.38134765625, -0.2518310546875, -0.122314453125, 0.0072021484375, 0.13671875, 0.2662353515625, 0.395751953125, 0.5252685546875, 0.65478515625, 0.7843017578125, 0.913818359375, 1.0433349609375, 1.1728515625, 1.3023681640625, 1.431884765625, 1.5614013671875, 1.69091796875, 1.8204345703125, 1.949951171875, 2.0794677734375, 2.208984375, 2.3385009765625, 2.468017578125, 2.5975341796875, 2.72705078125, 2.8565673828125, 2.986083984375, 3.1156005859375, 3.2451171875, 3.3746337890625, 3.504150390625, 3.6336669921875, 3.76318359375, 3.8927001953125, 4.022216796875, 4.1517333984375, 4.28125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 4.0, 1.0, 3.0, 6.0, 7.0, 7.0, 12.0, 13.0, 15.0, 17.0, 24.0, 35.0, 39.0, 50.0, 67.0, 68.0, 105.0, 136.0, 288.0, 701.0, 2876.0, 53232.0, 1794337.0, 2254488.0, 82113.0, 3835.0, 835.0, 321.0, 163.0, 103.0, 74.0, 61.0, 56.0, 39.0, 28.0, 23.0, 19.0, 13.0, 16.0, 12.0, 19.0, 5.0, 6.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-13.078125, -12.6824951171875, -12.286865234375, -11.8912353515625, -11.49560546875, -11.0999755859375, -10.704345703125, -10.3087158203125, -9.9130859375, -9.5174560546875, -9.121826171875, -8.7261962890625, -8.33056640625, -7.9349365234375, -7.539306640625, -7.1436767578125, -6.748046875, -6.3524169921875, -5.956787109375, -5.5611572265625, -5.16552734375, -4.7698974609375, -4.374267578125, -3.9786376953125, -3.5830078125, -3.1873779296875, -2.791748046875, -2.3961181640625, -2.00048828125, -1.6048583984375, -1.209228515625, -0.8135986328125, -0.41796875, -0.0223388671875, 0.373291015625, 0.7689208984375, 1.16455078125, 1.5601806640625, 1.955810546875, 2.3514404296875, 2.7470703125, 3.1427001953125, 3.538330078125, 3.9339599609375, 4.32958984375, 4.7252197265625, 5.120849609375, 5.5164794921875, 5.912109375, 6.3077392578125, 6.703369140625, 7.0989990234375, 7.49462890625, 7.8902587890625, 8.285888671875, 8.6815185546875, 9.0771484375, 9.4727783203125, 9.868408203125, 10.2640380859375, 10.65966796875, 11.0552978515625, 11.450927734375, 11.8465576171875, 12.2421875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 8.0, 14.0, 6.0, 29.0, 30.0, 65.0, 86.0, 117.0, 224.0, 364.0, 488.0, 636.0, 648.0, 467.0, 320.0, 200.0, 118.0, 87.0, 49.0, 40.0, 25.0, 16.0, 11.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.59375, -14.2535400390625, -13.913330078125, -13.5731201171875, -13.23291015625, -12.8927001953125, -12.552490234375, -12.2122802734375, -11.8720703125, -11.5318603515625, -11.191650390625, -10.8514404296875, -10.51123046875, -10.1710205078125, -9.830810546875, -9.4906005859375, -9.150390625, -8.8101806640625, -8.469970703125, -8.1297607421875, -7.78955078125, -7.4493408203125, -7.109130859375, -6.7689208984375, -6.4287109375, -6.0885009765625, -5.748291015625, -5.4080810546875, -5.06787109375, -4.7276611328125, -4.387451171875, -4.0472412109375, -3.70703125, -3.3668212890625, -3.026611328125, -2.6864013671875, -2.34619140625, -2.0059814453125, -1.665771484375, -1.3255615234375, -0.9853515625, -0.6451416015625, -0.304931640625, 0.0352783203125, 0.37548828125, 0.7156982421875, 1.055908203125, 1.3961181640625, 1.736328125, 2.0765380859375, 2.416748046875, 2.7569580078125, 3.09716796875, 3.4373779296875, 3.777587890625, 4.1177978515625, 4.4580078125, 4.7982177734375, 5.138427734375, 5.4786376953125, 5.81884765625, 6.1590576171875, 6.499267578125, 6.8394775390625, 7.1796875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 8.0, 4.0, 8.0, 13.0, 20.0, 42.0, 54.0, 76.0, 115.0, 152.0, 311.0, 433.0, 965.0, 170339.0, 4017374.0, 2785.0, 613.0, 384.0, 197.0, 132.0, 100.0, 61.0, 32.0, 16.0, 14.0, 16.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.25, -28.7548828125, -27.259765625, -25.7646484375, -24.26953125, -22.7744140625, -21.279296875, -19.7841796875, -18.2890625, -16.7939453125, -15.298828125, -13.8037109375, -12.30859375, -10.8134765625, -9.318359375, -7.8232421875, -6.328125, -4.8330078125, -3.337890625, -1.8427734375, -0.34765625, 1.1474609375, 2.642578125, 4.1376953125, 5.6328125, 7.1279296875, 8.623046875, 10.1181640625, 11.61328125, 13.1083984375, 14.603515625, 16.0986328125, 17.59375, 19.0888671875, 20.583984375, 22.0791015625, 23.57421875, 25.0693359375, 26.564453125, 28.0595703125, 29.5546875, 31.0498046875, 32.544921875, 34.0400390625, 35.53515625, 37.0302734375, 38.525390625, 40.0205078125, 41.515625, 43.0107421875, 44.505859375, 46.0009765625, 47.49609375, 48.9912109375, 50.486328125, 51.9814453125, 53.4765625, 54.9716796875, 56.466796875, 57.9619140625, 59.45703125, 60.9521484375, 62.447265625, 63.9423828125, 65.4375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 32.0, 303.0, 481.0, 182.0, 14.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.25506591796875, -140.28289794921875, -136.31072998046875, -132.33856201171875, -128.36639404296875, -124.39422607421875, -120.42206573486328, -116.44989776611328, -112.47772979736328, -108.50556182861328, -104.53339385986328, -100.56122589111328, -96.58906555175781, -92.61689758300781, -88.64472961425781, -84.67256164550781, -80.70039367675781, -76.72822570800781, -72.75605773925781, -68.78388977050781, -64.81172180175781, -60.83955764770508, -56.867393493652344, -52.895225524902344, -48.923057556152344, -44.950889587402344, -40.978721618652344, -37.00655746459961, -33.03438949584961, -29.06222152709961, -25.090055465698242, -21.117889404296875, -17.145729064941406, -13.173562049865723, -9.201395034790039, -5.2292280197143555, -1.2570610046386719, 2.715106964111328, 6.687273025512695, 10.659439086914062, 14.631607055664062, 18.603775024414062, 22.57594108581543, 26.548107147216797, 30.520275115966797, 34.4924430847168, 38.46460723876953, 42.43677520751953, 46.40894317626953, 50.38111114501953, 54.35327911376953, 58.325443267822266, 62.297611236572266, 66.269775390625, 70.241943359375, 74.214111328125, 78.186279296875, 82.158447265625, 86.130615234375, 90.102783203125, 94.074951171875, 98.047119140625, 102.01927947998047, 105.99144744873047, 109.96361541748047]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 6.0, 15.0, 12.0, 18.0, 26.0, 25.0, 28.0, 34.0, 31.0, 37.0, 44.0, 48.0, 53.0, 53.0, 44.0, 53.0, 52.0, 45.0, 46.0, 46.0, 29.0, 33.0, 34.0, 31.0, 23.0, 26.0, 20.0, 14.0, 14.0, 12.0, 11.0, 4.0, 4.0, 6.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.145313262939453, -24.26028060913086, -23.375246047973633, -22.49021339416504, -21.605178833007812, -20.72014617919922, -19.835113525390625, -18.95008087158203, -18.065046310424805, -17.18001365661621, -16.294979095458984, -15.40994644165039, -14.52491283416748, -13.63987922668457, -12.754846572875977, -11.869812965393066, -10.984779357910156, -10.099745750427246, -9.214712142944336, -8.329679489135742, -7.444645881652832, -6.559612274169922, -5.67457914352417, -4.789546012878418, -3.904512405395508, -3.0194790363311768, -2.1344456672668457, -1.2494122982025146, -0.3643789291381836, 0.5206546783447266, 1.4056878089904785, 2.2907209396362305, 3.1757545471191406, 4.060788154602051, 4.945821285247803, 5.830854415893555, 6.715888023376465, 7.600921630859375, 8.485954284667969, 9.370987892150879, 10.256021499633789, 11.1410551071167, 12.02608871459961, 12.911121368408203, 13.796154975891113, 14.681188583374023, 15.566221237182617, 16.451255798339844, 17.336288452148438, 18.22132110595703, 19.106355667114258, 19.99138832092285, 20.876422882080078, 21.761455535888672, 22.646488189697266, 23.53152084350586, 24.416555404663086, 25.30158805847168, 26.186622619628906, 27.0716552734375, 27.956687927246094, 28.84172248840332, 29.726755142211914, 30.61178970336914, 31.496822357177734]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 1.0, 2.0, 6.0, 9.0, 5.0, 13.0, 9.0, 8.0, 14.0, 19.0, 27.0, 24.0, 27.0, 33.0, 17.0, 34.0, 34.0, 30.0, 37.0, 28.0, 43.0, 54.0, 27.0, 39.0, 39.0, 39.0, 37.0, 40.0, 26.0, 31.0, 21.0, 30.0, 23.0, 21.0, 21.0, 25.0, 12.0, 16.0, 21.0, 8.0, 15.0, 12.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.609375, -3.4932861328125, -3.377197265625, -3.2611083984375, -3.14501953125, -3.0289306640625, -2.912841796875, -2.7967529296875, -2.6806640625, -2.5645751953125, -2.448486328125, -2.3323974609375, -2.21630859375, -2.1002197265625, -1.984130859375, -1.8680419921875, -1.751953125, -1.6358642578125, -1.519775390625, -1.4036865234375, -1.28759765625, -1.1715087890625, -1.055419921875, -0.9393310546875, -0.8232421875, -0.7071533203125, -0.591064453125, -0.4749755859375, -0.35888671875, -0.2427978515625, -0.126708984375, -0.0106201171875, 0.10546875, 0.2215576171875, 0.337646484375, 0.4537353515625, 0.56982421875, 0.6859130859375, 0.802001953125, 0.9180908203125, 1.0341796875, 1.1502685546875, 1.266357421875, 1.3824462890625, 1.49853515625, 1.6146240234375, 1.730712890625, 1.8468017578125, 1.962890625, 2.0789794921875, 2.195068359375, 2.3111572265625, 2.42724609375, 2.5433349609375, 2.659423828125, 2.7755126953125, 2.8916015625, 3.0076904296875, 3.123779296875, 3.2398681640625, 3.35595703125, 3.4720458984375, 3.588134765625, 3.7042236328125, 3.8203125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 11.0, 13.0, 11.0, 8.0, 22.0, 42.0, 56.0, 96.0, 115.0, 200.0, 287.0, 440.0, 656.0, 1028.0, 1582.0, 2501.0, 3961.0, 6218.0, 9851.0, 15990.0, 25709.0, 42736.0, 75367.0, 145311.0, 302290.0, 189327.0, 92738.0, 51379.0, 30403.0, 18373.0, 11559.0, 7348.0, 4567.0, 2996.0, 1805.0, 1195.0, 778.0, 527.0, 370.0, 211.0, 148.0, 110.0, 64.0, 51.0, 30.0, 13.0, 16.0, 15.0, 10.0, 12.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.70166015625, -0.67950439453125, -0.6573486328125, -0.63519287109375, -0.613037109375, -0.59088134765625, -0.5687255859375, -0.54656982421875, -0.5244140625, -0.50225830078125, -0.4801025390625, -0.45794677734375, -0.435791015625, -0.41363525390625, -0.3914794921875, -0.36932373046875, -0.34716796875, -0.32501220703125, -0.3028564453125, -0.28070068359375, -0.258544921875, -0.23638916015625, -0.2142333984375, -0.19207763671875, -0.169921875, -0.14776611328125, -0.1256103515625, -0.10345458984375, -0.081298828125, -0.05914306640625, -0.0369873046875, -0.01483154296875, 0.00732421875, 0.02947998046875, 0.0516357421875, 0.07379150390625, 0.095947265625, 0.11810302734375, 0.1402587890625, 0.16241455078125, 0.1845703125, 0.20672607421875, 0.2288818359375, 0.25103759765625, 0.273193359375, 0.29534912109375, 0.3175048828125, 0.33966064453125, 0.36181640625, 0.38397216796875, 0.4061279296875, 0.42828369140625, 0.450439453125, 0.47259521484375, 0.4947509765625, 0.51690673828125, 0.5390625, 0.56121826171875, 0.5833740234375, 0.60552978515625, 0.627685546875, 0.64984130859375, 0.6719970703125, 0.69415283203125, 0.71630859375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 8.0, 10.0, 11.0, 11.0, 7.0, 14.0, 17.0, 16.0, 20.0, 24.0, 32.0, 27.0, 41.0, 34.0, 29.0, 31.0, 40.0, 45.0, 52.0, 1063.0, 42.0, 33.0, 54.0, 33.0, 24.0, 36.0, 40.0, 31.0, 32.0, 30.0, 29.0, 16.0, 13.0, 16.0, 12.0, 20.0, 12.0, 6.0, 3.0, 6.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.658203125, -2.574371337890625, -2.49053955078125, -2.406707763671875, -2.3228759765625, -2.239044189453125, -2.15521240234375, -2.071380615234375, -1.987548828125, -1.903717041015625, -1.81988525390625, -1.736053466796875, -1.6522216796875, -1.568389892578125, -1.48455810546875, -1.400726318359375, -1.31689453125, -1.233062744140625, -1.14923095703125, -1.065399169921875, -0.9815673828125, -0.897735595703125, -0.81390380859375, -0.730072021484375, -0.646240234375, -0.562408447265625, -0.47857666015625, -0.394744873046875, -0.3109130859375, -0.227081298828125, -0.14324951171875, -0.059417724609375, 0.0244140625, 0.108245849609375, 0.19207763671875, 0.275909423828125, 0.3597412109375, 0.443572998046875, 0.52740478515625, 0.611236572265625, 0.695068359375, 0.778900146484375, 0.86273193359375, 0.946563720703125, 1.0303955078125, 1.114227294921875, 1.19805908203125, 1.281890869140625, 1.36572265625, 1.449554443359375, 1.53338623046875, 1.617218017578125, 1.7010498046875, 1.784881591796875, 1.86871337890625, 1.952545166015625, 2.036376953125, 2.120208740234375, 2.20404052734375, 2.287872314453125, 2.3717041015625, 2.455535888671875, 2.53936767578125, 2.623199462890625, 2.70703125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 7.0, 8.0, 15.0, 19.0, 33.0, 38.0, 75.0, 81.0, 93.0, 125.0, 174.0, 228.0, 298.0, 480.0, 674.0, 931.0, 1338.0, 1886.0, 2751.0, 3921.0, 5811.0, 8560.0, 12294.0, 18036.0, 26877.0, 40322.0, 63808.0, 110094.0, 1283007.0, 224052.0, 107180.0, 61217.0, 39751.0, 26644.0, 17700.0, 12065.0, 8044.0, 5598.0, 3882.0, 2649.0, 1814.0, 1304.0, 939.0, 686.0, 502.0, 324.0, 241.0, 183.0, 100.0, 68.0, 61.0, 32.0, 33.0, 27.0, 23.0, 13.0, 14.0, 4.0, 5.0, 0.0, 4.0], "bins": [-0.587890625, -0.5695037841796875, -0.551116943359375, -0.5327301025390625, -0.51434326171875, -0.4959564208984375, -0.477569580078125, -0.4591827392578125, -0.4407958984375, -0.4224090576171875, -0.404022216796875, -0.3856353759765625, -0.36724853515625, -0.3488616943359375, -0.330474853515625, -0.3120880126953125, -0.293701171875, -0.2753143310546875, -0.256927490234375, -0.2385406494140625, -0.22015380859375, -0.2017669677734375, -0.183380126953125, -0.1649932861328125, -0.1466064453125, -0.1282196044921875, -0.109832763671875, -0.0914459228515625, -0.07305908203125, -0.0546722412109375, -0.036285400390625, -0.0178985595703125, 0.00048828125, 0.0188751220703125, 0.037261962890625, 0.0556488037109375, 0.07403564453125, 0.0924224853515625, 0.110809326171875, 0.1291961669921875, 0.1475830078125, 0.1659698486328125, 0.184356689453125, 0.2027435302734375, 0.22113037109375, 0.2395172119140625, 0.257904052734375, 0.2762908935546875, 0.294677734375, 0.3130645751953125, 0.331451416015625, 0.3498382568359375, 0.36822509765625, 0.3866119384765625, 0.404998779296875, 0.4233856201171875, 0.4417724609375, 0.4601593017578125, 0.478546142578125, 0.4969329833984375, 0.51531982421875, 0.5337066650390625, 0.552093505859375, 0.5704803466796875, 0.5888671875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 3.0, 10.0, 7.0, 10.0, 12.0, 27.0, 24.0, 28.0, 35.0, 36.0, 44.0, 50.0, 56.0, 60.0, 68.0, 67.0, 65.0, 62.0, 61.0, 48.0, 33.0, 39.0, 20.0, 28.0, 24.0, 13.0, 7.0, 6.0, 8.0, 8.0, 9.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0001659393310546875, -0.00016099214553833008, -0.00015604496002197266, -0.00015109777450561523, -0.0001461505889892578, -0.0001412034034729004, -0.00013625621795654297, -0.00013130903244018555, -0.00012636184692382812, -0.0001214146614074707, -0.00011646747589111328, -0.00011152029037475586, -0.00010657310485839844, -0.00010162591934204102, -9.66787338256836e-05, -9.173154830932617e-05, -8.678436279296875e-05, -8.183717727661133e-05, -7.68899917602539e-05, -7.194280624389648e-05, -6.699562072753906e-05, -6.204843521118164e-05, -5.710124969482422e-05, -5.21540641784668e-05, -4.7206878662109375e-05, -4.225969314575195e-05, -3.731250762939453e-05, -3.236532211303711e-05, -2.7418136596679688e-05, -2.2470951080322266e-05, -1.7523765563964844e-05, -1.2576580047607422e-05, -7.62939453125e-06, -2.682209014892578e-06, 2.2649765014648438e-06, 7.212162017822266e-06, 1.2159347534179688e-05, 1.710653305053711e-05, 2.205371856689453e-05, 2.7000904083251953e-05, 3.1948089599609375e-05, 3.68952751159668e-05, 4.184246063232422e-05, 4.678964614868164e-05, 5.173683166503906e-05, 5.6684017181396484e-05, 6.16312026977539e-05, 6.657838821411133e-05, 7.152557373046875e-05, 7.647275924682617e-05, 8.14199447631836e-05, 8.636713027954102e-05, 9.131431579589844e-05, 9.626150131225586e-05, 0.00010120868682861328, 0.0001061558723449707, 0.00011110305786132812, 0.00011605024337768555, 0.00012099742889404297, 0.0001259446144104004, 0.0001308917999267578, 0.00013583898544311523, 0.00014078617095947266, 0.00014573335647583008, 0.0001506805419921875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 3.0, 3.0, 12.0, 12.0, 8.0, 10.0, 17.0, 33.0, 38.0, 43.0, 64.0, 75.0, 122.0, 215.0, 535.0, 2852.0, 1038074.0, 5030.0, 594.0, 269.0, 126.0, 100.0, 83.0, 47.0, 36.0, 29.0, 29.0, 22.0, 9.0, 11.0, 9.0, 7.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00345611572265625, -0.0033429861068725586, -0.003229856491088867, -0.0031167268753051758, -0.0030035972595214844, -0.002890467643737793, -0.0027773380279541016, -0.00266420841217041, -0.0025510787963867188, -0.0024379491806030273, -0.002324819564819336, -0.0022116899490356445, -0.002098560333251953, -0.0019854307174682617, -0.0018723011016845703, -0.001759171485900879, -0.0016460418701171875, -0.001532912254333496, -0.0014197826385498047, -0.0013066530227661133, -0.0011935234069824219, -0.0010803937911987305, -0.0009672641754150391, -0.0008541345596313477, -0.0007410049438476562, -0.0006278753280639648, -0.0005147457122802734, -0.00040161609649658203, -0.0002884864807128906, -0.00017535686492919922, -6.222724914550781e-05, 5.0902366638183594e-05, 0.000164031982421875, 0.0002771615982055664, 0.0003902912139892578, 0.0005034208297729492, 0.0006165504455566406, 0.000729680061340332, 0.0008428096771240234, 0.0009559392929077148, 0.0010690689086914062, 0.0011821985244750977, 0.001295328140258789, 0.0014084577560424805, 0.0015215873718261719, 0.0016347169876098633, 0.0017478466033935547, 0.001860976219177246, 0.0019741058349609375, 0.002087235450744629, 0.0022003650665283203, 0.0023134946823120117, 0.002426624298095703, 0.0025397539138793945, 0.002652883529663086, 0.0027660131454467773, 0.0028791427612304688, 0.00299227237701416, 0.0031054019927978516, 0.003218531608581543, 0.0033316612243652344, 0.0034447908401489258, 0.003557920455932617, 0.0036710500717163086, 0.0037841796875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 8.0, 19.0, 47.0, 45.0, 97.0, 148.0, 178.0, 164.0, 124.0, 87.0, 44.0, 29.0, 7.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00017212591774296016, -0.00016852229600772262, -0.0001649186888244003, -0.00016131506708916277, -0.00015771145990584046, -0.00015410783817060292, -0.0001505042309872806, -0.00014690060925204307, -0.00014329700206872076, -0.00013969338033348322, -0.0001360897731501609, -0.00013248615141492337, -0.00012888254423160106, -0.00012527892249636352, -0.00012167531531304121, -0.00011807169357780367, -0.00011446807911852375, -0.00011086446465924382, -0.0001072608501999639, -0.00010365723574068397, -0.00010005362128140405, -9.645000682212412e-05, -9.284638508688658e-05, -8.924277790356427e-05, -8.563915616832674e-05, -8.203554170904681e-05, -7.843192724976689e-05, -7.482831279048696e-05, -7.122469833120704e-05, -6.762108387192711e-05, -6.401746941264719e-05, -6.0413851315388456e-05, -5.6810244132066146e-05, -5.320662967278622e-05, -4.9603015213506296e-05, -4.5999397116247565e-05, -4.239578265696764e-05, -3.8792168197687715e-05, -3.518855373840779e-05, -3.1584939279127866e-05, -2.798132481984794e-05, -2.4377710360568017e-05, -2.0774095901288092e-05, -1.7170479623018764e-05, -1.356686516373884e-05, -9.963250704458915e-06, -6.3596344261895865e-06, -2.756019966909662e-06, 8.475944923702627e-07, 4.451209406397538e-06, 8.054824320424814e-06, 1.165843968919944e-05, 1.5262054148479365e-05, 1.886566860775929e-05, 2.2469284886028618e-05, 2.6072899345308542e-05, 2.9676513804588467e-05, 3.328012826386839e-05, 3.6883742723148316e-05, 4.048735718242824e-05, 4.4090971641708165e-05, 4.769458610098809e-05, 5.129820419824682e-05, 5.4901818657526746e-05, 5.850543311680667e-05]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 10.0, 10.0, 11.0, 16.0, 15.0, 19.0, 17.0, 21.0, 12.0, 27.0, 38.0, 24.0, 36.0, 31.0, 39.0, 46.0, 40.0, 38.0, 38.0, 45.0, 38.0, 37.0, 39.0, 41.0, 26.0, 32.0, 46.0, 26.0, 36.0, 18.0, 16.0, 22.0, 19.0, 12.0, 11.0, 11.0, 5.0, 8.0, 4.0, 6.0, 5.0, 6.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.396936416625977e-05, -7.145106792449951e-05, -6.893277168273926e-05, -6.6414475440979e-05, -6.389617919921875e-05, -6.13778829574585e-05, -5.885958671569824e-05, -5.634129047393799e-05, -5.3822994232177734e-05, -5.130469799041748e-05, -4.8786401748657227e-05, -4.626810550689697e-05, -4.374980926513672e-05, -4.1231513023376465e-05, -3.871321678161621e-05, -3.619492053985596e-05, -3.36766242980957e-05, -3.115832805633545e-05, -2.8640031814575195e-05, -2.612173557281494e-05, -2.3603439331054688e-05, -2.1085143089294434e-05, -1.856684684753418e-05, -1.6048550605773926e-05, -1.3530254364013672e-05, -1.1011958122253418e-05, -8.493661880493164e-06, -5.97536563873291e-06, -3.4570693969726562e-06, -9.387731552124023e-07, 1.5795230865478516e-06, 4.0978193283081055e-06, 6.616115570068359e-06, 9.134411811828613e-06, 1.1652708053588867e-05, 1.4171004295349121e-05, 1.6689300537109375e-05, 1.920759677886963e-05, 2.1725893020629883e-05, 2.4244189262390137e-05, 2.676248550415039e-05, 2.9280781745910645e-05, 3.17990779876709e-05, 3.431737422943115e-05, 3.6835670471191406e-05, 3.935396671295166e-05, 4.1872262954711914e-05, 4.439055919647217e-05, 4.690885543823242e-05, 4.9427151679992676e-05, 5.194544792175293e-05, 5.4463744163513184e-05, 5.698204040527344e-05, 5.950033664703369e-05, 6.201863288879395e-05, 6.45369291305542e-05, 6.705522537231445e-05, 6.957352161407471e-05, 7.209181785583496e-05, 7.461011409759521e-05, 7.712841033935547e-05, 7.964670658111572e-05, 8.216500282287598e-05, 8.468329906463623e-05, 8.720159530639648e-05]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 1.0, 2.0, 6.0, 9.0, 5.0, 13.0, 9.0, 8.0, 14.0, 19.0, 27.0, 24.0, 27.0, 33.0, 17.0, 34.0, 34.0, 30.0, 37.0, 28.0, 43.0, 54.0, 27.0, 39.0, 39.0, 39.0, 37.0, 40.0, 26.0, 31.0, 21.0, 30.0, 23.0, 21.0, 21.0, 25.0, 12.0, 16.0, 21.0, 8.0, 15.0, 12.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.609375, -3.4932861328125, -3.377197265625, -3.2611083984375, -3.14501953125, -3.0289306640625, -2.912841796875, -2.7967529296875, -2.6806640625, -2.5645751953125, -2.448486328125, -2.3323974609375, -2.21630859375, -2.1002197265625, -1.984130859375, -1.8680419921875, -1.751953125, -1.6358642578125, -1.519775390625, -1.4036865234375, -1.28759765625, -1.1715087890625, -1.055419921875, -0.9393310546875, -0.8232421875, -0.7071533203125, -0.591064453125, -0.4749755859375, -0.35888671875, -0.2427978515625, -0.126708984375, -0.0106201171875, 0.10546875, 0.2215576171875, 0.337646484375, 0.4537353515625, 0.56982421875, 0.6859130859375, 0.802001953125, 0.9180908203125, 1.0341796875, 1.1502685546875, 1.266357421875, 1.3824462890625, 1.49853515625, 1.6146240234375, 1.730712890625, 1.8468017578125, 1.962890625, 2.0789794921875, 2.195068359375, 2.3111572265625, 2.42724609375, 2.5433349609375, 2.659423828125, 2.7755126953125, 2.8916015625, 3.0076904296875, 3.123779296875, 3.2398681640625, 3.35595703125, 3.4720458984375, 3.588134765625, 3.7042236328125, 3.8203125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 10.0, 4.0, 7.0, 16.0, 10.0, 11.0, 22.0, 31.0, 50.0, 54.0, 68.0, 93.0, 106.0, 156.0, 250.0, 439.0, 923.0, 2376.0, 6225.0, 16749.0, 45198.0, 115421.0, 278323.0, 347228.0, 143335.0, 56751.0, 21298.0, 7899.0, 2887.0, 1156.0, 494.0, 277.0, 167.0, 117.0, 93.0, 75.0, 47.0, 38.0, 39.0, 23.0, 22.0, 15.0, 12.0, 9.0, 11.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.84765625, -3.71990966796875, -3.5921630859375, -3.46441650390625, -3.336669921875, -3.20892333984375, -3.0811767578125, -2.95343017578125, -2.82568359375, -2.69793701171875, -2.5701904296875, -2.44244384765625, -2.314697265625, -2.18695068359375, -2.0592041015625, -1.93145751953125, -1.8037109375, -1.67596435546875, -1.5482177734375, -1.42047119140625, -1.292724609375, -1.16497802734375, -1.0372314453125, -0.90948486328125, -0.78173828125, -0.65399169921875, -0.5262451171875, -0.39849853515625, -0.270751953125, -0.14300537109375, -0.0152587890625, 0.11248779296875, 0.240234375, 0.36798095703125, 0.4957275390625, 0.62347412109375, 0.751220703125, 0.87896728515625, 1.0067138671875, 1.13446044921875, 1.26220703125, 1.38995361328125, 1.5177001953125, 1.64544677734375, 1.773193359375, 1.90093994140625, 2.0286865234375, 2.15643310546875, 2.2841796875, 2.41192626953125, 2.5396728515625, 2.66741943359375, 2.795166015625, 2.92291259765625, 3.0506591796875, 3.17840576171875, 3.30615234375, 3.43389892578125, 3.5616455078125, 3.68939208984375, 3.817138671875, 3.94488525390625, 4.0726318359375, 4.20037841796875, 4.328125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 3.0, 0.0, 4.0, 5.0, 12.0, 11.0, 11.0, 8.0, 16.0, 21.0, 21.0, 20.0, 27.0, 22.0, 37.0, 41.0, 41.0, 57.0, 65.0, 166.0, 1440.0, 415.0, 128.0, 75.0, 50.0, 58.0, 41.0, 42.0, 29.0, 33.0, 35.0, 15.0, 16.0, 9.0, 14.0, 9.0, 10.0, 9.0, 7.0, 9.0, 1.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.421875, -11.0272216796875, -10.632568359375, -10.2379150390625, -9.84326171875, -9.4486083984375, -9.053955078125, -8.6593017578125, -8.2646484375, -7.8699951171875, -7.475341796875, -7.0806884765625, -6.68603515625, -6.2913818359375, -5.896728515625, -5.5020751953125, -5.107421875, -4.7127685546875, -4.318115234375, -3.9234619140625, -3.52880859375, -3.1341552734375, -2.739501953125, -2.3448486328125, -1.9501953125, -1.5555419921875, -1.160888671875, -0.7662353515625, -0.37158203125, 0.0230712890625, 0.417724609375, 0.8123779296875, 1.20703125, 1.6016845703125, 1.996337890625, 2.3909912109375, 2.78564453125, 3.1802978515625, 3.574951171875, 3.9696044921875, 4.3642578125, 4.7589111328125, 5.153564453125, 5.5482177734375, 5.94287109375, 6.3375244140625, 6.732177734375, 7.1268310546875, 7.521484375, 7.9161376953125, 8.310791015625, 8.7054443359375, 9.10009765625, 9.4947509765625, 9.889404296875, 10.2840576171875, 10.6787109375, 11.0733642578125, 11.468017578125, 11.8626708984375, 12.25732421875, 12.6519775390625, 13.046630859375, 13.4412841796875, 13.8359375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 7.0, 3.0, 4.0, 13.0, 20.0, 32.0, 25.0, 35.0, 32.0, 59.0, 96.0, 110.0, 187.0, 347.0, 779.0, 3974.0, 3117233.0, 20501.0, 1138.0, 451.0, 198.0, 137.0, 94.0, 67.0, 45.0, 29.0, 16.0, 20.0, 9.0, 13.0, 7.0, 10.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.4375, -48.7373046875, -47.037109375, -45.3369140625, -43.63671875, -41.9365234375, -40.236328125, -38.5361328125, -36.8359375, -35.1357421875, -33.435546875, -31.7353515625, -30.03515625, -28.3349609375, -26.634765625, -24.9345703125, -23.234375, -21.5341796875, -19.833984375, -18.1337890625, -16.43359375, -14.7333984375, -13.033203125, -11.3330078125, -9.6328125, -7.9326171875, -6.232421875, -4.5322265625, -2.83203125, -1.1318359375, 0.568359375, 2.2685546875, 3.96875, 5.6689453125, 7.369140625, 9.0693359375, 10.76953125, 12.4697265625, 14.169921875, 15.8701171875, 17.5703125, 19.2705078125, 20.970703125, 22.6708984375, 24.37109375, 26.0712890625, 27.771484375, 29.4716796875, 31.171875, 32.8720703125, 34.572265625, 36.2724609375, 37.97265625, 39.6728515625, 41.373046875, 43.0732421875, 44.7734375, 46.4736328125, 48.173828125, 49.8740234375, 51.57421875, 53.2744140625, 54.974609375, 56.6748046875, 58.375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 21.0, 55.0, 128.0, 214.0, 257.0, 196.0, 90.0, 35.0, 10.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.67979621887207, -16.764461517333984, -15.849126815795898, -14.933792114257812, -14.018457412719727, -13.10312271118164, -12.187788009643555, -11.272453308105469, -10.357118606567383, -9.441783905029297, -8.526449203491211, -7.611114501953125, -6.695779800415039, -5.780445098876953, -4.865110397338867, -3.9497756958007812, -3.0344409942626953, -2.1191062927246094, -1.2037715911865234, -0.2884368896484375, 0.6268978118896484, 1.5422325134277344, 2.4575672149658203, 3.3729019165039062, 4.288236618041992, 5.203571319580078, 6.118906021118164, 7.03424072265625, 7.949575424194336, 8.864910125732422, 9.780244827270508, 10.695579528808594, 11.610912322998047, 12.526247024536133, 13.441581726074219, 14.356916427612305, 15.27225112915039, 16.187585830688477, 17.102920532226562, 18.01825523376465, 18.933589935302734, 19.84892463684082, 20.764259338378906, 21.679594039916992, 22.594928741455078, 23.510263442993164, 24.42559814453125, 25.340932846069336, 26.256267547607422, 27.171602249145508, 28.086936950683594, 29.00227165222168, 29.917606353759766, 30.83294105529785, 31.748275756835938, 32.663612365722656, 33.57894515991211, 34.49427795410156, 35.40961456298828, 36.324951171875, 37.24028396606445, 38.155616760253906, 39.070953369140625, 39.986289978027344, 40.9016227722168]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 9.0, 9.0, 10.0, 12.0, 11.0, 13.0, 14.0, 27.0, 32.0, 27.0, 36.0, 34.0, 46.0, 37.0, 31.0, 28.0, 39.0, 55.0, 42.0, 37.0, 48.0, 44.0, 38.0, 44.0, 37.0, 31.0, 27.0, 24.0, 25.0, 22.0, 26.0, 18.0, 9.0, 13.0, 7.0, 4.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.4241828918457, -31.450801849365234, -30.477420806884766, -29.504039764404297, -28.530658721923828, -27.55727767944336, -26.583898544311523, -25.610517501831055, -24.637136459350586, -23.663755416870117, -22.69037437438965, -21.71699333190918, -20.743614196777344, -19.770233154296875, -18.796852111816406, -17.823471069335938, -16.85009002685547, -15.876708984375, -14.903327941894531, -13.929947853088379, -12.95656681060791, -11.983185768127441, -11.009805679321289, -10.03642463684082, -9.063043594360352, -8.089662551879883, -7.116281986236572, -6.142901420593262, -5.169520378112793, -4.196139335632324, -3.2227587699890137, -2.249378204345703, -1.2759971618652344, -0.3026163578033447, 0.6707644462585449, 1.6441452503204346, 2.617526054382324, 3.590907096862793, 4.5642876625061035, 5.537668228149414, 6.511049270629883, 7.484430313110352, 8.45781135559082, 9.431191444396973, 10.404572486877441, 11.37795352935791, 12.351333618164062, 13.324714660644531, 14.298095703125, 15.271476745605469, 16.244857788085938, 17.218238830566406, 18.191619873046875, 19.165000915527344, 20.13838005065918, 21.11176109313965, 22.085142135620117, 23.058523178100586, 24.031904220581055, 25.005285263061523, 25.97866439819336, 26.952045440673828, 27.925426483154297, 28.898807525634766, 29.872188568115234]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 6.0, 1.0, 7.0, 8.0, 8.0, 6.0, 7.0, 10.0, 14.0, 12.0, 24.0, 25.0, 20.0, 26.0, 26.0, 40.0, 22.0, 27.0, 41.0, 33.0, 27.0, 47.0, 39.0, 36.0, 38.0, 26.0, 38.0, 45.0, 40.0, 31.0, 22.0, 33.0, 22.0, 26.0, 26.0, 17.0, 17.0, 12.0, 13.0, 19.0, 13.0, 12.0, 13.0, 8.0, 3.0, 5.0, 6.0, 1.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.70703125, -3.5831298828125, -3.459228515625, -3.3353271484375, -3.21142578125, -3.0875244140625, -2.963623046875, -2.8397216796875, -2.7158203125, -2.5919189453125, -2.468017578125, -2.3441162109375, -2.22021484375, -2.0963134765625, -1.972412109375, -1.8485107421875, -1.724609375, -1.6007080078125, -1.476806640625, -1.3529052734375, -1.22900390625, -1.1051025390625, -0.981201171875, -0.8572998046875, -0.7333984375, -0.6094970703125, -0.485595703125, -0.3616943359375, -0.23779296875, -0.1138916015625, 0.010009765625, 0.1339111328125, 0.2578125, 0.3817138671875, 0.505615234375, 0.6295166015625, 0.75341796875, 0.8773193359375, 1.001220703125, 1.1251220703125, 1.2490234375, 1.3729248046875, 1.496826171875, 1.6207275390625, 1.74462890625, 1.8685302734375, 1.992431640625, 2.1163330078125, 2.240234375, 2.3641357421875, 2.488037109375, 2.6119384765625, 2.73583984375, 2.8597412109375, 2.983642578125, 3.1075439453125, 3.2314453125, 3.3553466796875, 3.479248046875, 3.6031494140625, 3.72705078125, 3.8509521484375, 3.974853515625, 4.0987548828125, 4.22265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 9.0, 11.0, 9.0, 9.0, 18.0, 19.0, 25.0, 31.0, 29.0, 41.0, 62.0, 66.0, 67.0, 95.0, 118.0, 152.0, 259.0, 923.0, 9554.0, 457803.0, 3304912.0, 409136.0, 8970.0, 924.0, 272.0, 155.0, 121.0, 71.0, 77.0, 56.0, 45.0, 48.0, 35.0, 35.0, 22.0, 15.0, 21.0, 10.0, 18.0, 4.0, 8.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.359375, -11.9539794921875, -11.548583984375, -11.1431884765625, -10.73779296875, -10.3323974609375, -9.927001953125, -9.5216064453125, -9.1162109375, -8.7108154296875, -8.305419921875, -7.9000244140625, -7.49462890625, -7.0892333984375, -6.683837890625, -6.2784423828125, -5.873046875, -5.4676513671875, -5.062255859375, -4.6568603515625, -4.25146484375, -3.8460693359375, -3.440673828125, -3.0352783203125, -2.6298828125, -2.2244873046875, -1.819091796875, -1.4136962890625, -1.00830078125, -0.6029052734375, -0.197509765625, 0.2078857421875, 0.61328125, 1.0186767578125, 1.424072265625, 1.8294677734375, 2.23486328125, 2.6402587890625, 3.045654296875, 3.4510498046875, 3.8564453125, 4.2618408203125, 4.667236328125, 5.0726318359375, 5.47802734375, 5.8834228515625, 6.288818359375, 6.6942138671875, 7.099609375, 7.5050048828125, 7.910400390625, 8.3157958984375, 8.72119140625, 9.1265869140625, 9.531982421875, 9.9373779296875, 10.3427734375, 10.7481689453125, 11.153564453125, 11.5589599609375, 11.96435546875, 12.3697509765625, 12.775146484375, 13.1805419921875, 13.5859375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 9.0, 6.0, 8.0, 6.0, 8.0, 12.0, 13.0, 23.0, 23.0, 41.0, 56.0, 76.0, 78.0, 139.0, 163.0, 214.0, 248.0, 319.0, 370.0, 382.0, 387.0, 350.0, 257.0, 210.0, 143.0, 115.0, 101.0, 63.0, 54.0, 47.0, 39.0, 29.0, 22.0, 18.0, 11.0, 3.0, 6.0, 10.0, 3.0, 1.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.98046875, -4.7862548828125, -4.592041015625, -4.3978271484375, -4.20361328125, -4.0093994140625, -3.815185546875, -3.6209716796875, -3.4267578125, -3.2325439453125, -3.038330078125, -2.8441162109375, -2.64990234375, -2.4556884765625, -2.261474609375, -2.0672607421875, -1.873046875, -1.6788330078125, -1.484619140625, -1.2904052734375, -1.09619140625, -0.9019775390625, -0.707763671875, -0.5135498046875, -0.3193359375, -0.1251220703125, 0.069091796875, 0.2633056640625, 0.45751953125, 0.6517333984375, 0.845947265625, 1.0401611328125, 1.234375, 1.4285888671875, 1.622802734375, 1.8170166015625, 2.01123046875, 2.2054443359375, 2.399658203125, 2.5938720703125, 2.7880859375, 2.9822998046875, 3.176513671875, 3.3707275390625, 3.56494140625, 3.7591552734375, 3.953369140625, 4.1475830078125, 4.341796875, 4.5360107421875, 4.730224609375, 4.9244384765625, 5.11865234375, 5.3128662109375, 5.507080078125, 5.7012939453125, 5.8955078125, 6.0897216796875, 6.283935546875, 6.4781494140625, 6.67236328125, 6.8665771484375, 7.060791015625, 7.2550048828125, 7.44921875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 4.0, 3.0, 11.0, 13.0, 24.0, 18.0, 39.0, 43.0, 63.0, 65.0, 110.0, 127.0, 162.0, 198.0, 271.0, 409.0, 836.0, 42163.0, 4076390.0, 70640.0, 975.0, 405.0, 313.0, 243.0, 185.0, 149.0, 110.0, 70.0, 56.0, 40.0, 40.0, 22.0, 13.0, 12.0, 9.0, 11.0, 7.0, 6.0, 5.0, 1.0, 1.0, 4.0, 3.0, 1.0], "bins": [-39.28125, -38.261962890625, -37.24267578125, -36.223388671875, -35.2041015625, -34.184814453125, -33.16552734375, -32.146240234375, -31.126953125, -30.107666015625, -29.08837890625, -28.069091796875, -27.0498046875, -26.030517578125, -25.01123046875, -23.991943359375, -22.97265625, -21.953369140625, -20.93408203125, -19.914794921875, -18.8955078125, -17.876220703125, -16.85693359375, -15.837646484375, -14.818359375, -13.799072265625, -12.77978515625, -11.760498046875, -10.7412109375, -9.721923828125, -8.70263671875, -7.683349609375, -6.6640625, -5.644775390625, -4.62548828125, -3.606201171875, -2.5869140625, -1.567626953125, -0.54833984375, 0.470947265625, 1.490234375, 2.509521484375, 3.52880859375, 4.548095703125, 5.5673828125, 6.586669921875, 7.60595703125, 8.625244140625, 9.64453125, 10.663818359375, 11.68310546875, 12.702392578125, 13.7216796875, 14.740966796875, 15.76025390625, 16.779541015625, 17.798828125, 18.818115234375, 19.83740234375, 20.856689453125, 21.8759765625, 22.895263671875, 23.91455078125, 24.933837890625, 25.953125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 25.0, 177.0, 391.0, 309.0, 98.0, 10.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.38491439819336, -19.52646827697754, -16.66802215576172, -13.809574127197266, -10.951128005981445, -8.092681884765625, -5.234233856201172, -2.3757877349853516, 0.48265838623046875, 3.3411049842834473, 6.199551582336426, 9.057998657226562, 11.916444778442383, 14.774890899658203, 17.633338928222656, 20.491785049438477, 23.350231170654297, 26.208677291870117, 29.067123413085938, 31.92557144165039, 34.784019470214844, 37.64246368408203, 40.500911712646484, 43.35935974121094, 46.217803955078125, 49.07625198364258, 51.934696197509766, 54.79314422607422, 57.651588439941406, 60.51003646850586, 63.36848449707031, 66.2269287109375, 69.08537292480469, 71.94381713867188, 74.8022689819336, 77.66071319580078, 80.51915740966797, 83.37760925292969, 86.23605346679688, 89.09449768066406, 91.95294189453125, 94.81138610839844, 97.66983795166016, 100.52828216552734, 103.38672637939453, 106.24517822265625, 109.10362243652344, 111.96206665039062, 114.82051849365234, 117.67896270751953, 120.53741455078125, 123.39585876464844, 126.25430297851562, 129.1127471923828, 131.97119140625, 134.82965087890625, 137.68809509277344, 140.54653930664062, 143.4049835205078, 146.263427734375, 149.12188720703125, 151.98033142089844, 154.83877563476562, 157.6972198486328, 160.5556640625]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 5.0, 9.0, 4.0, 12.0, 18.0, 19.0, 21.0, 23.0, 19.0, 17.0, 30.0, 24.0, 37.0, 34.0, 39.0, 36.0, 50.0, 43.0, 41.0, 42.0, 53.0, 38.0, 42.0, 38.0, 37.0, 25.0, 30.0, 24.0, 30.0, 24.0, 24.0, 16.0, 9.0, 20.0, 15.0, 10.0, 7.0, 11.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.612600326538086, -23.874149322509766, -23.135698318481445, -22.397247314453125, -21.658796310424805, -20.920345306396484, -20.181894302368164, -19.443443298339844, -18.704992294311523, -17.966541290283203, -17.228090286254883, -16.489639282226562, -15.751188278198242, -15.012737274169922, -14.274286270141602, -13.535835266113281, -12.797384262084961, -12.05893325805664, -11.32048225402832, -10.58203125, -9.84358024597168, -9.10512924194336, -8.366678237915039, -7.628227233886719, -6.889776229858398, -6.151325225830078, -5.412874221801758, -4.6744232177734375, -3.935972213745117, -3.197521209716797, -2.4590702056884766, -1.7206192016601562, -0.9821662902832031, -0.2437152862548828, 0.4947357177734375, 1.2331867218017578, 1.9716377258300781, 2.7100887298583984, 3.4485397338867188, 4.186990737915039, 4.925441741943359, 5.66389274597168, 6.40234375, 7.14079475402832, 7.879245758056641, 8.617696762084961, 9.356147766113281, 10.094598770141602, 10.833049774169922, 11.571500778198242, 12.309951782226562, 13.048402786254883, 13.786853790283203, 14.525304794311523, 15.263755798339844, 16.002206802368164, 16.740657806396484, 17.479108810424805, 18.217559814453125, 18.956010818481445, 19.694461822509766, 20.432912826538086, 21.171363830566406, 21.909814834594727, 22.648265838623047]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 8.0, 3.0, 8.0, 5.0, 9.0, 7.0, 18.0, 24.0, 23.0, 19.0, 26.0, 22.0, 24.0, 23.0, 29.0, 32.0, 28.0, 37.0, 42.0, 36.0, 41.0, 39.0, 33.0, 29.0, 33.0, 28.0, 30.0, 33.0, 26.0, 34.0, 21.0, 27.0, 25.0, 25.0, 18.0, 23.0, 15.0, 20.0, 11.0, 11.0, 7.0, 11.0, 7.0, 7.0, 8.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0], "bins": [-3.7734375, -3.6602783203125, -3.547119140625, -3.4339599609375, -3.32080078125, -3.2076416015625, -3.094482421875, -2.9813232421875, -2.8681640625, -2.7550048828125, -2.641845703125, -2.5286865234375, -2.41552734375, -2.3023681640625, -2.189208984375, -2.0760498046875, -1.962890625, -1.8497314453125, -1.736572265625, -1.6234130859375, -1.51025390625, -1.3970947265625, -1.283935546875, -1.1707763671875, -1.0576171875, -0.9444580078125, -0.831298828125, -0.7181396484375, -0.60498046875, -0.4918212890625, -0.378662109375, -0.2655029296875, -0.15234375, -0.0391845703125, 0.073974609375, 0.1871337890625, 0.30029296875, 0.4134521484375, 0.526611328125, 0.6397705078125, 0.7529296875, 0.8660888671875, 0.979248046875, 1.0924072265625, 1.20556640625, 1.3187255859375, 1.431884765625, 1.5450439453125, 1.658203125, 1.7713623046875, 1.884521484375, 1.9976806640625, 2.11083984375, 2.2239990234375, 2.337158203125, 2.4503173828125, 2.5634765625, 2.6766357421875, 2.789794921875, 2.9029541015625, 3.01611328125, 3.1292724609375, 3.242431640625, 3.3555908203125, 3.46875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 7.0, 5.0, 8.0, 9.0, 19.0, 25.0, 42.0, 62.0, 84.0, 120.0, 151.0, 260.0, 352.0, 507.0, 688.0, 1011.0, 1506.0, 2230.0, 3264.0, 4652.0, 7097.0, 10605.0, 15781.0, 23820.0, 35868.0, 54690.0, 88325.0, 152243.0, 249742.0, 148529.0, 85824.0, 54057.0, 35536.0, 23500.0, 15678.0, 10435.0, 7023.0, 4729.0, 3144.0, 2149.0, 1497.0, 1033.0, 669.0, 448.0, 375.0, 242.0, 174.0, 117.0, 79.0, 53.0, 32.0, 33.0, 12.0, 7.0, 13.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.5927734375, -0.573944091796875, -0.55511474609375, -0.536285400390625, -0.5174560546875, -0.498626708984375, -0.47979736328125, -0.460968017578125, -0.442138671875, -0.423309326171875, -0.40447998046875, -0.385650634765625, -0.3668212890625, -0.347991943359375, -0.32916259765625, -0.310333251953125, -0.29150390625, -0.272674560546875, -0.25384521484375, -0.235015869140625, -0.2161865234375, -0.197357177734375, -0.17852783203125, -0.159698486328125, -0.140869140625, -0.122039794921875, -0.10321044921875, -0.084381103515625, -0.0655517578125, -0.046722412109375, -0.02789306640625, -0.009063720703125, 0.009765625, 0.028594970703125, 0.04742431640625, 0.066253662109375, 0.0850830078125, 0.103912353515625, 0.12274169921875, 0.141571044921875, 0.160400390625, 0.179229736328125, 0.19805908203125, 0.216888427734375, 0.2357177734375, 0.254547119140625, 0.27337646484375, 0.292205810546875, 0.31103515625, 0.329864501953125, 0.34869384765625, 0.367523193359375, 0.3863525390625, 0.405181884765625, 0.42401123046875, 0.442840576171875, 0.461669921875, 0.480499267578125, 0.49932861328125, 0.518157958984375, 0.5369873046875, 0.555816650390625, 0.57464599609375, 0.593475341796875, 0.6123046875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 8.0, 4.0, 14.0, 15.0, 9.0, 8.0, 23.0, 19.0, 20.0, 34.0, 26.0, 41.0, 44.0, 38.0, 31.0, 52.0, 40.0, 51.0, 1069.0, 46.0, 37.0, 50.0, 39.0, 47.0, 40.0, 40.0, 25.0, 32.0, 17.0, 17.0, 22.0, 12.0, 7.0, 12.0, 8.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.76025390625, -2.6689453125, -2.57763671875, -2.486328125, -2.39501953125, -2.3037109375, -2.21240234375, -2.12109375, -2.02978515625, -1.9384765625, -1.84716796875, -1.755859375, -1.66455078125, -1.5732421875, -1.48193359375, -1.390625, -1.29931640625, -1.2080078125, -1.11669921875, -1.025390625, -0.93408203125, -0.8427734375, -0.75146484375, -0.66015625, -0.56884765625, -0.4775390625, -0.38623046875, -0.294921875, -0.20361328125, -0.1123046875, -0.02099609375, 0.0703125, 0.16162109375, 0.2529296875, 0.34423828125, 0.435546875, 0.52685546875, 0.6181640625, 0.70947265625, 0.80078125, 0.89208984375, 0.9833984375, 1.07470703125, 1.166015625, 1.25732421875, 1.3486328125, 1.43994140625, 1.53125, 1.62255859375, 1.7138671875, 1.80517578125, 1.896484375, 1.98779296875, 2.0791015625, 2.17041015625, 2.26171875, 2.35302734375, 2.4443359375, 2.53564453125, 2.626953125, 2.71826171875, 2.8095703125, 2.90087890625, 2.9921875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 8.0, 2.0, 8.0, 5.0, 12.0, 6.0, 30.0, 27.0, 48.0, 76.0, 134.0, 156.0, 272.0, 411.0, 576.0, 837.0, 1210.0, 1838.0, 2604.0, 3868.0, 5675.0, 8281.0, 12679.0, 18822.0, 29571.0, 46929.0, 79271.0, 149763.0, 1339434.0, 166250.0, 85518.0, 50654.0, 31304.0, 20156.0, 13057.0, 8719.0, 6085.0, 4072.0, 2782.0, 1880.0, 1359.0, 888.0, 610.0, 390.0, 281.0, 199.0, 118.0, 98.0, 62.0, 39.0, 21.0, 18.0, 12.0, 8.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.64208984375, -0.62237548828125, -0.6026611328125, -0.58294677734375, -0.563232421875, -0.54351806640625, -0.5238037109375, -0.50408935546875, -0.484375, -0.46466064453125, -0.4449462890625, -0.42523193359375, -0.405517578125, -0.38580322265625, -0.3660888671875, -0.34637451171875, -0.32666015625, -0.30694580078125, -0.2872314453125, -0.26751708984375, -0.247802734375, -0.22808837890625, -0.2083740234375, -0.18865966796875, -0.1689453125, -0.14923095703125, -0.1295166015625, -0.10980224609375, -0.090087890625, -0.07037353515625, -0.0506591796875, -0.03094482421875, -0.01123046875, 0.00848388671875, 0.0281982421875, 0.04791259765625, 0.067626953125, 0.08734130859375, 0.1070556640625, 0.12677001953125, 0.146484375, 0.16619873046875, 0.1859130859375, 0.20562744140625, 0.225341796875, 0.24505615234375, 0.2647705078125, 0.28448486328125, 0.30419921875, 0.32391357421875, 0.3436279296875, 0.36334228515625, 0.383056640625, 0.40277099609375, 0.4224853515625, 0.44219970703125, 0.4619140625, 0.48162841796875, 0.5013427734375, 0.52105712890625, 0.540771484375, 0.56048583984375, 0.5802001953125, 0.59991455078125, 0.61962890625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 8.0, 10.0, 9.0, 14.0, 5.0, 10.0, 17.0, 22.0, 32.0, 30.0, 44.0, 55.0, 68.0, 63.0, 59.0, 62.0, 63.0, 55.0, 71.0, 63.0, 47.0, 40.0, 32.0, 24.0, 25.0, 23.0, 14.0, 11.0, 6.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011867284774780273, -0.0001133875921368599, -0.00010810233652591705, -0.00010281708091497421, -9.753182530403137e-05, -9.224656969308853e-05, -8.696131408214569e-05, -8.167605847120285e-05, -7.639080286026001e-05, -7.110554724931717e-05, -6.582029163837433e-05, -6.053503602743149e-05, -5.524978041648865e-05, -4.996452480554581e-05, -4.4679269194602966e-05, -3.9394013583660126e-05, -3.4108757972717285e-05, -2.8823502361774445e-05, -2.3538246750831604e-05, -1.8252991139888763e-05, -1.2967735528945923e-05, -7.682479918003082e-06, -2.3972243070602417e-06, 2.888031303882599e-06, 8.17328691482544e-06, 1.345854252576828e-05, 1.874379813671112e-05, 2.402905374765396e-05, 2.9314309358596802e-05, 3.459956496953964e-05, 3.988482058048248e-05, 4.5170076191425323e-05, 5.0455331802368164e-05, 5.5740587413311005e-05, 6.1025843024253845e-05, 6.631109863519669e-05, 7.159635424613953e-05, 7.688160985708237e-05, 8.216686546802521e-05, 8.745212107896805e-05, 9.273737668991089e-05, 9.802263230085373e-05, 0.00010330788791179657, 0.00010859314352273941, 0.00011387839913368225, 0.00011916365474462509, 0.00012444891035556793, 0.00012973416596651077, 0.0001350194215774536, 0.00014030467718839645, 0.0001455899327993393, 0.00015087518841028214, 0.00015616044402122498, 0.00016144569963216782, 0.00016673095524311066, 0.0001720162108540535, 0.00017730146646499634, 0.00018258672207593918, 0.00018787197768688202, 0.00019315723329782486, 0.0001984424889087677, 0.00020372774451971054, 0.00020901300013065338, 0.00021429825574159622, 0.00021958351135253906]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 2.0, 9.0, 10.0, 19.0, 17.0, 35.0, 38.0, 50.0, 60.0, 87.0, 123.0, 196.0, 332.0, 818.0, 12382.0, 1030579.0, 2435.0, 602.0, 251.0, 137.0, 90.0, 59.0, 54.0, 40.0, 27.0, 16.0, 14.0, 15.0, 15.0, 13.0, 5.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0], "bins": [-0.004535675048828125, -0.004423230886459351, -0.004310786724090576, -0.004198342561721802, -0.004085898399353027, -0.003973454236984253, -0.0038610100746154785, -0.003748565912246704, -0.0036361217498779297, -0.0035236775875091553, -0.003411233425140381, -0.0032987892627716064, -0.003186345100402832, -0.0030739009380340576, -0.002961456775665283, -0.002849012613296509, -0.0027365684509277344, -0.00262412428855896, -0.0025116801261901855, -0.002399235963821411, -0.0022867918014526367, -0.0021743476390838623, -0.002061903476715088, -0.0019494593143463135, -0.001837015151977539, -0.0017245709896087646, -0.0016121268272399902, -0.0014996826648712158, -0.0013872385025024414, -0.001274794340133667, -0.0011623501777648926, -0.0010499060153961182, -0.0009374618530273438, -0.0008250176906585693, -0.0007125735282897949, -0.0006001293659210205, -0.0004876852035522461, -0.0003752410411834717, -0.00026279687881469727, -0.00015035271644592285, -3.790855407714844e-05, 7.453560829162598e-05, 0.0001869797706604004, 0.0002994239330291748, 0.0004118680953979492, 0.0005243122577667236, 0.000636756420135498, 0.0007492005825042725, 0.0008616447448730469, 0.0009740889072418213, 0.0010865330696105957, 0.0011989772319793701, 0.0013114213943481445, 0.001423865556716919, 0.0015363097190856934, 0.0016487538814544678, 0.0017611980438232422, 0.0018736422061920166, 0.001986086368560791, 0.0020985305309295654, 0.00221097469329834, 0.0023234188556671143, 0.0024358630180358887, 0.002548307180404663, 0.0026607513427734375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 219.0, 568.0, 200.0, 15.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022592559980694205, -0.00021223867952357978, -0.00019855177379213274, -0.00018486485350877047, -0.0001711779332254082, -0.00015749101294204593, -0.00014380409265868366, -0.00013011718692723662, -0.00011643026664387435, -0.00010274334636051208, -8.905643335310742e-05, -7.536952034570277e-05, -6.16826000623405e-05, -4.799567977897823e-05, -3.430876677157357e-05, -2.0621853764168918e-05, -6.934933480806649e-06, 6.751983164576814e-06, 2.0438899809960276e-05, 3.412581645534374e-05, 4.78127331007272e-05, 6.149965338408947e-05, 7.518656639149413e-05, 8.887347939889878e-05, 0.00010256039968226105, 0.00011624731996562332, 0.00012993422569707036, 0.00014362114598043263, 0.0001573080662637949, 0.00017099498654715717, 0.00018468190683051944, 0.00019836881256196648, 0.00021205574739724398, 0.00022574266768060625, 0.00023942958796396852, 0.0002531165082473308, 0.00026680342853069305, 0.00028049031971022487, 0.00029417723999358714, 0.0003078641602769494, 0.0003215510805603117, 0.00033523800084367394, 0.0003489249211270362, 0.0003626118414103985, 0.0003762987325899303, 0.000389985681977123, 0.00040367257315665483, 0.0004173594934400171, 0.0004310464137233794, 0.00044473333400674164, 0.0004584202542901039, 0.0004721071745734662, 0.00048579409485682845, 0.0004994809860363603, 0.000513167935423553, 0.0005268548266030848, 0.0005405417177826166, 0.0005542286089621484, 0.0005679155583493412, 0.000581602449528873, 0.0005952893989160657, 0.0006089762900955975, 0.0006226632394827902, 0.000636350130662322, 0.0006500370800495148]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 11.0, 8.0, 9.0, 11.0, 15.0, 12.0, 13.0, 18.0, 15.0, 18.0, 35.0, 33.0, 18.0, 27.0, 36.0, 41.0, 35.0, 39.0, 41.0, 26.0, 37.0, 38.0, 45.0, 29.0, 38.0, 31.0, 45.0, 23.0, 24.0, 20.0, 37.0, 20.0, 29.0, 24.0, 15.0, 15.0, 11.0, 15.0, 9.0, 5.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-7.963180541992188e-05, -7.73230567574501e-05, -7.501430809497833e-05, -7.270555943250656e-05, -7.039681077003479e-05, -6.808806210756302e-05, -6.577931344509125e-05, -6.347056478261948e-05, -6.11618161201477e-05, -5.8853067457675934e-05, -5.654431879520416e-05, -5.423557013273239e-05, -5.192682147026062e-05, -4.961807280778885e-05, -4.730932414531708e-05, -4.5000575482845306e-05, -4.2691826820373535e-05, -4.0383078157901764e-05, -3.807432949542999e-05, -3.576558083295822e-05, -3.345683217048645e-05, -3.114808350801468e-05, -2.8839334845542908e-05, -2.6530586183071136e-05, -2.4221837520599365e-05, -2.1913088858127594e-05, -1.9604340195655823e-05, -1.729559153318405e-05, -1.498684287071228e-05, -1.2678094208240509e-05, -1.0369345545768738e-05, -8.060596883296967e-06, -5.751848220825195e-06, -3.443099558353424e-06, -1.1343508958816528e-06, 1.1743977665901184e-06, 3.4831464290618896e-06, 5.791895091533661e-06, 8.100643754005432e-06, 1.0409392416477203e-05, 1.2718141078948975e-05, 1.5026889741420746e-05, 1.7335638403892517e-05, 1.964438706636429e-05, 2.195313572883606e-05, 2.426188439130783e-05, 2.6570633053779602e-05, 2.8879381716251373e-05, 3.1188130378723145e-05, 3.3496879041194916e-05, 3.580562770366669e-05, 3.811437636613846e-05, 4.042312502861023e-05, 4.2731873691082e-05, 4.504062235355377e-05, 4.734937101602554e-05, 4.9658119678497314e-05, 5.1966868340969086e-05, 5.427561700344086e-05, 5.658436566591263e-05, 5.88931143283844e-05, 6.120186299085617e-05, 6.351061165332794e-05, 6.581936031579971e-05, 6.812810897827148e-05]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 8.0, 3.0, 8.0, 5.0, 9.0, 7.0, 18.0, 24.0, 23.0, 19.0, 26.0, 22.0, 24.0, 23.0, 29.0, 32.0, 28.0, 37.0, 42.0, 36.0, 41.0, 39.0, 33.0, 29.0, 33.0, 28.0, 30.0, 33.0, 26.0, 34.0, 21.0, 27.0, 25.0, 25.0, 18.0, 23.0, 15.0, 20.0, 11.0, 11.0, 7.0, 11.0, 7.0, 7.0, 8.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0], "bins": [-3.7734375, -3.6602783203125, -3.547119140625, -3.4339599609375, -3.32080078125, -3.2076416015625, -3.094482421875, -2.9813232421875, -2.8681640625, -2.7550048828125, -2.641845703125, -2.5286865234375, -2.41552734375, -2.3023681640625, -2.189208984375, -2.0760498046875, -1.962890625, -1.8497314453125, -1.736572265625, -1.6234130859375, -1.51025390625, -1.3970947265625, -1.283935546875, -1.1707763671875, -1.0576171875, -0.9444580078125, -0.831298828125, -0.7181396484375, -0.60498046875, -0.4918212890625, -0.378662109375, -0.2655029296875, -0.15234375, -0.0391845703125, 0.073974609375, 0.1871337890625, 0.30029296875, 0.4134521484375, 0.526611328125, 0.6397705078125, 0.7529296875, 0.8660888671875, 0.979248046875, 1.0924072265625, 1.20556640625, 1.3187255859375, 1.431884765625, 1.5450439453125, 1.658203125, 1.7713623046875, 1.884521484375, 1.9976806640625, 2.11083984375, 2.2239990234375, 2.337158203125, 2.4503173828125, 2.5634765625, 2.6766357421875, 2.789794921875, 2.9029541015625, 3.01611328125, 3.1292724609375, 3.242431640625, 3.3555908203125, 3.46875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 8.0, 5.0, 7.0, 18.0, 20.0, 22.0, 18.0, 45.0, 46.0, 54.0, 62.0, 87.0, 156.0, 184.0, 292.0, 449.0, 900.0, 3007.0, 20259.0, 154733.0, 692278.0, 150685.0, 19966.0, 2872.0, 871.0, 501.0, 264.0, 186.0, 125.0, 93.0, 65.0, 54.0, 53.0, 23.0, 31.0, 24.0, 13.0, 16.0, 11.0, 5.0, 13.0, 4.0, 2.0, 7.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-8.3203125, -8.0718994140625, -7.823486328125, -7.5750732421875, -7.32666015625, -7.0782470703125, -6.829833984375, -6.5814208984375, -6.3330078125, -6.0845947265625, -5.836181640625, -5.5877685546875, -5.33935546875, -5.0909423828125, -4.842529296875, -4.5941162109375, -4.345703125, -4.0972900390625, -3.848876953125, -3.6004638671875, -3.35205078125, -3.1036376953125, -2.855224609375, -2.6068115234375, -2.3583984375, -2.1099853515625, -1.861572265625, -1.6131591796875, -1.36474609375, -1.1163330078125, -0.867919921875, -0.6195068359375, -0.37109375, -0.1226806640625, 0.125732421875, 0.3741455078125, 0.62255859375, 0.8709716796875, 1.119384765625, 1.3677978515625, 1.6162109375, 1.8646240234375, 2.113037109375, 2.3614501953125, 2.60986328125, 2.8582763671875, 3.106689453125, 3.3551025390625, 3.603515625, 3.8519287109375, 4.100341796875, 4.3487548828125, 4.59716796875, 4.8455810546875, 5.093994140625, 5.3424072265625, 5.5908203125, 5.8392333984375, 6.087646484375, 6.3360595703125, 6.58447265625, 6.8328857421875, 7.081298828125, 7.3297119140625, 7.578125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 1.0, 1.0, 4.0, 9.0, 5.0, 13.0, 6.0, 9.0, 8.0, 9.0, 14.0, 18.0, 12.0, 36.0, 32.0, 32.0, 28.0, 45.0, 29.0, 39.0, 48.0, 86.0, 200.0, 1520.0, 252.0, 116.0, 61.0, 50.0, 45.0, 40.0, 38.0, 43.0, 33.0, 30.0, 26.0, 15.0, 16.0, 14.0, 20.0, 13.0, 3.0, 9.0, 6.0, 9.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2265625, -9.8436279296875, -9.460693359375, -9.0777587890625, -8.69482421875, -8.3118896484375, -7.928955078125, -7.5460205078125, -7.1630859375, -6.7801513671875, -6.397216796875, -6.0142822265625, -5.63134765625, -5.2484130859375, -4.865478515625, -4.4825439453125, -4.099609375, -3.7166748046875, -3.333740234375, -2.9508056640625, -2.56787109375, -2.1849365234375, -1.802001953125, -1.4190673828125, -1.0361328125, -0.6531982421875, -0.270263671875, 0.1126708984375, 0.49560546875, 0.8785400390625, 1.261474609375, 1.6444091796875, 2.02734375, 2.4102783203125, 2.793212890625, 3.1761474609375, 3.55908203125, 3.9420166015625, 4.324951171875, 4.7078857421875, 5.0908203125, 5.4737548828125, 5.856689453125, 6.2396240234375, 6.62255859375, 7.0054931640625, 7.388427734375, 7.7713623046875, 8.154296875, 8.5372314453125, 8.920166015625, 9.3031005859375, 9.68603515625, 10.0689697265625, 10.451904296875, 10.8348388671875, 11.2177734375, 11.6007080078125, 11.983642578125, 12.3665771484375, 12.74951171875, 13.1324462890625, 13.515380859375, 13.8983154296875, 14.28125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 4.0, 10.0, 11.0, 9.0, 17.0, 24.0, 34.0, 28.0, 32.0, 56.0, 52.0, 83.0, 102.0, 124.0, 187.0, 391.0, 914.0, 5363.0, 3092426.0, 43141.0, 1323.0, 525.0, 232.0, 147.0, 101.0, 65.0, 62.0, 50.0, 48.0, 22.0, 25.0, 19.0, 11.0, 16.0, 12.0, 9.0, 5.0, 6.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.21875, -40.96533203125, -39.7119140625, -38.45849609375, -37.205078125, -35.95166015625, -34.6982421875, -33.44482421875, -32.19140625, -30.93798828125, -29.6845703125, -28.43115234375, -27.177734375, -25.92431640625, -24.6708984375, -23.41748046875, -22.1640625, -20.91064453125, -19.6572265625, -18.40380859375, -17.150390625, -15.89697265625, -14.6435546875, -13.39013671875, -12.13671875, -10.88330078125, -9.6298828125, -8.37646484375, -7.123046875, -5.86962890625, -4.6162109375, -3.36279296875, -2.109375, -0.85595703125, 0.3974609375, 1.65087890625, 2.904296875, 4.15771484375, 5.4111328125, 6.66455078125, 7.91796875, 9.17138671875, 10.4248046875, 11.67822265625, 12.931640625, 14.18505859375, 15.4384765625, 16.69189453125, 17.9453125, 19.19873046875, 20.4521484375, 21.70556640625, 22.958984375, 24.21240234375, 25.4658203125, 26.71923828125, 27.97265625, 29.22607421875, 30.4794921875, 31.73291015625, 32.986328125, 34.23974609375, 35.4931640625, 36.74658203125, 38.0]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [38.0, 489.0, 461.0, 28.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.029485702514648, -2.5264501571655273, -0.02341461181640625, 2.479620933532715, 4.982656478881836, 7.485692024230957, 9.988727569580078, 12.491762161254883, 14.99479866027832, 17.497833251953125, 20.000869750976562, 22.50390625, 25.006940841674805, 27.50997543334961, 30.013011932373047, 32.51604461669922, 35.019081115722656, 37.522117614746094, 40.02515411376953, 42.5281867980957, 45.03122329711914, 47.53425979614258, 50.03729248046875, 52.54032897949219, 55.043365478515625, 57.54640197753906, 60.0494384765625, 62.55247116088867, 65.05551147460938, 67.55854034423828, 70.06157684326172, 72.56461334228516, 75.06765747070312, 77.57069396972656, 80.07373046875, 82.57676696777344, 85.07980346679688, 87.58283233642578, 90.08586883544922, 92.58890533447266, 95.0919418334961, 97.59497833251953, 100.09801483154297, 102.6010513305664, 105.10408020019531, 107.60711669921875, 110.11015319824219, 112.61318969726562, 115.11622619628906, 117.6192626953125, 120.12229919433594, 122.62533569335938, 125.12837219238281, 127.63140106201172, 130.1344451904297, 132.63748168945312, 135.1405029296875, 137.64353942871094, 140.14657592773438, 142.6496124267578, 145.15264892578125, 147.6556854248047, 150.15872192382812, 152.6617431640625, 155.164794921875]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 8.0, 7.0, 12.0, 8.0, 7.0, 9.0, 18.0, 19.0, 22.0, 13.0, 23.0, 20.0, 36.0, 25.0, 35.0, 32.0, 32.0, 30.0, 46.0, 51.0, 38.0, 49.0, 46.0, 39.0, 39.0, 44.0, 41.0, 34.0, 34.0, 24.0, 20.0, 17.0, 12.0, 19.0, 15.0, 16.0, 8.0, 13.0, 9.0, 11.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.94292449951172, -32.890628814697266, -31.838335037231445, -30.786041259765625, -29.733745574951172, -28.68145179748535, -27.62915802001953, -26.576862335205078, -25.524568557739258, -24.472274780273438, -23.419979095458984, -22.367685317993164, -21.315391540527344, -20.26309585571289, -19.21080207824707, -18.15850830078125, -17.106212615966797, -16.053918838500977, -15.001623153686523, -13.949329376220703, -12.897034645080566, -11.84473991394043, -10.79244613647461, -9.740151405334473, -8.687856674194336, -7.635561943054199, -6.583267688751221, -5.530973434448242, -4.4786787033081055, -3.4263839721679688, -2.3740897178649902, -1.3217954635620117, -0.2695045471191406, 0.782789945602417, 1.8350844383239746, 2.8873789310455322, 3.93967342376709, 4.991968154907227, 6.044262409210205, 7.096556663513184, 8.14885139465332, 9.201146125793457, 10.253440856933594, 11.305734634399414, 12.35802936553955, 13.410324096679688, 14.462617874145508, 15.514912605285645, 16.56720733642578, 17.6195011138916, 18.671796798706055, 19.724090576171875, 20.776386260986328, 21.82868003845215, 22.88097381591797, 23.933269500732422, 24.985563278198242, 26.037857055664062, 27.090152740478516, 28.142446517944336, 29.194740295410156, 30.24703598022461, 31.29932975769043, 32.35162353515625, 33.4039192199707]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 6.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 7.0, 11.0, 7.0, 13.0, 15.0, 17.0, 23.0, 19.0, 26.0, 23.0, 15.0, 29.0, 34.0, 29.0, 39.0, 33.0, 33.0, 32.0, 30.0, 41.0, 27.0, 43.0, 38.0, 34.0, 27.0, 34.0, 37.0, 33.0, 26.0, 20.0, 27.0, 20.0, 36.0, 17.0, 12.0, 14.0, 16.0, 10.0, 5.0, 5.0, 5.0, 6.0, 6.0, 4.0, 4.0, 0.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.0625, -3.9361572265625, -3.809814453125, -3.6834716796875, -3.55712890625, -3.4307861328125, -3.304443359375, -3.1781005859375, -3.0517578125, -2.9254150390625, -2.799072265625, -2.6727294921875, -2.54638671875, -2.4200439453125, -2.293701171875, -2.1673583984375, -2.041015625, -1.9146728515625, -1.788330078125, -1.6619873046875, -1.53564453125, -1.4093017578125, -1.282958984375, -1.1566162109375, -1.0302734375, -0.9039306640625, -0.777587890625, -0.6512451171875, -0.52490234375, -0.3985595703125, -0.272216796875, -0.1458740234375, -0.01953125, 0.1068115234375, 0.233154296875, 0.3594970703125, 0.48583984375, 0.6121826171875, 0.738525390625, 0.8648681640625, 0.9912109375, 1.1175537109375, 1.243896484375, 1.3702392578125, 1.49658203125, 1.6229248046875, 1.749267578125, 1.8756103515625, 2.001953125, 2.1282958984375, 2.254638671875, 2.3809814453125, 2.50732421875, 2.6336669921875, 2.760009765625, 2.8863525390625, 3.0126953125, 3.1390380859375, 3.265380859375, 3.3917236328125, 3.51806640625, 3.6444091796875, 3.770751953125, 3.8970947265625, 4.0234375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 6.0, 7.0, 11.0, 8.0, 10.0, 22.0, 24.0, 24.0, 42.0, 53.0, 72.0, 102.0, 155.0, 254.0, 443.0, 745.0, 2124.0, 7306.0, 36950.0, 213098.0, 896093.0, 1688518.0, 1022831.0, 263615.0, 47616.0, 9314.0, 2558.0, 963.0, 465.0, 253.0, 177.0, 117.0, 88.0, 49.0, 32.0, 32.0, 29.0, 20.0, 12.0, 7.0, 5.0, 3.0, 5.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0], "bins": [-6.16015625, -5.98193359375, -5.8037109375, -5.62548828125, -5.447265625, -5.26904296875, -5.0908203125, -4.91259765625, -4.734375, -4.55615234375, -4.3779296875, -4.19970703125, -4.021484375, -3.84326171875, -3.6650390625, -3.48681640625, -3.30859375, -3.13037109375, -2.9521484375, -2.77392578125, -2.595703125, -2.41748046875, -2.2392578125, -2.06103515625, -1.8828125, -1.70458984375, -1.5263671875, -1.34814453125, -1.169921875, -0.99169921875, -0.8134765625, -0.63525390625, -0.45703125, -0.27880859375, -0.1005859375, 0.07763671875, 0.255859375, 0.43408203125, 0.6123046875, 0.79052734375, 0.96875, 1.14697265625, 1.3251953125, 1.50341796875, 1.681640625, 1.85986328125, 2.0380859375, 2.21630859375, 2.39453125, 2.57275390625, 2.7509765625, 2.92919921875, 3.107421875, 3.28564453125, 3.4638671875, 3.64208984375, 3.8203125, 3.99853515625, 4.1767578125, 4.35498046875, 4.533203125, 4.71142578125, 4.8896484375, 5.06787109375, 5.24609375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 20.0, 12.0, 14.0, 23.0, 39.0, 62.0, 74.0, 104.0, 128.0, 182.0, 209.0, 351.0, 443.0, 426.0, 446.0, 325.0, 315.0, 224.0, 144.0, 144.0, 85.0, 67.0, 69.0, 28.0, 39.0, 20.0, 13.0, 10.0, 12.0, 5.0, 9.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.359375, -7.111572265625, -6.86376953125, -6.615966796875, -6.3681640625, -6.120361328125, -5.87255859375, -5.624755859375, -5.376953125, -5.129150390625, -4.88134765625, -4.633544921875, -4.3857421875, -4.137939453125, -3.89013671875, -3.642333984375, -3.39453125, -3.146728515625, -2.89892578125, -2.651123046875, -2.4033203125, -2.155517578125, -1.90771484375, -1.659912109375, -1.412109375, -1.164306640625, -0.91650390625, -0.668701171875, -0.4208984375, -0.173095703125, 0.07470703125, 0.322509765625, 0.5703125, 0.818115234375, 1.06591796875, 1.313720703125, 1.5615234375, 1.809326171875, 2.05712890625, 2.304931640625, 2.552734375, 2.800537109375, 3.04833984375, 3.296142578125, 3.5439453125, 3.791748046875, 4.03955078125, 4.287353515625, 4.53515625, 4.782958984375, 5.03076171875, 5.278564453125, 5.5263671875, 5.774169921875, 6.02197265625, 6.269775390625, 6.517578125, 6.765380859375, 7.01318359375, 7.260986328125, 7.5087890625, 7.756591796875, 8.00439453125, 8.252197265625, 8.5]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 9.0, 9.0, 11.0, 15.0, 21.0, 27.0, 47.0, 60.0, 89.0, 129.0, 163.0, 193.0, 281.0, 388.0, 668.0, 1518.0, 7074.0, 1264850.0, 2902863.0, 11882.0, 1730.0, 711.0, 472.0, 304.0, 204.0, 161.0, 107.0, 77.0, 59.0, 50.0, 26.0, 21.0, 16.0, 6.0, 10.0, 8.0, 5.0, 0.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-28.625, -27.78515625, -26.9453125, -26.10546875, -25.265625, -24.42578125, -23.5859375, -22.74609375, -21.90625, -21.06640625, -20.2265625, -19.38671875, -18.546875, -17.70703125, -16.8671875, -16.02734375, -15.1875, -14.34765625, -13.5078125, -12.66796875, -11.828125, -10.98828125, -10.1484375, -9.30859375, -8.46875, -7.62890625, -6.7890625, -5.94921875, -5.109375, -4.26953125, -3.4296875, -2.58984375, -1.75, -0.91015625, -0.0703125, 0.76953125, 1.609375, 2.44921875, 3.2890625, 4.12890625, 4.96875, 5.80859375, 6.6484375, 7.48828125, 8.328125, 9.16796875, 10.0078125, 10.84765625, 11.6875, 12.52734375, 13.3671875, 14.20703125, 15.046875, 15.88671875, 16.7265625, 17.56640625, 18.40625, 19.24609375, 20.0859375, 20.92578125, 21.765625, 22.60546875, 23.4453125, 24.28515625, 25.125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 56.0, 759.0, 194.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.14484405517578, -55.700927734375, -49.25700759887695, -42.813087463378906, -36.369171142578125, -29.925254821777344, -23.481334686279297, -17.03741455078125, -10.593498229980469, -4.149580001831055, 2.2943382263183594, 8.738256454467773, 15.182174682617188, 21.62609100341797, 28.070011138916016, 34.51393127441406, 40.957847595214844, 47.401763916015625, 53.84568405151367, 60.28960418701172, 66.7335205078125, 73.17743682861328, 79.62135314941406, 86.06527709960938, 92.50919342041016, 98.95310974121094, 105.39703369140625, 111.84095001220703, 118.28486633300781, 124.7287826538086, 131.17269897460938, 137.6166229248047, 144.060546875, 150.5044708251953, 156.94837951660156, 163.39230346679688, 169.83621215820312, 176.28013610839844, 182.72406005859375, 189.16796875, 195.6118927001953, 202.05581665039062, 208.49972534179688, 214.9436492919922, 221.3875732421875, 227.83148193359375, 234.27540588378906, 240.71932983398438, 247.16323852539062, 253.60716247558594, 260.05108642578125, 266.4949951171875, 272.93890380859375, 279.3828125, 285.8267517089844, 292.2706604003906, 298.714599609375, 305.15850830078125, 311.6024475097656, 318.0463562011719, 324.4902648925781, 330.9342041015625, 337.37811279296875, 343.822021484375, 350.26593017578125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 6.0, 8.0, 7.0, 12.0, 17.0, 26.0, 21.0, 17.0, 24.0, 20.0, 28.0, 31.0, 32.0, 36.0, 36.0, 39.0, 43.0, 52.0, 36.0, 34.0, 34.0, 42.0, 45.0, 45.0, 33.0, 30.0, 24.0, 27.0, 31.0, 15.0, 26.0, 24.0, 18.0, 16.0, 20.0, 7.0, 10.0, 7.0, 11.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.00054931640625, -26.189193725585938, -25.377838134765625, -24.566482543945312, -23.755126953125, -22.943771362304688, -22.132417678833008, -21.321062088012695, -20.509706497192383, -19.69835090637207, -18.886995315551758, -18.075639724731445, -17.264286041259766, -16.452930450439453, -15.64157485961914, -14.830219268798828, -14.018863677978516, -13.207508087158203, -12.39615249633789, -11.584797859191895, -10.773442268371582, -9.96208667755127, -9.150732040405273, -8.339376449584961, -7.528020858764648, -6.716665267944336, -5.905310153961182, -5.093955039978027, -4.282599449157715, -3.4712438583374023, -2.659888744354248, -1.8485336303710938, -1.0371780395507812, -0.22582268714904785, 0.5855326652526855, 1.396888017654419, 2.2082433700561523, 3.019598960876465, 3.830954074859619, 4.642309188842773, 5.453664779663086, 6.265020370483398, 7.076375484466553, 7.887730598449707, 8.69908618927002, 9.510441780090332, 10.321796417236328, 11.13315200805664, 11.944507598876953, 12.755863189697266, 13.567218780517578, 14.378573417663574, 15.189929008483887, 16.001285552978516, 16.812639236450195, 17.623994827270508, 18.43535041809082, 19.246706008911133, 20.058061599731445, 20.869417190551758, 21.680770874023438, 22.49212646484375, 23.303482055664062, 24.114837646484375, 24.926193237304688]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 9.0, 5.0, 12.0, 12.0, 13.0, 16.0, 28.0, 22.0, 27.0, 31.0, 36.0, 38.0, 29.0, 33.0, 43.0, 39.0, 43.0, 43.0, 48.0, 42.0, 41.0, 44.0, 34.0, 40.0, 26.0, 35.0, 36.0, 23.0, 22.0, 23.0, 14.0, 17.0, 19.0, 11.0, 6.0, 7.0, 8.0, 1.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.36328125, -4.23126220703125, -4.0992431640625, -3.96722412109375, -3.835205078125, -3.70318603515625, -3.5711669921875, -3.43914794921875, -3.30712890625, -3.17510986328125, -3.0430908203125, -2.91107177734375, -2.779052734375, -2.64703369140625, -2.5150146484375, -2.38299560546875, -2.2509765625, -2.11895751953125, -1.9869384765625, -1.85491943359375, -1.722900390625, -1.59088134765625, -1.4588623046875, -1.32684326171875, -1.19482421875, -1.06280517578125, -0.9307861328125, -0.79876708984375, -0.666748046875, -0.53472900390625, -0.4027099609375, -0.27069091796875, -0.138671875, -0.00665283203125, 0.1253662109375, 0.25738525390625, 0.389404296875, 0.52142333984375, 0.6534423828125, 0.78546142578125, 0.91748046875, 1.04949951171875, 1.1815185546875, 1.31353759765625, 1.445556640625, 1.57757568359375, 1.7095947265625, 1.84161376953125, 1.9736328125, 2.10565185546875, 2.2376708984375, 2.36968994140625, 2.501708984375, 2.63372802734375, 2.7657470703125, 2.89776611328125, 3.02978515625, 3.16180419921875, 3.2938232421875, 3.42584228515625, 3.557861328125, 3.68988037109375, 3.8218994140625, 3.95391845703125, 4.0859375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 7.0, 12.0, 12.0, 26.0, 47.0, 55.0, 99.0, 136.0, 177.0, 248.0, 399.0, 606.0, 890.0, 1254.0, 1811.0, 2903.0, 4249.0, 6536.0, 10035.0, 15318.0, 24244.0, 39754.0, 67255.0, 127335.0, 266843.0, 218477.0, 105644.0, 58215.0, 34381.0, 21679.0, 13657.0, 8706.0, 5826.0, 3851.0, 2616.0, 1762.0, 1104.0, 735.0, 514.0, 372.0, 235.0, 170.0, 110.0, 77.0, 64.0, 30.0, 23.0, 22.0, 12.0, 10.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.6630859375, -0.6416015625, -0.6201171875, -0.5986328125, -0.5771484375, -0.5556640625, -0.5341796875, -0.5126953125, -0.4912109375, -0.4697265625, -0.4482421875, -0.4267578125, -0.4052734375, -0.3837890625, -0.3623046875, -0.3408203125, -0.3193359375, -0.2978515625, -0.2763671875, -0.2548828125, -0.2333984375, -0.2119140625, -0.1904296875, -0.1689453125, -0.1474609375, -0.1259765625, -0.1044921875, -0.0830078125, -0.0615234375, -0.0400390625, -0.0185546875, 0.0029296875, 0.0244140625, 0.0458984375, 0.0673828125, 0.0888671875, 0.1103515625, 0.1318359375, 0.1533203125, 0.1748046875, 0.1962890625, 0.2177734375, 0.2392578125, 0.2607421875, 0.2822265625, 0.3037109375, 0.3251953125, 0.3466796875, 0.3681640625, 0.3896484375, 0.4111328125, 0.4326171875, 0.4541015625, 0.4755859375, 0.4970703125, 0.5185546875, 0.5400390625, 0.5615234375, 0.5830078125, 0.6044921875, 0.6259765625, 0.6474609375, 0.6689453125, 0.6904296875, 0.7119140625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 6.0, 12.0, 10.0, 12.0, 11.0, 10.0, 10.0, 11.0, 22.0, 26.0, 24.0, 24.0, 29.0, 29.0, 38.0, 28.0, 38.0, 30.0, 35.0, 36.0, 44.0, 1062.0, 34.0, 38.0, 36.0, 29.0, 29.0, 35.0, 32.0, 31.0, 27.0, 24.0, 18.0, 18.0, 24.0, 13.0, 17.0, 12.0, 7.0, 8.0, 8.0, 5.0, 7.0, 6.0, 5.0, 5.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.181640625, -2.107940673828125, -2.03424072265625, -1.960540771484375, -1.8868408203125, -1.813140869140625, -1.73944091796875, -1.665740966796875, -1.592041015625, -1.518341064453125, -1.44464111328125, -1.370941162109375, -1.2972412109375, -1.223541259765625, -1.14984130859375, -1.076141357421875, -1.00244140625, -0.928741455078125, -0.85504150390625, -0.781341552734375, -0.7076416015625, -0.633941650390625, -0.56024169921875, -0.486541748046875, -0.412841796875, -0.339141845703125, -0.26544189453125, -0.191741943359375, -0.1180419921875, -0.044342041015625, 0.02935791015625, 0.103057861328125, 0.1767578125, 0.250457763671875, 0.32415771484375, 0.397857666015625, 0.4715576171875, 0.545257568359375, 0.61895751953125, 0.692657470703125, 0.766357421875, 0.840057373046875, 0.91375732421875, 0.987457275390625, 1.0611572265625, 1.134857177734375, 1.20855712890625, 1.282257080078125, 1.35595703125, 1.429656982421875, 1.50335693359375, 1.577056884765625, 1.6507568359375, 1.724456787109375, 1.79815673828125, 1.871856689453125, 1.945556640625, 2.019256591796875, 2.09295654296875, 2.166656494140625, 2.2403564453125, 2.314056396484375, 2.38775634765625, 2.461456298828125, 2.53515625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 6.0, 14.0, 20.0, 26.0, 41.0, 70.0, 87.0, 108.0, 172.0, 242.0, 351.0, 448.0, 652.0, 857.0, 1235.0, 1754.0, 2458.0, 3445.0, 4893.0, 6828.0, 9757.0, 14197.0, 20310.0, 30465.0, 46073.0, 72057.0, 126517.0, 1296555.0, 184485.0, 94911.0, 57443.0, 37951.0, 25332.0, 17099.0, 11805.0, 8160.0, 5905.0, 4155.0, 2987.0, 2072.0, 1581.0, 1107.0, 841.0, 530.0, 353.0, 266.0, 157.0, 111.0, 94.0, 65.0, 35.0, 19.0, 16.0, 9.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.5537109375, -0.5362777709960938, -0.5188446044921875, -0.5014114379882812, -0.483978271484375, -0.46654510498046875, -0.4491119384765625, -0.43167877197265625, -0.41424560546875, -0.39681243896484375, -0.3793792724609375, -0.36194610595703125, -0.344512939453125, -0.32707977294921875, -0.3096466064453125, -0.29221343994140625, -0.2747802734375, -0.25734710693359375, -0.2399139404296875, -0.22248077392578125, -0.205047607421875, -0.18761444091796875, -0.1701812744140625, -0.15274810791015625, -0.13531494140625, -0.11788177490234375, -0.1004486083984375, -0.08301544189453125, -0.065582275390625, -0.04814910888671875, -0.0307159423828125, -0.01328277587890625, 0.004150390625, 0.02158355712890625, 0.0390167236328125, 0.05644989013671875, 0.073883056640625, 0.09131622314453125, 0.1087493896484375, 0.12618255615234375, 0.14361572265625, 0.16104888916015625, 0.1784820556640625, 0.19591522216796875, 0.213348388671875, 0.23078155517578125, 0.2482147216796875, 0.26564788818359375, 0.2830810546875, 0.30051422119140625, 0.3179473876953125, 0.33538055419921875, 0.352813720703125, 0.37024688720703125, 0.3876800537109375, 0.40511322021484375, 0.42254638671875, 0.43997955322265625, 0.4574127197265625, 0.47484588623046875, 0.492279052734375, 0.5097122192382812, 0.5271453857421875, 0.5445785522460938, 0.56201171875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 3.0, 8.0, 7.0, 5.0, 10.0, 10.0, 15.0, 19.0, 29.0, 22.0, 23.0, 26.0, 21.0, 35.0, 45.0, 40.0, 53.0, 58.0, 57.0, 54.0, 42.0, 46.0, 44.0, 40.0, 39.0, 50.0, 32.0, 29.0, 20.0, 24.0, 19.0, 12.0, 9.0, 7.0, 11.0, 8.0, 10.0, 2.0, 1.0, 1.0, 7.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00011557340621948242, -0.00011192634701728821, -0.000108279287815094, -0.00010463222861289978, -0.00010098516941070557, -9.733811020851135e-05, -9.369105100631714e-05, -9.004399180412292e-05, -8.639693260192871e-05, -8.27498733997345e-05, -7.910281419754028e-05, -7.545575499534607e-05, -7.180869579315186e-05, -6.816163659095764e-05, -6.451457738876343e-05, -6.0867518186569214e-05, -5.7220458984375e-05, -5.3573399782180786e-05, -4.992634057998657e-05, -4.627928137779236e-05, -4.2632222175598145e-05, -3.898516297340393e-05, -3.533810377120972e-05, -3.16910445690155e-05, -2.804398536682129e-05, -2.4396926164627075e-05, -2.074986696243286e-05, -1.7102807760238647e-05, -1.3455748558044434e-05, -9.80868935585022e-06, -6.161630153656006e-06, -2.514570951461792e-06, 1.1324882507324219e-06, 4.779547452926636e-06, 8.42660665512085e-06, 1.2073665857315063e-05, 1.5720725059509277e-05, 1.936778426170349e-05, 2.3014843463897705e-05, 2.666190266609192e-05, 3.0308961868286133e-05, 3.395602107048035e-05, 3.760308027267456e-05, 4.1250139474868774e-05, 4.489719867706299e-05, 4.85442578792572e-05, 5.2191317081451416e-05, 5.583837628364563e-05, 5.9485435485839844e-05, 6.313249468803406e-05, 6.677955389022827e-05, 7.042661309242249e-05, 7.40736722946167e-05, 7.772073149681091e-05, 8.136779069900513e-05, 8.501484990119934e-05, 8.866190910339355e-05, 9.230896830558777e-05, 9.595602750778198e-05, 9.96030867099762e-05, 0.00010325014591217041, 0.00010689720511436462, 0.00011054426431655884, 0.00011419132351875305, 0.00011783838272094727]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 4.0, 4.0, 11.0, 8.0, 13.0, 11.0, 19.0, 23.0, 42.0, 22.0, 45.0, 47.0, 73.0, 122.0, 151.0, 247.0, 462.0, 1118.0, 73407.0, 968189.0, 2732.0, 716.0, 320.0, 191.0, 130.0, 110.0, 52.0, 57.0, 29.0, 38.0, 32.0, 32.0, 22.0, 13.0, 17.0, 6.0, 9.0, 3.0, 10.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024871826171875, -0.002407550811767578, -0.0023279190063476562, -0.0022482872009277344, -0.0021686553955078125, -0.0020890235900878906, -0.0020093917846679688, -0.0019297599792480469, -0.001850128173828125, -0.0017704963684082031, -0.0016908645629882812, -0.0016112327575683594, -0.0015316009521484375, -0.0014519691467285156, -0.0013723373413085938, -0.0012927055358886719, -0.00121307373046875, -0.0011334419250488281, -0.0010538101196289062, -0.0009741783142089844, -0.0008945465087890625, -0.0008149147033691406, -0.0007352828979492188, -0.0006556510925292969, -0.000576019287109375, -0.0004963874816894531, -0.00041675567626953125, -0.0003371238708496094, -0.0002574920654296875, -0.00017786026000976562, -9.822845458984375e-05, -1.8596649169921875e-05, 6.103515625e-05, 0.00014066696166992188, 0.00022029876708984375, 0.0002999305725097656, 0.0003795623779296875, 0.0004591941833496094, 0.0005388259887695312, 0.0006184577941894531, 0.000698089599609375, 0.0007777214050292969, 0.0008573532104492188, 0.0009369850158691406, 0.0010166168212890625, 0.0010962486267089844, 0.0011758804321289062, 0.0012555122375488281, 0.00133514404296875, 0.0014147758483886719, 0.0014944076538085938, 0.0015740394592285156, 0.0016536712646484375, 0.0017333030700683594, 0.0018129348754882812, 0.0018925666809082031, 0.001972198486328125, 0.002051830291748047, 0.0021314620971679688, 0.0022110939025878906, 0.0022907257080078125, 0.0023703575134277344, 0.0024499893188476562, 0.002529621124267578, 0.0026092529296875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 102.0, 530.0, 331.0, 44.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026377395261079073, -0.0002510901540517807, -0.00023840635549277067, -0.00022572255693376064, -0.00021303874382283539, -0.00020035494526382536, -0.00018767114670481533, -0.00017498733359389007, -0.00016230353503488004, -0.00014961973647587, -0.00013693593791685998, -0.00012425213935784996, -0.0001115683262469247, -9.888452768791467e-05, -8.620072912890464e-05, -7.3516923293937e-05, -6.083313201088458e-05, -4.814932981389575e-05, -3.546552761690691e-05, -2.2781729057896882e-05, -1.0097926860908046e-05, 2.5858753360807896e-06, 1.526967389509082e-05, 2.795347973005846e-05, 4.063727828906849e-05, 5.3321080486057326e-05, 6.600488268304616e-05, 7.868868124205619e-05, 9.137247980106622e-05, 0.00010405628563603386, 0.00011674008419504389, 0.00012942389003001153, 0.00014210768858902156, 0.0001547914871480316, 0.00016747528570704162, 0.00018015908426605165, 0.0001928428973769769, 0.00020552669593598694, 0.00021821049449499696, 0.00023089430760592222, 0.00024357810616493225, 0.0002562619047239423, 0.0002689457032829523, 0.00028162950184196234, 0.00029431330040097237, 0.0003069970989599824, 0.0003196808975189924, 0.0003323647251818329, 0.0003450484946370125, 0.0003577322931960225, 0.00037041609175503254, 0.00038309989031404257, 0.0003957836888730526, 0.0004084674874320626, 0.00042115128599107265, 0.00043383511365391314, 0.00044651891221292317, 0.0004592027107719332, 0.0004718865093309432, 0.00048457030788995326, 0.0004972541355527937, 0.0005099379341118038, 0.0005226217326708138, 0.0005353055312298238, 0.0005479893297888339]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 14.0, 9.0, 23.0, 23.0, 23.0, 30.0, 24.0, 26.0, 35.0, 32.0, 31.0, 35.0, 32.0, 40.0, 57.0, 50.0, 38.0, 39.0, 31.0, 42.0, 34.0, 36.0, 46.0, 32.0, 27.0, 27.0, 22.0, 31.0, 17.0, 14.0, 13.0, 10.0, 14.0, 7.0, 8.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.580352783203125e-05, -6.354041397571564e-05, -6.127730011940002e-05, -5.901418626308441e-05, -5.67510724067688e-05, -5.4487958550453186e-05, -5.222484469413757e-05, -4.996173083782196e-05, -4.769861698150635e-05, -4.5435503125190735e-05, -4.317238926887512e-05, -4.090927541255951e-05, -3.8646161556243896e-05, -3.6383047699928284e-05, -3.411993384361267e-05, -3.185681998729706e-05, -2.9593706130981445e-05, -2.7330592274665833e-05, -2.506747841835022e-05, -2.2804364562034607e-05, -2.0541250705718994e-05, -1.827813684940338e-05, -1.601502299308777e-05, -1.3751909136772156e-05, -1.1488795280456543e-05, -9.22568142414093e-06, -6.962567567825317e-06, -4.699453711509705e-06, -2.436339855194092e-06, -1.73225998878479e-07, 2.089887857437134e-06, 4.353001713752747e-06, 6.616115570068359e-06, 8.879229426383972e-06, 1.1142343282699585e-05, 1.3405457139015198e-05, 1.566857099533081e-05, 1.7931684851646423e-05, 2.0194798707962036e-05, 2.245791256427765e-05, 2.4721026420593262e-05, 2.6984140276908875e-05, 2.9247254133224487e-05, 3.15103679895401e-05, 3.377348184585571e-05, 3.6036595702171326e-05, 3.829970955848694e-05, 4.056282341480255e-05, 4.2825937271118164e-05, 4.508905112743378e-05, 4.735216498374939e-05, 4.9615278840065e-05, 5.1878392696380615e-05, 5.414150655269623e-05, 5.640462040901184e-05, 5.8667734265327454e-05, 6.0930848121643066e-05, 6.319396197795868e-05, 6.545707583427429e-05, 6.77201896905899e-05, 6.998330354690552e-05, 7.224641740322113e-05, 7.450953125953674e-05, 7.677264511585236e-05, 7.903575897216797e-05]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 9.0, 5.0, 12.0, 12.0, 13.0, 16.0, 28.0, 22.0, 27.0, 31.0, 36.0, 38.0, 29.0, 33.0, 43.0, 39.0, 43.0, 43.0, 48.0, 42.0, 41.0, 44.0, 34.0, 40.0, 26.0, 35.0, 36.0, 23.0, 22.0, 23.0, 14.0, 17.0, 19.0, 11.0, 6.0, 7.0, 8.0, 1.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.36328125, -4.23126220703125, -4.0992431640625, -3.96722412109375, -3.835205078125, -3.70318603515625, -3.5711669921875, -3.43914794921875, -3.30712890625, -3.17510986328125, -3.0430908203125, -2.91107177734375, -2.779052734375, -2.64703369140625, -2.5150146484375, -2.38299560546875, -2.2509765625, -2.11895751953125, -1.9869384765625, -1.85491943359375, -1.722900390625, -1.59088134765625, -1.4588623046875, -1.32684326171875, -1.19482421875, -1.06280517578125, -0.9307861328125, -0.79876708984375, -0.666748046875, -0.53472900390625, -0.4027099609375, -0.27069091796875, -0.138671875, -0.00665283203125, 0.1253662109375, 0.25738525390625, 0.389404296875, 0.52142333984375, 0.6534423828125, 0.78546142578125, 0.91748046875, 1.04949951171875, 1.1815185546875, 1.31353759765625, 1.445556640625, 1.57757568359375, 1.7095947265625, 1.84161376953125, 1.9736328125, 2.10565185546875, 2.2376708984375, 2.36968994140625, 2.501708984375, 2.63372802734375, 2.7657470703125, 2.89776611328125, 3.02978515625, 3.16180419921875, 3.2938232421875, 3.42584228515625, 3.557861328125, 3.68988037109375, 3.8218994140625, 3.95391845703125, 4.0859375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 1.0, 7.0, 7.0, 7.0, 14.0, 11.0, 12.0, 25.0, 37.0, 47.0, 68.0, 112.0, 226.0, 531.0, 1334.0, 3906.0, 10967.0, 30497.0, 86200.0, 253510.0, 393450.0, 174426.0, 59552.0, 21470.0, 7690.0, 2683.0, 951.0, 356.0, 166.0, 97.0, 52.0, 25.0, 26.0, 22.0, 15.0, 14.0, 11.0, 6.0, 9.0, 2.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.22265625, -5.07049560546875, -4.9183349609375, -4.76617431640625, -4.614013671875, -4.46185302734375, -4.3096923828125, -4.15753173828125, -4.00537109375, -3.85321044921875, -3.7010498046875, -3.54888916015625, -3.396728515625, -3.24456787109375, -3.0924072265625, -2.94024658203125, -2.7880859375, -2.63592529296875, -2.4837646484375, -2.33160400390625, -2.179443359375, -2.02728271484375, -1.8751220703125, -1.72296142578125, -1.57080078125, -1.41864013671875, -1.2664794921875, -1.11431884765625, -0.962158203125, -0.80999755859375, -0.6578369140625, -0.50567626953125, -0.353515625, -0.20135498046875, -0.0491943359375, 0.10296630859375, 0.255126953125, 0.40728759765625, 0.5594482421875, 0.71160888671875, 0.86376953125, 1.01593017578125, 1.1680908203125, 1.32025146484375, 1.472412109375, 1.62457275390625, 1.7767333984375, 1.92889404296875, 2.0810546875, 2.23321533203125, 2.3853759765625, 2.53753662109375, 2.689697265625, 2.84185791015625, 2.9940185546875, 3.14617919921875, 3.29833984375, 3.45050048828125, 3.6026611328125, 3.75482177734375, 3.906982421875, 4.05914306640625, 4.2113037109375, 4.36346435546875, 4.515625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 5.0, 9.0, 8.0, 10.0, 15.0, 26.0, 22.0, 23.0, 25.0, 23.0, 43.0, 40.0, 50.0, 43.0, 71.0, 141.0, 244.0, 1458.0, 245.0, 108.0, 64.0, 57.0, 30.0, 43.0, 27.0, 36.0, 36.0, 37.0, 19.0, 18.0, 12.0, 16.0, 9.0, 8.0, 4.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 5.0], "bins": [-17.34375, -16.9039306640625, -16.464111328125, -16.0242919921875, -15.58447265625, -15.1446533203125, -14.704833984375, -14.2650146484375, -13.8251953125, -13.3853759765625, -12.945556640625, -12.5057373046875, -12.06591796875, -11.6260986328125, -11.186279296875, -10.7464599609375, -10.306640625, -9.8668212890625, -9.427001953125, -8.9871826171875, -8.54736328125, -8.1075439453125, -7.667724609375, -7.2279052734375, -6.7880859375, -6.3482666015625, -5.908447265625, -5.4686279296875, -5.02880859375, -4.5889892578125, -4.149169921875, -3.7093505859375, -3.26953125, -2.8297119140625, -2.389892578125, -1.9500732421875, -1.51025390625, -1.0704345703125, -0.630615234375, -0.1907958984375, 0.2490234375, 0.6888427734375, 1.128662109375, 1.5684814453125, 2.00830078125, 2.4481201171875, 2.887939453125, 3.3277587890625, 3.767578125, 4.2073974609375, 4.647216796875, 5.0870361328125, 5.52685546875, 5.9666748046875, 6.406494140625, 6.8463134765625, 7.2861328125, 7.7259521484375, 8.165771484375, 8.6055908203125, 9.04541015625, 9.4852294921875, 9.925048828125, 10.3648681640625, 10.8046875]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 1.0, 5.0, 5.0, 9.0, 16.0, 15.0, 17.0, 25.0, 24.0, 45.0, 59.0, 84.0, 107.0, 163.0, 224.0, 371.0, 683.0, 1848.0, 46398.0, 3058544.0, 33674.0, 1589.0, 678.0, 353.0, 228.0, 135.0, 114.0, 70.0, 57.0, 35.0, 29.0, 19.0, 15.0, 11.0, 15.0, 5.0, 10.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0], "bins": [-32.75, -31.82666015625, -30.9033203125, -29.97998046875, -29.056640625, -28.13330078125, -27.2099609375, -26.28662109375, -25.36328125, -24.43994140625, -23.5166015625, -22.59326171875, -21.669921875, -20.74658203125, -19.8232421875, -18.89990234375, -17.9765625, -17.05322265625, -16.1298828125, -15.20654296875, -14.283203125, -13.35986328125, -12.4365234375, -11.51318359375, -10.58984375, -9.66650390625, -8.7431640625, -7.81982421875, -6.896484375, -5.97314453125, -5.0498046875, -4.12646484375, -3.203125, -2.27978515625, -1.3564453125, -0.43310546875, 0.490234375, 1.41357421875, 2.3369140625, 3.26025390625, 4.18359375, 5.10693359375, 6.0302734375, 6.95361328125, 7.876953125, 8.80029296875, 9.7236328125, 10.64697265625, 11.5703125, 12.49365234375, 13.4169921875, 14.34033203125, 15.263671875, 16.18701171875, 17.1103515625, 18.03369140625, 18.95703125, 19.88037109375, 20.8037109375, 21.72705078125, 22.650390625, 23.57373046875, 24.4970703125, 25.42041015625, 26.34375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 94.0, 547.0, 347.0, 22.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.10516357421875, -51.50600814819336, -48.9068489074707, -46.30769348144531, -43.708534240722656, -41.109378814697266, -38.510223388671875, -35.91106414794922, -33.31190872192383, -30.712751388549805, -28.11359405517578, -25.51443862915039, -22.915281295776367, -20.316123962402344, -17.716968536376953, -15.11781120300293, -12.518653869628906, -9.919496536254883, -7.320340156555176, -4.7211833000183105, -2.1220264434814453, 0.4771308898925781, 3.076287269592285, 5.675443649291992, 8.274600982666016, 10.873758316040039, 13.472914695739746, 16.072071075439453, 18.671228408813477, 21.2703857421875, 23.86954116821289, 26.468698501586914, 29.067855834960938, 31.66701316833496, 34.266170501708984, 36.865325927734375, 39.46448516845703, 42.06364059448242, 44.66279602050781, 47.26195526123047, 49.86111068725586, 52.46026611328125, 55.059425354003906, 57.6585807800293, 60.25773620605469, 62.856895446777344, 65.4560546875, 68.05520629882812, 70.65436553955078, 73.25352478027344, 75.85267639160156, 78.45183563232422, 81.05099487304688, 83.650146484375, 86.24930572509766, 88.84846496582031, 91.44761657714844, 94.0467758178711, 96.64592742919922, 99.24508666992188, 101.84424591064453, 104.44340515136719, 107.04255676269531, 109.64171600341797, 112.24087524414062]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 9.0, 10.0, 7.0, 18.0, 7.0, 5.0, 12.0, 15.0, 23.0, 15.0, 18.0, 27.0, 36.0, 31.0, 44.0, 37.0, 37.0, 31.0, 37.0, 42.0, 37.0, 40.0, 39.0, 34.0, 48.0, 22.0, 40.0, 23.0, 23.0, 28.0, 17.0, 26.0, 21.0, 22.0, 16.0, 14.0, 13.0, 11.0, 5.0, 8.0, 8.0, 5.0, 7.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-29.64960479736328, -28.7479305267334, -27.84625816345215, -26.944583892822266, -26.042911529541016, -25.141237258911133, -24.23956298828125, -23.337890625, -22.43621826171875, -21.534543991088867, -20.632871627807617, -19.731197357177734, -18.829524993896484, -17.9278507232666, -17.02617645263672, -16.12450408935547, -15.222829818725586, -14.32115650177002, -13.419483184814453, -12.51780891418457, -11.61613655090332, -10.714462280273438, -9.812788963317871, -8.911115646362305, -8.009442329406738, -7.107769012451172, -6.2060956954956055, -5.304421901702881, -4.4027485847473145, -3.501075267791748, -2.5994014739990234, -1.697728157043457, -0.7960567474365234, 0.10561668872833252, 1.0072901248931885, 1.908963680267334, 2.8106369972229004, 3.712310314178467, 4.613984107971191, 5.515657424926758, 6.417330741882324, 7.319004058837891, 8.220677375793457, 9.122350692749023, 10.024024963378906, 10.925697326660156, 11.827371597290039, 12.729044914245605, 13.630718231201172, 14.532391548156738, 15.434064865112305, 16.335739135742188, 17.237411499023438, 18.13908576965332, 19.040760040283203, 19.942432403564453, 20.844104766845703, 21.745779037475586, 22.647451400756836, 23.54912567138672, 24.45079803466797, 25.35247230529785, 26.254146575927734, 27.155818939208984, 28.057493209838867]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 1.0, 1.0, 5.0, 3.0, 8.0, 16.0, 13.0, 14.0, 21.0, 27.0, 25.0, 25.0, 24.0, 35.0, 25.0, 42.0, 40.0, 37.0, 35.0, 48.0, 47.0, 45.0, 43.0, 46.0, 48.0, 40.0, 31.0, 42.0, 31.0, 32.0, 28.0, 15.0, 14.0, 17.0, 10.0, 13.0, 5.0, 12.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.65625, -4.51470947265625, -4.3731689453125, -4.23162841796875, -4.090087890625, -3.94854736328125, -3.8070068359375, -3.66546630859375, -3.52392578125, -3.38238525390625, -3.2408447265625, -3.09930419921875, -2.957763671875, -2.81622314453125, -2.6746826171875, -2.53314208984375, -2.3916015625, -2.25006103515625, -2.1085205078125, -1.96697998046875, -1.825439453125, -1.68389892578125, -1.5423583984375, -1.40081787109375, -1.25927734375, -1.11773681640625, -0.9761962890625, -0.83465576171875, -0.693115234375, -0.55157470703125, -0.4100341796875, -0.26849365234375, -0.126953125, 0.01458740234375, 0.1561279296875, 0.29766845703125, 0.439208984375, 0.58074951171875, 0.7222900390625, 0.86383056640625, 1.00537109375, 1.14691162109375, 1.2884521484375, 1.42999267578125, 1.571533203125, 1.71307373046875, 1.8546142578125, 1.99615478515625, 2.1376953125, 2.27923583984375, 2.4207763671875, 2.56231689453125, 2.703857421875, 2.84539794921875, 2.9869384765625, 3.12847900390625, 3.27001953125, 3.41156005859375, 3.5531005859375, 3.69464111328125, 3.836181640625, 3.97772216796875, 4.1192626953125, 4.26080322265625, 4.40234375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 3.0, 5.0, 7.0, 15.0, 13.0, 25.0, 11.0, 26.0, 28.0, 35.0, 37.0, 50.0, 58.0, 64.0, 127.0, 225.0, 736.0, 7214.0, 514826.0, 3455447.0, 210064.0, 4025.0, 523.0, 201.0, 132.0, 65.0, 69.0, 48.0, 38.0, 30.0, 23.0, 16.0, 15.0, 12.0, 11.0, 5.0, 4.0, 13.0, 8.0, 8.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0546875, -13.6070556640625, -13.159423828125, -12.7117919921875, -12.26416015625, -11.8165283203125, -11.368896484375, -10.9212646484375, -10.4736328125, -10.0260009765625, -9.578369140625, -9.1307373046875, -8.68310546875, -8.2354736328125, -7.787841796875, -7.3402099609375, -6.892578125, -6.4449462890625, -5.997314453125, -5.5496826171875, -5.10205078125, -4.6544189453125, -4.206787109375, -3.7591552734375, -3.3115234375, -2.8638916015625, -2.416259765625, -1.9686279296875, -1.52099609375, -1.0733642578125, -0.625732421875, -0.1781005859375, 0.26953125, 0.7171630859375, 1.164794921875, 1.6124267578125, 2.06005859375, 2.5076904296875, 2.955322265625, 3.4029541015625, 3.8505859375, 4.2982177734375, 4.745849609375, 5.1934814453125, 5.64111328125, 6.0887451171875, 6.536376953125, 6.9840087890625, 7.431640625, 7.8792724609375, 8.326904296875, 8.7745361328125, 9.22216796875, 9.6697998046875, 10.117431640625, 10.5650634765625, 11.0126953125, 11.4603271484375, 11.907958984375, 12.3555908203125, 12.80322265625, 13.2508544921875, 13.698486328125, 14.1461181640625, 14.59375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 9.0, 13.0, 23.0, 19.0, 36.0, 64.0, 74.0, 113.0, 166.0, 236.0, 354.0, 460.0, 503.0, 512.0, 418.0, 295.0, 236.0, 174.0, 96.0, 83.0, 49.0, 40.0, 25.0, 16.0, 16.0, 7.0, 11.0, 7.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.0859375, -7.8328857421875, -7.579833984375, -7.3267822265625, -7.07373046875, -6.8206787109375, -6.567626953125, -6.3145751953125, -6.0615234375, -5.8084716796875, -5.555419921875, -5.3023681640625, -5.04931640625, -4.7962646484375, -4.543212890625, -4.2901611328125, -4.037109375, -3.7840576171875, -3.531005859375, -3.2779541015625, -3.02490234375, -2.7718505859375, -2.518798828125, -2.2657470703125, -2.0126953125, -1.7596435546875, -1.506591796875, -1.2535400390625, -1.00048828125, -0.7474365234375, -0.494384765625, -0.2413330078125, 0.01171875, 0.2647705078125, 0.517822265625, 0.7708740234375, 1.02392578125, 1.2769775390625, 1.530029296875, 1.7830810546875, 2.0361328125, 2.2891845703125, 2.542236328125, 2.7952880859375, 3.04833984375, 3.3013916015625, 3.554443359375, 3.8074951171875, 4.060546875, 4.3135986328125, 4.566650390625, 4.8197021484375, 5.07275390625, 5.3258056640625, 5.578857421875, 5.8319091796875, 6.0849609375, 6.3380126953125, 6.591064453125, 6.8441162109375, 7.09716796875, 7.3502197265625, 7.603271484375, 7.8563232421875, 8.109375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 13.0, 8.0, 7.0, 18.0, 30.0, 37.0, 47.0, 30.0, 63.0, 130.0, 138.0, 166.0, 223.0, 359.0, 629.0, 1496.0, 30957.0, 3783034.0, 370671.0, 3899.0, 878.0, 415.0, 266.0, 171.0, 143.0, 114.0, 83.0, 70.0, 43.0, 40.0, 24.0, 19.0, 19.0, 9.0, 10.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.03125, -25.210693359375, -24.39013671875, -23.569580078125, -22.7490234375, -21.928466796875, -21.10791015625, -20.287353515625, -19.466796875, -18.646240234375, -17.82568359375, -17.005126953125, -16.1845703125, -15.364013671875, -14.54345703125, -13.722900390625, -12.90234375, -12.081787109375, -11.26123046875, -10.440673828125, -9.6201171875, -8.799560546875, -7.97900390625, -7.158447265625, -6.337890625, -5.517333984375, -4.69677734375, -3.876220703125, -3.0556640625, -2.235107421875, -1.41455078125, -0.593994140625, 0.2265625, 1.047119140625, 1.86767578125, 2.688232421875, 3.5087890625, 4.329345703125, 5.14990234375, 5.970458984375, 6.791015625, 7.611572265625, 8.43212890625, 9.252685546875, 10.0732421875, 10.893798828125, 11.71435546875, 12.534912109375, 13.35546875, 14.176025390625, 14.99658203125, 15.817138671875, 16.6376953125, 17.458251953125, 18.27880859375, 19.099365234375, 19.919921875, 20.740478515625, 21.56103515625, 22.381591796875, 23.2021484375, 24.022705078125, 24.84326171875, 25.663818359375, 26.484375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 36.0, 342.0, 479.0, 141.0, 12.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.917238235473633, -18.39624786376953, -14.87525749206543, -11.354267120361328, -7.833276748657227, -4.312286376953125, -0.7912960052490234, 2.729694366455078, 6.25068473815918, 9.771675109863281, 13.292665481567383, 16.813655853271484, 20.334646224975586, 23.855636596679688, 27.37662696838379, 30.89761734008789, 34.418609619140625, 37.939598083496094, 41.46059036254883, 44.98158264160156, 48.50257110595703, 52.0235595703125, 55.544551849365234, 59.06554412841797, 62.58653259277344, 66.1075210571289, 69.62850952148438, 73.14950561523438, 76.67049407958984, 80.19148254394531, 83.71247863769531, 87.23346710205078, 90.75445556640625, 94.27544403076172, 97.79643249511719, 101.31742858886719, 104.83841705322266, 108.35940551757812, 111.88040161132812, 115.4013900756836, 118.92237854003906, 122.44336700439453, 125.96435546875, 129.4853515625, 133.00634765625, 136.52732849121094, 140.04832458496094, 143.56930541992188, 147.09030151367188, 150.61129760742188, 154.1322784423828, 157.6532745361328, 161.17425537109375, 164.69525146484375, 168.21624755859375, 171.7372283935547, 175.2582244873047, 178.7792205810547, 182.30020141601562, 185.82119750976562, 189.34219360351562, 192.86317443847656, 196.38417053222656, 199.9051513671875, 203.4261474609375]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 10.0, 8.0, 15.0, 9.0, 16.0, 5.0, 18.0, 14.0, 28.0, 15.0, 25.0, 30.0, 32.0, 20.0, 27.0, 35.0, 38.0, 44.0, 43.0, 36.0, 36.0, 39.0, 27.0, 30.0, 40.0, 36.0, 32.0, 34.0, 35.0, 35.0, 21.0, 21.0, 18.0, 14.0, 15.0, 17.0, 15.0, 11.0, 8.0, 10.0, 9.0, 6.0, 7.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.458660125732422, -19.81545066833496, -19.1722412109375, -18.529033660888672, -17.88582420349121, -17.24261474609375, -16.59940528869629, -15.956195831298828, -15.312986373901367, -14.669776916503906, -14.026568412780762, -13.3833589553833, -12.74014949798584, -12.096940994262695, -11.453731536865234, -10.810522079467773, -10.167313575744629, -9.524104118347168, -8.880895614624023, -8.237686157226562, -7.594476699829102, -6.951267719268799, -6.308058738708496, -5.664849281311035, -5.021640300750732, -4.37843132019043, -3.7352218627929688, -3.092012882232666, -2.448803663253784, -1.8055944442749023, -1.1623854637145996, -0.5191760063171387, 0.12403297424316406, 0.7672421336174011, 1.4104512929916382, 2.0536603927612305, 2.6968696117401123, 3.340078830718994, 3.983287811279297, 4.626497268676758, 5.2697062492370605, 5.912915229797363, 6.556124687194824, 7.199333667755127, 7.84254264831543, 8.48575210571289, 9.128961563110352, 9.772171020507812, 10.415379524230957, 11.058588981628418, 11.701797485351562, 12.345006942749023, 12.988216400146484, 13.631425857543945, 14.27463436126709, 14.91784381866455, 15.561052322387695, 16.204261779785156, 16.847471237182617, 17.490680694580078, 18.133888244628906, 18.777097702026367, 19.420307159423828, 20.06351661682129, 20.70672607421875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 9.0, 11.0, 11.0, 14.0, 13.0, 22.0, 27.0, 27.0, 27.0, 21.0, 36.0, 28.0, 43.0, 37.0, 39.0, 51.0, 44.0, 35.0, 38.0, 42.0, 30.0, 47.0, 36.0, 30.0, 43.0, 33.0, 34.0, 28.0, 27.0, 17.0, 22.0, 13.0, 13.0, 11.0, 8.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.45703125, -4.32073974609375, -4.1844482421875, -4.04815673828125, -3.911865234375, -3.77557373046875, -3.6392822265625, -3.50299072265625, -3.36669921875, -3.23040771484375, -3.0941162109375, -2.95782470703125, -2.821533203125, -2.68524169921875, -2.5489501953125, -2.41265869140625, -2.2763671875, -2.14007568359375, -2.0037841796875, -1.86749267578125, -1.731201171875, -1.59490966796875, -1.4586181640625, -1.32232666015625, -1.18603515625, -1.04974365234375, -0.9134521484375, -0.77716064453125, -0.640869140625, -0.50457763671875, -0.3682861328125, -0.23199462890625, -0.095703125, 0.04058837890625, 0.1768798828125, 0.31317138671875, 0.449462890625, 0.58575439453125, 0.7220458984375, 0.85833740234375, 0.99462890625, 1.13092041015625, 1.2672119140625, 1.40350341796875, 1.539794921875, 1.67608642578125, 1.8123779296875, 1.94866943359375, 2.0849609375, 2.22125244140625, 2.3575439453125, 2.49383544921875, 2.630126953125, 2.76641845703125, 2.9027099609375, 3.03900146484375, 3.17529296875, 3.31158447265625, 3.4478759765625, 3.58416748046875, 3.720458984375, 3.85675048828125, 3.9930419921875, 4.12933349609375, 4.265625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 11.0, 9.0, 11.0, 19.0, 38.0, 61.0, 79.0, 114.0, 146.0, 288.0, 398.0, 623.0, 918.0, 1522.0, 2353.0, 3876.0, 6192.0, 10061.0, 16516.0, 27754.0, 49080.0, 89129.0, 176299.0, 307770.0, 160572.0, 82205.0, 45618.0, 26117.0, 15547.0, 9432.0, 5853.0, 3637.0, 2205.0, 1457.0, 932.0, 572.0, 414.0, 259.0, 155.0, 108.0, 78.0, 45.0, 27.0, 17.0, 14.0, 7.0, 8.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.83154296875, -0.805908203125, -0.7802734375, -0.754638671875, -0.72900390625, -0.703369140625, -0.677734375, -0.652099609375, -0.62646484375, -0.600830078125, -0.5751953125, -0.549560546875, -0.52392578125, -0.498291015625, -0.47265625, -0.447021484375, -0.42138671875, -0.395751953125, -0.3701171875, -0.344482421875, -0.31884765625, -0.293212890625, -0.267578125, -0.241943359375, -0.21630859375, -0.190673828125, -0.1650390625, -0.139404296875, -0.11376953125, -0.088134765625, -0.0625, -0.036865234375, -0.01123046875, 0.014404296875, 0.0400390625, 0.065673828125, 0.09130859375, 0.116943359375, 0.142578125, 0.168212890625, 0.19384765625, 0.219482421875, 0.2451171875, 0.270751953125, 0.29638671875, 0.322021484375, 0.34765625, 0.373291015625, 0.39892578125, 0.424560546875, 0.4501953125, 0.475830078125, 0.50146484375, 0.527099609375, 0.552734375, 0.578369140625, 0.60400390625, 0.629638671875, 0.6552734375, 0.680908203125, 0.70654296875, 0.732177734375, 0.7578125, 0.783447265625, 0.80908203125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 4.0, 0.0, 4.0, 9.0, 10.0, 7.0, 10.0, 6.0, 18.0, 30.0, 22.0, 22.0, 29.0, 38.0, 37.0, 37.0, 30.0, 34.0, 35.0, 43.0, 37.0, 1083.0, 49.0, 44.0, 45.0, 47.0, 39.0, 25.0, 29.0, 33.0, 28.0, 21.0, 15.0, 17.0, 15.0, 13.0, 8.0, 12.0, 16.0, 7.0, 7.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.92327880859375, -2.8367919921875, -2.75030517578125, -2.663818359375, -2.57733154296875, -2.4908447265625, -2.40435791015625, -2.31787109375, -2.23138427734375, -2.1448974609375, -2.05841064453125, -1.971923828125, -1.88543701171875, -1.7989501953125, -1.71246337890625, -1.6259765625, -1.53948974609375, -1.4530029296875, -1.36651611328125, -1.280029296875, -1.19354248046875, -1.1070556640625, -1.02056884765625, -0.93408203125, -0.84759521484375, -0.7611083984375, -0.67462158203125, -0.588134765625, -0.50164794921875, -0.4151611328125, -0.32867431640625, -0.2421875, -0.15570068359375, -0.0692138671875, 0.01727294921875, 0.103759765625, 0.19024658203125, 0.2767333984375, 0.36322021484375, 0.44970703125, 0.53619384765625, 0.6226806640625, 0.70916748046875, 0.795654296875, 0.88214111328125, 0.9686279296875, 1.05511474609375, 1.1416015625, 1.22808837890625, 1.3145751953125, 1.40106201171875, 1.487548828125, 1.57403564453125, 1.6605224609375, 1.74700927734375, 1.83349609375, 1.91998291015625, 2.0064697265625, 2.09295654296875, 2.179443359375, 2.26593017578125, 2.3524169921875, 2.43890380859375, 2.525390625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 13.0, 13.0, 25.0, 30.0, 66.0, 82.0, 118.0, 185.0, 303.0, 466.0, 630.0, 1001.0, 1454.0, 2077.0, 3025.0, 4581.0, 6555.0, 9994.0, 15320.0, 23663.0, 37109.0, 60167.0, 106324.0, 237747.0, 1300611.0, 112307.0, 62186.0, 38409.0, 24360.0, 16066.0, 10575.0, 7176.0, 4752.0, 3138.0, 2116.0, 1446.0, 955.0, 642.0, 452.0, 291.0, 230.0, 159.0, 91.0, 66.0, 44.0, 48.0, 28.0, 9.0, 8.0, 9.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6352920532226562, -0.6148223876953125, -0.5943527221679688, -0.573883056640625, -0.5534133911132812, -0.5329437255859375, -0.5124740600585938, -0.49200439453125, -0.47153472900390625, -0.4510650634765625, -0.43059539794921875, -0.410125732421875, -0.38965606689453125, -0.3691864013671875, -0.34871673583984375, -0.3282470703125, -0.30777740478515625, -0.2873077392578125, -0.26683807373046875, -0.246368408203125, -0.22589874267578125, -0.2054290771484375, -0.18495941162109375, -0.16448974609375, -0.14402008056640625, -0.1235504150390625, -0.10308074951171875, -0.082611083984375, -0.06214141845703125, -0.0416717529296875, -0.02120208740234375, -0.000732421875, 0.01973724365234375, 0.0402069091796875, 0.06067657470703125, 0.081146240234375, 0.10161590576171875, 0.1220855712890625, 0.14255523681640625, 0.16302490234375, 0.18349456787109375, 0.2039642333984375, 0.22443389892578125, 0.244903564453125, 0.26537322998046875, 0.2858428955078125, 0.30631256103515625, 0.3267822265625, 0.34725189208984375, 0.3677215576171875, 0.38819122314453125, 0.408660888671875, 0.42913055419921875, 0.4496002197265625, 0.47006988525390625, 0.49053955078125, 0.5110092163085938, 0.5314788818359375, 0.5519485473632812, 0.572418212890625, 0.5928878784179688, 0.6133575439453125, 0.6338272094726562, 0.654296875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 16.0, 2.0, 7.0, 7.0, 13.0, 21.0, 24.0, 26.0, 26.0, 50.0, 51.0, 70.0, 67.0, 71.0, 81.0, 68.0, 69.0, 71.0, 63.0, 44.0, 31.0, 18.0, 24.0, 12.0, 15.0, 12.0, 8.0, 7.0, 8.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001919269561767578, -0.0001860298216342926, -0.0001801326870918274, -0.00017423555254936218, -0.00016833841800689697, -0.00016244128346443176, -0.00015654414892196655, -0.00015064701437950134, -0.00014474987983703613, -0.00013885274529457092, -0.0001329556107521057, -0.0001270584762096405, -0.00012116134166717529, -0.00011526420712471008, -0.00010936707258224487, -0.00010346993803977966, -9.757280349731445e-05, -9.167566895484924e-05, -8.577853441238403e-05, -7.988139986991882e-05, -7.398426532745361e-05, -6.80871307849884e-05, -6.21899962425232e-05, -5.6292861700057983e-05, -5.0395727157592773e-05, -4.4498592615127563e-05, -3.8601458072662354e-05, -3.2704323530197144e-05, -2.6807188987731934e-05, -2.0910054445266724e-05, -1.5012919902801514e-05, -9.115785360336304e-06, -3.2186508178710938e-06, 2.678483724594116e-06, 8.575618267059326e-06, 1.4472752809524536e-05, 2.0369887351989746e-05, 2.6267021894454956e-05, 3.2164156436920166e-05, 3.8061290979385376e-05, 4.3958425521850586e-05, 4.9855560064315796e-05, 5.5752694606781006e-05, 6.164982914924622e-05, 6.754696369171143e-05, 7.344409823417664e-05, 7.934123277664185e-05, 8.523836731910706e-05, 9.113550186157227e-05, 9.703263640403748e-05, 0.00010292977094650269, 0.0001088269054889679, 0.0001147240400314331, 0.00012062117457389832, 0.00012651830911636353, 0.00013241544365882874, 0.00013831257820129395, 0.00014420971274375916, 0.00015010684728622437, 0.00015600398182868958, 0.00016190111637115479, 0.00016779825091362, 0.0001736953854560852, 0.00017959251999855042, 0.00018548965454101562]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 8.0, 13.0, 23.0, 9.0, 18.0, 29.0, 36.0, 53.0, 82.0, 134.0, 225.0, 459.0, 1338.0, 1010530.0, 33897.0, 818.0, 340.0, 154.0, 124.0, 59.0, 45.0, 35.0, 32.0, 24.0, 13.0, 10.0, 11.0, 8.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004161834716796875, -0.0040267109870910645, -0.003891587257385254, -0.0037564635276794434, -0.003621339797973633, -0.0034862160682678223, -0.0033510923385620117, -0.003215968608856201, -0.0030808448791503906, -0.00294572114944458, -0.0028105974197387695, -0.002675473690032959, -0.0025403499603271484, -0.002405226230621338, -0.0022701025009155273, -0.002134978771209717, -0.0019998550415039062, -0.0018647313117980957, -0.0017296075820922852, -0.0015944838523864746, -0.001459360122680664, -0.0013242363929748535, -0.001189112663269043, -0.0010539889335632324, -0.0009188652038574219, -0.0007837414741516113, -0.0006486177444458008, -0.0005134940147399902, -0.0003783702850341797, -0.00024324655532836914, -0.0001081228256225586, 2.7000904083251953e-05, 0.0001621246337890625, 0.00029724836349487305, 0.0004323720932006836, 0.0005674958229064941, 0.0007026195526123047, 0.0008377432823181152, 0.0009728670120239258, 0.0011079907417297363, 0.0012431144714355469, 0.0013782382011413574, 0.001513361930847168, 0.0016484856605529785, 0.001783609390258789, 0.0019187331199645996, 0.00205385684967041, 0.0021889805793762207, 0.0023241043090820312, 0.002459228038787842, 0.0025943517684936523, 0.002729475498199463, 0.0028645992279052734, 0.002999722957611084, 0.0031348466873168945, 0.003269970417022705, 0.0034050941467285156, 0.003540217876434326, 0.0036753416061401367, 0.0038104653358459473, 0.003945589065551758, 0.004080712795257568, 0.004215836524963379, 0.0043509602546691895, 0.004486083984375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 15.0, 29.0, 64.0, 106.0, 143.0, 172.0, 154.0, 144.0, 94.0, 41.0, 25.0, 14.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010209299944108352, -9.857855911832303e-05, -9.506411879556254e-05, -9.154967847280204e-05, -8.803523815004155e-05, -8.452079782728106e-05, -8.100636478047818e-05, -7.749191718176007e-05, -7.39774841349572e-05, -7.04630438121967e-05, -6.694860348943621e-05, -6.343416316667572e-05, -5.9919722843915224e-05, -5.640528252115473e-05, -5.2890845836373046e-05, -4.9376405513612553e-05, -4.5861961552873254e-05, -4.234752123011276e-05, -3.883308090735227e-05, -3.5318640584591776e-05, -3.1804200261831284e-05, -2.8289761758060195e-05, -2.4775323254289106e-05, -2.1260882931528613e-05, -1.774644260876812e-05, -1.4232002286007628e-05, -1.0717562872741837e-05, -7.203123459476046e-06, -3.6886831367155537e-06, -1.7424281395506114e-07, 3.340195689816028e-06, 6.8546360125765204e-06, 1.0369083611294627e-05, 1.388352393405512e-05, 1.7397964256815612e-05, 2.09124027605867e-05, 2.4426843083347194e-05, 2.7941283406107686e-05, 3.1455721909878775e-05, 3.497016223263927e-05, 3.848460255539976e-05, 4.199904287816025e-05, 4.5513483200920746e-05, 4.902791988570243e-05, 5.2542360208462924e-05, 5.6056800531223416e-05, 5.957124085398391e-05, 6.30856811767444e-05, 6.66001214995049e-05, 7.011456182226539e-05, 7.362900214502588e-05, 7.714344246778637e-05, 8.065788279054686e-05, 8.417232311330736e-05, 8.768675616011024e-05, 9.120120375882834e-05, 9.471563680563122e-05, 9.823007712839171e-05, 0.0001017445174511522, 0.0001052589577739127, 0.00010877339809667319, 0.00011228783841943368, 0.00011580227874219418, 0.00011931671178899705, 0.00012283115938771516]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 3.0, 2.0, 4.0, 8.0, 10.0, 6.0, 13.0, 10.0, 18.0, 11.0, 25.0, 13.0, 23.0, 21.0, 31.0, 34.0, 26.0, 32.0, 42.0, 35.0, 33.0, 41.0, 29.0, 44.0, 35.0, 36.0, 31.0, 40.0, 34.0, 38.0, 23.0, 28.0, 33.0, 28.0, 28.0, 17.0, 10.0, 19.0, 15.0, 14.0, 8.0, 8.0, 10.0, 6.0, 7.0, 3.0, 5.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.575750350952148e-05, -7.341057062149048e-05, -7.106363773345947e-05, -6.871670484542847e-05, -6.636977195739746e-05, -6.402283906936646e-05, -6.167590618133545e-05, -5.932897329330444e-05, -5.698204040527344e-05, -5.463510751724243e-05, -5.2288174629211426e-05, -4.994124174118042e-05, -4.7594308853149414e-05, -4.524737596511841e-05, -4.29004430770874e-05, -4.0553510189056396e-05, -3.820657730102539e-05, -3.5859644412994385e-05, -3.351271152496338e-05, -3.116577863693237e-05, -2.8818845748901367e-05, -2.647191286087036e-05, -2.4124979972839355e-05, -2.177804708480835e-05, -1.9431114196777344e-05, -1.7084181308746338e-05, -1.4737248420715332e-05, -1.2390315532684326e-05, -1.004338264465332e-05, -7.696449756622314e-06, -5.349516868591309e-06, -3.0025839805603027e-06, -6.556510925292969e-07, 1.691281795501709e-06, 4.038214683532715e-06, 6.385147571563721e-06, 8.732080459594727e-06, 1.1079013347625732e-05, 1.3425946235656738e-05, 1.5772879123687744e-05, 1.811981201171875e-05, 2.0466744899749756e-05, 2.2813677787780762e-05, 2.5160610675811768e-05, 2.7507543563842773e-05, 2.985447645187378e-05, 3.2201409339904785e-05, 3.454834222793579e-05, 3.68952751159668e-05, 3.92422080039978e-05, 4.158914089202881e-05, 4.3936073780059814e-05, 4.628300666809082e-05, 4.8629939556121826e-05, 5.097687244415283e-05, 5.332380533218384e-05, 5.5670738220214844e-05, 5.801767110824585e-05, 6.0364603996276855e-05, 6.271153688430786e-05, 6.505846977233887e-05, 6.740540266036987e-05, 6.975233554840088e-05, 7.209926843643188e-05, 7.444620132446289e-05]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 9.0, 11.0, 11.0, 14.0, 13.0, 22.0, 27.0, 27.0, 27.0, 21.0, 36.0, 28.0, 43.0, 37.0, 39.0, 51.0, 44.0, 35.0, 38.0, 42.0, 30.0, 47.0, 36.0, 30.0, 43.0, 33.0, 34.0, 28.0, 27.0, 17.0, 22.0, 13.0, 13.0, 11.0, 8.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.45703125, -4.32073974609375, -4.1844482421875, -4.04815673828125, -3.911865234375, -3.77557373046875, -3.6392822265625, -3.50299072265625, -3.36669921875, -3.23040771484375, -3.0941162109375, -2.95782470703125, -2.821533203125, -2.68524169921875, -2.5489501953125, -2.41265869140625, -2.2763671875, -2.14007568359375, -2.0037841796875, -1.86749267578125, -1.731201171875, -1.59490966796875, -1.4586181640625, -1.32232666015625, -1.18603515625, -1.04974365234375, -0.9134521484375, -0.77716064453125, -0.640869140625, -0.50457763671875, -0.3682861328125, -0.23199462890625, -0.095703125, 0.04058837890625, 0.1768798828125, 0.31317138671875, 0.449462890625, 0.58575439453125, 0.7220458984375, 0.85833740234375, 0.99462890625, 1.13092041015625, 1.2672119140625, 1.40350341796875, 1.539794921875, 1.67608642578125, 1.8123779296875, 1.94866943359375, 2.0849609375, 2.22125244140625, 2.3575439453125, 2.49383544921875, 2.630126953125, 2.76641845703125, 2.9027099609375, 3.03900146484375, 3.17529296875, 3.31158447265625, 3.4478759765625, 3.58416748046875, 3.720458984375, 3.85675048828125, 3.9930419921875, 4.12933349609375, 4.265625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 2.0, 8.0, 9.0, 9.0, 19.0, 21.0, 24.0, 36.0, 44.0, 66.0, 97.0, 126.0, 190.0, 276.0, 430.0, 835.0, 2827.0, 13082.0, 65420.0, 489034.0, 406361.0, 54177.0, 10874.0, 2460.0, 807.0, 407.0, 268.0, 184.0, 122.0, 88.0, 64.0, 43.0, 40.0, 33.0, 21.0, 12.0, 7.0, 11.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.296875, -8.0450439453125, -7.793212890625, -7.5413818359375, -7.28955078125, -7.0377197265625, -6.785888671875, -6.5340576171875, -6.2822265625, -6.0303955078125, -5.778564453125, -5.5267333984375, -5.27490234375, -5.0230712890625, -4.771240234375, -4.5194091796875, -4.267578125, -4.0157470703125, -3.763916015625, -3.5120849609375, -3.26025390625, -3.0084228515625, -2.756591796875, -2.5047607421875, -2.2529296875, -2.0010986328125, -1.749267578125, -1.4974365234375, -1.24560546875, -0.9937744140625, -0.741943359375, -0.4901123046875, -0.23828125, 0.0135498046875, 0.265380859375, 0.5172119140625, 0.76904296875, 1.0208740234375, 1.272705078125, 1.5245361328125, 1.7763671875, 2.0281982421875, 2.280029296875, 2.5318603515625, 2.78369140625, 3.0355224609375, 3.287353515625, 3.5391845703125, 3.791015625, 4.0428466796875, 4.294677734375, 4.5465087890625, 4.79833984375, 5.0501708984375, 5.302001953125, 5.5538330078125, 5.8056640625, 6.0574951171875, 6.309326171875, 6.5611572265625, 6.81298828125, 7.0648193359375, 7.316650390625, 7.5684814453125, 7.8203125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 0.0, 1.0, 5.0, 5.0, 7.0, 7.0, 5.0, 12.0, 12.0, 10.0, 10.0, 18.0, 17.0, 21.0, 23.0, 29.0, 30.0, 43.0, 42.0, 56.0, 58.0, 75.0, 134.0, 391.0, 1411.0, 168.0, 69.0, 52.0, 46.0, 40.0, 41.0, 36.0, 23.0, 28.0, 20.0, 17.0, 12.0, 17.0, 11.0, 14.0, 11.0, 9.0, 6.0, 2.0, 3.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.5960693359375, -12.176513671875, -11.7569580078125, -11.33740234375, -10.9178466796875, -10.498291015625, -10.0787353515625, -9.6591796875, -9.2396240234375, -8.820068359375, -8.4005126953125, -7.98095703125, -7.5614013671875, -7.141845703125, -6.7222900390625, -6.302734375, -5.8831787109375, -5.463623046875, -5.0440673828125, -4.62451171875, -4.2049560546875, -3.785400390625, -3.3658447265625, -2.9462890625, -2.5267333984375, -2.107177734375, -1.6876220703125, -1.26806640625, -0.8485107421875, -0.428955078125, -0.0093994140625, 0.41015625, 0.8297119140625, 1.249267578125, 1.6688232421875, 2.08837890625, 2.5079345703125, 2.927490234375, 3.3470458984375, 3.7666015625, 4.1861572265625, 4.605712890625, 5.0252685546875, 5.44482421875, 5.8643798828125, 6.283935546875, 6.7034912109375, 7.123046875, 7.5426025390625, 7.962158203125, 8.3817138671875, 8.80126953125, 9.2208251953125, 9.640380859375, 10.0599365234375, 10.4794921875, 10.8990478515625, 11.318603515625, 11.7381591796875, 12.15771484375, 12.5772705078125, 12.996826171875, 13.4163818359375, 13.8359375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 10.0, 3.0, 9.0, 10.0, 14.0, 23.0, 24.0, 20.0, 21.0, 38.0, 49.0, 49.0, 82.0, 119.0, 192.0, 254.0, 505.0, 1212.0, 7902.0, 2965328.0, 165133.0, 2709.0, 812.0, 384.0, 235.0, 121.0, 83.0, 70.0, 63.0, 41.0, 45.0, 21.0, 24.0, 20.0, 16.0, 10.0, 11.0, 11.0, 9.0, 4.0, 6.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.09375, -29.08349609375, -28.0732421875, -27.06298828125, -26.052734375, -25.04248046875, -24.0322265625, -23.02197265625, -22.01171875, -21.00146484375, -19.9912109375, -18.98095703125, -17.970703125, -16.96044921875, -15.9501953125, -14.93994140625, -13.9296875, -12.91943359375, -11.9091796875, -10.89892578125, -9.888671875, -8.87841796875, -7.8681640625, -6.85791015625, -5.84765625, -4.83740234375, -3.8271484375, -2.81689453125, -1.806640625, -0.79638671875, 0.2138671875, 1.22412109375, 2.234375, 3.24462890625, 4.2548828125, 5.26513671875, 6.275390625, 7.28564453125, 8.2958984375, 9.30615234375, 10.31640625, 11.32666015625, 12.3369140625, 13.34716796875, 14.357421875, 15.36767578125, 16.3779296875, 17.38818359375, 18.3984375, 19.40869140625, 20.4189453125, 21.42919921875, 22.439453125, 23.44970703125, 24.4599609375, 25.47021484375, 26.48046875, 27.49072265625, 28.5009765625, 29.51123046875, 30.521484375, 31.53173828125, 32.5419921875, 33.55224609375, 34.5625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 364.0, 639.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.357666015625, -178.4025115966797, -174.44735717773438, -170.49220275878906, -166.53704833984375, -162.58189392089844, -158.62673950195312, -154.6715850830078, -150.7164306640625, -146.7612762451172, -142.80612182617188, -138.85096740722656, -134.89581298828125, -130.94065856933594, -126.98550415039062, -123.03034973144531, -119.0751953125, -115.12004089355469, -111.16488647460938, -107.20973205566406, -103.25457763671875, -99.29942321777344, -95.34426879882812, -91.38911437988281, -87.43396759033203, -83.47881317138672, -79.5236587524414, -75.5685043334961, -71.61334991455078, -67.65819549560547, -63.703041076660156, -59.747886657714844, -55.79273223876953, -51.83757781982422, -47.882423400878906, -43.927268981933594, -39.97211456298828, -36.01696014404297, -32.061805725097656, -28.106653213500977, -24.151498794555664, -20.19634437561035, -16.24118995666504, -12.286036491394043, -8.33088207244873, -4.375728607177734, -0.4205741882324219, 3.5345802307128906, 7.489734649658203, 11.444889068603516, 15.400043487548828, 19.35519790649414, 23.310352325439453, 27.265504837036133, 31.220659255981445, 35.175811767578125, 39.13096618652344, 43.08612060546875, 47.04127502441406, 50.996429443359375, 54.95158386230469, 58.90673828125, 62.86189270019531, 66.81704711914062, 70.77220153808594]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 4.0, 10.0, 9.0, 5.0, 9.0, 5.0, 10.0, 14.0, 18.0, 21.0, 35.0, 27.0, 22.0, 31.0, 37.0, 32.0, 45.0, 61.0, 34.0, 42.0, 38.0, 39.0, 28.0, 43.0, 38.0, 33.0, 30.0, 35.0, 23.0, 23.0, 34.0, 22.0, 24.0, 17.0, 11.0, 17.0, 9.0, 7.0, 8.0, 10.0, 7.0, 5.0, 6.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.35193634033203, -27.443452835083008, -26.534971237182617, -25.626487731933594, -24.71800422668457, -23.809520721435547, -22.901039123535156, -21.992555618286133, -21.08407211303711, -20.175588607788086, -19.267107009887695, -18.358623504638672, -17.45013999938965, -16.541656494140625, -15.633174896240234, -14.724691390991211, -13.81620979309082, -12.907727241516113, -11.99924373626709, -11.090761184692383, -10.18227767944336, -9.273795127868652, -8.365312576293945, -7.45682954788208, -6.548346519470215, -5.63986349105835, -4.731380462646484, -3.8228979110717773, -2.914414882659912, -2.005931854248047, -1.0974493026733398, -0.1889662742614746, 0.7195186614990234, 1.6280015707015991, 2.536484479904175, 3.444967269897461, 4.353450298309326, 5.261933326721191, 6.170415878295898, 7.078898906707764, 7.987381935119629, 8.895864486694336, 9.80434799194336, 10.712830543518066, 11.621313095092773, 12.529796600341797, 13.438279151916504, 14.346761703491211, 15.255245208740234, 16.163728713989258, 17.07221031188965, 17.980693817138672, 18.889177322387695, 19.79766082763672, 20.70614242553711, 21.614625930786133, 22.523109436035156, 23.43159294128418, 24.34007453918457, 25.248558044433594, 26.157041549682617, 27.06552505493164, 27.97400665283203, 28.882490158081055, 29.790971755981445]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 7.0, 8.0, 12.0, 9.0, 9.0, 16.0, 9.0, 22.0, 20.0, 28.0, 23.0, 38.0, 31.0, 21.0, 31.0, 33.0, 45.0, 40.0, 40.0, 41.0, 44.0, 44.0, 40.0, 38.0, 38.0, 30.0, 35.0, 36.0, 29.0, 26.0, 22.0, 14.0, 21.0, 13.0, 12.0, 9.0, 11.0, 17.0, 6.0, 8.0, 1.0, 4.0, 4.0, 1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.03515625, -3.90496826171875, -3.7747802734375, -3.64459228515625, -3.514404296875, -3.38421630859375, -3.2540283203125, -3.12384033203125, -2.99365234375, -2.86346435546875, -2.7332763671875, -2.60308837890625, -2.472900390625, -2.34271240234375, -2.2125244140625, -2.08233642578125, -1.9521484375, -1.82196044921875, -1.6917724609375, -1.56158447265625, -1.431396484375, -1.30120849609375, -1.1710205078125, -1.04083251953125, -0.91064453125, -0.78045654296875, -0.6502685546875, -0.52008056640625, -0.389892578125, -0.25970458984375, -0.1295166015625, 0.00067138671875, 0.130859375, 0.26104736328125, 0.3912353515625, 0.52142333984375, 0.651611328125, 0.78179931640625, 0.9119873046875, 1.04217529296875, 1.17236328125, 1.30255126953125, 1.4327392578125, 1.56292724609375, 1.693115234375, 1.82330322265625, 1.9534912109375, 2.08367919921875, 2.2138671875, 2.34405517578125, 2.4742431640625, 2.60443115234375, 2.734619140625, 2.86480712890625, 2.9949951171875, 3.12518310546875, 3.25537109375, 3.38555908203125, 3.5157470703125, 3.64593505859375, 3.776123046875, 3.90631103515625, 4.0364990234375, 4.16668701171875, 4.296875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 10.0, 9.0, 13.0, 14.0, 16.0, 29.0, 22.0, 24.0, 47.0, 47.0, 61.0, 82.0, 135.0, 203.0, 562.0, 2274.0, 33292.0, 874831.0, 2891512.0, 375191.0, 13414.0, 1408.0, 405.0, 190.0, 109.0, 80.0, 50.0, 47.0, 33.0, 24.0, 22.0, 15.0, 17.0, 16.0, 8.0, 13.0, 7.0, 6.0, 9.0, 3.0, 5.0, 1.0, 6.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-11.125, -10.79150390625, -10.4580078125, -10.12451171875, -9.791015625, -9.45751953125, -9.1240234375, -8.79052734375, -8.45703125, -8.12353515625, -7.7900390625, -7.45654296875, -7.123046875, -6.78955078125, -6.4560546875, -6.12255859375, -5.7890625, -5.45556640625, -5.1220703125, -4.78857421875, -4.455078125, -4.12158203125, -3.7880859375, -3.45458984375, -3.12109375, -2.78759765625, -2.4541015625, -2.12060546875, -1.787109375, -1.45361328125, -1.1201171875, -0.78662109375, -0.453125, -0.11962890625, 0.2138671875, 0.54736328125, 0.880859375, 1.21435546875, 1.5478515625, 1.88134765625, 2.21484375, 2.54833984375, 2.8818359375, 3.21533203125, 3.548828125, 3.88232421875, 4.2158203125, 4.54931640625, 4.8828125, 5.21630859375, 5.5498046875, 5.88330078125, 6.216796875, 6.55029296875, 6.8837890625, 7.21728515625, 7.55078125, 7.88427734375, 8.2177734375, 8.55126953125, 8.884765625, 9.21826171875, 9.5517578125, 9.88525390625, 10.21875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 6.0, 2.0, 6.0, 12.0, 9.0, 15.0, 18.0, 17.0, 32.0, 31.0, 66.0, 70.0, 109.0, 145.0, 194.0, 209.0, 297.0, 348.0, 351.0, 408.0, 367.0, 275.0, 223.0, 213.0, 158.0, 106.0, 85.0, 75.0, 50.0, 36.0, 33.0, 16.0, 16.0, 13.0, 13.0, 21.0, 13.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.10546875, -5.92706298828125, -5.7486572265625, -5.57025146484375, -5.391845703125, -5.21343994140625, -5.0350341796875, -4.85662841796875, -4.67822265625, -4.49981689453125, -4.3214111328125, -4.14300537109375, -3.964599609375, -3.78619384765625, -3.6077880859375, -3.42938232421875, -3.2509765625, -3.07257080078125, -2.8941650390625, -2.71575927734375, -2.537353515625, -2.35894775390625, -2.1805419921875, -2.00213623046875, -1.82373046875, -1.64532470703125, -1.4669189453125, -1.28851318359375, -1.110107421875, -0.93170166015625, -0.7532958984375, -0.57489013671875, -0.396484375, -0.21807861328125, -0.0396728515625, 0.13873291015625, 0.317138671875, 0.49554443359375, 0.6739501953125, 0.85235595703125, 1.03076171875, 1.20916748046875, 1.3875732421875, 1.56597900390625, 1.744384765625, 1.92279052734375, 2.1011962890625, 2.27960205078125, 2.4580078125, 2.63641357421875, 2.8148193359375, 2.99322509765625, 3.171630859375, 3.35003662109375, 3.5284423828125, 3.70684814453125, 3.88525390625, 4.06365966796875, 4.2420654296875, 4.42047119140625, 4.598876953125, 4.77728271484375, 4.9556884765625, 5.13409423828125, 5.3125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 7.0, 2.0, 10.0, 7.0, 16.0, 19.0, 23.0, 26.0, 54.0, 70.0, 77.0, 96.0, 130.0, 176.0, 261.0, 433.0, 759.0, 2264.0, 28945.0, 2603854.0, 1535414.0, 17784.0, 1820.0, 729.0, 416.0, 238.0, 169.0, 123.0, 73.0, 62.0, 56.0, 47.0, 38.0, 30.0, 14.0, 13.0, 12.0, 12.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.046875, -17.423095703125, -16.79931640625, -16.175537109375, -15.5517578125, -14.927978515625, -14.30419921875, -13.680419921875, -13.056640625, -12.432861328125, -11.80908203125, -11.185302734375, -10.5615234375, -9.937744140625, -9.31396484375, -8.690185546875, -8.06640625, -7.442626953125, -6.81884765625, -6.195068359375, -5.5712890625, -4.947509765625, -4.32373046875, -3.699951171875, -3.076171875, -2.452392578125, -1.82861328125, -1.204833984375, -0.5810546875, 0.042724609375, 0.66650390625, 1.290283203125, 1.9140625, 2.537841796875, 3.16162109375, 3.785400390625, 4.4091796875, 5.032958984375, 5.65673828125, 6.280517578125, 6.904296875, 7.528076171875, 8.15185546875, 8.775634765625, 9.3994140625, 10.023193359375, 10.64697265625, 11.270751953125, 11.89453125, 12.518310546875, 13.14208984375, 13.765869140625, 14.3896484375, 15.013427734375, 15.63720703125, 16.260986328125, 16.884765625, 17.508544921875, 18.13232421875, 18.756103515625, 19.3798828125, 20.003662109375, 20.62744140625, 21.251220703125, 21.875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 25.0, 129.0, 367.0, 356.0, 115.0, 22.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.33060455322266, -105.81037902832031, -103.2901611328125, -100.76993560791016, -98.24971008300781, -95.7294921875, -93.20926666259766, -90.68904113769531, -88.1688232421875, -85.64859771728516, -83.12837982177734, -80.608154296875, -78.08793640136719, -75.56771087646484, -73.0474853515625, -70.52726745605469, -68.00704193115234, -65.48681640625, -62.96659851074219, -60.446372985839844, -57.926151275634766, -55.40592956542969, -52.885704040527344, -50.365482330322266, -47.84526062011719, -45.32503890991211, -42.80481719970703, -40.28459167480469, -37.76436996459961, -35.24414825439453, -32.72392272949219, -30.20370101928711, -27.6834716796875, -25.163249969482422, -22.64302635192871, -20.122802734375, -17.602581024169922, -15.082358360290527, -12.562135696411133, -10.041912078857422, -7.521690368652344, -5.001467704772949, -2.4812450408935547, 0.038977622985839844, 2.5592002868652344, 5.079422950744629, 7.599645614624023, 10.119869232177734, 12.640090942382812, 15.160313606262207, 17.6805362701416, 20.200759887695312, 22.72098159790039, 25.24120330810547, 27.76142692565918, 30.28165054321289, 32.80187225341797, 35.32209396362305, 37.842315673828125, 40.36254119873047, 42.88276290893555, 45.402984619140625, 47.92321014404297, 50.44343185424805, 52.963653564453125]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 6.0, 4.0, 9.0, 7.0, 7.0, 13.0, 10.0, 16.0, 11.0, 13.0, 25.0, 27.0, 25.0, 21.0, 32.0, 41.0, 41.0, 42.0, 30.0, 43.0, 39.0, 42.0, 41.0, 33.0, 30.0, 35.0, 34.0, 35.0, 24.0, 38.0, 32.0, 30.0, 22.0, 25.0, 16.0, 11.0, 15.0, 14.0, 11.0, 14.0, 6.0, 7.0, 5.0, 4.0, 7.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.28722381591797, -19.64261245727539, -18.998001098632812, -18.353389739990234, -17.708778381347656, -17.064167022705078, -16.4195556640625, -15.774945259094238, -15.13033390045166, -14.485722541809082, -13.841111183166504, -13.196499824523926, -12.551889419555664, -11.907278060913086, -11.262666702270508, -10.61805534362793, -9.973443984985352, -9.328832626342773, -8.684221267700195, -8.039609909057617, -7.394999027252197, -6.750387668609619, -6.105776786804199, -5.461165428161621, -4.816554069519043, -4.171942710876465, -3.527331590652466, -2.882720470428467, -2.2381091117858887, -1.5934977531433105, -0.9488866329193115, -0.3042755126953125, 0.3403358459472656, 0.9849470853805542, 1.6295583248138428, 2.274169445037842, 2.91878080368042, 3.563392162322998, 4.208003044128418, 4.852614402770996, 5.497225761413574, 6.141837120056152, 6.7864484786987305, 7.43105936050415, 8.07567024230957, 8.720281600952148, 9.364892959594727, 10.009504318237305, 10.654115676879883, 11.298727035522461, 11.943338394165039, 12.587949752807617, 13.232561111450195, 13.877172470092773, 14.521782875061035, 15.166394233703613, 15.811005592346191, 16.455615997314453, 17.10022735595703, 17.74483871459961, 18.389450073242188, 19.034061431884766, 19.678672790527344, 20.323284149169922, 20.9678955078125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 3.0, 1.0, 8.0, 3.0, 7.0, 11.0, 11.0, 14.0, 23.0, 22.0, 19.0, 20.0, 29.0, 26.0, 24.0, 30.0, 39.0, 40.0, 42.0, 30.0, 36.0, 41.0, 50.0, 54.0, 43.0, 37.0, 44.0, 25.0, 30.0, 44.0, 20.0, 20.0, 25.0, 22.0, 16.0, 20.0, 15.0, 12.0, 9.0, 7.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.93505859375, -3.7998046875, -3.66455078125, -3.529296875, -3.39404296875, -3.2587890625, -3.12353515625, -2.98828125, -2.85302734375, -2.7177734375, -2.58251953125, -2.447265625, -2.31201171875, -2.1767578125, -2.04150390625, -1.90625, -1.77099609375, -1.6357421875, -1.50048828125, -1.365234375, -1.22998046875, -1.0947265625, -0.95947265625, -0.82421875, -0.68896484375, -0.5537109375, -0.41845703125, -0.283203125, -0.14794921875, -0.0126953125, 0.12255859375, 0.2578125, 0.39306640625, 0.5283203125, 0.66357421875, 0.798828125, 0.93408203125, 1.0693359375, 1.20458984375, 1.33984375, 1.47509765625, 1.6103515625, 1.74560546875, 1.880859375, 2.01611328125, 2.1513671875, 2.28662109375, 2.421875, 2.55712890625, 2.6923828125, 2.82763671875, 2.962890625, 3.09814453125, 3.2333984375, 3.36865234375, 3.50390625, 3.63916015625, 3.7744140625, 3.90966796875, 4.044921875, 4.18017578125, 4.3154296875, 4.45068359375, 4.5859375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 5.0, 12.0, 10.0, 22.0, 33.0, 35.0, 53.0, 77.0, 88.0, 145.0, 197.0, 299.0, 445.0, 591.0, 846.0, 1119.0, 1700.0, 2478.0, 3691.0, 5147.0, 7644.0, 11462.0, 16878.0, 25331.0, 39336.0, 63173.0, 111476.0, 227193.0, 232062.0, 113448.0, 64365.0, 39703.0, 26063.0, 17163.0, 11343.0, 7709.0, 5298.0, 3700.0, 2454.0, 1723.0, 1136.0, 876.0, 596.0, 449.0, 273.0, 205.0, 157.0, 112.0, 92.0, 47.0, 26.0, 32.0, 19.0, 8.0, 3.0, 8.0, 3.0, 4.0, 0.0, 0.0, 3.0], "bins": [-0.63818359375, -0.6176071166992188, -0.5970306396484375, -0.5764541625976562, -0.555877685546875, -0.5353012084960938, -0.5147247314453125, -0.49414825439453125, -0.47357177734375, -0.45299530029296875, -0.4324188232421875, -0.41184234619140625, -0.391265869140625, -0.37068939208984375, -0.3501129150390625, -0.32953643798828125, -0.3089599609375, -0.28838348388671875, -0.2678070068359375, -0.24723052978515625, -0.226654052734375, -0.20607757568359375, -0.1855010986328125, -0.16492462158203125, -0.14434814453125, -0.12377166748046875, -0.1031951904296875, -0.08261871337890625, -0.062042236328125, -0.04146575927734375, -0.0208892822265625, -0.00031280517578125, 0.020263671875, 0.04084014892578125, 0.0614166259765625, 0.08199310302734375, 0.102569580078125, 0.12314605712890625, 0.1437225341796875, 0.16429901123046875, 0.18487548828125, 0.20545196533203125, 0.2260284423828125, 0.24660491943359375, 0.267181396484375, 0.28775787353515625, 0.3083343505859375, 0.32891082763671875, 0.3494873046875, 0.37006378173828125, 0.3906402587890625, 0.41121673583984375, 0.431793212890625, 0.45236968994140625, 0.4729461669921875, 0.49352264404296875, 0.51409912109375, 0.5346755981445312, 0.5552520751953125, 0.5758285522460938, 0.596405029296875, 0.6169815063476562, 0.6375579833984375, 0.6581344604492188, 0.6787109375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 7.0, 7.0, 6.0, 12.0, 13.0, 6.0, 18.0, 15.0, 20.0, 19.0, 29.0, 27.0, 32.0, 29.0, 28.0, 34.0, 32.0, 43.0, 32.0, 43.0, 34.0, 1062.0, 33.0, 42.0, 31.0, 27.0, 44.0, 32.0, 31.0, 32.0, 29.0, 26.0, 14.0, 19.0, 14.0, 19.0, 18.0, 9.0, 6.0, 10.0, 7.0, 6.0, 6.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.55078125, -2.46875, -2.38671875, -2.3046875, -2.22265625, -2.140625, -2.05859375, -1.9765625, -1.89453125, -1.8125, -1.73046875, -1.6484375, -1.56640625, -1.484375, -1.40234375, -1.3203125, -1.23828125, -1.15625, -1.07421875, -0.9921875, -0.91015625, -0.828125, -0.74609375, -0.6640625, -0.58203125, -0.5, -0.41796875, -0.3359375, -0.25390625, -0.171875, -0.08984375, -0.0078125, 0.07421875, 0.15625, 0.23828125, 0.3203125, 0.40234375, 0.484375, 0.56640625, 0.6484375, 0.73046875, 0.8125, 0.89453125, 0.9765625, 1.05859375, 1.140625, 1.22265625, 1.3046875, 1.38671875, 1.46875, 1.55078125, 1.6328125, 1.71484375, 1.796875, 1.87890625, 1.9609375, 2.04296875, 2.125, 2.20703125, 2.2890625, 2.37109375, 2.453125, 2.53515625, 2.6171875, 2.69921875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 8.0, 9.0, 15.0, 27.0, 35.0, 47.0, 90.0, 96.0, 161.0, 230.0, 350.0, 457.0, 631.0, 919.0, 1223.0, 1695.0, 2372.0, 3250.0, 4538.0, 6129.0, 8601.0, 12288.0, 17421.0, 24979.0, 36658.0, 55438.0, 88723.0, 162438.0, 1294168.0, 136133.0, 78001.0, 49088.0, 32632.0, 22693.0, 15733.0, 11342.0, 8061.0, 5804.0, 4123.0, 2940.0, 2132.0, 1559.0, 1095.0, 827.0, 595.0, 421.0, 274.0, 210.0, 155.0, 101.0, 74.0, 56.0, 38.0, 23.0, 17.0, 8.0, 5.0, 3.0, 1.0, 2.0], "bins": [-0.5810546875, -0.5631027221679688, -0.5451507568359375, -0.5271987915039062, -0.509246826171875, -0.49129486083984375, -0.4733428955078125, -0.45539093017578125, -0.43743896484375, -0.41948699951171875, -0.4015350341796875, -0.38358306884765625, -0.365631103515625, -0.34767913818359375, -0.3297271728515625, -0.31177520751953125, -0.2938232421875, -0.27587127685546875, -0.2579193115234375, -0.23996734619140625, -0.222015380859375, -0.20406341552734375, -0.1861114501953125, -0.16815948486328125, -0.15020751953125, -0.13225555419921875, -0.1143035888671875, -0.09635162353515625, -0.078399658203125, -0.06044769287109375, -0.0424957275390625, -0.02454376220703125, -0.006591796875, 0.01136016845703125, 0.0293121337890625, 0.04726409912109375, 0.065216064453125, 0.08316802978515625, 0.1011199951171875, 0.11907196044921875, 0.13702392578125, 0.15497589111328125, 0.1729278564453125, 0.19087982177734375, 0.208831787109375, 0.22678375244140625, 0.2447357177734375, 0.26268768310546875, 0.2806396484375, 0.29859161376953125, 0.3165435791015625, 0.33449554443359375, 0.352447509765625, 0.37039947509765625, 0.3883514404296875, 0.40630340576171875, 0.42425537109375, 0.44220733642578125, 0.4601593017578125, 0.47811126708984375, 0.496063232421875, 0.5140151977539062, 0.5319671630859375, 0.5499191284179688, 0.56787109375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 8.0, 10.0, 8.0, 10.0, 11.0, 16.0, 18.0, 15.0, 29.0, 26.0, 42.0, 50.0, 44.0, 58.0, 76.0, 51.0, 65.0, 56.0, 64.0, 51.0, 49.0, 60.0, 46.0, 27.0, 26.0, 17.0, 11.0, 10.0, 9.0, 9.0, 5.0, 3.0, 6.0, 5.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019121170043945312, -0.00018531642854213715, -0.00017942115664482117, -0.0001735258847475052, -0.0001676306128501892, -0.00016173534095287323, -0.00015584006905555725, -0.00014994479715824127, -0.0001440495252609253, -0.00013815425336360931, -0.00013225898146629333, -0.00012636370956897736, -0.00012046843767166138, -0.0001145731657743454, -0.00010867789387702942, -0.00010278262197971344, -9.688735008239746e-05, -9.099207818508148e-05, -8.50968062877655e-05, -7.920153439044952e-05, -7.330626249313354e-05, -6.741099059581757e-05, -6.151571869850159e-05, -5.562044680118561e-05, -4.972517490386963e-05, -4.382990300655365e-05, -3.793463110923767e-05, -3.203935921192169e-05, -2.6144087314605713e-05, -2.0248815417289734e-05, -1.4353543519973755e-05, -8.458271622657776e-06, -2.562999725341797e-06, 3.332272171974182e-06, 9.227544069290161e-06, 1.512281596660614e-05, 2.101808786392212e-05, 2.6913359761238098e-05, 3.280863165855408e-05, 3.8703903555870056e-05, 4.4599175453186035e-05, 5.0494447350502014e-05, 5.638971924781799e-05, 6.228499114513397e-05, 6.818026304244995e-05, 7.407553493976593e-05, 7.997080683708191e-05, 8.586607873439789e-05, 9.176135063171387e-05, 9.765662252902985e-05, 0.00010355189442634583, 0.0001094471663236618, 0.00011534243822097778, 0.00012123771011829376, 0.00012713298201560974, 0.00013302825391292572, 0.0001389235258102417, 0.00014481879770755768, 0.00015071406960487366, 0.00015660934150218964, 0.00016250461339950562, 0.0001683998852968216, 0.00017429515719413757, 0.00018019042909145355, 0.00018608570098876953]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 7.0, 7.0, 12.0, 17.0, 17.0, 24.0, 26.0, 39.0, 57.0, 91.0, 147.0, 224.0, 341.0, 674.0, 2570.0, 1036095.0, 6239.0, 818.0, 396.0, 214.0, 162.0, 76.0, 73.0, 50.0, 33.0, 37.0, 23.0, 19.0, 22.0, 12.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004161834716796875, -0.004034161567687988, -0.0039064884185791016, -0.003778815269470215, -0.003651142120361328, -0.0035234689712524414, -0.0033957958221435547, -0.003268122673034668, -0.0031404495239257812, -0.0030127763748168945, -0.002885103225708008, -0.002757430076599121, -0.0026297569274902344, -0.0025020837783813477, -0.002374410629272461, -0.0022467374801635742, -0.0021190643310546875, -0.0019913911819458008, -0.001863718032836914, -0.0017360448837280273, -0.0016083717346191406, -0.001480698585510254, -0.0013530254364013672, -0.0012253522872924805, -0.0010976791381835938, -0.000970005989074707, -0.0008423328399658203, -0.0007146596908569336, -0.0005869865417480469, -0.00045931339263916016, -0.00033164024353027344, -0.00020396709442138672, -7.62939453125e-05, 5.137920379638672e-05, 0.00017905235290527344, 0.00030672550201416016, 0.0004343986511230469, 0.0005620718002319336, 0.0006897449493408203, 0.000817418098449707, 0.0009450912475585938, 0.0010727643966674805, 0.0012004375457763672, 0.001328110694885254, 0.0014557838439941406, 0.0015834569931030273, 0.001711130142211914, 0.0018388032913208008, 0.0019664764404296875, 0.0020941495895385742, 0.002221822738647461, 0.0023494958877563477, 0.0024771690368652344, 0.002604842185974121, 0.002732515335083008, 0.0028601884841918945, 0.0029878616333007812, 0.003115534782409668, 0.0032432079315185547, 0.0033708810806274414, 0.003498554229736328, 0.003626227378845215, 0.0037539005279541016, 0.0038815736770629883, 0.004009246826171875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 34.0, 154.0, 245.0, 302.0, 182.0, 71.0, 16.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027681791107170284, -0.0002701149496715516, -0.0002634120173752308, -0.00025670905597507954, -0.00025000612367875874, -0.0002433031622786075, -0.00023660021543037146, -0.00022989726858213544, -0.00022319432173389941, -0.0002164913748856634, -0.00020978842803742737, -0.00020308548118919134, -0.0001963825197890401, -0.0001896795874927193, -0.00018297662609256804, -0.00017627367924433202, -0.000169570732396096, -0.00016286778554785997, -0.00015616483869962394, -0.00014946189185138792, -0.0001427589450031519, -0.00013605598360300064, -0.00012935303675476462, -0.0001226500899065286, -0.00011594714305829257, -0.00010924419621005654, -0.00010254124936182052, -9.583829523762688e-05, -8.913534838939086e-05, -8.243240154115483e-05, -7.572944741696119e-05, -6.902650056872517e-05, -6.232355372048914e-05, -5.562060687225312e-05, -4.891765638603829e-05, -4.221470589982346e-05, -3.551175905158743e-05, -2.8808812203351408e-05, -2.2105861717136577e-05, -1.5402911230921745e-05, -8.699964382685721e-06, -1.997015715460293e-06, 4.705932951765135e-06, 1.1408881618990563e-05, 1.811183028621599e-05, 2.4814777134452015e-05, 3.151772762066685e-05, 3.822067810688168e-05, 4.49236249551177e-05, 5.162657180335373e-05, 5.832952228956856e-05, 6.503247277578339e-05, 7.173541962401941e-05, 7.843836647225544e-05, 8.514132059644908e-05, 9.18442674446851e-05, 9.854721429292113e-05, 0.00010525016114115715, 0.00011195310798939317, 0.00011865606211358681, 0.00012535901623778045, 0.00013206194853410125, 0.0001387649099342525, 0.00014546785678248852, 0.00015217080363072455]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 5.0, 5.0, 9.0, 20.0, 14.0, 26.0, 27.0, 29.0, 22.0, 35.0, 35.0, 35.0, 48.0, 56.0, 47.0, 59.0, 45.0, 54.0, 52.0, 43.0, 42.0, 50.0, 38.0, 26.0, 37.0, 31.0, 20.0, 20.0, 16.0, 10.0, 14.0, 6.0, 2.0, 6.0, 5.0, 1.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011771917343139648, -0.00011443905532360077, -0.00011115893721580505, -0.00010787881910800934, -0.00010459870100021362, -0.00010131858289241791, -9.803846478462219e-05, -9.475834667682648e-05, -9.147822856903076e-05, -8.819811046123505e-05, -8.491799235343933e-05, -8.163787424564362e-05, -7.83577561378479e-05, -7.507763803005219e-05, -7.179751992225647e-05, -6.851740181446075e-05, -6.523728370666504e-05, -6.195716559886932e-05, -5.867704749107361e-05, -5.539692938327789e-05, -5.211681127548218e-05, -4.883669316768646e-05, -4.555657505989075e-05, -4.227645695209503e-05, -3.8996338844299316e-05, -3.57162207365036e-05, -3.2436102628707886e-05, -2.915598452091217e-05, -2.5875866413116455e-05, -2.259574830532074e-05, -1.9315630197525024e-05, -1.603551208972931e-05, -1.2755393981933594e-05, -9.475275874137878e-06, -6.195157766342163e-06, -2.9150396585464478e-06, 3.650784492492676e-07, 3.645196557044983e-06, 6.925314664840698e-06, 1.0205432772636414e-05, 1.3485550880432129e-05, 1.6765668988227844e-05, 2.004578709602356e-05, 2.3325905203819275e-05, 2.660602331161499e-05, 2.9886141419410706e-05, 3.316625952720642e-05, 3.6446377635002136e-05, 3.972649574279785e-05, 4.300661385059357e-05, 4.628673195838928e-05, 4.9566850066185e-05, 5.284696817398071e-05, 5.612708628177643e-05, 5.9407204389572144e-05, 6.268732249736786e-05, 6.596744060516357e-05, 6.924755871295929e-05, 7.2527676820755e-05, 7.580779492855072e-05, 7.908791303634644e-05, 8.236803114414215e-05, 8.564814925193787e-05, 8.892826735973358e-05, 9.22083854675293e-05]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 3.0, 1.0, 8.0, 3.0, 7.0, 11.0, 11.0, 14.0, 23.0, 22.0, 19.0, 20.0, 29.0, 26.0, 24.0, 30.0, 39.0, 40.0, 42.0, 30.0, 36.0, 41.0, 50.0, 54.0, 43.0, 37.0, 44.0, 25.0, 30.0, 44.0, 20.0, 20.0, 25.0, 22.0, 16.0, 20.0, 15.0, 12.0, 9.0, 7.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.93505859375, -3.7998046875, -3.66455078125, -3.529296875, -3.39404296875, -3.2587890625, -3.12353515625, -2.98828125, -2.85302734375, -2.7177734375, -2.58251953125, -2.447265625, -2.31201171875, -2.1767578125, -2.04150390625, -1.90625, -1.77099609375, -1.6357421875, -1.50048828125, -1.365234375, -1.22998046875, -1.0947265625, -0.95947265625, -0.82421875, -0.68896484375, -0.5537109375, -0.41845703125, -0.283203125, -0.14794921875, -0.0126953125, 0.12255859375, 0.2578125, 0.39306640625, 0.5283203125, 0.66357421875, 0.798828125, 0.93408203125, 1.0693359375, 1.20458984375, 1.33984375, 1.47509765625, 1.6103515625, 1.74560546875, 1.880859375, 2.01611328125, 2.1513671875, 2.28662109375, 2.421875, 2.55712890625, 2.6923828125, 2.82763671875, 2.962890625, 3.09814453125, 3.2333984375, 3.36865234375, 3.50390625, 3.63916015625, 3.7744140625, 3.90966796875, 4.044921875, 4.18017578125, 4.3154296875, 4.45068359375, 4.5859375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 2.0, 2.0, 13.0, 3.0, 8.0, 26.0, 20.0, 39.0, 57.0, 76.0, 88.0, 104.0, 149.0, 189.0, 258.0, 351.0, 503.0, 707.0, 1485.0, 5258.0, 28272.0, 287266.0, 658501.0, 51419.0, 8833.0, 2008.0, 821.0, 571.0, 387.0, 292.0, 219.0, 134.0, 122.0, 93.0, 70.0, 48.0, 41.0, 26.0, 22.0, 19.0, 12.0, 9.0, 6.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.2265625, -9.887451171875, -9.54833984375, -9.209228515625, -8.8701171875, -8.531005859375, -8.19189453125, -7.852783203125, -7.513671875, -7.174560546875, -6.83544921875, -6.496337890625, -6.1572265625, -5.818115234375, -5.47900390625, -5.139892578125, -4.80078125, -4.461669921875, -4.12255859375, -3.783447265625, -3.4443359375, -3.105224609375, -2.76611328125, -2.427001953125, -2.087890625, -1.748779296875, -1.40966796875, -1.070556640625, -0.7314453125, -0.392333984375, -0.05322265625, 0.285888671875, 0.625, 0.964111328125, 1.30322265625, 1.642333984375, 1.9814453125, 2.320556640625, 2.65966796875, 2.998779296875, 3.337890625, 3.677001953125, 4.01611328125, 4.355224609375, 4.6943359375, 5.033447265625, 5.37255859375, 5.711669921875, 6.05078125, 6.389892578125, 6.72900390625, 7.068115234375, 7.4072265625, 7.746337890625, 8.08544921875, 8.424560546875, 8.763671875, 9.102783203125, 9.44189453125, 9.781005859375, 10.1201171875, 10.459228515625, 10.79833984375, 11.137451171875, 11.4765625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 3.0, 4.0, 7.0, 10.0, 5.0, 12.0, 17.0, 25.0, 32.0, 38.0, 45.0, 56.0, 59.0, 68.0, 91.0, 315.0, 1663.0, 153.0, 72.0, 65.0, 57.0, 37.0, 41.0, 30.0, 33.0, 22.0, 16.0, 17.0, 10.0, 9.0, 11.0, 2.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.734375, -19.158447265625, -18.58251953125, -18.006591796875, -17.4306640625, -16.854736328125, -16.27880859375, -15.702880859375, -15.126953125, -14.551025390625, -13.97509765625, -13.399169921875, -12.8232421875, -12.247314453125, -11.67138671875, -11.095458984375, -10.51953125, -9.943603515625, -9.36767578125, -8.791748046875, -8.2158203125, -7.639892578125, -7.06396484375, -6.488037109375, -5.912109375, -5.336181640625, -4.76025390625, -4.184326171875, -3.6083984375, -3.032470703125, -2.45654296875, -1.880615234375, -1.3046875, -0.728759765625, -0.15283203125, 0.423095703125, 0.9990234375, 1.574951171875, 2.15087890625, 2.726806640625, 3.302734375, 3.878662109375, 4.45458984375, 5.030517578125, 5.6064453125, 6.182373046875, 6.75830078125, 7.334228515625, 7.91015625, 8.486083984375, 9.06201171875, 9.637939453125, 10.2138671875, 10.789794921875, 11.36572265625, 11.941650390625, 12.517578125, 13.093505859375, 13.66943359375, 14.245361328125, 14.8212890625, 15.397216796875, 15.97314453125, 16.549072265625, 17.125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 13.0, 17.0, 28.0, 56.0, 50.0, 85.0, 160.0, 344.0, 1796.0, 2785039.0, 355834.0, 1523.0, 324.0, 157.0, 102.0, 49.0, 38.0, 24.0, 19.0, 9.0, 6.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.625, -92.3232421875, -89.021484375, -85.7197265625, -82.41796875, -79.1162109375, -75.814453125, -72.5126953125, -69.2109375, -65.9091796875, -62.607421875, -59.3056640625, -56.00390625, -52.7021484375, -49.400390625, -46.0986328125, -42.796875, -39.4951171875, -36.193359375, -32.8916015625, -29.58984375, -26.2880859375, -22.986328125, -19.6845703125, -16.3828125, -13.0810546875, -9.779296875, -6.4775390625, -3.17578125, 0.1259765625, 3.427734375, 6.7294921875, 10.03125, 13.3330078125, 16.634765625, 19.9365234375, 23.23828125, 26.5400390625, 29.841796875, 33.1435546875, 36.4453125, 39.7470703125, 43.048828125, 46.3505859375, 49.65234375, 52.9541015625, 56.255859375, 59.5576171875, 62.859375, 66.1611328125, 69.462890625, 72.7646484375, 76.06640625, 79.3681640625, 82.669921875, 85.9716796875, 89.2734375, 92.5751953125, 95.876953125, 99.1787109375, 102.48046875, 105.7822265625, 109.083984375, 112.3857421875, 115.6875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 10.0, 57.0, 283.0, 473.0, 155.0, 32.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.85395812988281, -62.91175079345703, -60.969547271728516, -59.027339935302734, -57.08513259887695, -55.14292907714844, -53.200721740722656, -51.258514404296875, -49.316307067871094, -47.37409973144531, -45.4318962097168, -43.489688873291016, -41.547481536865234, -39.60527801513672, -37.66307067871094, -35.720863342285156, -33.77865982055664, -31.836454391479492, -29.89424705505371, -27.952041625976562, -26.00983428955078, -24.067628860473633, -22.125423431396484, -20.183216094970703, -18.241010665893555, -16.298805236816406, -14.356597900390625, -12.414392471313477, -10.472186088562012, -8.529979705810547, -6.587774276733398, -4.645567893981934, -2.703357696533203, -0.7611515522003174, 1.1810545921325684, 3.123260498046875, 5.06546688079834, 7.007673263549805, 8.949878692626953, 10.892085075378418, 12.834291458129883, 14.776497840881348, 16.718704223632812, 18.66090965270996, 20.60311508178711, 22.54532241821289, 24.48752784729004, 26.429733276367188, 28.37194061279297, 30.314146041870117, 32.256351470947266, 34.19855880737305, 36.14076614379883, 38.082969665527344, 40.025177001953125, 41.967384338378906, 43.90959167480469, 45.85179901123047, 47.794002532958984, 49.736209869384766, 51.67841720581055, 53.62062072753906, 55.562828063964844, 57.505035400390625, 59.44723892211914]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 6.0, 3.0, 4.0, 12.0, 8.0, 5.0, 15.0, 14.0, 15.0, 17.0, 23.0, 25.0, 20.0, 35.0, 37.0, 38.0, 37.0, 31.0, 37.0, 38.0, 48.0, 41.0, 40.0, 45.0, 38.0, 41.0, 51.0, 40.0, 23.0, 23.0, 24.0, 22.0, 31.0, 20.0, 25.0, 10.0, 8.0, 12.0, 14.0, 7.0, 5.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.744325637817383, -28.76934242248535, -27.794361114501953, -26.819377899169922, -25.84439468383789, -24.869413375854492, -23.89443016052246, -22.919448852539062, -21.94446563720703, -20.969482421875, -19.9945011138916, -19.01951789855957, -18.044536590576172, -17.06955337524414, -16.09457015991211, -15.119587898254395, -14.14460563659668, -13.169623374938965, -12.19464111328125, -11.219657897949219, -10.244675636291504, -9.269693374633789, -8.294710159301758, -7.319727897644043, -6.344745635986328, -5.369763374328613, -4.39478063583374, -3.4197981357574463, -2.4448156356811523, -1.4698333740234375, -0.49485063552856445, 0.4801321029663086, 1.4551162719726562, 2.43009877204895, 3.405081272125244, 4.380064010620117, 5.355046272277832, 6.330028533935547, 7.30501127243042, 8.279994010925293, 9.254976272583008, 10.229958534240723, 11.204940795898438, 12.179924011230469, 13.154906272888184, 14.129888534545898, 15.10487174987793, 16.079853057861328, 17.05483627319336, 18.02981948852539, 19.00480079650879, 19.97978401184082, 20.95476531982422, 21.92974853515625, 22.90473175048828, 23.879714965820312, 24.85469627380371, 25.829679489135742, 26.80466079711914, 27.779644012451172, 28.754627227783203, 29.7296085357666, 30.704591751098633, 31.67957305908203, 32.65455627441406]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 7.0, 6.0, 6.0, 4.0, 6.0, 11.0, 12.0, 13.0, 17.0, 14.0, 19.0, 39.0, 24.0, 27.0, 31.0, 22.0, 46.0, 45.0, 42.0, 49.0, 45.0, 52.0, 49.0, 36.0, 33.0, 41.0, 34.0, 34.0, 27.0, 20.0, 26.0, 25.0, 18.0, 20.0, 19.0, 13.0, 16.0, 16.0, 6.0, 8.0, 8.0, 4.0, 8.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.390625, -4.24755859375, -4.1044921875, -3.96142578125, -3.818359375, -3.67529296875, -3.5322265625, -3.38916015625, -3.24609375, -3.10302734375, -2.9599609375, -2.81689453125, -2.673828125, -2.53076171875, -2.3876953125, -2.24462890625, -2.1015625, -1.95849609375, -1.8154296875, -1.67236328125, -1.529296875, -1.38623046875, -1.2431640625, -1.10009765625, -0.95703125, -0.81396484375, -0.6708984375, -0.52783203125, -0.384765625, -0.24169921875, -0.0986328125, 0.04443359375, 0.1875, 0.33056640625, 0.4736328125, 0.61669921875, 0.759765625, 0.90283203125, 1.0458984375, 1.18896484375, 1.33203125, 1.47509765625, 1.6181640625, 1.76123046875, 1.904296875, 2.04736328125, 2.1904296875, 2.33349609375, 2.4765625, 2.61962890625, 2.7626953125, 2.90576171875, 3.048828125, 3.19189453125, 3.3349609375, 3.47802734375, 3.62109375, 3.76416015625, 3.9072265625, 4.05029296875, 4.193359375, 4.33642578125, 4.4794921875, 4.62255859375, 4.765625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 6.0, 9.0, 11.0, 12.0, 21.0, 30.0, 38.0, 32.0, 53.0, 66.0, 74.0, 102.0, 119.0, 182.0, 253.0, 381.0, 704.0, 1891.0, 9696.0, 113570.0, 1128531.0, 2375736.0, 515372.0, 39855.0, 4585.0, 1121.0, 559.0, 320.0, 211.0, 184.0, 122.0, 94.0, 71.0, 48.0, 49.0, 45.0, 32.0, 23.0, 16.0, 16.0, 9.0, 11.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.63671875, -7.37615966796875, -7.1156005859375, -6.85504150390625, -6.594482421875, -6.33392333984375, -6.0733642578125, -5.81280517578125, -5.55224609375, -5.29168701171875, -5.0311279296875, -4.77056884765625, -4.510009765625, -4.24945068359375, -3.9888916015625, -3.72833251953125, -3.4677734375, -3.20721435546875, -2.9466552734375, -2.68609619140625, -2.425537109375, -2.16497802734375, -1.9044189453125, -1.64385986328125, -1.38330078125, -1.12274169921875, -0.8621826171875, -0.60162353515625, -0.341064453125, -0.08050537109375, 0.1800537109375, 0.44061279296875, 0.701171875, 0.96173095703125, 1.2222900390625, 1.48284912109375, 1.743408203125, 2.00396728515625, 2.2645263671875, 2.52508544921875, 2.78564453125, 3.04620361328125, 3.3067626953125, 3.56732177734375, 3.827880859375, 4.08843994140625, 4.3489990234375, 4.60955810546875, 4.8701171875, 5.13067626953125, 5.3912353515625, 5.65179443359375, 5.912353515625, 6.17291259765625, 6.4334716796875, 6.69403076171875, 6.95458984375, 7.21514892578125, 7.4757080078125, 7.73626708984375, 7.996826171875, 8.25738525390625, 8.5179443359375, 8.77850341796875, 9.0390625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 6.0, 9.0, 6.0, 19.0, 21.0, 26.0, 41.0, 49.0, 99.0, 107.0, 166.0, 224.0, 327.0, 407.0, 457.0, 444.0, 406.0, 332.0, 236.0, 197.0, 122.0, 96.0, 76.0, 61.0, 34.0, 31.0, 20.0, 17.0, 4.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.53515625, -5.33050537109375, -5.1258544921875, -4.92120361328125, -4.716552734375, -4.51190185546875, -4.3072509765625, -4.10260009765625, -3.89794921875, -3.69329833984375, -3.4886474609375, -3.28399658203125, -3.079345703125, -2.87469482421875, -2.6700439453125, -2.46539306640625, -2.2607421875, -2.05609130859375, -1.8514404296875, -1.64678955078125, -1.442138671875, -1.23748779296875, -1.0328369140625, -0.82818603515625, -0.62353515625, -0.41888427734375, -0.2142333984375, -0.00958251953125, 0.195068359375, 0.39971923828125, 0.6043701171875, 0.80902099609375, 1.013671875, 1.21832275390625, 1.4229736328125, 1.62762451171875, 1.832275390625, 2.03692626953125, 2.2415771484375, 2.44622802734375, 2.65087890625, 2.85552978515625, 3.0601806640625, 3.26483154296875, 3.469482421875, 3.67413330078125, 3.8787841796875, 4.08343505859375, 4.2880859375, 4.49273681640625, 4.6973876953125, 4.90203857421875, 5.106689453125, 5.31134033203125, 5.5159912109375, 5.72064208984375, 5.92529296875, 6.12994384765625, 6.3345947265625, 6.53924560546875, 6.743896484375, 6.94854736328125, 7.1531982421875, 7.35784912109375, 7.5625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 6.0, 8.0, 18.0, 11.0, 22.0, 28.0, 37.0, 46.0, 62.0, 60.0, 87.0, 141.0, 180.0, 284.0, 431.0, 739.0, 1584.0, 6721.0, 88911.0, 3037941.0, 1020543.0, 29854.0, 3638.0, 1121.0, 569.0, 373.0, 240.0, 148.0, 125.0, 73.0, 61.0, 54.0, 41.0, 27.0, 29.0, 14.0, 14.0, 9.0, 4.0, 4.0, 3.0, 8.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.6484375, -15.1566162109375, -14.664794921875, -14.1729736328125, -13.68115234375, -13.1893310546875, -12.697509765625, -12.2056884765625, -11.7138671875, -11.2220458984375, -10.730224609375, -10.2384033203125, -9.74658203125, -9.2547607421875, -8.762939453125, -8.2711181640625, -7.779296875, -7.2874755859375, -6.795654296875, -6.3038330078125, -5.81201171875, -5.3201904296875, -4.828369140625, -4.3365478515625, -3.8447265625, -3.3529052734375, -2.861083984375, -2.3692626953125, -1.87744140625, -1.3856201171875, -0.893798828125, -0.4019775390625, 0.08984375, 0.5816650390625, 1.073486328125, 1.5653076171875, 2.05712890625, 2.5489501953125, 3.040771484375, 3.5325927734375, 4.0244140625, 4.5162353515625, 5.008056640625, 5.4998779296875, 5.99169921875, 6.4835205078125, 6.975341796875, 7.4671630859375, 7.958984375, 8.4508056640625, 8.942626953125, 9.4344482421875, 9.92626953125, 10.4180908203125, 10.909912109375, 11.4017333984375, 11.8935546875, 12.3853759765625, 12.877197265625, 13.3690185546875, 13.86083984375, 14.3526611328125, 14.844482421875, 15.3363037109375, 15.828125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 56.0, 401.0, 436.0, 111.0, 10.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.4868392944336, -84.95323181152344, -81.41963195800781, -77.88602447509766, -74.35242462158203, -70.81881713867188, -67.28521728515625, -63.751609802246094, -60.2180061340332, -56.68440246582031, -53.15079879760742, -49.61719512939453, -46.083587646484375, -42.54998779296875, -39.016380310058594, -35.4827766418457, -31.949172973632812, -28.415569305419922, -24.88196563720703, -21.348360061645508, -17.814756393432617, -14.281152725219727, -10.747547149658203, -7.2139434814453125, -3.680339813232422, -0.14673566818237305, 3.386868476867676, 6.920473098754883, 10.454076766967773, 13.987680435180664, 17.521286010742188, 21.054889678955078, 24.5885009765625, 28.12210464477539, 31.65570831298828, 35.18931579589844, 38.72291564941406, 42.25652313232422, 45.79012680053711, 49.32373046875, 52.85733413696289, 56.39093780517578, 59.92454147338867, 63.45814514160156, 66.99175262451172, 70.52535247802734, 74.0589599609375, 77.59255981445312, 81.12616729736328, 84.65977478027344, 88.19337463378906, 91.72698211669922, 95.26058197021484, 98.794189453125, 102.32778930664062, 105.86139678955078, 109.39500427246094, 112.9286117553711, 116.46221160888672, 119.99581909179688, 123.5294189453125, 127.06302642822266, 130.5966339111328, 134.13023376464844, 137.66383361816406]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 2.0, 6.0, 12.0, 7.0, 4.0, 8.0, 13.0, 10.0, 12.0, 14.0, 23.0, 16.0, 26.0, 24.0, 21.0, 20.0, 29.0, 33.0, 40.0, 34.0, 45.0, 37.0, 36.0, 42.0, 33.0, 42.0, 37.0, 38.0, 41.0, 36.0, 32.0, 34.0, 39.0, 19.0, 28.0, 10.0, 14.0, 22.0, 13.0, 10.0, 9.0, 7.0, 3.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-21.181427001953125, -20.560644149780273, -19.93985939025879, -19.319076538085938, -18.698291778564453, -18.0775089263916, -17.456724166870117, -16.835941314697266, -16.21515655517578, -15.594372749328613, -14.973588943481445, -14.352805137634277, -13.73202133178711, -13.111237525939941, -12.490453720092773, -11.869670867919922, -11.248887062072754, -10.628103256225586, -10.007319450378418, -9.38653564453125, -8.765751838684082, -8.144968032836914, -7.524184703826904, -6.903400897979736, -6.282617092132568, -5.6618332862854, -5.041049480438232, -4.420266151428223, -3.7994821071624756, -3.1786983013153076, -2.5579147338867188, -1.9371309280395508, -1.3163471221923828, -0.6955633759498596, -0.07477962970733643, 0.546004056930542, 1.16678786277771, 1.787571668624878, 2.408355236053467, 3.0291390419006348, 3.6499228477478027, 4.270706653594971, 4.891490459442139, 5.512273788452148, 6.133057594299316, 6.753841400146484, 7.374625205993652, 7.99540901184082, 8.616192817687988, 9.236976623535156, 9.857760429382324, 10.478544235229492, 11.09932804107666, 11.720111846923828, 12.34089469909668, 12.961679458618164, 13.582462310791016, 14.203246116638184, 14.824029922485352, 15.44481372833252, 16.065597534179688, 16.68638038635254, 17.307165145874023, 17.927947998046875, 18.54873275756836]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 9.0, 12.0, 10.0, 12.0, 13.0, 12.0, 14.0, 18.0, 15.0, 20.0, 22.0, 28.0, 25.0, 25.0, 31.0, 40.0, 41.0, 39.0, 44.0, 43.0, 46.0, 51.0, 50.0, 31.0, 38.0, 29.0, 40.0, 23.0, 31.0, 20.0, 19.0, 22.0, 22.0, 12.0, 16.0, 13.0, 6.0, 12.0, 10.0, 10.0, 8.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.998046875, -3.866058349609375, -3.73406982421875, -3.602081298828125, -3.4700927734375, -3.338104248046875, -3.20611572265625, -3.074127197265625, -2.942138671875, -2.810150146484375, -2.67816162109375, -2.546173095703125, -2.4141845703125, -2.282196044921875, -2.15020751953125, -2.018218994140625, -1.88623046875, -1.754241943359375, -1.62225341796875, -1.490264892578125, -1.3582763671875, -1.226287841796875, -1.09429931640625, -0.962310791015625, -0.830322265625, -0.698333740234375, -0.56634521484375, -0.434356689453125, -0.3023681640625, -0.170379638671875, -0.03839111328125, 0.093597412109375, 0.2255859375, 0.357574462890625, 0.48956298828125, 0.621551513671875, 0.7535400390625, 0.885528564453125, 1.01751708984375, 1.149505615234375, 1.281494140625, 1.413482666015625, 1.54547119140625, 1.677459716796875, 1.8094482421875, 1.941436767578125, 2.07342529296875, 2.205413818359375, 2.33740234375, 2.469390869140625, 2.60137939453125, 2.733367919921875, 2.8653564453125, 2.997344970703125, 3.12933349609375, 3.261322021484375, 3.393310546875, 3.525299072265625, 3.65728759765625, 3.789276123046875, 3.9212646484375, 4.053253173828125, 4.18524169921875, 4.317230224609375, 4.44921875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 10.0, 15.0, 10.0, 18.0, 28.0, 62.0, 65.0, 95.0, 116.0, 193.0, 272.0, 386.0, 555.0, 808.0, 1175.0, 1706.0, 2307.0, 3343.0, 4906.0, 6985.0, 10183.0, 14410.0, 21493.0, 32622.0, 51399.0, 88973.0, 173683.0, 273284.0, 144206.0, 77320.0, 45575.0, 29187.0, 19608.0, 13146.0, 9155.0, 6410.0, 4516.0, 3137.0, 2180.0, 1536.0, 1033.0, 763.0, 527.0, 369.0, 263.0, 153.0, 120.0, 75.0, 64.0, 36.0, 27.0, 17.0, 13.0, 7.0, 6.0, 7.0, 2.0], "bins": [-0.7099609375, -0.6893081665039062, -0.6686553955078125, -0.6480026245117188, -0.627349853515625, -0.6066970825195312, -0.5860443115234375, -0.5653915405273438, -0.54473876953125, -0.5240859985351562, -0.5034332275390625, -0.48278045654296875, -0.462127685546875, -0.44147491455078125, -0.4208221435546875, -0.40016937255859375, -0.3795166015625, -0.35886383056640625, -0.3382110595703125, -0.31755828857421875, -0.296905517578125, -0.27625274658203125, -0.2555999755859375, -0.23494720458984375, -0.21429443359375, -0.19364166259765625, -0.1729888916015625, -0.15233612060546875, -0.131683349609375, -0.11103057861328125, -0.0903778076171875, -0.06972503662109375, -0.049072265625, -0.02841949462890625, -0.0077667236328125, 0.01288604736328125, 0.033538818359375, 0.05419158935546875, 0.0748443603515625, 0.09549713134765625, 0.11614990234375, 0.13680267333984375, 0.1574554443359375, 0.17810821533203125, 0.198760986328125, 0.21941375732421875, 0.2400665283203125, 0.26071929931640625, 0.2813720703125, 0.30202484130859375, 0.3226776123046875, 0.34333038330078125, 0.363983154296875, 0.38463592529296875, 0.4052886962890625, 0.42594146728515625, 0.44659423828125, 0.46724700927734375, 0.4878997802734375, 0.5085525512695312, 0.529205322265625, 0.5498580932617188, 0.5705108642578125, 0.5911636352539062, 0.61181640625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 6.0, 10.0, 7.0, 13.0, 15.0, 15.0, 16.0, 15.0, 21.0, 36.0, 24.0, 27.0, 32.0, 21.0, 28.0, 29.0, 39.0, 39.0, 43.0, 1066.0, 48.0, 41.0, 40.0, 35.0, 33.0, 37.0, 40.0, 24.0, 34.0, 24.0, 26.0, 17.0, 15.0, 15.0, 17.0, 10.0, 13.0, 7.0, 5.0, 8.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.65234375, -2.57147216796875, -2.4906005859375, -2.40972900390625, -2.328857421875, -2.24798583984375, -2.1671142578125, -2.08624267578125, -2.00537109375, -1.92449951171875, -1.8436279296875, -1.76275634765625, -1.681884765625, -1.60101318359375, -1.5201416015625, -1.43927001953125, -1.3583984375, -1.27752685546875, -1.1966552734375, -1.11578369140625, -1.034912109375, -0.95404052734375, -0.8731689453125, -0.79229736328125, -0.71142578125, -0.63055419921875, -0.5496826171875, -0.46881103515625, -0.387939453125, -0.30706787109375, -0.2261962890625, -0.14532470703125, -0.064453125, 0.01641845703125, 0.0972900390625, 0.17816162109375, 0.259033203125, 0.33990478515625, 0.4207763671875, 0.50164794921875, 0.58251953125, 0.66339111328125, 0.7442626953125, 0.82513427734375, 0.906005859375, 0.98687744140625, 1.0677490234375, 1.14862060546875, 1.2294921875, 1.31036376953125, 1.3912353515625, 1.47210693359375, 1.552978515625, 1.63385009765625, 1.7147216796875, 1.79559326171875, 1.87646484375, 1.95733642578125, 2.0382080078125, 2.11907958984375, 2.199951171875, 2.28082275390625, 2.3616943359375, 2.44256591796875, 2.5234375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 1.0, 4.0, 5.0, 5.0, 11.0, 24.0, 33.0, 48.0, 70.0, 95.0, 155.0, 196.0, 304.0, 406.0, 589.0, 830.0, 1164.0, 1562.0, 2259.0, 3053.0, 4276.0, 5930.0, 8246.0, 11620.0, 16549.0, 23908.0, 34651.0, 51949.0, 83824.0, 156674.0, 1299881.0, 147336.0, 79667.0, 50167.0, 33188.0, 22601.0, 15993.0, 11285.0, 8066.0, 5751.0, 4084.0, 3018.0, 2191.0, 1529.0, 1165.0, 782.0, 565.0, 440.0, 301.0, 202.0, 161.0, 114.0, 77.0, 41.0, 27.0, 28.0, 17.0, 9.0, 10.0, 4.0, 2.0, 3.0, 1.0], "bins": [-0.54638671875, -0.5290145874023438, -0.5116424560546875, -0.49427032470703125, -0.476898193359375, -0.45952606201171875, -0.4421539306640625, -0.42478179931640625, -0.40740966796875, -0.39003753662109375, -0.3726654052734375, -0.35529327392578125, -0.337921142578125, -0.32054901123046875, -0.3031768798828125, -0.28580474853515625, -0.2684326171875, -0.25106048583984375, -0.2336883544921875, -0.21631622314453125, -0.198944091796875, -0.18157196044921875, -0.1641998291015625, -0.14682769775390625, -0.12945556640625, -0.11208343505859375, -0.0947113037109375, -0.07733917236328125, -0.059967041015625, -0.04259490966796875, -0.0252227783203125, -0.00785064697265625, 0.009521484375, 0.02689361572265625, 0.0442657470703125, 0.06163787841796875, 0.079010009765625, 0.09638214111328125, 0.1137542724609375, 0.13112640380859375, 0.14849853515625, 0.16587066650390625, 0.1832427978515625, 0.20061492919921875, 0.217987060546875, 0.23535919189453125, 0.2527313232421875, 0.27010345458984375, 0.2874755859375, 0.30484771728515625, 0.3222198486328125, 0.33959197998046875, 0.356964111328125, 0.37433624267578125, 0.3917083740234375, 0.40908050537109375, 0.42645263671875, 0.44382476806640625, 0.4611968994140625, 0.47856903076171875, 0.495941162109375, 0.5133132934570312, 0.5306854248046875, 0.5480575561523438, 0.5654296875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 7.0, 6.0, 9.0, 11.0, 16.0, 6.0, 18.0, 12.0, 31.0, 28.0, 35.0, 32.0, 46.0, 63.0, 47.0, 61.0, 85.0, 79.0, 64.0, 72.0, 41.0, 44.0, 37.0, 33.0, 22.0, 12.0, 20.0, 17.0, 9.0, 8.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00020456314086914062, -0.00019867345690727234, -0.00019278377294540405, -0.00018689408898353577, -0.00018100440502166748, -0.0001751147210597992, -0.0001692250370979309, -0.00016333535313606262, -0.00015744566917419434, -0.00015155598521232605, -0.00014566630125045776, -0.00013977661728858948, -0.0001338869333267212, -0.0001279972493648529, -0.00012210756540298462, -0.00011621788144111633, -0.00011032819747924805, -0.00010443851351737976, -9.854882955551147e-05, -9.265914559364319e-05, -8.67694616317749e-05, -8.087977766990662e-05, -7.499009370803833e-05, -6.910040974617004e-05, -6.321072578430176e-05, -5.732104182243347e-05, -5.1431357860565186e-05, -4.55416738986969e-05, -3.965198993682861e-05, -3.376230597496033e-05, -2.787262201309204e-05, -2.1982938051223755e-05, -1.609325408935547e-05, -1.0203570127487183e-05, -4.3138861656188965e-06, 1.5757977962493896e-06, 7.465481758117676e-06, 1.3355165719985962e-05, 1.9244849681854248e-05, 2.5134533643722534e-05, 3.102421760559082e-05, 3.6913901567459106e-05, 4.280358552932739e-05, 4.869326949119568e-05, 5.4582953453063965e-05, 6.047263741493225e-05, 6.636232137680054e-05, 7.225200533866882e-05, 7.814168930053711e-05, 8.40313732624054e-05, 8.992105722427368e-05, 9.581074118614197e-05, 0.00010170042514801025, 0.00010759010910987854, 0.00011347979307174683, 0.00011936947703361511, 0.0001252591609954834, 0.00013114884495735168, 0.00013703852891921997, 0.00014292821288108826, 0.00014881789684295654, 0.00015470758080482483, 0.00016059726476669312, 0.0001664869487285614, 0.0001723766326904297]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 8.0, 11.0, 12.0, 21.0, 33.0, 34.0, 34.0, 44.0, 76.0, 102.0, 128.0, 169.0, 326.0, 570.0, 1350.0, 642215.0, 400605.0, 1194.0, 552.0, 284.0, 192.0, 134.0, 104.0, 79.0, 48.0, 33.0, 40.0, 25.0, 22.0, 13.0, 17.0, 15.0, 11.0, 12.0, 6.0, 9.0, 1.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0032215118408203125, -0.0031140148639678955, -0.0030065178871154785, -0.0028990209102630615, -0.0027915239334106445, -0.0026840269565582275, -0.0025765299797058105, -0.0024690330028533936, -0.0023615360260009766, -0.0022540390491485596, -0.0021465420722961426, -0.0020390450954437256, -0.0019315481185913086, -0.0018240511417388916, -0.0017165541648864746, -0.0016090571880340576, -0.0015015602111816406, -0.0013940632343292236, -0.0012865662574768066, -0.0011790692806243896, -0.0010715723037719727, -0.0009640753269195557, -0.0008565783500671387, -0.0007490813732147217, -0.0006415843963623047, -0.0005340874195098877, -0.0004265904426574707, -0.0003190934658050537, -0.00021159648895263672, -0.00010409951210021973, 3.3974647521972656e-06, 0.00011089444160461426, 0.00021839141845703125, 0.00032588839530944824, 0.00043338537216186523, 0.0005408823490142822, 0.0006483793258666992, 0.0007558763027191162, 0.0008633732795715332, 0.0009708702564239502, 0.0010783672332763672, 0.0011858642101287842, 0.0012933611869812012, 0.0014008581638336182, 0.0015083551406860352, 0.0016158521175384521, 0.0017233490943908691, 0.0018308460712432861, 0.0019383430480957031, 0.00204584002494812, 0.002153337001800537, 0.002260833978652954, 0.002368330955505371, 0.002475827932357788, 0.002583324909210205, 0.002690821886062622, 0.002798318862915039, 0.002905815839767456, 0.003013312816619873, 0.00312080979347229, 0.003228306770324707, 0.003335803747177124, 0.003443300724029541, 0.003550797700881958, 0.003658294677734375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 14.0, 402.0, 562.0, 32.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0011356903705745935, -0.0011161316651850939, -0.0010965729597955942, -0.0010770141379907727, -0.001057455432601273, -0.0010378967272117734, -0.0010183380218222737, -0.0009987792000174522, -0.0009792204946279526, -0.0009596617892384529, -0.0009401030256412923, -0.0009205443202517927, -0.0009009855566546321, -0.0008814268512651324, -0.0008618680876679718, -0.0008423093822784722, -0.0008227506186813116, -0.0008031919132918119, -0.0007836331496946514, -0.0007640744443051517, -0.0007445156807079911, -0.0007249569753184915, -0.0007053982117213309, -0.0006858395063318312, -0.0006662808009423316, -0.0006467220955528319, -0.0006271633319556713, -0.0006076046265661716, -0.0005880458629690111, -0.0005684871575795114, -0.0005489283939823508, -0.0005293696885928512, -0.0005098109249956906, -0.0004902522196061909, -0.00047069345600903034, -0.0004511347215157002, -0.0004315759870223701, -0.00041201725252904, -0.00039245851803570986, -0.0003728998126462102, -0.00035334107815288007, -0.00033378234365954995, -0.00031422360916621983, -0.0002946648746728897, -0.0002751061401795596, -0.00025554740568622947, -0.00023598868574481457, -0.00021642995125148445, -0.00019687121675815433, -0.0001773124822648242, -0.0001577537477714941, -0.0001381950278300792, -0.00011863628606079146, -9.907755156746134e-05, -7.951882435008883e-05, -5.9960089856758714e-05, -4.040135536342859e-05, -2.0842622689087875e-05, -1.2838900147471577e-06, 1.8274840840604156e-05, 3.783357533393428e-05, 5.73923098272644e-05, 7.69510370446369e-05, 9.650977153796703e-05, 0.00011606850603129715]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 5.0, 2.0, 10.0, 8.0, 14.0, 14.0, 10.0, 14.0, 24.0, 17.0, 29.0, 14.0, 39.0, 35.0, 27.0, 28.0, 32.0, 44.0, 44.0, 37.0, 31.0, 34.0, 39.0, 43.0, 28.0, 41.0, 26.0, 41.0, 23.0, 38.0, 28.0, 16.0, 21.0, 21.0, 24.0, 14.0, 19.0, 11.0, 10.0, 12.0, 11.0, 9.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.445978164672852e-05, -8.176174014806747e-05, -7.906369864940643e-05, -7.636565715074539e-05, -7.366761565208435e-05, -7.096957415342331e-05, -6.827153265476227e-05, -6.557349115610123e-05, -6.287544965744019e-05, -6.0177408158779144e-05, -5.74793666601181e-05, -5.478132516145706e-05, -5.208328366279602e-05, -4.938524216413498e-05, -4.668720066547394e-05, -4.39891591668129e-05, -4.1291117668151855e-05, -3.8593076169490814e-05, -3.589503467082977e-05, -3.319699317216873e-05, -3.049895167350769e-05, -2.780091017484665e-05, -2.5102868676185608e-05, -2.2404827177524567e-05, -1.9706785678863525e-05, -1.7008744180202484e-05, -1.4310702681541443e-05, -1.1612661182880402e-05, -8.91461968421936e-06, -6.216578185558319e-06, -3.518536686897278e-06, -8.204951882362366e-07, 1.8775463104248047e-06, 4.575587809085846e-06, 7.273629307746887e-06, 9.971670806407928e-06, 1.266971230506897e-05, 1.536775380373001e-05, 1.8065795302391052e-05, 2.0763836801052094e-05, 2.3461878299713135e-05, 2.6159919798374176e-05, 2.8857961297035217e-05, 3.155600279569626e-05, 3.42540442943573e-05, 3.695208579301834e-05, 3.965012729167938e-05, 4.2348168790340424e-05, 4.5046210289001465e-05, 4.7744251787662506e-05, 5.044229328632355e-05, 5.314033478498459e-05, 5.583837628364563e-05, 5.853641778230667e-05, 6.123445928096771e-05, 6.393250077962875e-05, 6.66305422782898e-05, 6.932858377695084e-05, 7.202662527561188e-05, 7.472466677427292e-05, 7.742270827293396e-05, 8.0120749771595e-05, 8.281879127025604e-05, 8.551683276891708e-05, 8.821487426757812e-05]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 9.0, 12.0, 10.0, 12.0, 13.0, 12.0, 14.0, 18.0, 15.0, 20.0, 22.0, 28.0, 25.0, 25.0, 31.0, 40.0, 41.0, 39.0, 44.0, 43.0, 46.0, 51.0, 50.0, 31.0, 38.0, 29.0, 40.0, 23.0, 31.0, 20.0, 19.0, 22.0, 22.0, 12.0, 16.0, 13.0, 6.0, 12.0, 10.0, 10.0, 8.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.998046875, -3.866058349609375, -3.73406982421875, -3.602081298828125, -3.4700927734375, -3.338104248046875, -3.20611572265625, -3.074127197265625, -2.942138671875, -2.810150146484375, -2.67816162109375, -2.546173095703125, -2.4141845703125, -2.282196044921875, -2.15020751953125, -2.018218994140625, -1.88623046875, -1.754241943359375, -1.62225341796875, -1.490264892578125, -1.3582763671875, -1.226287841796875, -1.09429931640625, -0.962310791015625, -0.830322265625, -0.698333740234375, -0.56634521484375, -0.434356689453125, -0.3023681640625, -0.170379638671875, -0.03839111328125, 0.093597412109375, 0.2255859375, 0.357574462890625, 0.48956298828125, 0.621551513671875, 0.7535400390625, 0.885528564453125, 1.01751708984375, 1.149505615234375, 1.281494140625, 1.413482666015625, 1.54547119140625, 1.677459716796875, 1.8094482421875, 1.941436767578125, 2.07342529296875, 2.205413818359375, 2.33740234375, 2.469390869140625, 2.60137939453125, 2.733367919921875, 2.8653564453125, 2.997344970703125, 3.12933349609375, 3.261322021484375, 3.393310546875, 3.525299072265625, 3.65728759765625, 3.789276123046875, 3.9212646484375, 4.053253173828125, 4.18524169921875, 4.317230224609375, 4.44921875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 7.0, 6.0, 16.0, 16.0, 27.0, 38.0, 42.0, 46.0, 73.0, 88.0, 119.0, 166.0, 261.0, 383.0, 617.0, 1319.0, 2698.0, 6302.0, 15533.0, 39812.0, 104766.0, 293639.0, 360212.0, 136816.0, 50866.0, 19676.0, 7780.0, 3447.0, 1536.0, 803.0, 467.0, 256.0, 189.0, 137.0, 102.0, 74.0, 46.0, 39.0, 37.0, 29.0, 18.0, 13.0, 7.0, 10.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.171875, -5.0057373046875, -4.839599609375, -4.6734619140625, -4.50732421875, -4.3411865234375, -4.175048828125, -4.0089111328125, -3.8427734375, -3.6766357421875, -3.510498046875, -3.3443603515625, -3.17822265625, -3.0120849609375, -2.845947265625, -2.6798095703125, -2.513671875, -2.3475341796875, -2.181396484375, -2.0152587890625, -1.84912109375, -1.6829833984375, -1.516845703125, -1.3507080078125, -1.1845703125, -1.0184326171875, -0.852294921875, -0.6861572265625, -0.52001953125, -0.3538818359375, -0.187744140625, -0.0216064453125, 0.14453125, 0.3106689453125, 0.476806640625, 0.6429443359375, 0.80908203125, 0.9752197265625, 1.141357421875, 1.3074951171875, 1.4736328125, 1.6397705078125, 1.805908203125, 1.9720458984375, 2.13818359375, 2.3043212890625, 2.470458984375, 2.6365966796875, 2.802734375, 2.9688720703125, 3.135009765625, 3.3011474609375, 3.46728515625, 3.6334228515625, 3.799560546875, 3.9656982421875, 4.1318359375, 4.2979736328125, 4.464111328125, 4.6302490234375, 4.79638671875, 4.9625244140625, 5.128662109375, 5.2947998046875, 5.4609375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 12.0, 8.0, 17.0, 15.0, 34.0, 23.0, 25.0, 34.0, 28.0, 33.0, 54.0, 59.0, 64.0, 91.0, 244.0, 1514.0, 264.0, 127.0, 73.0, 56.0, 42.0, 31.0, 36.0, 42.0, 25.0, 16.0, 23.0, 11.0, 8.0, 7.0, 4.0, 9.0, 10.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1015625, -11.6475830078125, -11.193603515625, -10.7396240234375, -10.28564453125, -9.8316650390625, -9.377685546875, -8.9237060546875, -8.4697265625, -8.0157470703125, -7.561767578125, -7.1077880859375, -6.65380859375, -6.1998291015625, -5.745849609375, -5.2918701171875, -4.837890625, -4.3839111328125, -3.929931640625, -3.4759521484375, -3.02197265625, -2.5679931640625, -2.114013671875, -1.6600341796875, -1.2060546875, -0.7520751953125, -0.298095703125, 0.1558837890625, 0.60986328125, 1.0638427734375, 1.517822265625, 1.9718017578125, 2.42578125, 2.8797607421875, 3.333740234375, 3.7877197265625, 4.24169921875, 4.6956787109375, 5.149658203125, 5.6036376953125, 6.0576171875, 6.5115966796875, 6.965576171875, 7.4195556640625, 7.87353515625, 8.3275146484375, 8.781494140625, 9.2354736328125, 9.689453125, 10.1434326171875, 10.597412109375, 11.0513916015625, 11.50537109375, 11.9593505859375, 12.413330078125, 12.8673095703125, 13.3212890625, 13.7752685546875, 14.229248046875, 14.6832275390625, 15.13720703125, 15.5911865234375, 16.045166015625, 16.4991455078125, 16.953125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 7.0, 14.0, 17.0, 21.0, 27.0, 34.0, 54.0, 92.0, 127.0, 217.0, 349.0, 636.0, 1489.0, 24383.0, 2959476.0, 153736.0, 2895.0, 881.0, 425.0, 275.0, 184.0, 119.0, 73.0, 43.0, 27.0, 23.0, 10.0, 12.0, 7.0, 12.0, 9.0, 2.0, 5.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.265625, -28.39697265625, -27.5283203125, -26.65966796875, -25.791015625, -24.92236328125, -24.0537109375, -23.18505859375, -22.31640625, -21.44775390625, -20.5791015625, -19.71044921875, -18.841796875, -17.97314453125, -17.1044921875, -16.23583984375, -15.3671875, -14.49853515625, -13.6298828125, -12.76123046875, -11.892578125, -11.02392578125, -10.1552734375, -9.28662109375, -8.41796875, -7.54931640625, -6.6806640625, -5.81201171875, -4.943359375, -4.07470703125, -3.2060546875, -2.33740234375, -1.46875, -0.60009765625, 0.2685546875, 1.13720703125, 2.005859375, 2.87451171875, 3.7431640625, 4.61181640625, 5.48046875, 6.34912109375, 7.2177734375, 8.08642578125, 8.955078125, 9.82373046875, 10.6923828125, 11.56103515625, 12.4296875, 13.29833984375, 14.1669921875, 15.03564453125, 15.904296875, 16.77294921875, 17.6416015625, 18.51025390625, 19.37890625, 20.24755859375, 21.1162109375, 21.98486328125, 22.853515625, 23.72216796875, 24.5908203125, 25.45947265625, 26.328125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 22.0, 102.0, 259.0, 361.0, 198.0, 52.0, 12.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.3653564453125, -27.031261444091797, -25.69716453552246, -24.363067626953125, -23.028972625732422, -21.69487762451172, -20.360780715942383, -19.026683807373047, -17.692588806152344, -16.35849380493164, -15.024396896362305, -13.690300941467285, -12.356204986572266, -11.022109031677246, -9.688013076782227, -8.353917121887207, -7.0198211669921875, -5.685725212097168, -4.351629257202148, -3.017533302307129, -1.6834373474121094, -0.34934139251708984, 0.9847545623779297, 2.318850517272949, 3.6529464721679688, 4.987042427062988, 6.321138381958008, 7.655234336853027, 8.989330291748047, 10.323426246643066, 11.657522201538086, 12.991618156433105, 14.32571029663086, 15.659806251525879, 16.9939022064209, 18.327999114990234, 19.662094116210938, 20.99618911743164, 22.330286026000977, 23.664382934570312, 24.998477935791016, 26.33257293701172, 27.666669845581055, 29.00076675415039, 30.334861755371094, 31.668956756591797, 33.0030517578125, 34.33715057373047, 35.67124557495117, 37.005340576171875, 38.339439392089844, 39.67353439331055, 41.00762939453125, 42.34172439575195, 43.675819396972656, 45.009918212890625, 46.34401321411133, 47.67810821533203, 49.01220703125, 50.3463020324707, 51.680397033691406, 53.01449203491211, 54.34858703613281, 55.68268585205078, 57.016780853271484]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 10.0, 10.0, 9.0, 13.0, 12.0, 19.0, 21.0, 25.0, 30.0, 26.0, 24.0, 25.0, 34.0, 34.0, 55.0, 29.0, 27.0, 44.0, 42.0, 41.0, 44.0, 44.0, 34.0, 32.0, 32.0, 23.0, 33.0, 28.0, 17.0, 22.0, 16.0, 17.0, 14.0, 17.0, 19.0, 12.0, 12.0, 6.0, 8.0, 8.0, 4.0, 4.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-26.375974655151367, -25.584087371826172, -24.79220199584961, -24.000316619873047, -23.20842933654785, -22.416542053222656, -21.624656677246094, -20.83277130126953, -20.040884017944336, -19.24899673461914, -18.457111358642578, -17.665225982666016, -16.87333869934082, -16.081451416015625, -15.289566040039062, -14.497679710388184, -13.705793380737305, -12.913907051086426, -12.122020721435547, -11.330134391784668, -10.538248062133789, -9.74636173248291, -8.954475402832031, -8.162589073181152, -7.370702743530273, -6.5788164138793945, -5.786930084228516, -4.995043754577637, -4.203157424926758, -3.411271095275879, -2.619384765625, -1.827498435974121, -1.035614013671875, -0.2437276840209961, 0.5481586456298828, 1.3400449752807617, 2.1319313049316406, 2.9238176345825195, 3.7157039642333984, 4.507590293884277, 5.299476623535156, 6.091362953186035, 6.883249282836914, 7.675135612487793, 8.467021942138672, 9.25890827178955, 10.05079460144043, 10.842680931091309, 11.634567260742188, 12.426453590393066, 13.218339920043945, 14.010226249694824, 14.802112579345703, 15.593998908996582, 16.38588523864746, 17.177772521972656, 17.96965789794922, 18.76154327392578, 19.553430557250977, 20.345317840576172, 21.137203216552734, 21.929088592529297, 22.720975875854492, 23.512863159179688, 24.30474853515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 7.0, 5.0, 6.0, 10.0, 10.0, 12.0, 17.0, 13.0, 19.0, 14.0, 17.0, 21.0, 18.0, 26.0, 23.0, 24.0, 39.0, 39.0, 46.0, 49.0, 40.0, 51.0, 47.0, 42.0, 41.0, 34.0, 34.0, 30.0, 34.0, 32.0, 27.0, 20.0, 23.0, 22.0, 17.0, 16.0, 17.0, 17.0, 4.0, 8.0, 11.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.0078125, -3.873779296875, -3.73974609375, -3.605712890625, -3.4716796875, -3.337646484375, -3.20361328125, -3.069580078125, -2.935546875, -2.801513671875, -2.66748046875, -2.533447265625, -2.3994140625, -2.265380859375, -2.13134765625, -1.997314453125, -1.86328125, -1.729248046875, -1.59521484375, -1.461181640625, -1.3271484375, -1.193115234375, -1.05908203125, -0.925048828125, -0.791015625, -0.656982421875, -0.52294921875, -0.388916015625, -0.2548828125, -0.120849609375, 0.01318359375, 0.147216796875, 0.28125, 0.415283203125, 0.54931640625, 0.683349609375, 0.8173828125, 0.951416015625, 1.08544921875, 1.219482421875, 1.353515625, 1.487548828125, 1.62158203125, 1.755615234375, 1.8896484375, 2.023681640625, 2.15771484375, 2.291748046875, 2.42578125, 2.559814453125, 2.69384765625, 2.827880859375, 2.9619140625, 3.095947265625, 3.22998046875, 3.364013671875, 3.498046875, 3.632080078125, 3.76611328125, 3.900146484375, 4.0341796875, 4.168212890625, 4.30224609375, 4.436279296875, 4.5703125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 6.0, 5.0, 8.0, 5.0, 10.0, 8.0, 14.0, 18.0, 26.0, 37.0, 40.0, 65.0, 114.0, 180.0, 349.0, 854.0, 3003.0, 23423.0, 317797.0, 2213932.0, 1476141.0, 143437.0, 11528.0, 1891.0, 614.0, 279.0, 135.0, 89.0, 65.0, 40.0, 22.0, 20.0, 29.0, 17.0, 19.0, 9.0, 7.0, 7.0, 4.0, 6.0, 5.0, 5.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.734375, -9.46282958984375, -9.1912841796875, -8.91973876953125, -8.648193359375, -8.37664794921875, -8.1051025390625, -7.83355712890625, -7.56201171875, -7.29046630859375, -7.0189208984375, -6.74737548828125, -6.475830078125, -6.20428466796875, -5.9327392578125, -5.66119384765625, -5.3896484375, -5.11810302734375, -4.8465576171875, -4.57501220703125, -4.303466796875, -4.03192138671875, -3.7603759765625, -3.48883056640625, -3.21728515625, -2.94573974609375, -2.6741943359375, -2.40264892578125, -2.131103515625, -1.85955810546875, -1.5880126953125, -1.31646728515625, -1.044921875, -0.77337646484375, -0.5018310546875, -0.23028564453125, 0.041259765625, 0.31280517578125, 0.5843505859375, 0.85589599609375, 1.12744140625, 1.39898681640625, 1.6705322265625, 1.94207763671875, 2.213623046875, 2.48516845703125, 2.7567138671875, 3.02825927734375, 3.2998046875, 3.57135009765625, 3.8428955078125, 4.11444091796875, 4.385986328125, 4.65753173828125, 4.9290771484375, 5.20062255859375, 5.47216796875, 5.74371337890625, 6.0152587890625, 6.28680419921875, 6.558349609375, 6.82989501953125, 7.1014404296875, 7.37298583984375, 7.64453125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 1.0, 7.0, 5.0, 9.0, 12.0, 16.0, 26.0, 36.0, 58.0, 68.0, 89.0, 143.0, 193.0, 311.0, 387.0, 521.0, 501.0, 453.0, 372.0, 262.0, 187.0, 139.0, 79.0, 57.0, 44.0, 27.0, 20.0, 17.0, 8.0, 6.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.81640625, -7.6064453125, -7.396484375, -7.1865234375, -6.9765625, -6.7666015625, -6.556640625, -6.3466796875, -6.13671875, -5.9267578125, -5.716796875, -5.5068359375, -5.296875, -5.0869140625, -4.876953125, -4.6669921875, -4.45703125, -4.2470703125, -4.037109375, -3.8271484375, -3.6171875, -3.4072265625, -3.197265625, -2.9873046875, -2.77734375, -2.5673828125, -2.357421875, -2.1474609375, -1.9375, -1.7275390625, -1.517578125, -1.3076171875, -1.09765625, -0.8876953125, -0.677734375, -0.4677734375, -0.2578125, -0.0478515625, 0.162109375, 0.3720703125, 0.58203125, 0.7919921875, 1.001953125, 1.2119140625, 1.421875, 1.6318359375, 1.841796875, 2.0517578125, 2.26171875, 2.4716796875, 2.681640625, 2.8916015625, 3.1015625, 3.3115234375, 3.521484375, 3.7314453125, 3.94140625, 4.1513671875, 4.361328125, 4.5712890625, 4.78125, 4.9912109375, 5.201171875, 5.4111328125, 5.62109375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 15.0, 12.0, 15.0, 20.0, 19.0, 31.0, 52.0, 58.0, 86.0, 148.0, 272.0, 433.0, 831.0, 1994.0, 6699.0, 34452.0, 300883.0, 2794559.0, 952082.0, 82890.0, 12979.0, 3232.0, 1144.0, 512.0, 281.0, 171.0, 129.0, 75.0, 47.0, 33.0, 18.0, 19.0, 20.0, 19.0, 2.0, 14.0, 11.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.6796875, -9.37451171875, -9.0693359375, -8.76416015625, -8.458984375, -8.15380859375, -7.8486328125, -7.54345703125, -7.23828125, -6.93310546875, -6.6279296875, -6.32275390625, -6.017578125, -5.71240234375, -5.4072265625, -5.10205078125, -4.796875, -4.49169921875, -4.1865234375, -3.88134765625, -3.576171875, -3.27099609375, -2.9658203125, -2.66064453125, -2.35546875, -2.05029296875, -1.7451171875, -1.43994140625, -1.134765625, -0.82958984375, -0.5244140625, -0.21923828125, 0.0859375, 0.39111328125, 0.6962890625, 1.00146484375, 1.306640625, 1.61181640625, 1.9169921875, 2.22216796875, 2.52734375, 2.83251953125, 3.1376953125, 3.44287109375, 3.748046875, 4.05322265625, 4.3583984375, 4.66357421875, 4.96875, 5.27392578125, 5.5791015625, 5.88427734375, 6.189453125, 6.49462890625, 6.7998046875, 7.10498046875, 7.41015625, 7.71533203125, 8.0205078125, 8.32568359375, 8.630859375, 8.93603515625, 9.2412109375, 9.54638671875, 9.8515625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 16.0, 49.0, 76.0, 154.0, 205.0, 198.0, 148.0, 95.0, 43.0, 13.0, 9.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-51.798091888427734, -50.645545959472656, -49.49299621582031, -48.34044647216797, -47.18790054321289, -46.03535461425781, -44.88280487060547, -43.730255126953125, -42.57770919799805, -41.42516326904297, -40.272613525390625, -39.12006378173828, -37.9675178527832, -36.814971923828125, -35.66242218017578, -34.50987243652344, -33.35732650756836, -32.20478057861328, -31.052230834960938, -29.899682998657227, -28.747135162353516, -27.594587326049805, -26.442039489746094, -25.289491653442383, -24.136943817138672, -22.98439598083496, -21.83184814453125, -20.67930030822754, -19.526752471923828, -18.374204635620117, -17.221656799316406, -16.069108963012695, -14.916557312011719, -13.764009475708008, -12.611461639404297, -11.458913803100586, -10.306365966796875, -9.153818130493164, -8.001270294189453, -6.848722457885742, -5.696174621582031, -4.54362678527832, -3.3910789489746094, -2.2385311126708984, -1.0859832763671875, 0.06656455993652344, 1.2191123962402344, 2.3716602325439453, 3.5242080688476562, 4.676755905151367, 5.829303741455078, 6.981851577758789, 8.1343994140625, 9.286947250366211, 10.439495086669922, 11.592042922973633, 12.744590759277344, 13.897138595581055, 15.049686431884766, 16.202234268188477, 17.354782104492188, 18.5073299407959, 19.65987777709961, 20.81242561340332, 21.96497344970703]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 5.0, 3.0, 3.0, 3.0, 9.0, 5.0, 10.0, 13.0, 13.0, 10.0, 16.0, 17.0, 22.0, 19.0, 21.0, 43.0, 26.0, 27.0, 35.0, 38.0, 30.0, 32.0, 41.0, 43.0, 31.0, 55.0, 45.0, 30.0, 36.0, 28.0, 32.0, 24.0, 29.0, 22.0, 27.0, 27.0, 20.0, 17.0, 20.0, 14.0, 11.0, 12.0, 13.0, 7.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.560039520263672, -16.944480895996094, -16.328920364379883, -15.713360786437988, -15.097801208496094, -14.4822416305542, -13.866682052612305, -13.25112247467041, -12.635562896728516, -12.020003318786621, -11.404443740844727, -10.788884162902832, -10.173324584960938, -9.557765007019043, -8.942205429077148, -8.326645851135254, -7.711086273193359, -7.095526695251465, -6.47996711730957, -5.864407539367676, -5.248847961425781, -4.633288383483887, -4.017728805541992, -3.4021692276000977, -2.786609649658203, -2.1710500717163086, -1.555490493774414, -0.9399309158325195, -0.324371337890625, 0.29118824005126953, 0.9067478179931641, 1.5223073959350586, 2.1378650665283203, 2.753424644470215, 3.3689842224121094, 3.984543800354004, 4.600103378295898, 5.215662956237793, 5.8312225341796875, 6.446782112121582, 7.062341690063477, 7.677901268005371, 8.293460845947266, 8.90902042388916, 9.524580001831055, 10.14013957977295, 10.755699157714844, 11.371258735656738, 11.986818313598633, 12.602377891540527, 13.217937469482422, 13.833497047424316, 14.449056625366211, 15.064616203308105, 15.68017578125, 16.295734405517578, 16.91129493713379, 17.52685546875, 18.142414093017578, 18.757972717285156, 19.373533248901367, 19.989093780517578, 20.604652404785156, 21.220211029052734, 21.835771560668945]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 5.0, 2.0, 8.0, 11.0, 9.0, 7.0, 11.0, 12.0, 16.0, 12.0, 21.0, 22.0, 26.0, 24.0, 21.0, 33.0, 40.0, 35.0, 35.0, 52.0, 45.0, 52.0, 42.0, 44.0, 55.0, 32.0, 31.0, 28.0, 30.0, 33.0, 23.0, 32.0, 27.0, 25.0, 23.0, 14.0, 13.0, 7.0, 11.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.817779541015625, -3.67657470703125, -3.535369873046875, -3.3941650390625, -3.252960205078125, -3.11175537109375, -2.970550537109375, -2.829345703125, -2.688140869140625, -2.54693603515625, -2.405731201171875, -2.2645263671875, -2.123321533203125, -1.98211669921875, -1.840911865234375, -1.69970703125, -1.558502197265625, -1.41729736328125, -1.276092529296875, -1.1348876953125, -0.993682861328125, -0.85247802734375, -0.711273193359375, -0.570068359375, -0.428863525390625, -0.28765869140625, -0.146453857421875, -0.0052490234375, 0.135955810546875, 0.27716064453125, 0.418365478515625, 0.5595703125, 0.700775146484375, 0.84197998046875, 0.983184814453125, 1.1243896484375, 1.265594482421875, 1.40679931640625, 1.548004150390625, 1.689208984375, 1.830413818359375, 1.97161865234375, 2.112823486328125, 2.2540283203125, 2.395233154296875, 2.53643798828125, 2.677642822265625, 2.81884765625, 2.960052490234375, 3.10125732421875, 3.242462158203125, 3.3836669921875, 3.524871826171875, 3.66607666015625, 3.807281494140625, 3.948486328125, 4.089691162109375, 4.23089599609375, 4.372100830078125, 4.5133056640625, 4.654510498046875, 4.79571533203125, 4.936920166015625, 5.078125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 8.0, 13.0, 9.0, 34.0, 37.0, 53.0, 66.0, 104.0, 124.0, 197.0, 284.0, 407.0, 639.0, 980.0, 1485.0, 2391.0, 3576.0, 5662.0, 8590.0, 13762.0, 22120.0, 37738.0, 68805.0, 146387.0, 338385.0, 195465.0, 85335.0, 45172.0, 26877.0, 16042.0, 9828.0, 6109.0, 4041.0, 2577.0, 1662.0, 1168.0, 813.0, 542.0, 361.0, 262.0, 149.0, 113.0, 67.0, 36.0, 31.0, 20.0, 12.0, 6.0, 7.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.723358154296875, -0.69720458984375, -0.671051025390625, -0.6448974609375, -0.618743896484375, -0.59259033203125, -0.566436767578125, -0.540283203125, -0.514129638671875, -0.48797607421875, -0.461822509765625, -0.4356689453125, -0.409515380859375, -0.38336181640625, -0.357208251953125, -0.3310546875, -0.304901123046875, -0.27874755859375, -0.252593994140625, -0.2264404296875, -0.200286865234375, -0.17413330078125, -0.147979736328125, -0.121826171875, -0.095672607421875, -0.06951904296875, -0.043365478515625, -0.0172119140625, 0.008941650390625, 0.03509521484375, 0.061248779296875, 0.08740234375, 0.113555908203125, 0.13970947265625, 0.165863037109375, 0.1920166015625, 0.218170166015625, 0.24432373046875, 0.270477294921875, 0.296630859375, 0.322784423828125, 0.34893798828125, 0.375091552734375, 0.4012451171875, 0.427398681640625, 0.45355224609375, 0.479705810546875, 0.505859375, 0.532012939453125, 0.55816650390625, 0.584320068359375, 0.6104736328125, 0.636627197265625, 0.66278076171875, 0.688934326171875, 0.715087890625, 0.741241455078125, 0.76739501953125, 0.793548583984375, 0.8197021484375, 0.845855712890625, 0.87200927734375, 0.898162841796875, 0.92431640625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 4.0, 6.0, 3.0, 5.0, 8.0, 14.0, 19.0, 15.0, 14.0, 24.0, 16.0, 28.0, 30.0, 23.0, 29.0, 36.0, 36.0, 39.0, 42.0, 47.0, 35.0, 1059.0, 42.0, 43.0, 42.0, 34.0, 43.0, 28.0, 29.0, 27.0, 32.0, 21.0, 27.0, 19.0, 17.0, 14.0, 10.0, 12.0, 10.0, 9.0, 13.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.771484375, -2.683319091796875, -2.59515380859375, -2.506988525390625, -2.4188232421875, -2.330657958984375, -2.24249267578125, -2.154327392578125, -2.066162109375, -1.977996826171875, -1.88983154296875, -1.801666259765625, -1.7135009765625, -1.625335693359375, -1.53717041015625, -1.449005126953125, -1.36083984375, -1.272674560546875, -1.18450927734375, -1.096343994140625, -1.0081787109375, -0.920013427734375, -0.83184814453125, -0.743682861328125, -0.655517578125, -0.567352294921875, -0.47918701171875, -0.391021728515625, -0.3028564453125, -0.214691162109375, -0.12652587890625, -0.038360595703125, 0.0498046875, 0.137969970703125, 0.22613525390625, 0.314300537109375, 0.4024658203125, 0.490631103515625, 0.57879638671875, 0.666961669921875, 0.755126953125, 0.843292236328125, 0.93145751953125, 1.019622802734375, 1.1077880859375, 1.195953369140625, 1.28411865234375, 1.372283935546875, 1.46044921875, 1.548614501953125, 1.63677978515625, 1.724945068359375, 1.8131103515625, 1.901275634765625, 1.98944091796875, 2.077606201171875, 2.165771484375, 2.253936767578125, 2.34210205078125, 2.430267333984375, 2.5184326171875, 2.606597900390625, 2.69476318359375, 2.782928466796875, 2.87109375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 7.0, 7.0, 5.0, 18.0, 25.0, 31.0, 44.0, 71.0, 108.0, 145.0, 173.0, 276.0, 438.0, 538.0, 840.0, 1106.0, 1594.0, 2130.0, 3022.0, 4334.0, 5965.0, 8396.0, 11791.0, 17051.0, 24694.0, 36409.0, 56100.0, 93852.0, 178821.0, 1294533.0, 133273.0, 73839.0, 45952.0, 30884.0, 20708.0, 14551.0, 10255.0, 7274.0, 5114.0, 3603.0, 2629.0, 1942.0, 1343.0, 943.0, 628.0, 486.0, 354.0, 278.0, 167.0, 124.0, 96.0, 61.0, 42.0, 23.0, 18.0, 12.0, 8.0, 4.0, 3.0, 0.0, 6.0], "bins": [-0.61572265625, -0.596649169921875, -0.57757568359375, -0.558502197265625, -0.5394287109375, -0.520355224609375, -0.50128173828125, -0.482208251953125, -0.463134765625, -0.444061279296875, -0.42498779296875, -0.405914306640625, -0.3868408203125, -0.367767333984375, -0.34869384765625, -0.329620361328125, -0.310546875, -0.291473388671875, -0.27239990234375, -0.253326416015625, -0.2342529296875, -0.215179443359375, -0.19610595703125, -0.177032470703125, -0.157958984375, -0.138885498046875, -0.11981201171875, -0.100738525390625, -0.0816650390625, -0.062591552734375, -0.04351806640625, -0.024444580078125, -0.00537109375, 0.013702392578125, 0.03277587890625, 0.051849365234375, 0.0709228515625, 0.089996337890625, 0.10906982421875, 0.128143310546875, 0.147216796875, 0.166290283203125, 0.18536376953125, 0.204437255859375, 0.2235107421875, 0.242584228515625, 0.26165771484375, 0.280731201171875, 0.2998046875, 0.318878173828125, 0.33795166015625, 0.357025146484375, 0.3760986328125, 0.395172119140625, 0.41424560546875, 0.433319091796875, 0.452392578125, 0.471466064453125, 0.49053955078125, 0.509613037109375, 0.5286865234375, 0.547760009765625, 0.56683349609375, 0.585906982421875, 0.60498046875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 5.0, 6.0, 4.0, 10.0, 8.0, 5.0, 8.0, 20.0, 17.0, 24.0, 20.0, 20.0, 32.0, 31.0, 44.0, 45.0, 54.0, 55.0, 62.0, 75.0, 58.0, 66.0, 49.0, 39.0, 44.0, 42.0, 36.0, 22.0, 20.0, 18.0, 12.0, 11.0, 9.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015115737915039062, -0.0001463666558265686, -0.00014157593250274658, -0.00013678520917892456, -0.00013199448585510254, -0.00012720376253128052, -0.0001224130392074585, -0.00011762231588363647, -0.00011283159255981445, -0.00010804086923599243, -0.00010325014591217041, -9.845942258834839e-05, -9.366869926452637e-05, -8.887797594070435e-05, -8.408725261688232e-05, -7.92965292930603e-05, -7.450580596923828e-05, -6.971508264541626e-05, -6.492435932159424e-05, -6.013363599777222e-05, -5.5342912673950195e-05, -5.0552189350128174e-05, -4.576146602630615e-05, -4.097074270248413e-05, -3.618001937866211e-05, -3.138929605484009e-05, -2.6598572731018066e-05, -2.1807849407196045e-05, -1.7017126083374023e-05, -1.2226402759552002e-05, -7.4356794357299805e-06, -2.644956111907959e-06, 2.1457672119140625e-06, 6.936490535736084e-06, 1.1727213859558105e-05, 1.6517937183380127e-05, 2.130866050720215e-05, 2.609938383102417e-05, 3.089010715484619e-05, 3.568083047866821e-05, 4.0471553802490234e-05, 4.5262277126312256e-05, 5.005300045013428e-05, 5.48437237739563e-05, 5.963444709777832e-05, 6.442517042160034e-05, 6.921589374542236e-05, 7.400661706924438e-05, 7.87973403930664e-05, 8.358806371688843e-05, 8.837878704071045e-05, 9.316951036453247e-05, 9.796023368835449e-05, 0.00010275095701217651, 0.00010754168033599854, 0.00011233240365982056, 0.00011712312698364258, 0.0001219138503074646, 0.00012670457363128662, 0.00013149529695510864, 0.00013628602027893066, 0.00014107674360275269, 0.0001458674669265747, 0.00015065819025039673, 0.00015544891357421875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 7.0, 7.0, 12.0, 7.0, 9.0, 21.0, 18.0, 33.0, 30.0, 53.0, 63.0, 104.0, 114.0, 202.0, 276.0, 526.0, 1109.0, 119431.0, 922748.0, 1920.0, 683.0, 350.0, 230.0, 137.0, 86.0, 86.0, 60.0, 42.0, 45.0, 31.0, 24.0, 10.0, 19.0, 12.0, 13.0, 6.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.003078460693359375, -0.002985656261444092, -0.0028928518295288086, -0.0028000473976135254, -0.002707242965698242, -0.002614438533782959, -0.0025216341018676758, -0.0024288296699523926, -0.0023360252380371094, -0.002243220806121826, -0.002150416374206543, -0.0020576119422912598, -0.0019648075103759766, -0.0018720030784606934, -0.0017791986465454102, -0.001686394214630127, -0.0015935897827148438, -0.0015007853507995605, -0.0014079809188842773, -0.0013151764869689941, -0.001222372055053711, -0.0011295676231384277, -0.0010367631912231445, -0.0009439587593078613, -0.0008511543273925781, -0.0007583498954772949, -0.0006655454635620117, -0.0005727410316467285, -0.0004799365997314453, -0.0003871321678161621, -0.0002943277359008789, -0.0002015233039855957, -0.0001087188720703125, -1.5914440155029297e-05, 7.68899917602539e-05, 0.0001696944236755371, 0.0002624988555908203, 0.0003553032875061035, 0.0004481077194213867, 0.0005409121513366699, 0.0006337165832519531, 0.0007265210151672363, 0.0008193254470825195, 0.0009121298789978027, 0.001004934310913086, 0.0010977387428283691, 0.0011905431747436523, 0.0012833476066589355, 0.0013761520385742188, 0.001468956470489502, 0.0015617609024047852, 0.0016545653343200684, 0.0017473697662353516, 0.0018401741981506348, 0.001932978630065918, 0.002025783061981201, 0.0021185874938964844, 0.0022113919258117676, 0.0023041963577270508, 0.002397000789642334, 0.002489805221557617, 0.0025826096534729004, 0.0026754140853881836, 0.002768218517303467, 0.00286102294921875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 43.0, 173.0, 395.0, 281.0, 103.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014769290282856673, -0.0001383087655995041, -0.00012892464292235672, -0.00011954050569329411, -0.00011015638301614672, -0.0001007722457870841, -9.13881158339791e-05, -8.20039858808741e-05, -7.26198559277691e-05, -6.323572597466409e-05, -5.385159602155909e-05, -4.446746243047528e-05, -3.508333247737028e-05, -2.5699202524265274e-05, -1.6315068933181465e-05, -6.930938980076462e-06, 2.4531909730285406e-06, 1.1837321835628245e-05, 2.122145269822795e-05, 3.0605584470322356e-05, 3.998971442342736e-05, 4.937384437653236e-05, 5.875797796761617e-05, 6.814210792072117e-05, 7.752623787382618e-05, 8.691036782693118e-05, 9.629449778003618e-05, 0.00010567862773314118, 0.0001150627649622038, 0.0001244468876393512, 0.0001338310248684138, 0.0001432151475455612, 0.00015259927022270858, 0.0001619834074517712, 0.0001713675301289186, 0.0001807516673579812, 0.0001901357900351286, 0.0001995199272641912, 0.00020890406449325383, 0.00021828818717040122, 0.0002276723098475486, 0.00023705644707661122, 0.00024644058430567384, 0.0002558247069828212, 0.0002652088296599686, 0.000274592952337116, 0.00028397710411809385, 0.00029336122679524124, 0.0003027453785762191, 0.00031212950125336647, 0.0003215136530343443, 0.0003308977757114917, 0.0003402818983886391, 0.0003496660210657865, 0.0003590501728467643, 0.0003684342955239117, 0.0003778184182010591, 0.0003872025408782065, 0.00039658669265918434, 0.0004059708153363317, 0.0004153549380134791, 0.0004247390606906265, 0.00043412321247160435, 0.00044350733514875174, 0.0004528914578258991]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 16.0, 10.0, 11.0, 14.0, 17.0, 11.0, 23.0, 22.0, 25.0, 22.0, 27.0, 26.0, 36.0, 51.0, 40.0, 42.0, 49.0, 41.0, 44.0, 38.0, 36.0, 35.0, 33.0, 34.0, 35.0, 42.0, 36.0, 24.0, 32.0, 27.0, 18.0, 16.0, 16.0, 6.0, 6.0, 11.0, 13.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.143352508544922e-05, -8.877180516719818e-05, -8.611008524894714e-05, -8.34483653306961e-05, -8.078664541244507e-05, -7.812492549419403e-05, -7.546320557594299e-05, -7.280148565769196e-05, -7.013976573944092e-05, -6.747804582118988e-05, -6.481632590293884e-05, -6.21546059846878e-05, -5.949288606643677e-05, -5.683116614818573e-05, -5.416944622993469e-05, -5.1507726311683655e-05, -4.884600639343262e-05, -4.618428647518158e-05, -4.352256655693054e-05, -4.0860846638679504e-05, -3.819912672042847e-05, -3.553740680217743e-05, -3.287568688392639e-05, -3.0213966965675354e-05, -2.7552247047424316e-05, -2.489052712917328e-05, -2.222880721092224e-05, -1.9567087292671204e-05, -1.6905367374420166e-05, -1.4243647456169128e-05, -1.158192753791809e-05, -8.920207619667053e-06, -6.258487701416016e-06, -3.596767783164978e-06, -9.350478649139404e-07, 1.7266720533370972e-06, 4.388391971588135e-06, 7.050111889839172e-06, 9.71183180809021e-06, 1.2373551726341248e-05, 1.5035271644592285e-05, 1.7696991562843323e-05, 2.035871148109436e-05, 2.3020431399345398e-05, 2.5682151317596436e-05, 2.8343871235847473e-05, 3.100559115409851e-05, 3.366731107234955e-05, 3.6329030990600586e-05, 3.8990750908851624e-05, 4.165247082710266e-05, 4.43141907453537e-05, 4.6975910663604736e-05, 4.9637630581855774e-05, 5.229935050010681e-05, 5.496107041835785e-05, 5.762279033660889e-05, 6.0284510254859924e-05, 6.294623017311096e-05, 6.5607950091362e-05, 6.826967000961304e-05, 7.093138992786407e-05, 7.359310984611511e-05, 7.625482976436615e-05, 7.891654968261719e-05]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 5.0, 2.0, 8.0, 11.0, 9.0, 7.0, 11.0, 12.0, 16.0, 12.0, 21.0, 22.0, 26.0, 24.0, 21.0, 33.0, 40.0, 35.0, 35.0, 52.0, 45.0, 52.0, 42.0, 44.0, 55.0, 32.0, 31.0, 28.0, 30.0, 33.0, 23.0, 32.0, 27.0, 25.0, 23.0, 14.0, 13.0, 7.0, 11.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.817779541015625, -3.67657470703125, -3.535369873046875, -3.3941650390625, -3.252960205078125, -3.11175537109375, -2.970550537109375, -2.829345703125, -2.688140869140625, -2.54693603515625, -2.405731201171875, -2.2645263671875, -2.123321533203125, -1.98211669921875, -1.840911865234375, -1.69970703125, -1.558502197265625, -1.41729736328125, -1.276092529296875, -1.1348876953125, -0.993682861328125, -0.85247802734375, -0.711273193359375, -0.570068359375, -0.428863525390625, -0.28765869140625, -0.146453857421875, -0.0052490234375, 0.135955810546875, 0.27716064453125, 0.418365478515625, 0.5595703125, 0.700775146484375, 0.84197998046875, 0.983184814453125, 1.1243896484375, 1.265594482421875, 1.40679931640625, 1.548004150390625, 1.689208984375, 1.830413818359375, 1.97161865234375, 2.112823486328125, 2.2540283203125, 2.395233154296875, 2.53643798828125, 2.677642822265625, 2.81884765625, 2.960052490234375, 3.10125732421875, 3.242462158203125, 3.3836669921875, 3.524871826171875, 3.66607666015625, 3.807281494140625, 3.948486328125, 4.089691162109375, 4.23089599609375, 4.372100830078125, 4.5133056640625, 4.654510498046875, 4.79571533203125, 4.936920166015625, 5.078125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 5.0, 6.0, 10.0, 17.0, 26.0, 33.0, 33.0, 53.0, 70.0, 112.0, 152.0, 164.0, 228.0, 289.0, 473.0, 762.0, 1406.0, 3040.0, 8072.0, 27515.0, 97773.0, 301902.0, 389639.0, 152294.0, 43365.0, 12243.0, 4185.0, 1858.0, 904.0, 542.0, 357.0, 245.0, 226.0, 145.0, 112.0, 69.0, 57.0, 57.0, 30.0, 22.0, 11.0, 13.0, 12.0, 7.0, 4.0, 7.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-6.8046875, -6.61126708984375, -6.4178466796875, -6.22442626953125, -6.031005859375, -5.83758544921875, -5.6441650390625, -5.45074462890625, -5.25732421875, -5.06390380859375, -4.8704833984375, -4.67706298828125, -4.483642578125, -4.29022216796875, -4.0968017578125, -3.90338134765625, -3.7099609375, -3.51654052734375, -3.3231201171875, -3.12969970703125, -2.936279296875, -2.74285888671875, -2.5494384765625, -2.35601806640625, -2.16259765625, -1.96917724609375, -1.7757568359375, -1.58233642578125, -1.388916015625, -1.19549560546875, -1.0020751953125, -0.80865478515625, -0.615234375, -0.42181396484375, -0.2283935546875, -0.03497314453125, 0.158447265625, 0.35186767578125, 0.5452880859375, 0.73870849609375, 0.93212890625, 1.12554931640625, 1.3189697265625, 1.51239013671875, 1.705810546875, 1.89923095703125, 2.0926513671875, 2.28607177734375, 2.4794921875, 2.67291259765625, 2.8663330078125, 3.05975341796875, 3.253173828125, 3.44659423828125, 3.6400146484375, 3.83343505859375, 4.02685546875, 4.22027587890625, 4.4136962890625, 4.60711669921875, 4.800537109375, 4.99395751953125, 5.1873779296875, 5.38079833984375, 5.57421875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 6.0, 12.0, 11.0, 18.0, 29.0, 25.0, 21.0, 45.0, 40.0, 36.0, 74.0, 92.0, 157.0, 358.0, 1460.0, 173.0, 90.0, 70.0, 53.0, 46.0, 43.0, 35.0, 27.0, 19.0, 23.0, 12.0, 8.0, 12.0, 6.0, 17.0, 5.0, 5.0, 1.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.578125, -13.1263427734375, -12.674560546875, -12.2227783203125, -11.77099609375, -11.3192138671875, -10.867431640625, -10.4156494140625, -9.9638671875, -9.5120849609375, -9.060302734375, -8.6085205078125, -8.15673828125, -7.7049560546875, -7.253173828125, -6.8013916015625, -6.349609375, -5.8978271484375, -5.446044921875, -4.9942626953125, -4.54248046875, -4.0906982421875, -3.638916015625, -3.1871337890625, -2.7353515625, -2.2835693359375, -1.831787109375, -1.3800048828125, -0.92822265625, -0.4764404296875, -0.024658203125, 0.4271240234375, 0.87890625, 1.3306884765625, 1.782470703125, 2.2342529296875, 2.68603515625, 3.1378173828125, 3.589599609375, 4.0413818359375, 4.4931640625, 4.9449462890625, 5.396728515625, 5.8485107421875, 6.30029296875, 6.7520751953125, 7.203857421875, 7.6556396484375, 8.107421875, 8.5592041015625, 9.010986328125, 9.4627685546875, 9.91455078125, 10.3663330078125, 10.818115234375, 11.2698974609375, 11.7216796875, 12.1734619140625, 12.625244140625, 13.0770263671875, 13.52880859375, 13.9805908203125, 14.432373046875, 14.8841552734375, 15.3359375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 10.0, 12.0, 15.0, 25.0, 27.0, 41.0, 41.0, 93.0, 75.0, 104.0, 146.0, 204.0, 309.0, 434.0, 716.0, 1402.0, 11715.0, 2271148.0, 848604.0, 7320.0, 1223.0, 643.0, 361.0, 269.0, 210.0, 132.0, 123.0, 61.0, 35.0, 42.0, 29.0, 30.0, 24.0, 9.0, 8.0, 8.0, 8.0, 8.0, 9.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-26.03125, -25.306640625, -24.58203125, -23.857421875, -23.1328125, -22.408203125, -21.68359375, -20.958984375, -20.234375, -19.509765625, -18.78515625, -18.060546875, -17.3359375, -16.611328125, -15.88671875, -15.162109375, -14.4375, -13.712890625, -12.98828125, -12.263671875, -11.5390625, -10.814453125, -10.08984375, -9.365234375, -8.640625, -7.916015625, -7.19140625, -6.466796875, -5.7421875, -5.017578125, -4.29296875, -3.568359375, -2.84375, -2.119140625, -1.39453125, -0.669921875, 0.0546875, 0.779296875, 1.50390625, 2.228515625, 2.953125, 3.677734375, 4.40234375, 5.126953125, 5.8515625, 6.576171875, 7.30078125, 8.025390625, 8.75, 9.474609375, 10.19921875, 10.923828125, 11.6484375, 12.373046875, 13.09765625, 13.822265625, 14.546875, 15.271484375, 15.99609375, 16.720703125, 17.4453125, 18.169921875, 18.89453125, 19.619140625, 20.34375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 41.0, 79.0, 191.0, 248.0, 255.0, 125.0, 54.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.88557243347168, -22.83837127685547, -21.79117202758789, -20.74397087097168, -19.69676971435547, -18.649568557739258, -17.602367401123047, -16.55516815185547, -15.507966995239258, -14.460765838623047, -13.413565635681152, -12.366365432739258, -11.319164276123047, -10.271963119506836, -9.224762916564941, -8.177562713623047, -7.130361557006836, -6.083160877227783, -5.0359601974487305, -3.9887595176696777, -2.941558837890625, -1.8943581581115723, -0.8471574783325195, 0.2000432014465332, 1.247243881225586, 2.2944445610046387, 3.3416452407836914, 4.388845920562744, 5.436046600341797, 6.48324728012085, 7.530447959899902, 8.577648162841797, 9.624847412109375, 10.672048568725586, 11.71924877166748, 12.766448974609375, 13.813650131225586, 14.860851287841797, 15.908051490783691, 16.955251693725586, 18.002452850341797, 19.049654006958008, 20.09685516357422, 21.144054412841797, 22.191255569458008, 23.23845672607422, 24.285655975341797, 25.332857131958008, 26.38005828857422, 27.42725944519043, 28.47446060180664, 29.52165985107422, 30.56886100769043, 31.61606216430664, 32.66326141357422, 33.71046447753906, 34.75766372680664, 35.80486297607422, 36.85206604003906, 37.89926528930664, 38.94646453857422, 39.99366760253906, 41.04086685180664, 42.088069915771484, 43.13526916503906]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 8.0, 3.0, 7.0, 7.0, 10.0, 10.0, 8.0, 13.0, 17.0, 20.0, 23.0, 23.0, 25.0, 27.0, 25.0, 30.0, 31.0, 40.0, 45.0, 38.0, 39.0, 31.0, 30.0, 35.0, 33.0, 38.0, 27.0, 41.0, 34.0, 31.0, 21.0, 23.0, 20.0, 20.0, 23.0, 16.0, 19.0, 22.0, 8.0, 15.0, 10.0, 11.0, 10.0, 8.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-21.802602767944336, -21.121204376220703, -20.43980598449707, -19.758407592773438, -19.077009201049805, -18.395610809326172, -17.714214324951172, -17.03281593322754, -16.351417541503906, -15.670019149780273, -14.98862075805664, -14.307222366333008, -13.625824928283691, -12.944426536560059, -12.263028144836426, -11.58163070678711, -10.90023136138916, -10.218832969665527, -9.537434577941895, -8.856037139892578, -8.174638748168945, -7.4932403564453125, -6.81184196472168, -6.130444049835205, -5.449045658111572, -4.7676472663879395, -4.086249351501465, -3.404850959777832, -2.7234528064727783, -2.0420546531677246, -1.3606562614440918, -0.6792583465576172, 0.002140045166015625, 0.6835382580757141, 1.3649364709854126, 2.046334743499756, 2.7277328968048096, 3.4091310501098633, 4.090529441833496, 4.771927356719971, 5.4533257484436035, 6.134724140167236, 6.816122055053711, 7.497520446777344, 8.178918838500977, 8.86031723022461, 9.541715621948242, 10.223113059997559, 10.904511451721191, 11.585909843444824, 12.267308235168457, 12.948705673217773, 13.630104064941406, 14.311502456665039, 14.992900848388672, 15.674299240112305, 16.355697631835938, 17.03709602355957, 17.718494415283203, 18.399892807006836, 19.08129119873047, 19.76268768310547, 20.444087982177734, 21.125484466552734, 21.806882858276367]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 11.0, 4.0, 7.0, 7.0, 1.0, 11.0, 10.0, 10.0, 20.0, 13.0, 14.0, 19.0, 12.0, 19.0, 22.0, 29.0, 25.0, 31.0, 40.0, 39.0, 54.0, 30.0, 37.0, 35.0, 57.0, 38.0, 37.0, 36.0, 28.0, 26.0, 34.0, 33.0, 31.0, 14.0, 33.0, 15.0, 17.0, 18.0, 18.0, 11.0, 14.0, 10.0, 7.0, 6.0, 7.0, 3.0, 5.0, 1.0, 7.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.0078125, -3.874267578125, -3.74072265625, -3.607177734375, -3.4736328125, -3.340087890625, -3.20654296875, -3.072998046875, -2.939453125, -2.805908203125, -2.67236328125, -2.538818359375, -2.4052734375, -2.271728515625, -2.13818359375, -2.004638671875, -1.87109375, -1.737548828125, -1.60400390625, -1.470458984375, -1.3369140625, -1.203369140625, -1.06982421875, -0.936279296875, -0.802734375, -0.669189453125, -0.53564453125, -0.402099609375, -0.2685546875, -0.135009765625, -0.00146484375, 0.132080078125, 0.265625, 0.399169921875, 0.53271484375, 0.666259765625, 0.7998046875, 0.933349609375, 1.06689453125, 1.200439453125, 1.333984375, 1.467529296875, 1.60107421875, 1.734619140625, 1.8681640625, 2.001708984375, 2.13525390625, 2.268798828125, 2.40234375, 2.535888671875, 2.66943359375, 2.802978515625, 2.9365234375, 3.070068359375, 3.20361328125, 3.337158203125, 3.470703125, 3.604248046875, 3.73779296875, 3.871337890625, 4.0048828125, 4.138427734375, 4.27197265625, 4.405517578125, 4.5390625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 7.0, 7.0, 12.0, 3.0, 8.0, 12.0, 21.0, 26.0, 30.0, 40.0, 43.0, 65.0, 93.0, 115.0, 135.0, 185.0, 280.0, 382.0, 532.0, 4753.0, 4183987.0, 1605.0, 469.0, 369.0, 257.0, 216.0, 149.0, 106.0, 83.0, 70.0, 38.0, 29.0, 26.0, 28.0, 24.0, 15.0, 11.0, 10.0, 7.0, 5.0, 4.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-80.0625, -77.80078125, -75.5390625, -73.27734375, -71.015625, -68.75390625, -66.4921875, -64.23046875, -61.96875, -59.70703125, -57.4453125, -55.18359375, -52.921875, -50.66015625, -48.3984375, -46.13671875, -43.875, -41.61328125, -39.3515625, -37.08984375, -34.828125, -32.56640625, -30.3046875, -28.04296875, -25.78125, -23.51953125, -21.2578125, -18.99609375, -16.734375, -14.47265625, -12.2109375, -9.94921875, -7.6875, -5.42578125, -3.1640625, -0.90234375, 1.359375, 3.62109375, 5.8828125, 8.14453125, 10.40625, 12.66796875, 14.9296875, 17.19140625, 19.453125, 21.71484375, 23.9765625, 26.23828125, 28.5, 30.76171875, 33.0234375, 35.28515625, 37.546875, 39.80859375, 42.0703125, 44.33203125, 46.59375, 48.85546875, 51.1171875, 53.37890625, 55.640625, 57.90234375, 60.1640625, 62.42578125, 64.6875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 7.0, 6.0, 10.0, 11.0, 11.0, 9.0, 22.0, 36.0, 36.0, 52.0, 57.0, 86.0, 118.0, 180.0, 231.0, 352.0, 456.0, 513.0, 487.0, 402.0, 273.0, 214.0, 130.0, 87.0, 69.0, 48.0, 47.0, 26.0, 30.0, 8.0, 13.0, 13.0, 6.0, 4.0, 10.0, 2.0, 4.0, 0.0, 8.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.23046875, -7.021484375, -6.8125, -6.603515625, -6.39453125, -6.185546875, -5.9765625, -5.767578125, -5.55859375, -5.349609375, -5.140625, -4.931640625, -4.72265625, -4.513671875, -4.3046875, -4.095703125, -3.88671875, -3.677734375, -3.46875, -3.259765625, -3.05078125, -2.841796875, -2.6328125, -2.423828125, -2.21484375, -2.005859375, -1.796875, -1.587890625, -1.37890625, -1.169921875, -0.9609375, -0.751953125, -0.54296875, -0.333984375, -0.125, 0.083984375, 0.29296875, 0.501953125, 0.7109375, 0.919921875, 1.12890625, 1.337890625, 1.546875, 1.755859375, 1.96484375, 2.173828125, 2.3828125, 2.591796875, 2.80078125, 3.009765625, 3.21875, 3.427734375, 3.63671875, 3.845703125, 4.0546875, 4.263671875, 4.47265625, 4.681640625, 4.890625, 5.099609375, 5.30859375, 5.517578125, 5.7265625, 5.935546875, 6.14453125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 11.0, 7.0, 19.0, 26.0, 31.0, 35.0, 47.0, 63.0, 82.0, 159.0, 603.0, 57261.0, 4132131.0, 3075.0, 334.0, 117.0, 75.0, 44.0, 36.0, 42.0, 24.0, 25.0, 16.0, 7.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-68.4375, -66.7392578125, -65.041015625, -63.3427734375, -61.64453125, -59.9462890625, -58.248046875, -56.5498046875, -54.8515625, -53.1533203125, -51.455078125, -49.7568359375, -48.05859375, -46.3603515625, -44.662109375, -42.9638671875, -41.265625, -39.5673828125, -37.869140625, -36.1708984375, -34.47265625, -32.7744140625, -31.076171875, -29.3779296875, -27.6796875, -25.9814453125, -24.283203125, -22.5849609375, -20.88671875, -19.1884765625, -17.490234375, -15.7919921875, -14.09375, -12.3955078125, -10.697265625, -8.9990234375, -7.30078125, -5.6025390625, -3.904296875, -2.2060546875, -0.5078125, 1.1904296875, 2.888671875, 4.5869140625, 6.28515625, 7.9833984375, 9.681640625, 11.3798828125, 13.078125, 14.7763671875, 16.474609375, 18.1728515625, 19.87109375, 21.5693359375, 23.267578125, 24.9658203125, 26.6640625, 28.3623046875, 30.060546875, 31.7587890625, 33.45703125, 35.1552734375, 36.853515625, 38.5517578125, 40.25]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 33.0, 90.0, 174.0, 269.0, 257.0, 123.0, 41.0, 13.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.711305618286133, -30.176977157592773, -28.642648696899414, -27.108318328857422, -25.573989868164062, -24.039661407470703, -22.505332946777344, -20.971004486083984, -19.436676025390625, -17.902347564697266, -16.368019104003906, -14.83368968963623, -13.299361228942871, -11.765032768249512, -10.230703353881836, -8.696374893188477, -7.162046432495117, -5.627717971801758, -4.09338903427124, -2.5590600967407227, -1.0247316360473633, 0.5095968246459961, 2.043926239013672, 3.5782546997070312, 5.112583160400391, 6.64691162109375, 8.18124008178711, 9.715569496154785, 11.249897956848145, 12.784226417541504, 14.31855583190918, 15.852884292602539, 17.38721466064453, 18.92154312133789, 20.45587158203125, 21.99020004272461, 23.52452850341797, 25.058856964111328, 26.59318733215332, 28.12751579284668, 29.66184425354004, 31.1961727142334, 32.73050308227539, 34.26483154296875, 35.79916000366211, 37.33348846435547, 38.86781692504883, 40.40214538574219, 41.93647384643555, 43.470802307128906, 45.005130767822266, 46.539459228515625, 48.073787689208984, 49.608116149902344, 51.14244842529297, 52.67677307128906, 54.21110534667969, 55.74543380737305, 57.279762268066406, 58.814090728759766, 60.348419189453125, 61.882747650146484, 63.417076110839844, 64.95140838623047, 66.48573303222656]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 2.0, 1.0, 7.0, 5.0, 11.0, 14.0, 14.0, 12.0, 13.0, 17.0, 32.0, 18.0, 23.0, 21.0, 37.0, 40.0, 40.0, 43.0, 41.0, 31.0, 44.0, 38.0, 44.0, 38.0, 36.0, 39.0, 33.0, 38.0, 35.0, 30.0, 26.0, 29.0, 24.0, 20.0, 17.0, 19.0, 14.0, 14.0, 6.0, 5.0, 7.0, 2.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.36933135986328, -19.69687271118164, -19.024415969848633, -18.351957321166992, -17.679500579833984, -17.007041931152344, -16.334583282470703, -15.662125587463379, -14.989667892456055, -14.31721019744873, -13.644752502441406, -12.972293853759766, -12.299836158752441, -11.627378463745117, -10.954919815063477, -10.282462120056152, -9.610004425048828, -8.937546730041504, -8.26508903503418, -7.592630386352539, -6.920172691345215, -6.247714996337891, -5.575256824493408, -4.902798652648926, -4.230340957641602, -3.5578830242156982, -2.885425090789795, -2.2129671573638916, -1.5405092239379883, -0.868051290512085, -0.19559335708618164, 0.4768648147583008, 1.1493244171142578, 1.8217823505401611, 2.4942402839660645, 3.1666982173919678, 3.839156150817871, 4.511613845825195, 5.184072017669678, 5.85653018951416, 6.528987884521484, 7.201445579528809, 7.873903751373291, 8.546361923217773, 9.218819618225098, 9.891277313232422, 10.563735961914062, 11.236193656921387, 11.908651351928711, 12.581109046936035, 13.25356674194336, 13.926025390625, 14.598483085632324, 15.270940780639648, 15.943399429321289, 16.615856170654297, 17.288314819335938, 17.960773468017578, 18.633230209350586, 19.305688858032227, 19.978145599365234, 20.650604248046875, 21.323062896728516, 21.995521545410156, 22.667978286743164]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 4.0, 9.0, 12.0, 14.0, 10.0, 15.0, 21.0, 23.0, 28.0, 29.0, 28.0, 41.0, 49.0, 37.0, 41.0, 45.0, 49.0, 48.0, 56.0, 45.0, 43.0, 37.0, 27.0, 28.0, 40.0, 28.0, 23.0, 24.0, 35.0, 23.0, 18.0, 8.0, 11.0, 20.0, 7.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.5816650390625, -4.432861328125, -4.2840576171875, -4.13525390625, -3.9864501953125, -3.837646484375, -3.6888427734375, -3.5400390625, -3.3912353515625, -3.242431640625, -3.0936279296875, -2.94482421875, -2.7960205078125, -2.647216796875, -2.4984130859375, -2.349609375, -2.2008056640625, -2.052001953125, -1.9031982421875, -1.75439453125, -1.6055908203125, -1.456787109375, -1.3079833984375, -1.1591796875, -1.0103759765625, -0.861572265625, -0.7127685546875, -0.56396484375, -0.4151611328125, -0.266357421875, -0.1175537109375, 0.03125, 0.1800537109375, 0.328857421875, 0.4776611328125, 0.62646484375, 0.7752685546875, 0.924072265625, 1.0728759765625, 1.2216796875, 1.3704833984375, 1.519287109375, 1.6680908203125, 1.81689453125, 1.9656982421875, 2.114501953125, 2.2633056640625, 2.412109375, 2.5609130859375, 2.709716796875, 2.8585205078125, 3.00732421875, 3.1561279296875, 3.304931640625, 3.4537353515625, 3.6025390625, 3.7513427734375, 3.900146484375, 4.0489501953125, 4.19775390625, 4.3465576171875, 4.495361328125, 4.6441650390625, 4.79296875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 13.0, 16.0, 20.0, 20.0, 42.0, 61.0, 107.0, 176.0, 287.0, 441.0, 682.0, 1094.0, 1808.0, 2872.0, 4967.0, 8218.0, 14205.0, 24703.0, 45471.0, 88549.0, 211727.0, 355444.0, 140102.0, 65701.0, 34644.0, 19234.0, 11110.0, 6573.0, 3967.0, 2435.0, 1484.0, 880.0, 510.0, 345.0, 229.0, 162.0, 92.0, 52.0, 37.0, 15.0, 20.0, 18.0, 9.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.916015625, -0.8867340087890625, -0.857452392578125, -0.8281707763671875, -0.79888916015625, -0.7696075439453125, -0.740325927734375, -0.7110443115234375, -0.6817626953125, -0.6524810791015625, -0.623199462890625, -0.5939178466796875, -0.56463623046875, -0.5353546142578125, -0.506072998046875, -0.4767913818359375, -0.447509765625, -0.4182281494140625, -0.388946533203125, -0.3596649169921875, -0.33038330078125, -0.3011016845703125, -0.271820068359375, -0.2425384521484375, -0.2132568359375, -0.1839752197265625, -0.154693603515625, -0.1254119873046875, -0.09613037109375, -0.0668487548828125, -0.037567138671875, -0.0082855224609375, 0.02099609375, 0.0502777099609375, 0.079559326171875, 0.1088409423828125, 0.13812255859375, 0.1674041748046875, 0.196685791015625, 0.2259674072265625, 0.2552490234375, 0.2845306396484375, 0.313812255859375, 0.3430938720703125, 0.37237548828125, 0.4016571044921875, 0.430938720703125, 0.4602203369140625, 0.489501953125, 0.5187835693359375, 0.548065185546875, 0.5773468017578125, 0.60662841796875, 0.6359100341796875, 0.665191650390625, 0.6944732666015625, 0.7237548828125, 0.7530364990234375, 0.782318115234375, 0.8115997314453125, 0.84088134765625, 0.8701629638671875, 0.899444580078125, 0.9287261962890625, 0.9580078125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 8.0, 3.0, 1.0, 5.0, 4.0, 7.0, 9.0, 12.0, 11.0, 13.0, 21.0, 11.0, 15.0, 22.0, 24.0, 17.0, 30.0, 36.0, 29.0, 31.0, 40.0, 19.0, 27.0, 36.0, 35.0, 1063.0, 27.0, 34.0, 47.0, 40.0, 24.0, 23.0, 29.0, 20.0, 32.0, 26.0, 30.0, 26.0, 18.0, 17.0, 12.0, 24.0, 13.0, 7.0, 8.0, 7.0, 9.0, 4.0, 5.0, 5.0, 4.0, 8.0, 2.0, 1.0, 2.0, 2.0], "bins": [-2.453125, -2.380157470703125, -2.30718994140625, -2.234222412109375, -2.1612548828125, -2.088287353515625, -2.01531982421875, -1.942352294921875, -1.869384765625, -1.796417236328125, -1.72344970703125, -1.650482177734375, -1.5775146484375, -1.504547119140625, -1.43157958984375, -1.358612060546875, -1.28564453125, -1.212677001953125, -1.13970947265625, -1.066741943359375, -0.9937744140625, -0.920806884765625, -0.84783935546875, -0.774871826171875, -0.701904296875, -0.628936767578125, -0.55596923828125, -0.483001708984375, -0.4100341796875, -0.337066650390625, -0.26409912109375, -0.191131591796875, -0.1181640625, -0.045196533203125, 0.02777099609375, 0.100738525390625, 0.1737060546875, 0.246673583984375, 0.31964111328125, 0.392608642578125, 0.465576171875, 0.538543701171875, 0.61151123046875, 0.684478759765625, 0.7574462890625, 0.830413818359375, 0.90338134765625, 0.976348876953125, 1.04931640625, 1.122283935546875, 1.19525146484375, 1.268218994140625, 1.3411865234375, 1.414154052734375, 1.48712158203125, 1.560089111328125, 1.633056640625, 1.706024169921875, 1.77899169921875, 1.851959228515625, 1.9249267578125, 1.997894287109375, 2.07086181640625, 2.143829345703125, 2.216796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 8.0, 8.0, 14.0, 12.0, 25.0, 47.0, 70.0, 103.0, 147.0, 209.0, 294.0, 399.0, 607.0, 792.0, 1069.0, 1427.0, 2007.0, 2809.0, 3647.0, 5212.0, 7164.0, 9896.0, 13937.0, 19318.0, 28089.0, 40646.0, 60953.0, 98211.0, 185831.0, 1271084.0, 118985.0, 70079.0, 45654.0, 31314.0, 21984.0, 15521.0, 10995.0, 7936.0, 5678.0, 4133.0, 2934.0, 2211.0, 1576.0, 1152.0, 789.0, 616.0, 443.0, 286.0, 237.0, 180.0, 110.0, 88.0, 70.0, 48.0, 38.0, 17.0, 15.0, 10.0, 6.0, 3.0, 2.0], "bins": [-0.541015625, -0.5241928100585938, -0.5073699951171875, -0.49054718017578125, -0.473724365234375, -0.45690155029296875, -0.4400787353515625, -0.42325592041015625, -0.40643310546875, -0.38961029052734375, -0.3727874755859375, -0.35596466064453125, -0.339141845703125, -0.32231903076171875, -0.3054962158203125, -0.28867340087890625, -0.2718505859375, -0.25502777099609375, -0.2382049560546875, -0.22138214111328125, -0.204559326171875, -0.18773651123046875, -0.1709136962890625, -0.15409088134765625, -0.13726806640625, -0.12044525146484375, -0.1036224365234375, -0.08679962158203125, -0.069976806640625, -0.05315399169921875, -0.0363311767578125, -0.01950836181640625, -0.002685546875, 0.01413726806640625, 0.0309600830078125, 0.04778289794921875, 0.064605712890625, 0.08142852783203125, 0.0982513427734375, 0.11507415771484375, 0.13189697265625, 0.14871978759765625, 0.1655426025390625, 0.18236541748046875, 0.199188232421875, 0.21601104736328125, 0.2328338623046875, 0.24965667724609375, 0.2664794921875, 0.28330230712890625, 0.3001251220703125, 0.31694793701171875, 0.333770751953125, 0.35059356689453125, 0.3674163818359375, 0.38423919677734375, 0.40106201171875, 0.41788482666015625, 0.4347076416015625, 0.45153045654296875, 0.468353271484375, 0.48517608642578125, 0.5019989013671875, 0.5188217163085938, 0.53564453125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 4.0, 11.0, 8.0, 14.0, 14.0, 11.0, 18.0, 27.0, 43.0, 44.0, 52.0, 42.0, 69.0, 70.0, 54.0, 68.0, 60.0, 66.0, 54.0, 49.0, 42.0, 49.0, 33.0, 19.0, 15.0, 18.0, 8.0, 8.0, 7.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013589859008789062, -0.00013083219528198242, -0.00012576580047607422, -0.00012069940567016602, -0.00011563301086425781, -0.00011056661605834961, -0.0001055002212524414, -0.0001004338264465332, -9.5367431640625e-05, -9.03010368347168e-05, -8.52346420288086e-05, -8.016824722290039e-05, -7.510185241699219e-05, -7.003545761108398e-05, -6.496906280517578e-05, -5.990266799926758e-05, -5.4836273193359375e-05, -4.976987838745117e-05, -4.470348358154297e-05, -3.9637088775634766e-05, -3.457069396972656e-05, -2.950429916381836e-05, -2.4437904357910156e-05, -1.9371509552001953e-05, -1.430511474609375e-05, -9.238719940185547e-06, -4.172325134277344e-06, 8.940696716308594e-07, 5.9604644775390625e-06, 1.1026859283447266e-05, 1.609325408935547e-05, 2.1159648895263672e-05, 2.6226043701171875e-05, 3.129243850708008e-05, 3.635883331298828e-05, 4.1425228118896484e-05, 4.649162292480469e-05, 5.155801773071289e-05, 5.6624412536621094e-05, 6.16908073425293e-05, 6.67572021484375e-05, 7.18235969543457e-05, 7.68899917602539e-05, 8.195638656616211e-05, 8.702278137207031e-05, 9.208917617797852e-05, 9.715557098388672e-05, 0.00010222196578979492, 0.00010728836059570312, 0.00011235475540161133, 0.00011742115020751953, 0.00012248754501342773, 0.00012755393981933594, 0.00013262033462524414, 0.00013768672943115234, 0.00014275312423706055, 0.00014781951904296875, 0.00015288591384887695, 0.00015795230865478516, 0.00016301870346069336, 0.00016808509826660156, 0.00017315149307250977, 0.00017821788787841797, 0.00018328428268432617, 0.00018835067749023438]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 7.0, 6.0, 8.0, 11.0, 7.0, 10.0, 8.0, 17.0, 15.0, 27.0, 29.0, 36.0, 67.0, 97.0, 128.0, 195.0, 258.0, 432.0, 774.0, 1519.0, 472519.0, 568710.0, 1632.0, 766.0, 413.0, 274.0, 195.0, 104.0, 75.0, 54.0, 37.0, 30.0, 30.0, 21.0, 11.0, 10.0, 11.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030765533447265625, -0.0029861032962799072, -0.002895653247833252, -0.0028052031993865967, -0.0027147531509399414, -0.002624303102493286, -0.002533853054046631, -0.0024434030055999756, -0.0023529529571533203, -0.002262502908706665, -0.0021720528602600098, -0.0020816028118133545, -0.0019911527633666992, -0.001900702714920044, -0.0018102526664733887, -0.0017198026180267334, -0.0016293525695800781, -0.0015389025211334229, -0.0014484524726867676, -0.0013580024242401123, -0.001267552375793457, -0.0011771023273468018, -0.0010866522789001465, -0.0009962022304534912, -0.0009057521820068359, -0.0008153021335601807, -0.0007248520851135254, -0.0006344020366668701, -0.0005439519882202148, -0.00045350193977355957, -0.0003630518913269043, -0.000272601842880249, -0.00018215179443359375, -9.170174598693848e-05, -1.2516975402832031e-06, 8.919835090637207e-05, 0.00017964839935302734, 0.0002700984477996826, 0.0003605484962463379, 0.00045099854469299316, 0.0005414485931396484, 0.0006318986415863037, 0.000722348690032959, 0.0008127987384796143, 0.0009032487869262695, 0.0009936988353729248, 0.00108414888381958, 0.0011745989322662354, 0.0012650489807128906, 0.001355499029159546, 0.0014459490776062012, 0.0015363991260528564, 0.0016268491744995117, 0.001717299222946167, 0.0018077492713928223, 0.0018981993198394775, 0.001988649368286133, 0.002079099416732788, 0.0021695494651794434, 0.0022599995136260986, 0.002350449562072754, 0.002440899610519409, 0.0025313496589660645, 0.0026217997074127197, 0.002712249755859375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 8.0, 25.0, 100.0, 281.0, 348.0, 175.0, 59.0, 14.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003797558892983943, -0.00037220411468297243, -0.00036465234006755054, -0.00035710056545212865, -0.00034954879083670676, -0.00034199701622128487, -0.000334445241605863, -0.0003268934669904411, -0.0003193416923750192, -0.0003117899177595973, -0.0003042381431441754, -0.0002966863685287535, -0.00028913459391333163, -0.00028158281929790974, -0.00027403104468248785, -0.00026647927006706595, -0.0002589275245554745, -0.00025137574994005263, -0.00024382397532463074, -0.00023627220070920885, -0.00022872042609378695, -0.00022116865147836506, -0.00021361687686294317, -0.00020606510224752128, -0.0001985133276320994, -0.0001909615530166775, -0.0001834097784012556, -0.00017585800378583372, -0.00016830622917041183, -0.00016075445455498993, -0.00015320267993956804, -0.00014565090532414615, -0.0001380991452606395, -0.0001305473706452176, -0.0001229955960297957, -0.00011544382141437382, -0.00010789204679895192, -0.00010034027218353003, -9.278850484406576e-05, -8.523673022864386e-05, -7.768495561322197e-05, -7.013318099780008e-05, -6.258140638237819e-05, -5.502963540493511e-05, -4.7477860789513215e-05, -3.9926086174091324e-05, -3.237431519664824e-05, -2.482254058122635e-05, -1.7270765965804458e-05, -9.718992259877268e-06, -2.1672185539500788e-06, 5.384554242482409e-06, 1.29363288579043e-05, 2.048810347332619e-05, 2.8039874450769275e-05, 3.559164906619117e-05, 4.314342368161306e-05, 5.069519829703495e-05, 5.824697291245684e-05, 6.579874025192112e-05, 7.335051486734301e-05, 8.09022894827649e-05, 8.845406409818679e-05, 9.600583871360868e-05, 0.00010355761332903057]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 5.0, 6.0, 8.0, 2.0, 6.0, 11.0, 12.0, 12.0, 22.0, 21.0, 24.0, 28.0, 28.0, 32.0, 27.0, 46.0, 37.0, 42.0, 48.0, 41.0, 49.0, 40.0, 38.0, 51.0, 39.0, 41.0, 46.0, 39.0, 34.0, 38.0, 22.0, 26.0, 19.0, 11.0, 10.0, 13.0, 4.0, 7.0, 8.0, 2.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.176399230957031e-05, -6.916001439094543e-05, -6.655603647232056e-05, -6.395205855369568e-05, -6.13480806350708e-05, -5.874410271644592e-05, -5.6140124797821045e-05, -5.353614687919617e-05, -5.093216896057129e-05, -4.832819104194641e-05, -4.572421312332153e-05, -4.3120235204696655e-05, -4.051625728607178e-05, -3.79122793674469e-05, -3.530830144882202e-05, -3.2704323530197144e-05, -3.0100345611572266e-05, -2.7496367692947388e-05, -2.489238977432251e-05, -2.2288411855697632e-05, -1.9684433937072754e-05, -1.7080456018447876e-05, -1.4476478099822998e-05, -1.187250018119812e-05, -9.268522262573242e-06, -6.664544343948364e-06, -4.060566425323486e-06, -1.4565885066986084e-06, 1.1473894119262695e-06, 3.7513673305511475e-06, 6.355345249176025e-06, 8.959323167800903e-06, 1.1563301086425781e-05, 1.416727900505066e-05, 1.6771256923675537e-05, 1.9375234842300415e-05, 2.1979212760925293e-05, 2.458319067955017e-05, 2.718716859817505e-05, 2.9791146516799927e-05, 3.2395124435424805e-05, 3.499910235404968e-05, 3.760308027267456e-05, 4.020705819129944e-05, 4.2811036109924316e-05, 4.5415014028549194e-05, 4.801899194717407e-05, 5.062296986579895e-05, 5.322694778442383e-05, 5.5830925703048706e-05, 5.8434903621673584e-05, 6.103888154029846e-05, 6.364285945892334e-05, 6.624683737754822e-05, 6.88508152961731e-05, 7.145479321479797e-05, 7.405877113342285e-05, 7.666274905204773e-05, 7.926672697067261e-05, 8.187070488929749e-05, 8.447468280792236e-05, 8.707866072654724e-05, 8.968263864517212e-05, 9.2286616563797e-05, 9.489059448242188e-05]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 4.0, 9.0, 12.0, 14.0, 10.0, 15.0, 21.0, 23.0, 28.0, 29.0, 28.0, 41.0, 49.0, 37.0, 41.0, 45.0, 49.0, 48.0, 56.0, 45.0, 43.0, 37.0, 27.0, 28.0, 40.0, 28.0, 23.0, 24.0, 35.0, 23.0, 18.0, 8.0, 11.0, 20.0, 7.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.5816650390625, -4.432861328125, -4.2840576171875, -4.13525390625, -3.9864501953125, -3.837646484375, -3.6888427734375, -3.5400390625, -3.3912353515625, -3.242431640625, -3.0936279296875, -2.94482421875, -2.7960205078125, -2.647216796875, -2.4984130859375, -2.349609375, -2.2008056640625, -2.052001953125, -1.9031982421875, -1.75439453125, -1.6055908203125, -1.456787109375, -1.3079833984375, -1.1591796875, -1.0103759765625, -0.861572265625, -0.7127685546875, -0.56396484375, -0.4151611328125, -0.266357421875, -0.1175537109375, 0.03125, 0.1800537109375, 0.328857421875, 0.4776611328125, 0.62646484375, 0.7752685546875, 0.924072265625, 1.0728759765625, 1.2216796875, 1.3704833984375, 1.519287109375, 1.6680908203125, 1.81689453125, 1.9656982421875, 2.114501953125, 2.2633056640625, 2.412109375, 2.5609130859375, 2.709716796875, 2.8585205078125, 3.00732421875, 3.1561279296875, 3.304931640625, 3.4537353515625, 3.6025390625, 3.7513427734375, 3.900146484375, 4.0489501953125, 4.19775390625, 4.3465576171875, 4.495361328125, 4.6441650390625, 4.79296875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 12.0, 16.0, 19.0, 19.0, 18.0, 26.0, 43.0, 62.0, 68.0, 90.0, 122.0, 179.0, 239.0, 318.0, 472.0, 610.0, 846.0, 1183.0, 1632.0, 3414.0, 18014.0, 152932.0, 598307.0, 230494.0, 28526.0, 4403.0, 1937.0, 1221.0, 888.0, 654.0, 446.0, 360.0, 257.0, 190.0, 135.0, 95.0, 99.0, 58.0, 47.0, 23.0, 25.0, 15.0, 12.0, 12.0, 10.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.4609375, -9.1707763671875, -8.880615234375, -8.5904541015625, -8.30029296875, -8.0101318359375, -7.719970703125, -7.4298095703125, -7.1396484375, -6.8494873046875, -6.559326171875, -6.2691650390625, -5.97900390625, -5.6888427734375, -5.398681640625, -5.1085205078125, -4.818359375, -4.5281982421875, -4.238037109375, -3.9478759765625, -3.65771484375, -3.3675537109375, -3.077392578125, -2.7872314453125, -2.4970703125, -2.2069091796875, -1.916748046875, -1.6265869140625, -1.33642578125, -1.0462646484375, -0.756103515625, -0.4659423828125, -0.17578125, 0.1143798828125, 0.404541015625, 0.6947021484375, 0.98486328125, 1.2750244140625, 1.565185546875, 1.8553466796875, 2.1455078125, 2.4356689453125, 2.725830078125, 3.0159912109375, 3.30615234375, 3.5963134765625, 3.886474609375, 4.1766357421875, 4.466796875, 4.7569580078125, 5.047119140625, 5.3372802734375, 5.62744140625, 5.9176025390625, 6.207763671875, 6.4979248046875, 6.7880859375, 7.0782470703125, 7.368408203125, 7.6585693359375, 7.94873046875, 8.2388916015625, 8.529052734375, 8.8192138671875, 9.109375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 9.0, 9.0, 10.0, 11.0, 12.0, 25.0, 16.0, 17.0, 19.0, 25.0, 26.0, 35.0, 46.0, 48.0, 43.0, 45.0, 73.0, 188.0, 1437.0, 354.0, 169.0, 81.0, 54.0, 60.0, 32.0, 29.0, 28.0, 17.0, 11.0, 22.0, 17.0, 16.0, 9.0, 14.0, 11.0, 4.0, 4.0, 3.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0], "bins": [-11.2890625, -10.9656982421875, -10.642333984375, -10.3189697265625, -9.99560546875, -9.6722412109375, -9.348876953125, -9.0255126953125, -8.7021484375, -8.3787841796875, -8.055419921875, -7.7320556640625, -7.40869140625, -7.0853271484375, -6.761962890625, -6.4385986328125, -6.115234375, -5.7918701171875, -5.468505859375, -5.1451416015625, -4.82177734375, -4.4984130859375, -4.175048828125, -3.8516845703125, -3.5283203125, -3.2049560546875, -2.881591796875, -2.5582275390625, -2.23486328125, -1.9114990234375, -1.588134765625, -1.2647705078125, -0.94140625, -0.6180419921875, -0.294677734375, 0.0286865234375, 0.35205078125, 0.6754150390625, 0.998779296875, 1.3221435546875, 1.6455078125, 1.9688720703125, 2.292236328125, 2.6156005859375, 2.93896484375, 3.2623291015625, 3.585693359375, 3.9090576171875, 4.232421875, 4.5557861328125, 4.879150390625, 5.2025146484375, 5.52587890625, 5.8492431640625, 6.172607421875, 6.4959716796875, 6.8193359375, 7.1427001953125, 7.466064453125, 7.7894287109375, 8.11279296875, 8.4361572265625, 8.759521484375, 9.0828857421875, 9.40625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 6.0, 4.0, 9.0, 5.0, 14.0, 19.0, 30.0, 34.0, 55.0, 63.0, 98.0, 131.0, 209.0, 354.0, 569.0, 1210.0, 10126.0, 3127372.0, 2985.0, 980.0, 458.0, 301.0, 194.0, 121.0, 98.0, 59.0, 58.0, 32.0, 16.0, 27.0, 9.0, 11.0, 9.0, 9.0, 4.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.78125, -49.107421875, -47.43359375, -45.759765625, -44.0859375, -42.412109375, -40.73828125, -39.064453125, -37.390625, -35.716796875, -34.04296875, -32.369140625, -30.6953125, -29.021484375, -27.34765625, -25.673828125, -24.0, -22.326171875, -20.65234375, -18.978515625, -17.3046875, -15.630859375, -13.95703125, -12.283203125, -10.609375, -8.935546875, -7.26171875, -5.587890625, -3.9140625, -2.240234375, -0.56640625, 1.107421875, 2.78125, 4.455078125, 6.12890625, 7.802734375, 9.4765625, 11.150390625, 12.82421875, 14.498046875, 16.171875, 17.845703125, 19.51953125, 21.193359375, 22.8671875, 24.541015625, 26.21484375, 27.888671875, 29.5625, 31.236328125, 32.91015625, 34.583984375, 36.2578125, 37.931640625, 39.60546875, 41.279296875, 42.953125, 44.626953125, 46.30078125, 47.974609375, 49.6484375, 51.322265625, 52.99609375, 54.669921875, 56.34375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 11.0, 18.0, 61.0, 138.0, 180.0, 224.0, 186.0, 109.0, 52.0, 17.0, 8.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.63885498046875, -28.664894104003906, -27.690933227539062, -26.71697425842285, -25.743013381958008, -24.769052505493164, -23.795093536376953, -22.82113265991211, -21.847171783447266, -20.873210906982422, -19.899250030517578, -18.925291061401367, -17.951330184936523, -16.97736930847168, -16.00341033935547, -15.029449462890625, -14.055488586425781, -13.081527709960938, -12.10756778717041, -11.133607864379883, -10.159646987915039, -9.185686111450195, -8.211726188659668, -7.237765789031982, -6.263805389404297, -5.289844989776611, -4.315884590148926, -3.3419241905212402, -2.3679637908935547, -1.3940033912658691, -0.4200429916381836, 0.553917407989502, 1.5278778076171875, 2.501838207244873, 3.4757986068725586, 4.449759006500244, 5.42371940612793, 6.397679805755615, 7.371640205383301, 8.345600128173828, 9.319561004638672, 10.293521881103516, 11.267481803894043, 12.24144172668457, 13.215402603149414, 14.189363479614258, 15.163323402404785, 16.137283325195312, 17.111244201660156, 18.085205078125, 19.059165954589844, 20.033124923706055, 21.0070858001709, 21.981046676635742, 22.955005645751953, 23.928966522216797, 24.90292739868164, 25.876888275146484, 26.850849151611328, 27.82480812072754, 28.798768997192383, 29.772729873657227, 30.746688842773438, 31.72064971923828, 32.694610595703125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 10.0, 9.0, 14.0, 16.0, 26.0, 19.0, 24.0, 31.0, 24.0, 28.0, 27.0, 29.0, 37.0, 55.0, 44.0, 46.0, 51.0, 46.0, 50.0, 48.0, 30.0, 49.0, 26.0, 34.0, 31.0, 23.0, 19.0, 19.0, 26.0, 12.0, 15.0, 14.0, 12.0, 3.0, 8.0, 10.0, 5.0, 10.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.97964096069336, -22.160324096679688, -21.341007232666016, -20.521690368652344, -19.702373504638672, -18.883056640625, -18.06374168395996, -17.24442481994629, -16.425107955932617, -15.605791091918945, -14.786474227905273, -13.967158317565918, -13.147841453552246, -12.328524589538574, -11.509208679199219, -10.689891815185547, -9.870574951171875, -9.051258087158203, -8.231941223144531, -7.412625312805176, -6.593308448791504, -5.773991584777832, -4.954675197601318, -4.135358810424805, -3.316041946411133, -2.49672532081604, -1.6774086952209473, -0.8580920696258545, -0.03877544403076172, 0.7805414199829102, 1.5998578071594238, 2.4191741943359375, 3.2384910583496094, 4.057807922363281, 4.877124309539795, 5.696440696716309, 6.5157575607299805, 7.335074424743652, 8.154390335083008, 8.97370719909668, 9.793024063110352, 10.612340927124023, 11.431657791137695, 12.25097370147705, 13.070290565490723, 13.889607429504395, 14.70892333984375, 15.528240203857422, 16.347557067871094, 17.166873931884766, 17.986190795898438, 18.80550765991211, 19.62482452392578, 20.444141387939453, 21.263456344604492, 22.082773208618164, 22.902090072631836, 23.721406936645508, 24.54072380065918, 25.36004066467285, 26.17935562133789, 26.998672485351562, 27.817989349365234, 28.637306213378906, 29.456623077392578]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 0.0, 2.0, 6.0, 4.0, 7.0, 12.0, 12.0, 13.0, 19.0, 11.0, 16.0, 26.0, 28.0, 30.0, 32.0, 40.0, 41.0, 37.0, 34.0, 54.0, 43.0, 41.0, 48.0, 44.0, 42.0, 29.0, 39.0, 31.0, 32.0, 38.0, 30.0, 22.0, 17.0, 24.0, 26.0, 12.0, 19.0, 12.0, 6.0, 14.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.5714111328125, -4.424072265625, -4.2767333984375, -4.12939453125, -3.9820556640625, -3.834716796875, -3.6873779296875, -3.5400390625, -3.3927001953125, -3.245361328125, -3.0980224609375, -2.95068359375, -2.8033447265625, -2.656005859375, -2.5086669921875, -2.361328125, -2.2139892578125, -2.066650390625, -1.9193115234375, -1.77197265625, -1.6246337890625, -1.477294921875, -1.3299560546875, -1.1826171875, -1.0352783203125, -0.887939453125, -0.7406005859375, -0.59326171875, -0.4459228515625, -0.298583984375, -0.1512451171875, -0.00390625, 0.1434326171875, 0.290771484375, 0.4381103515625, 0.58544921875, 0.7327880859375, 0.880126953125, 1.0274658203125, 1.1748046875, 1.3221435546875, 1.469482421875, 1.6168212890625, 1.76416015625, 1.9114990234375, 2.058837890625, 2.2061767578125, 2.353515625, 2.5008544921875, 2.648193359375, 2.7955322265625, 2.94287109375, 3.0902099609375, 3.237548828125, 3.3848876953125, 3.5322265625, 3.6795654296875, 3.826904296875, 3.9742431640625, 4.12158203125, 4.2689208984375, 4.416259765625, 4.5635986328125, 4.7109375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 3.0, 4.0, 14.0, 13.0, 7.0, 17.0, 24.0, 21.0, 21.0, 44.0, 39.0, 45.0, 60.0, 77.0, 113.0, 155.0, 249.0, 479.0, 924.0, 2442.0, 7143.0, 28631.0, 184307.0, 1103989.0, 2109387.0, 638601.0, 92257.0, 16847.0, 4689.0, 1660.0, 765.0, 384.0, 217.0, 150.0, 113.0, 81.0, 68.0, 48.0, 51.0, 32.0, 23.0, 29.0, 11.0, 15.0, 9.0, 8.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.64453125, -7.4151611328125, -7.185791015625, -6.9564208984375, -6.72705078125, -6.4976806640625, -6.268310546875, -6.0389404296875, -5.8095703125, -5.5802001953125, -5.350830078125, -5.1214599609375, -4.89208984375, -4.6627197265625, -4.433349609375, -4.2039794921875, -3.974609375, -3.7452392578125, -3.515869140625, -3.2864990234375, -3.05712890625, -2.8277587890625, -2.598388671875, -2.3690185546875, -2.1396484375, -1.9102783203125, -1.680908203125, -1.4515380859375, -1.22216796875, -0.9927978515625, -0.763427734375, -0.5340576171875, -0.3046875, -0.0753173828125, 0.154052734375, 0.3834228515625, 0.61279296875, 0.8421630859375, 1.071533203125, 1.3009033203125, 1.5302734375, 1.7596435546875, 1.989013671875, 2.2183837890625, 2.44775390625, 2.6771240234375, 2.906494140625, 3.1358642578125, 3.365234375, 3.5946044921875, 3.823974609375, 4.0533447265625, 4.28271484375, 4.5120849609375, 4.741455078125, 4.9708251953125, 5.2001953125, 5.4295654296875, 5.658935546875, 5.8883056640625, 6.11767578125, 6.3470458984375, 6.576416015625, 6.8057861328125, 7.03515625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 9.0, 6.0, 10.0, 13.0, 22.0, 33.0, 35.0, 43.0, 65.0, 78.0, 75.0, 94.0, 134.0, 174.0, 237.0, 321.0, 391.0, 468.0, 423.0, 352.0, 292.0, 186.0, 147.0, 88.0, 88.0, 57.0, 46.0, 47.0, 33.0, 26.0, 22.0, 14.0, 14.0, 6.0, 4.0, 6.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.91015625, -5.696533203125, -5.48291015625, -5.269287109375, -5.0556640625, -4.842041015625, -4.62841796875, -4.414794921875, -4.201171875, -3.987548828125, -3.77392578125, -3.560302734375, -3.3466796875, -3.133056640625, -2.91943359375, -2.705810546875, -2.4921875, -2.278564453125, -2.06494140625, -1.851318359375, -1.6376953125, -1.424072265625, -1.21044921875, -0.996826171875, -0.783203125, -0.569580078125, -0.35595703125, -0.142333984375, 0.0712890625, 0.284912109375, 0.49853515625, 0.712158203125, 0.92578125, 1.139404296875, 1.35302734375, 1.566650390625, 1.7802734375, 1.993896484375, 2.20751953125, 2.421142578125, 2.634765625, 2.848388671875, 3.06201171875, 3.275634765625, 3.4892578125, 3.702880859375, 3.91650390625, 4.130126953125, 4.34375, 4.557373046875, 4.77099609375, 4.984619140625, 5.1982421875, 5.411865234375, 5.62548828125, 5.839111328125, 6.052734375, 6.266357421875, 6.47998046875, 6.693603515625, 6.9072265625, 7.120849609375, 7.33447265625, 7.548095703125, 7.76171875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 7.0, 14.0, 30.0, 37.0, 68.0, 99.0, 175.0, 243.0, 477.0, 900.0, 1992.0, 8836.0, 222658.0, 3645602.0, 297902.0, 10776.0, 2266.0, 959.0, 488.0, 302.0, 153.0, 104.0, 69.0, 43.0, 31.0, 14.0, 14.0, 6.0, 3.0, 6.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.84375, -15.307373046875, -14.77099609375, -14.234619140625, -13.6982421875, -13.161865234375, -12.62548828125, -12.089111328125, -11.552734375, -11.016357421875, -10.47998046875, -9.943603515625, -9.4072265625, -8.870849609375, -8.33447265625, -7.798095703125, -7.26171875, -6.725341796875, -6.18896484375, -5.652587890625, -5.1162109375, -4.579833984375, -4.04345703125, -3.507080078125, -2.970703125, -2.434326171875, -1.89794921875, -1.361572265625, -0.8251953125, -0.288818359375, 0.24755859375, 0.783935546875, 1.3203125, 1.856689453125, 2.39306640625, 2.929443359375, 3.4658203125, 4.002197265625, 4.53857421875, 5.074951171875, 5.611328125, 6.147705078125, 6.68408203125, 7.220458984375, 7.7568359375, 8.293212890625, 8.82958984375, 9.365966796875, 9.90234375, 10.438720703125, 10.97509765625, 11.511474609375, 12.0478515625, 12.584228515625, 13.12060546875, 13.656982421875, 14.193359375, 14.729736328125, 15.26611328125, 15.802490234375, 16.3388671875, 16.875244140625, 17.41162109375, 17.947998046875, 18.484375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 26.0, 199.0, 446.0, 270.0, 64.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.316314697265625, -53.8779182434082, -50.43952178955078, -47.00112533569336, -43.56272888183594, -40.124332427978516, -36.685935974121094, -33.24753952026367, -29.80914306640625, -26.370746612548828, -22.932350158691406, -19.493953704833984, -16.055557250976562, -12.61716079711914, -9.178764343261719, -5.740367889404297, -2.301971435546875, 1.1364250183105469, 4.574821472167969, 8.01321792602539, 11.451614379882812, 14.890010833740234, 18.328407287597656, 21.766803741455078, 25.2052001953125, 28.643596649169922, 32.081993103027344, 35.520389556884766, 38.95878601074219, 42.39718246459961, 45.83557891845703, 49.27397537231445, 52.712371826171875, 56.1507682800293, 59.58916473388672, 63.02756118774414, 66.46595764160156, 69.90435791015625, 73.3427505493164, 76.78114318847656, 80.21954345703125, 83.65794372558594, 87.0963363647461, 90.53472900390625, 93.97312927246094, 97.41152954101562, 100.84992218017578, 104.28831481933594, 107.72671508789062, 111.16511535644531, 114.60350799560547, 118.04190063476562, 121.48030090332031, 124.918701171875, 128.35708618164062, 131.7954864501953, 135.23388671875, 138.6722869873047, 142.11068725585938, 145.549072265625, 148.9874725341797, 152.42587280273438, 155.8642578125, 159.3026580810547, 162.74105834960938]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 12.0, 13.0, 10.0, 19.0, 17.0, 19.0, 25.0, 32.0, 31.0, 34.0, 28.0, 33.0, 31.0, 35.0, 41.0, 36.0, 60.0, 52.0, 45.0, 38.0, 30.0, 51.0, 33.0, 32.0, 27.0, 25.0, 25.0, 29.0, 26.0, 17.0, 16.0, 7.0, 9.0, 14.0, 5.0, 3.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.326858520507812, -23.46636390686035, -22.605867385864258, -21.745372772216797, -20.884876251220703, -20.024381637573242, -19.16388702392578, -18.303390502929688, -17.442893981933594, -16.582399368286133, -15.721902847290039, -14.861408233642578, -14.000911712646484, -13.140417098999023, -12.279921531677246, -11.419425964355469, -10.558931350708008, -9.69843578338623, -8.837940216064453, -7.977445125579834, -7.116949558258057, -6.256453990936279, -5.39595890045166, -4.535463333129883, -3.6749677658081055, -2.814472198486328, -1.9539768695831299, -1.0934815406799316, -0.2329859733581543, 0.627509593963623, 1.4880046844482422, 2.3485002517700195, 3.208995819091797, 4.069491386413574, 4.929986953735352, 5.790482044219971, 6.650977611541748, 7.511473178863525, 8.371968269348145, 9.232463836669922, 10.0929594039917, 10.953454971313477, 11.813950538635254, 12.674446105957031, 13.534940719604492, 14.395437240600586, 15.255931854248047, 16.11642837524414, 16.9769229888916, 17.837417602539062, 18.697914123535156, 19.558408737182617, 20.41890525817871, 21.279399871826172, 22.139896392822266, 23.000391006469727, 23.860885620117188, 24.72138023376465, 25.581876754760742, 26.442371368408203, 27.302867889404297, 28.163362503051758, 29.02385711669922, 29.884353637695312, 30.744850158691406]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 4.0, 1.0, 7.0, 7.0, 12.0, 8.0, 16.0, 17.0, 19.0, 22.0, 22.0, 28.0, 30.0, 38.0, 28.0, 40.0, 32.0, 44.0, 46.0, 43.0, 46.0, 43.0, 39.0, 41.0, 28.0, 33.0, 39.0, 32.0, 29.0, 34.0, 33.0, 28.0, 24.0, 16.0, 11.0, 8.0, 15.0, 9.0, 12.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.75, -3.642120361328125, -3.53424072265625, -3.426361083984375, -3.3184814453125, -3.210601806640625, -3.10272216796875, -2.994842529296875, -2.886962890625, -2.779083251953125, -2.67120361328125, -2.563323974609375, -2.4554443359375, -2.347564697265625, -2.23968505859375, -2.131805419921875, -2.02392578125, -1.916046142578125, -1.80816650390625, -1.700286865234375, -1.5924072265625, -1.484527587890625, -1.37664794921875, -1.268768310546875, -1.160888671875, -1.053009033203125, -0.94512939453125, -0.837249755859375, -0.7293701171875, -0.621490478515625, -0.51361083984375, -0.405731201171875, -0.2978515625, -0.189971923828125, -0.08209228515625, 0.025787353515625, 0.1336669921875, 0.241546630859375, 0.34942626953125, 0.457305908203125, 0.565185546875, 0.673065185546875, 0.78094482421875, 0.888824462890625, 0.9967041015625, 1.104583740234375, 1.21246337890625, 1.320343017578125, 1.42822265625, 1.536102294921875, 1.64398193359375, 1.751861572265625, 1.8597412109375, 1.967620849609375, 2.07550048828125, 2.183380126953125, 2.291259765625, 2.399139404296875, 2.50701904296875, 2.614898681640625, 2.7227783203125, 2.830657958984375, 2.93853759765625, 3.046417236328125, 3.154296875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 13.0, 17.0, 12.0, 27.0, 34.0, 54.0, 72.0, 97.0, 140.0, 200.0, 303.0, 390.0, 618.0, 846.0, 1261.0, 1798.0, 2649.0, 4028.0, 5927.0, 9059.0, 13681.0, 20999.0, 32979.0, 52282.0, 87002.0, 162845.0, 273763.0, 152757.0, 82898.0, 49863.0, 31667.0, 20475.0, 13361.0, 8658.0, 5738.0, 3786.0, 2630.0, 1734.0, 1176.0, 870.0, 586.0, 388.0, 251.0, 187.0, 128.0, 91.0, 63.0, 62.0, 40.0, 14.0, 19.0, 11.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0], "bins": [-0.53955078125, -0.5229263305664062, -0.5063018798828125, -0.48967742919921875, -0.473052978515625, -0.45642852783203125, -0.4398040771484375, -0.42317962646484375, -0.40655517578125, -0.38993072509765625, -0.3733062744140625, -0.35668182373046875, -0.340057373046875, -0.32343292236328125, -0.3068084716796875, -0.29018402099609375, -0.2735595703125, -0.25693511962890625, -0.2403106689453125, -0.22368621826171875, -0.207061767578125, -0.19043731689453125, -0.1738128662109375, -0.15718841552734375, -0.14056396484375, -0.12393951416015625, -0.1073150634765625, -0.09069061279296875, -0.074066162109375, -0.05744171142578125, -0.0408172607421875, -0.02419281005859375, -0.007568359375, 0.00905609130859375, 0.0256805419921875, 0.04230499267578125, 0.058929443359375, 0.07555389404296875, 0.0921783447265625, 0.10880279541015625, 0.12542724609375, 0.14205169677734375, 0.1586761474609375, 0.17530059814453125, 0.191925048828125, 0.20854949951171875, 0.2251739501953125, 0.24179840087890625, 0.2584228515625, 0.27504730224609375, 0.2916717529296875, 0.30829620361328125, 0.324920654296875, 0.34154510498046875, 0.3581695556640625, 0.37479400634765625, 0.39141845703125, 0.40804290771484375, 0.4246673583984375, 0.44129180908203125, 0.457916259765625, 0.47454071044921875, 0.4911651611328125, 0.5077896118164062, 0.5244140625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 8.0, 6.0, 13.0, 5.0, 10.0, 8.0, 10.0, 16.0, 16.0, 25.0, 13.0, 23.0, 31.0, 26.0, 26.0, 32.0, 35.0, 39.0, 26.0, 47.0, 35.0, 26.0, 1057.0, 37.0, 31.0, 39.0, 27.0, 41.0, 28.0, 28.0, 31.0, 32.0, 22.0, 18.0, 24.0, 21.0, 18.0, 9.0, 19.0, 14.0, 8.0, 12.0, 6.0, 6.0, 6.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.8974609375, -1.8379364013671875, -1.778411865234375, -1.7188873291015625, -1.65936279296875, -1.5998382568359375, -1.540313720703125, -1.4807891845703125, -1.4212646484375, -1.3617401123046875, -1.302215576171875, -1.2426910400390625, -1.18316650390625, -1.1236419677734375, -1.064117431640625, -1.0045928955078125, -0.945068359375, -0.8855438232421875, -0.826019287109375, -0.7664947509765625, -0.70697021484375, -0.6474456787109375, -0.587921142578125, -0.5283966064453125, -0.4688720703125, -0.4093475341796875, -0.349822998046875, -0.2902984619140625, -0.23077392578125, -0.1712493896484375, -0.111724853515625, -0.0522003173828125, 0.00732421875, 0.0668487548828125, 0.126373291015625, 0.1858978271484375, 0.24542236328125, 0.3049468994140625, 0.364471435546875, 0.4239959716796875, 0.4835205078125, 0.5430450439453125, 0.602569580078125, 0.6620941162109375, 0.72161865234375, 0.7811431884765625, 0.840667724609375, 0.9001922607421875, 0.959716796875, 1.0192413330078125, 1.078765869140625, 1.1382904052734375, 1.19781494140625, 1.2573394775390625, 1.316864013671875, 1.3763885498046875, 1.4359130859375, 1.4954376220703125, 1.554962158203125, 1.6144866943359375, 1.67401123046875, 1.7335357666015625, 1.793060302734375, 1.8525848388671875, 1.912109375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 6.0, 9.0, 10.0, 10.0, 28.0, 32.0, 56.0, 61.0, 98.0, 129.0, 165.0, 220.0, 311.0, 451.0, 597.0, 867.0, 1146.0, 1628.0, 2249.0, 3137.0, 4200.0, 5771.0, 7903.0, 10796.0, 14930.0, 21391.0, 30365.0, 44537.0, 68000.0, 111024.0, 1249338.0, 194253.0, 108419.0, 66211.0, 43511.0, 30001.0, 20944.0, 14915.0, 10754.0, 7745.0, 5613.0, 4149.0, 3028.0, 2179.0, 1611.0, 1139.0, 887.0, 688.0, 469.0, 365.0, 239.0, 182.0, 112.0, 79.0, 64.0, 37.0, 37.0, 18.0, 15.0, 7.0, 5.0, 2.0, 6.0], "bins": [-0.4130859375, -0.4001655578613281, -0.38724517822265625, -0.3743247985839844, -0.3614044189453125, -0.3484840393066406, -0.33556365966796875, -0.3226432800292969, -0.309722900390625, -0.2968025207519531, -0.28388214111328125, -0.2709617614746094, -0.2580413818359375, -0.24512100219726562, -0.23220062255859375, -0.21928024291992188, -0.20635986328125, -0.19343948364257812, -0.18051910400390625, -0.16759872436523438, -0.1546783447265625, -0.14175796508789062, -0.12883758544921875, -0.11591720581054688, -0.102996826171875, -0.09007644653320312, -0.07715606689453125, -0.06423568725585938, -0.0513153076171875, -0.038394927978515625, -0.02547454833984375, -0.012554168701171875, 0.0003662109375, 0.013286590576171875, 0.02620697021484375, 0.039127349853515625, 0.0520477294921875, 0.06496810913085938, 0.07788848876953125, 0.09080886840820312, 0.103729248046875, 0.11664962768554688, 0.12957000732421875, 0.14249038696289062, 0.1554107666015625, 0.16833114624023438, 0.18125152587890625, 0.19417190551757812, 0.20709228515625, 0.22001266479492188, 0.23293304443359375, 0.24585342407226562, 0.2587738037109375, 0.2716941833496094, 0.28461456298828125, 0.2975349426269531, 0.310455322265625, 0.3233757019042969, 0.33629608154296875, 0.3492164611816406, 0.3621368408203125, 0.3750572204589844, 0.38797760009765625, 0.4008979797363281, 0.413818359375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 1.0, 3.0, 8.0, 12.0, 9.0, 18.0, 29.0, 26.0, 25.0, 29.0, 39.0, 38.0, 46.0, 58.0, 64.0, 54.0, 61.0, 70.0, 38.0, 54.0, 42.0, 39.0, 40.0, 35.0, 37.0, 24.0, 13.0, 20.0, 14.0, 17.0, 4.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.28640365600586e-05, -8.961278945207596e-05, -8.636154234409332e-05, -8.311029523611069e-05, -7.985904812812805e-05, -7.660780102014542e-05, -7.335655391216278e-05, -7.010530680418015e-05, -6.685405969619751e-05, -6.360281258821487e-05, -6.035156548023224e-05, -5.71003183722496e-05, -5.384907126426697e-05, -5.059782415628433e-05, -4.73465770483017e-05, -4.409532994031906e-05, -4.0844082832336426e-05, -3.759283572435379e-05, -3.4341588616371155e-05, -3.109034150838852e-05, -2.7839094400405884e-05, -2.4587847292423248e-05, -2.1336600184440613e-05, -1.8085353076457977e-05, -1.4834105968475342e-05, -1.1582858860492706e-05, -8.33161175251007e-06, -5.080364644527435e-06, -1.8291175365447998e-06, 1.4221295714378357e-06, 4.673376679420471e-06, 7.924623787403107e-06, 1.1175870895385742e-05, 1.4427118003368378e-05, 1.7678365111351013e-05, 2.092961221933365e-05, 2.4180859327316284e-05, 2.743210643529892e-05, 3.0683353543281555e-05, 3.393460065126419e-05, 3.7185847759246826e-05, 4.043709486722946e-05, 4.36883419752121e-05, 4.693958908319473e-05, 5.019083619117737e-05, 5.3442083299160004e-05, 5.669333040714264e-05, 5.9944577515125275e-05, 6.319582462310791e-05, 6.644707173109055e-05, 6.969831883907318e-05, 7.294956594705582e-05, 7.620081305503845e-05, 7.945206016302109e-05, 8.270330727100372e-05, 8.595455437898636e-05, 8.9205801486969e-05, 9.245704859495163e-05, 9.570829570293427e-05, 9.89595428109169e-05, 0.00010221078991889954, 0.00010546203702688217, 0.00010871328413486481, 0.00011196453124284744, 0.00011521577835083008]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 1.0, 6.0, 6.0, 5.0, 7.0, 16.0, 11.0, 19.0, 28.0, 26.0, 44.0, 52.0, 65.0, 101.0, 135.0, 179.0, 273.0, 409.0, 677.0, 1531.0, 184699.0, 854589.0, 3281.0, 839.0, 486.0, 311.0, 205.0, 127.0, 117.0, 80.0, 65.0, 41.0, 31.0, 24.0, 15.0, 12.0, 9.0, 7.0, 12.0, 1.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.0023288726806640625, -0.0022678375244140625, -0.0022068023681640625, -0.0021457672119140625, -0.0020847320556640625, -0.0020236968994140625, -0.0019626617431640625, -0.0019016265869140625, -0.0018405914306640625, -0.0017795562744140625, -0.0017185211181640625, -0.0016574859619140625, -0.0015964508056640625, -0.0015354156494140625, -0.0014743804931640625, -0.0014133453369140625, -0.0013523101806640625, -0.0012912750244140625, -0.0012302398681640625, -0.0011692047119140625, -0.0011081695556640625, -0.0010471343994140625, -0.0009860992431640625, -0.0009250640869140625, -0.0008640289306640625, -0.0008029937744140625, -0.0007419586181640625, -0.0006809234619140625, -0.0006198883056640625, -0.0005588531494140625, -0.0004978179931640625, -0.0004367828369140625, -0.0003757476806640625, -0.0003147125244140625, -0.0002536773681640625, -0.0001926422119140625, -0.0001316070556640625, -7.05718994140625e-05, -9.5367431640625e-06, 5.14984130859375e-05, 0.0001125335693359375, 0.0001735687255859375, 0.0002346038818359375, 0.0002956390380859375, 0.0003566741943359375, 0.0004177093505859375, 0.0004787445068359375, 0.0005397796630859375, 0.0006008148193359375, 0.0006618499755859375, 0.0007228851318359375, 0.0007839202880859375, 0.0008449554443359375, 0.0009059906005859375, 0.0009670257568359375, 0.0010280609130859375, 0.0010890960693359375, 0.0011501312255859375, 0.0012111663818359375, 0.0012722015380859375, 0.0013332366943359375, 0.0013942718505859375, 0.0014553070068359375, 0.0015163421630859375, 0.0015773773193359375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 26.0, 76.0, 176.0, 256.0, 246.0, 140.0, 58.0, 16.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.349190516630188e-05, -5.8578654716257006e-05, -5.3665404266212136e-05, -4.875215017818846e-05, -4.383889972814359e-05, -3.892564927809872e-05, -3.401239519007504e-05, -2.909914474003017e-05, -2.41858942899853e-05, -1.927264383994043e-05, -1.4359391570906155e-05, -9.446140211366583e-06, -4.5328888518270105e-06, 3.8036159821785986e-07, 5.293613867252134e-06, 1.0206866136286408e-05, 1.5120116586331278e-05, 2.003336703637615e-05, 2.4946619305410422e-05, 2.9859871574444696e-05, 3.477312202448957e-05, 3.968637247453444e-05, 4.4599626562558115e-05, 4.9512877012602985e-05, 5.4426127462647855e-05, 5.9339377912692726e-05, 6.42526283627376e-05, 6.916587881278247e-05, 7.407912926282734e-05, 7.899237971287221e-05, 8.390563743887469e-05, 8.881888788891956e-05, 9.373214561492205e-05, 9.864539606496692e-05, 0.00010355864651501179, 0.00010847189696505666, 0.00011338514741510153, 0.0001182983978651464, 0.00012321164831519127, 0.00012812489876523614, 0.000133038149215281, 0.00013795139966532588, 0.00014286465011537075, 0.00014777790056541562, 0.0001526911510154605, 0.00015760440146550536, 0.00016251765191555023, 0.0001674309023655951, 0.0001723441673675552, 0.00017725741781760007, 0.00018217066826764494, 0.0001870839187176898, 0.00019199716916773468, 0.00019691041961777955, 0.00020182367006782442, 0.00020673693506978452, 0.0002116501855198294, 0.00021656343596987426, 0.00022147668641991913, 0.000226389936869964, 0.00023130318732000887, 0.00023621643777005374, 0.00024112968822009861, 0.0002460429386701435, 0.00025095618912018836]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 2.0, 11.0, 12.0, 14.0, 21.0, 17.0, 18.0, 29.0, 31.0, 19.0, 37.0, 37.0, 32.0, 43.0, 39.0, 50.0, 46.0, 48.0, 42.0, 38.0, 47.0, 40.0, 38.0, 30.0, 34.0, 36.0, 27.0, 26.0, 19.0, 26.0, 12.0, 9.0, 17.0, 11.0, 8.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-6.0558319091796875e-05, -5.88512048125267e-05, -5.714409053325653e-05, -5.543697625398636e-05, -5.3729861974716187e-05, -5.2022747695446014e-05, -5.031563341617584e-05, -4.860851913690567e-05, -4.69014048576355e-05, -4.5194290578365326e-05, -4.3487176299095154e-05, -4.178006201982498e-05, -4.007294774055481e-05, -3.836583346128464e-05, -3.6658719182014465e-05, -3.495160490274429e-05, -3.324449062347412e-05, -3.153737634420395e-05, -2.9830262064933777e-05, -2.8123147785663605e-05, -2.6416033506393433e-05, -2.470891922712326e-05, -2.300180494785309e-05, -2.1294690668582916e-05, -1.9587576389312744e-05, -1.7880462110042572e-05, -1.61733478307724e-05, -1.4466233551502228e-05, -1.2759119272232056e-05, -1.1052004992961884e-05, -9.344890713691711e-06, -7.63777643442154e-06, -5.930662155151367e-06, -4.223547875881195e-06, -2.516433596611023e-06, -8.093193173408508e-07, 8.977949619293213e-07, 2.6049092411994934e-06, 4.3120235204696655e-06, 6.019137799739838e-06, 7.72625207901001e-06, 9.433366358280182e-06, 1.1140480637550354e-05, 1.2847594916820526e-05, 1.4554709196090698e-05, 1.626182347536087e-05, 1.7968937754631042e-05, 1.9676052033901215e-05, 2.1383166313171387e-05, 2.309028059244156e-05, 2.479739487171173e-05, 2.6504509150981903e-05, 2.8211623430252075e-05, 2.9918737709522247e-05, 3.162585198879242e-05, 3.333296626806259e-05, 3.5040080547332764e-05, 3.6747194826602936e-05, 3.845430910587311e-05, 4.016142338514328e-05, 4.186853766441345e-05, 4.3575651943683624e-05, 4.5282766222953796e-05, 4.698988050222397e-05, 4.869699478149414e-05]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 4.0, 1.0, 7.0, 7.0, 12.0, 8.0, 16.0, 17.0, 19.0, 22.0, 22.0, 28.0, 30.0, 38.0, 28.0, 40.0, 32.0, 44.0, 46.0, 43.0, 46.0, 43.0, 39.0, 41.0, 28.0, 33.0, 39.0, 32.0, 29.0, 34.0, 33.0, 28.0, 24.0, 16.0, 11.0, 8.0, 15.0, 9.0, 12.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.75, -3.642120361328125, -3.53424072265625, -3.426361083984375, -3.3184814453125, -3.210601806640625, -3.10272216796875, -2.994842529296875, -2.886962890625, -2.779083251953125, -2.67120361328125, -2.563323974609375, -2.4554443359375, -2.347564697265625, -2.23968505859375, -2.131805419921875, -2.02392578125, -1.916046142578125, -1.80816650390625, -1.700286865234375, -1.5924072265625, -1.484527587890625, -1.37664794921875, -1.268768310546875, -1.160888671875, -1.053009033203125, -0.94512939453125, -0.837249755859375, -0.7293701171875, -0.621490478515625, -0.51361083984375, -0.405731201171875, -0.2978515625, -0.189971923828125, -0.08209228515625, 0.025787353515625, 0.1336669921875, 0.241546630859375, 0.34942626953125, 0.457305908203125, 0.565185546875, 0.673065185546875, 0.78094482421875, 0.888824462890625, 0.9967041015625, 1.104583740234375, 1.21246337890625, 1.320343017578125, 1.42822265625, 1.536102294921875, 1.64398193359375, 1.751861572265625, 1.8597412109375, 1.967620849609375, 2.07550048828125, 2.183380126953125, 2.291259765625, 2.399139404296875, 2.50701904296875, 2.614898681640625, 2.7227783203125, 2.830657958984375, 2.93853759765625, 3.046417236328125, 3.154296875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 5.0, 9.0, 9.0, 14.0, 19.0, 33.0, 34.0, 62.0, 77.0, 82.0, 128.0, 163.0, 227.0, 302.0, 364.0, 536.0, 718.0, 1019.0, 1341.0, 1891.0, 2771.0, 4779.0, 15921.0, 155685.0, 698751.0, 135045.0, 14263.0, 4526.0, 2775.0, 1932.0, 1316.0, 984.0, 734.0, 530.0, 385.0, 265.0, 238.0, 156.0, 111.0, 85.0, 65.0, 53.0, 43.0, 26.0, 20.0, 19.0, 17.0, 7.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.6015625, -8.3282470703125, -8.054931640625, -7.7816162109375, -7.50830078125, -7.2349853515625, -6.961669921875, -6.6883544921875, -6.4150390625, -6.1417236328125, -5.868408203125, -5.5950927734375, -5.32177734375, -5.0484619140625, -4.775146484375, -4.5018310546875, -4.228515625, -3.9552001953125, -3.681884765625, -3.4085693359375, -3.13525390625, -2.8619384765625, -2.588623046875, -2.3153076171875, -2.0419921875, -1.7686767578125, -1.495361328125, -1.2220458984375, -0.94873046875, -0.6754150390625, -0.402099609375, -0.1287841796875, 0.14453125, 0.4178466796875, 0.691162109375, 0.9644775390625, 1.23779296875, 1.5111083984375, 1.784423828125, 2.0577392578125, 2.3310546875, 2.6043701171875, 2.877685546875, 3.1510009765625, 3.42431640625, 3.6976318359375, 3.970947265625, 4.2442626953125, 4.517578125, 4.7908935546875, 5.064208984375, 5.3375244140625, 5.61083984375, 5.8841552734375, 6.157470703125, 6.4307861328125, 6.7041015625, 6.9774169921875, 7.250732421875, 7.5240478515625, 7.79736328125, 8.0706787109375, 8.343994140625, 8.6173095703125, 8.890625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 7.0, 7.0, 9.0, 12.0, 19.0, 15.0, 16.0, 17.0, 32.0, 28.0, 37.0, 56.0, 61.0, 78.0, 119.0, 370.0, 1576.0, 153.0, 85.0, 52.0, 53.0, 41.0, 40.0, 34.0, 29.0, 25.0, 16.0, 11.0, 10.0, 16.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.859375, -10.510498046875, -10.16162109375, -9.812744140625, -9.4638671875, -9.114990234375, -8.76611328125, -8.417236328125, -8.068359375, -7.719482421875, -7.37060546875, -7.021728515625, -6.6728515625, -6.323974609375, -5.97509765625, -5.626220703125, -5.27734375, -4.928466796875, -4.57958984375, -4.230712890625, -3.8818359375, -3.532958984375, -3.18408203125, -2.835205078125, -2.486328125, -2.137451171875, -1.78857421875, -1.439697265625, -1.0908203125, -0.741943359375, -0.39306640625, -0.044189453125, 0.3046875, 0.653564453125, 1.00244140625, 1.351318359375, 1.7001953125, 2.049072265625, 2.39794921875, 2.746826171875, 3.095703125, 3.444580078125, 3.79345703125, 4.142333984375, 4.4912109375, 4.840087890625, 5.18896484375, 5.537841796875, 5.88671875, 6.235595703125, 6.58447265625, 6.933349609375, 7.2822265625, 7.631103515625, 7.97998046875, 8.328857421875, 8.677734375, 9.026611328125, 9.37548828125, 9.724365234375, 10.0732421875, 10.422119140625, 10.77099609375, 11.119873046875, 11.46875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 6.0, 7.0, 10.0, 19.0, 42.0, 33.0, 33.0, 48.0, 72.0, 92.0, 178.0, 222.0, 432.0, 799.0, 2312.0, 249036.0, 2887497.0, 2622.0, 971.0, 425.0, 259.0, 173.0, 100.0, 81.0, 66.0, 47.0, 24.0, 17.0, 16.0, 22.0, 11.0, 5.0, 6.0, 2.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.375, -39.07568359375, -37.7763671875, -36.47705078125, -35.177734375, -33.87841796875, -32.5791015625, -31.27978515625, -29.98046875, -28.68115234375, -27.3818359375, -26.08251953125, -24.783203125, -23.48388671875, -22.1845703125, -20.88525390625, -19.5859375, -18.28662109375, -16.9873046875, -15.68798828125, -14.388671875, -13.08935546875, -11.7900390625, -10.49072265625, -9.19140625, -7.89208984375, -6.5927734375, -5.29345703125, -3.994140625, -2.69482421875, -1.3955078125, -0.09619140625, 1.203125, 2.50244140625, 3.8017578125, 5.10107421875, 6.400390625, 7.69970703125, 8.9990234375, 10.29833984375, 11.59765625, 12.89697265625, 14.1962890625, 15.49560546875, 16.794921875, 18.09423828125, 19.3935546875, 20.69287109375, 21.9921875, 23.29150390625, 24.5908203125, 25.89013671875, 27.189453125, 28.48876953125, 29.7880859375, 31.08740234375, 32.38671875, 33.68603515625, 34.9853515625, 36.28466796875, 37.583984375, 38.88330078125, 40.1826171875, 41.48193359375, 42.78125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 24.0, 45.0, 97.0, 208.0, 263.0, 231.0, 86.0, 37.0, 15.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.93561553955078, -46.724857330322266, -45.514095306396484, -44.30333709716797, -43.09257888793945, -41.88181686401367, -40.671058654785156, -39.460296630859375, -38.24953842163086, -37.038780212402344, -35.82801818847656, -34.61725997924805, -33.40650177001953, -32.19573974609375, -30.984981536865234, -29.774221420288086, -28.56346321105957, -27.352703094482422, -26.141944885253906, -24.931184768676758, -23.72042465209961, -22.509666442871094, -21.298906326293945, -20.088146209716797, -18.87738800048828, -17.666627883911133, -16.455869674682617, -15.245109558105469, -14.03434944152832, -12.823590278625488, -11.612831115722656, -10.402070999145508, -9.19131088256836, -7.980551242828369, -6.769791603088379, -5.559032440185547, -4.348272800445557, -3.1375131607055664, -1.9267539978027344, -0.7159938812255859, 0.4947652816772461, 1.7055248022079468, 2.9162843227386475, 4.127043724060059, 5.337803363800049, 6.548563003540039, 7.759322166442871, 8.97008228302002, 10.180841445922852, 11.391600608825684, 12.602360725402832, 13.813119888305664, 15.023880004882812, 16.234638214111328, 17.445398330688477, 18.656158447265625, 19.86691665649414, 21.07767677307129, 22.288434982299805, 23.499195098876953, 24.7099552154541, 25.92071533203125, 27.131473541259766, 28.342233657836914, 29.552993774414062]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 6.0, 4.0, 5.0, 7.0, 16.0, 10.0, 11.0, 9.0, 12.0, 12.0, 11.0, 22.0, 16.0, 16.0, 33.0, 28.0, 30.0, 27.0, 27.0, 34.0, 31.0, 41.0, 29.0, 40.0, 40.0, 37.0, 39.0, 29.0, 25.0, 34.0, 25.0, 29.0, 30.0, 36.0, 31.0, 27.0, 30.0, 19.0, 20.0, 8.0, 20.0, 10.0, 11.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.995271682739258, -18.326915740966797, -17.658557891845703, -16.990201950073242, -16.32184600830078, -15.65349006652832, -14.985133171081543, -14.316776275634766, -13.648420333862305, -12.980064392089844, -12.311707496643066, -11.643350601196289, -10.974994659423828, -10.306638717651367, -9.63828182220459, -8.969924926757812, -8.301568984985352, -7.633212566375732, -6.964856147766113, -6.296499729156494, -5.628143310546875, -4.959786891937256, -4.291430473327637, -3.6230740547180176, -2.9547176361083984, -2.2863612174987793, -1.6180047988891602, -0.949648380279541, -0.2812919616699219, 0.38706445693969727, 1.0554208755493164, 1.7237772941589355, 2.392131805419922, 3.060488224029541, 3.72884464263916, 4.397201061248779, 5.065557479858398, 5.733913898468018, 6.402270317077637, 7.070626735687256, 7.738983154296875, 8.407339096069336, 9.075695991516113, 9.74405288696289, 10.412408828735352, 11.080764770507812, 11.74912166595459, 12.417478561401367, 13.085834503173828, 13.754190444946289, 14.422547340393066, 15.090904235839844, 15.759260177612305, 16.427616119384766, 17.09597396850586, 17.76432991027832, 18.43268585205078, 19.101041793823242, 19.769397735595703, 20.437755584716797, 21.106111526489258, 21.77446746826172, 22.442825317382812, 23.111181259155273, 23.779537200927734]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 3.0, 8.0, 6.0, 5.0, 5.0, 6.0, 12.0, 17.0, 18.0, 16.0, 24.0, 18.0, 26.0, 31.0, 23.0, 38.0, 26.0, 37.0, 43.0, 29.0, 41.0, 30.0, 42.0, 42.0, 48.0, 38.0, 32.0, 32.0, 36.0, 38.0, 35.0, 19.0, 23.0, 26.0, 26.0, 19.0, 13.0, 12.0, 17.0, 13.0, 4.0, 6.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.40234375, -3.29425048828125, -3.1861572265625, -3.07806396484375, -2.969970703125, -2.86187744140625, -2.7537841796875, -2.64569091796875, -2.53759765625, -2.42950439453125, -2.3214111328125, -2.21331787109375, -2.105224609375, -1.99713134765625, -1.8890380859375, -1.78094482421875, -1.6728515625, -1.56475830078125, -1.4566650390625, -1.34857177734375, -1.240478515625, -1.13238525390625, -1.0242919921875, -0.91619873046875, -0.80810546875, -0.70001220703125, -0.5919189453125, -0.48382568359375, -0.375732421875, -0.26763916015625, -0.1595458984375, -0.05145263671875, 0.056640625, 0.16473388671875, 0.2728271484375, 0.38092041015625, 0.489013671875, 0.59710693359375, 0.7052001953125, 0.81329345703125, 0.92138671875, 1.02947998046875, 1.1375732421875, 1.24566650390625, 1.353759765625, 1.46185302734375, 1.5699462890625, 1.67803955078125, 1.7861328125, 1.89422607421875, 2.0023193359375, 2.11041259765625, 2.218505859375, 2.32659912109375, 2.4346923828125, 2.54278564453125, 2.65087890625, 2.75897216796875, 2.8670654296875, 2.97515869140625, 3.083251953125, 3.19134521484375, 3.2994384765625, 3.40753173828125, 3.515625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 6.0, 10.0, 11.0, 18.0, 13.0, 15.0, 20.0, 29.0, 32.0, 36.0, 44.0, 57.0, 74.0, 92.0, 156.0, 370.0, 1081.0, 3979.0, 26213.0, 529249.0, 3153552.0, 450069.0, 23380.0, 3776.0, 1027.0, 340.0, 148.0, 94.0, 82.0, 65.0, 50.0, 29.0, 28.0, 30.0, 31.0, 16.0, 8.0, 15.0, 7.0, 10.0, 8.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.5390625, -10.2042236328125, -9.869384765625, -9.5345458984375, -9.19970703125, -8.8648681640625, -8.530029296875, -8.1951904296875, -7.8603515625, -7.5255126953125, -7.190673828125, -6.8558349609375, -6.52099609375, -6.1861572265625, -5.851318359375, -5.5164794921875, -5.181640625, -4.8468017578125, -4.511962890625, -4.1771240234375, -3.84228515625, -3.5074462890625, -3.172607421875, -2.8377685546875, -2.5029296875, -2.1680908203125, -1.833251953125, -1.4984130859375, -1.16357421875, -0.8287353515625, -0.493896484375, -0.1590576171875, 0.17578125, 0.5106201171875, 0.845458984375, 1.1802978515625, 1.51513671875, 1.8499755859375, 2.184814453125, 2.5196533203125, 2.8544921875, 3.1893310546875, 3.524169921875, 3.8590087890625, 4.19384765625, 4.5286865234375, 4.863525390625, 5.1983642578125, 5.533203125, 5.8680419921875, 6.202880859375, 6.5377197265625, 6.87255859375, 7.2073974609375, 7.542236328125, 7.8770751953125, 8.2119140625, 8.5467529296875, 8.881591796875, 9.2164306640625, 9.55126953125, 9.8861083984375, 10.220947265625, 10.5557861328125, 10.890625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 10.0, 19.0, 33.0, 148.0, 409.0, 1057.0, 1474.0, 622.0, 193.0, 83.0, 27.0, 9.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.015625, -22.322509765625, -21.62939453125, -20.936279296875, -20.2431640625, -19.550048828125, -18.85693359375, -18.163818359375, -17.470703125, -16.777587890625, -16.08447265625, -15.391357421875, -14.6982421875, -14.005126953125, -13.31201171875, -12.618896484375, -11.92578125, -11.232666015625, -10.53955078125, -9.846435546875, -9.1533203125, -8.460205078125, -7.76708984375, -7.073974609375, -6.380859375, -5.687744140625, -4.99462890625, -4.301513671875, -3.6083984375, -2.915283203125, -2.22216796875, -1.529052734375, -0.8359375, -0.142822265625, 0.55029296875, 1.243408203125, 1.9365234375, 2.629638671875, 3.32275390625, 4.015869140625, 4.708984375, 5.402099609375, 6.09521484375, 6.788330078125, 7.4814453125, 8.174560546875, 8.86767578125, 9.560791015625, 10.25390625, 10.947021484375, 11.64013671875, 12.333251953125, 13.0263671875, 13.719482421875, 14.41259765625, 15.105712890625, 15.798828125, 16.491943359375, 17.18505859375, 17.878173828125, 18.5712890625, 19.264404296875, 19.95751953125, 20.650634765625, 21.34375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 11.0, 16.0, 25.0, 103.0, 313.0, 1417.0, 24152.0, 4161408.0, 5648.0, 842.0, 225.0, 61.0, 22.0, 15.0, 6.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.1875, -43.74560546875, -42.3037109375, -40.86181640625, -39.419921875, -37.97802734375, -36.5361328125, -35.09423828125, -33.65234375, -32.21044921875, -30.7685546875, -29.32666015625, -27.884765625, -26.44287109375, -25.0009765625, -23.55908203125, -22.1171875, -20.67529296875, -19.2333984375, -17.79150390625, -16.349609375, -14.90771484375, -13.4658203125, -12.02392578125, -10.58203125, -9.14013671875, -7.6982421875, -6.25634765625, -4.814453125, -3.37255859375, -1.9306640625, -0.48876953125, 0.953125, 2.39501953125, 3.8369140625, 5.27880859375, 6.720703125, 8.16259765625, 9.6044921875, 11.04638671875, 12.48828125, 13.93017578125, 15.3720703125, 16.81396484375, 18.255859375, 19.69775390625, 21.1396484375, 22.58154296875, 24.0234375, 25.46533203125, 26.9072265625, 28.34912109375, 29.791015625, 31.23291015625, 32.6748046875, 34.11669921875, 35.55859375, 37.00048828125, 38.4423828125, 39.88427734375, 41.326171875, 42.76806640625, 44.2099609375, 45.65185546875, 47.09375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 25.0, 98.0, 249.0, 301.0, 227.0, 90.0, 11.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-75.73889923095703, -73.76427459716797, -71.78964233398438, -69.81501770019531, -67.84038543701172, -65.86576080322266, -63.89113235473633, -61.91650390625, -59.94187545776367, -57.967247009277344, -55.992618560791016, -54.01799011230469, -52.043365478515625, -50.06873321533203, -48.09410858154297, -46.11948013305664, -44.14485168457031, -42.170223236083984, -40.195594787597656, -38.22096633911133, -36.246337890625, -34.27171325683594, -32.29708480834961, -30.32245635986328, -28.347827911376953, -26.373199462890625, -24.398571014404297, -22.4239444732666, -20.449316024780273, -18.474687576293945, -16.50006103515625, -14.525432586669922, -12.550804138183594, -10.576175689697266, -8.601548194885254, -6.626920223236084, -4.652292251586914, -2.677663803100586, -0.7030363082885742, 1.2715911865234375, 3.2462196350097656, 5.2208476066589355, 7.1954755783081055, 9.170103073120117, 11.144731521606445, 13.119359970092773, 15.093987464904785, 17.068614959716797, 19.043243408203125, 21.017871856689453, 22.99250030517578, 24.967126846313477, 26.941755294799805, 28.916383743286133, 30.891010284423828, 32.865638732910156, 34.840267181396484, 36.81489562988281, 38.78952407836914, 40.76415252685547, 42.73877716064453, 44.713409423828125, 46.68803405761719, 48.662662506103516, 50.637290954589844]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 3.0, 4.0, 6.0, 9.0, 8.0, 7.0, 13.0, 11.0, 15.0, 20.0, 22.0, 18.0, 23.0, 26.0, 29.0, 31.0, 39.0, 32.0, 44.0, 40.0, 34.0, 38.0, 45.0, 39.0, 40.0, 36.0, 34.0, 30.0, 50.0, 26.0, 24.0, 23.0, 31.0, 24.0, 20.0, 22.0, 14.0, 11.0, 8.0, 13.0, 10.0, 8.0, 8.0, 3.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.18072509765625, -21.426908493041992, -20.6730899810791, -19.919273376464844, -19.165454864501953, -18.411638259887695, -17.657821655273438, -16.904003143310547, -16.15018653869629, -15.396368980407715, -14.64255142211914, -13.888734817504883, -13.134917259216309, -12.381099700927734, -11.62728214263916, -10.873464584350586, -10.119647026062012, -9.365829467773438, -8.612011909484863, -7.858194828033447, -7.104377746582031, -6.350560188293457, -5.596742630004883, -4.842925548553467, -4.089107990264893, -3.3352906703948975, -2.5814733505249023, -1.8276557922363281, -1.073838472366333, -0.3200211524963379, 0.43379640579223633, 1.1876134872436523, 1.9414310455322266, 2.6952483654022217, 3.449065685272217, 4.202883243560791, 4.956700325012207, 5.710517883300781, 6.4643354415893555, 7.2181525230407715, 7.971970081329346, 8.725787162780762, 9.479604721069336, 10.23342227935791, 10.987239837646484, 11.741056442260742, 12.494874954223633, 13.24869155883789, 14.002509117126465, 14.756326675415039, 15.510144233703613, 16.263961791992188, 17.017778396606445, 17.771595001220703, 18.525413513183594, 19.27923011779785, 20.033048629760742, 20.786865234375, 21.54068374633789, 22.29450035095215, 23.04831886291504, 23.802135467529297, 24.555953979492188, 25.309770584106445, 26.063587188720703]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 10.0, 3.0, 7.0, 5.0, 13.0, 16.0, 13.0, 15.0, 14.0, 28.0, 24.0, 29.0, 28.0, 28.0, 31.0, 41.0, 33.0, 39.0, 46.0, 42.0, 39.0, 52.0, 40.0, 39.0, 36.0, 37.0, 40.0, 45.0, 32.0, 19.0, 18.0, 23.0, 25.0, 15.0, 15.0, 10.0, 9.0, 8.0, 5.0, 10.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.62640380859375, -2.5379638671875, -2.44952392578125, -2.361083984375, -2.27264404296875, -2.1842041015625, -2.09576416015625, -2.00732421875, -1.91888427734375, -1.8304443359375, -1.74200439453125, -1.653564453125, -1.56512451171875, -1.4766845703125, -1.38824462890625, -1.2998046875, -1.21136474609375, -1.1229248046875, -1.03448486328125, -0.946044921875, -0.85760498046875, -0.7691650390625, -0.68072509765625, -0.59228515625, -0.50384521484375, -0.4154052734375, -0.32696533203125, -0.238525390625, -0.15008544921875, -0.0616455078125, 0.02679443359375, 0.115234375, 0.20367431640625, 0.2921142578125, 0.38055419921875, 0.468994140625, 0.55743408203125, 0.6458740234375, 0.73431396484375, 0.82275390625, 0.91119384765625, 0.9996337890625, 1.08807373046875, 1.176513671875, 1.26495361328125, 1.3533935546875, 1.44183349609375, 1.5302734375, 1.61871337890625, 1.7071533203125, 1.79559326171875, 1.884033203125, 1.97247314453125, 2.0609130859375, 2.14935302734375, 2.23779296875, 2.32623291015625, 2.4146728515625, 2.50311279296875, 2.591552734375, 2.67999267578125, 2.7684326171875, 2.85687255859375, 2.9453125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 5.0, 4.0, 8.0, 14.0, 19.0, 34.0, 50.0, 85.0, 113.0, 142.0, 244.0, 349.0, 481.0, 759.0, 1043.0, 1478.0, 2217.0, 3054.0, 4492.0, 6541.0, 9466.0, 14099.0, 21297.0, 32713.0, 51102.0, 84628.0, 152448.0, 267379.0, 155269.0, 87134.0, 52010.0, 32948.0, 21476.0, 14252.0, 9725.0, 6584.0, 4666.0, 3179.0, 2149.0, 1536.0, 1031.0, 739.0, 454.0, 384.0, 248.0, 175.0, 104.0, 83.0, 50.0, 31.0, 25.0, 17.0, 16.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.414794921875, -0.4012031555175781, -0.38761138916015625, -0.3740196228027344, -0.3604278564453125, -0.3468360900878906, -0.33324432373046875, -0.3196525573730469, -0.306060791015625, -0.2924690246582031, -0.27887725830078125, -0.2652854919433594, -0.2516937255859375, -0.23810195922851562, -0.22451019287109375, -0.21091842651367188, -0.19732666015625, -0.18373489379882812, -0.17014312744140625, -0.15655136108398438, -0.1429595947265625, -0.12936782836914062, -0.11577606201171875, -0.10218429565429688, -0.088592529296875, -0.07500076293945312, -0.06140899658203125, -0.047817230224609375, -0.0342254638671875, -0.020633697509765625, -0.00704193115234375, 0.006549835205078125, 0.0201416015625, 0.033733367919921875, 0.04732513427734375, 0.060916900634765625, 0.0745086669921875, 0.08810043334960938, 0.10169219970703125, 0.11528396606445312, 0.128875732421875, 0.14246749877929688, 0.15605926513671875, 0.16965103149414062, 0.1832427978515625, 0.19683456420898438, 0.21042633056640625, 0.22401809692382812, 0.23760986328125, 0.2512016296386719, 0.26479339599609375, 0.2783851623535156, 0.2919769287109375, 0.3055686950683594, 0.31916046142578125, 0.3327522277832031, 0.346343994140625, 0.3599357604980469, 0.37352752685546875, 0.3871192932128906, 0.4007110595703125, 0.4143028259277344, 0.42789459228515625, 0.4414863586425781, 0.455078125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 10.0, 7.0, 8.0, 8.0, 9.0, 15.0, 16.0, 21.0, 23.0, 20.0, 34.0, 27.0, 35.0, 49.0, 41.0, 43.0, 43.0, 51.0, 48.0, 1067.0, 46.0, 46.0, 51.0, 28.0, 36.0, 40.0, 33.0, 24.0, 17.0, 28.0, 14.0, 15.0, 15.0, 9.0, 16.0, 6.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.078125, -2.0189208984375, -1.959716796875, -1.9005126953125, -1.84130859375, -1.7821044921875, -1.722900390625, -1.6636962890625, -1.6044921875, -1.5452880859375, -1.486083984375, -1.4268798828125, -1.36767578125, -1.3084716796875, -1.249267578125, -1.1900634765625, -1.130859375, -1.0716552734375, -1.012451171875, -0.9532470703125, -0.89404296875, -0.8348388671875, -0.775634765625, -0.7164306640625, -0.6572265625, -0.5980224609375, -0.538818359375, -0.4796142578125, -0.42041015625, -0.3612060546875, -0.302001953125, -0.2427978515625, -0.18359375, -0.1243896484375, -0.065185546875, -0.0059814453125, 0.05322265625, 0.1124267578125, 0.171630859375, 0.2308349609375, 0.2900390625, 0.3492431640625, 0.408447265625, 0.4676513671875, 0.52685546875, 0.5860595703125, 0.645263671875, 0.7044677734375, 0.763671875, 0.8228759765625, 0.882080078125, 0.9412841796875, 1.00048828125, 1.0596923828125, 1.118896484375, 1.1781005859375, 1.2373046875, 1.2965087890625, 1.355712890625, 1.4149169921875, 1.47412109375, 1.5333251953125, 1.592529296875, 1.6517333984375, 1.7109375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 15.0, 21.0, 31.0, 44.0, 77.0, 108.0, 149.0, 215.0, 301.0, 476.0, 662.0, 1026.0, 1524.0, 2226.0, 3255.0, 4953.0, 7405.0, 10884.0, 16957.0, 26524.0, 43096.0, 74261.0, 146227.0, 1347372.0, 183777.0, 88480.0, 49971.0, 30054.0, 19195.0, 12542.0, 8164.0, 5553.0, 3660.0, 2634.0, 1704.0, 1120.0, 821.0, 523.0, 397.0, 239.0, 172.0, 112.0, 64.0, 44.0, 29.0, 21.0, 11.0, 12.0, 6.0, 10.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.4375, -0.4236717224121094, -0.40984344482421875, -0.3960151672363281, -0.3821868896484375, -0.3683586120605469, -0.35453033447265625, -0.3407020568847656, -0.326873779296875, -0.3130455017089844, -0.29921722412109375, -0.2853889465332031, -0.2715606689453125, -0.2577323913574219, -0.24390411376953125, -0.23007583618164062, -0.21624755859375, -0.20241928100585938, -0.18859100341796875, -0.17476272583007812, -0.1609344482421875, -0.14710617065429688, -0.13327789306640625, -0.11944961547851562, -0.105621337890625, -0.09179306030273438, -0.07796478271484375, -0.06413650512695312, -0.0503082275390625, -0.036479949951171875, -0.02265167236328125, -0.008823394775390625, 0.0050048828125, 0.018833160400390625, 0.03266143798828125, 0.046489715576171875, 0.0603179931640625, 0.07414627075195312, 0.08797454833984375, 0.10180282592773438, 0.115631103515625, 0.12945938110351562, 0.14328765869140625, 0.15711593627929688, 0.1709442138671875, 0.18477249145507812, 0.19860076904296875, 0.21242904663085938, 0.22625732421875, 0.24008560180664062, 0.25391387939453125, 0.2677421569824219, 0.2815704345703125, 0.2953987121582031, 0.30922698974609375, 0.3230552673339844, 0.336883544921875, 0.3507118225097656, 0.36454010009765625, 0.3783683776855469, 0.3921966552734375, 0.4060249328613281, 0.41985321044921875, 0.4336814880371094, 0.447509765625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 5.0, 8.0, 5.0, 9.0, 6.0, 13.0, 9.0, 11.0, 21.0, 32.0, 44.0, 49.0, 62.0, 56.0, 67.0, 67.0, 82.0, 78.0, 61.0, 63.0, 48.0, 50.0, 33.0, 27.0, 24.0, 23.0, 10.0, 6.0, 7.0, 5.0, 8.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010216236114501953, -9.889528155326843e-05, -9.562820196151733e-05, -9.236112236976624e-05, -8.909404277801514e-05, -8.582696318626404e-05, -8.255988359451294e-05, -7.929280400276184e-05, -7.602572441101074e-05, -7.275864481925964e-05, -6.949156522750854e-05, -6.622448563575745e-05, -6.295740604400635e-05, -5.969032645225525e-05, -5.642324686050415e-05, -5.315616726875305e-05, -4.988908767700195e-05, -4.6622008085250854e-05, -4.3354928493499756e-05, -4.008784890174866e-05, -3.682076930999756e-05, -3.355368971824646e-05, -3.028661012649536e-05, -2.7019530534744263e-05, -2.3752450942993164e-05, -2.0485371351242065e-05, -1.7218291759490967e-05, -1.3951212167739868e-05, -1.068413257598877e-05, -7.417052984237671e-06, -4.149973392486572e-06, -8.828938007354736e-07, 2.384185791015625e-06, 5.651265382766724e-06, 8.918344974517822e-06, 1.2185424566268921e-05, 1.545250415802002e-05, 1.8719583749771118e-05, 2.1986663341522217e-05, 2.5253742933273315e-05, 2.8520822525024414e-05, 3.178790211677551e-05, 3.505498170852661e-05, 3.832206130027771e-05, 4.158914089202881e-05, 4.485622048377991e-05, 4.8123300075531006e-05, 5.1390379667282104e-05, 5.46574592590332e-05, 5.79245388507843e-05, 6.11916184425354e-05, 6.44586980342865e-05, 6.77257776260376e-05, 7.09928572177887e-05, 7.42599368095398e-05, 7.75270164012909e-05, 8.079409599304199e-05, 8.406117558479309e-05, 8.732825517654419e-05, 9.059533476829529e-05, 9.386241436004639e-05, 9.712949395179749e-05, 0.00010039657354354858, 0.00010366365313529968, 0.00010693073272705078]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 7.0, 3.0, 16.0, 10.0, 15.0, 22.0, 30.0, 35.0, 45.0, 80.0, 102.0, 160.0, 257.0, 453.0, 850.0, 2394.0, 1013478.0, 27970.0, 1150.0, 548.0, 315.0, 198.0, 134.0, 72.0, 44.0, 44.0, 25.0, 16.0, 21.0, 15.0, 11.0, 13.0, 2.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020694732666015625, -0.0020042061805725098, -0.001938939094543457, -0.0018736720085144043, -0.0018084049224853516, -0.0017431378364562988, -0.001677870750427246, -0.0016126036643981934, -0.0015473365783691406, -0.0014820694923400879, -0.0014168024063110352, -0.0013515353202819824, -0.0012862682342529297, -0.001221001148223877, -0.0011557340621948242, -0.0010904669761657715, -0.0010251998901367188, -0.000959932804107666, -0.0008946657180786133, -0.0008293986320495605, -0.0007641315460205078, -0.0006988644599914551, -0.0006335973739624023, -0.0005683302879333496, -0.0005030632019042969, -0.00043779611587524414, -0.0003725290298461914, -0.00030726194381713867, -0.00024199485778808594, -0.0001767277717590332, -0.00011146068572998047, -4.6193599700927734e-05, 1.9073486328125e-05, 8.434057235717773e-05, 0.00014960765838623047, 0.0002148747444152832, 0.00028014183044433594, 0.00034540891647338867, 0.0004106760025024414, 0.00047594308853149414, 0.0005412101745605469, 0.0006064772605895996, 0.0006717443466186523, 0.0007370114326477051, 0.0008022785186767578, 0.0008675456047058105, 0.0009328126907348633, 0.000998079776763916, 0.0010633468627929688, 0.0011286139488220215, 0.0011938810348510742, 0.001259148120880127, 0.0013244152069091797, 0.0013896822929382324, 0.0014549493789672852, 0.0015202164649963379, 0.0015854835510253906, 0.0016507506370544434, 0.001716017723083496, 0.0017812848091125488, 0.0018465518951416016, 0.0019118189811706543, 0.001977086067199707, 0.0020423531532287598, 0.0021076202392578125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 15.0, 488.0, 489.0, 19.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0006496733985841274, -0.000637414981611073, -0.0006251565064303577, -0.0006128980894573033, -0.0006006396724842489, -0.0005883811973035336, -0.0005761227803304791, -0.0005638643633574247, -0.0005516059463843703, -0.0005393475294113159, -0.0005270890542306006, -0.0005148306372575462, -0.0005025722202844918, -0.0004903137451037765, -0.00047805532813072205, -0.00046579691115766764, -0.0004535384359769523, -0.00044127998990006745, -0.00042902157292701304, -0.0004167631268501282, -0.00040450470987707376, -0.0003922462638001889, -0.00037998781772330403, -0.0003677294007502496, -0.00035547095467336476, -0.0003432125085964799, -0.0003309540916234255, -0.0003186956455465406, -0.00030643719946965575, -0.00029417878249660134, -0.0002819203364197165, -0.0002696618903428316, -0.00025740344426594675, -0.0002451449981890619, -0.00023288658121600747, -0.0002206281351391226, -0.00020836970361415297, -0.00019611127208918333, -0.00018385282601229846, -0.00017159439448732883, -0.0001593359629623592, -0.00014707753143738955, -0.00013481909991241992, -0.00012256065383553505, -0.00011030222231056541, -9.804379078559577e-05, -8.578535198466852e-05, -7.352691318374127e-05, -6.126848165877163e-05, -4.901004649582319e-05, -3.6751611332874745e-05, -2.44931761699263e-05, -1.2234741006977856e-05, 2.3690517991781235e-08, 1.2282129318919033e-05, 2.4540568119846284e-05, 3.679899964481592e-05, 4.9057434807764366e-05, 6.131586997071281e-05, 7.357430877164006e-05, 8.58327402966097e-05, 9.809117182157934e-05, 0.00011034961062250659, 0.00012260804942343384, 0.00013486648094840348]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 9.0, 6.0, 11.0, 9.0, 9.0, 20.0, 7.0, 20.0, 25.0, 22.0, 36.0, 30.0, 33.0, 20.0, 48.0, 25.0, 35.0, 38.0, 39.0, 50.0, 49.0, 38.0, 41.0, 37.0, 47.0, 38.0, 39.0, 22.0, 27.0, 31.0, 24.0, 27.0, 18.0, 15.0, 15.0, 11.0, 11.0, 4.0, 3.0, 1.0, 4.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.369020462036133e-05, -4.225224256515503e-05, -4.081428050994873e-05, -3.937631845474243e-05, -3.793835639953613e-05, -3.6500394344329834e-05, -3.5062432289123535e-05, -3.3624470233917236e-05, -3.218650817871094e-05, -3.074854612350464e-05, -2.931058406829834e-05, -2.787262201309204e-05, -2.6434659957885742e-05, -2.4996697902679443e-05, -2.3558735847473145e-05, -2.2120773792266846e-05, -2.0682811737060547e-05, -1.9244849681854248e-05, -1.780688762664795e-05, -1.636892557144165e-05, -1.4930963516235352e-05, -1.3493001461029053e-05, -1.2055039405822754e-05, -1.0617077350616455e-05, -9.179115295410156e-06, -7.741153240203857e-06, -6.303191184997559e-06, -4.86522912979126e-06, -3.427267074584961e-06, -1.989305019378662e-06, -5.513429641723633e-07, 8.866190910339355e-07, 2.3245811462402344e-06, 3.762543201446533e-06, 5.200505256652832e-06, 6.638467311859131e-06, 8.07642936706543e-06, 9.514391422271729e-06, 1.0952353477478027e-05, 1.2390315532684326e-05, 1.3828277587890625e-05, 1.5266239643096924e-05, 1.6704201698303223e-05, 1.814216375350952e-05, 1.958012580871582e-05, 2.101808786392212e-05, 2.2456049919128418e-05, 2.3894011974334717e-05, 2.5331974029541016e-05, 2.6769936084747314e-05, 2.8207898139953613e-05, 2.9645860195159912e-05, 3.108382225036621e-05, 3.252178430557251e-05, 3.395974636077881e-05, 3.539770841598511e-05, 3.6835670471191406e-05, 3.8273632526397705e-05, 3.9711594581604004e-05, 4.11495566368103e-05, 4.25875186920166e-05, 4.40254807472229e-05, 4.54634428024292e-05, 4.69014048576355e-05, 4.83393669128418e-05]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 10.0, 3.0, 7.0, 5.0, 13.0, 16.0, 13.0, 15.0, 14.0, 28.0, 24.0, 29.0, 28.0, 28.0, 31.0, 41.0, 33.0, 39.0, 46.0, 42.0, 39.0, 52.0, 40.0, 39.0, 36.0, 37.0, 40.0, 45.0, 32.0, 19.0, 18.0, 23.0, 25.0, 15.0, 15.0, 10.0, 9.0, 8.0, 5.0, 10.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.62640380859375, -2.5379638671875, -2.44952392578125, -2.361083984375, -2.27264404296875, -2.1842041015625, -2.09576416015625, -2.00732421875, -1.91888427734375, -1.8304443359375, -1.74200439453125, -1.653564453125, -1.56512451171875, -1.4766845703125, -1.38824462890625, -1.2998046875, -1.21136474609375, -1.1229248046875, -1.03448486328125, -0.946044921875, -0.85760498046875, -0.7691650390625, -0.68072509765625, -0.59228515625, -0.50384521484375, -0.4154052734375, -0.32696533203125, -0.238525390625, -0.15008544921875, -0.0616455078125, 0.02679443359375, 0.115234375, 0.20367431640625, 0.2921142578125, 0.38055419921875, 0.468994140625, 0.55743408203125, 0.6458740234375, 0.73431396484375, 0.82275390625, 0.91119384765625, 0.9996337890625, 1.08807373046875, 1.176513671875, 1.26495361328125, 1.3533935546875, 1.44183349609375, 1.5302734375, 1.61871337890625, 1.7071533203125, 1.79559326171875, 1.884033203125, 1.97247314453125, 2.0609130859375, 2.14935302734375, 2.23779296875, 2.32623291015625, 2.4146728515625, 2.50311279296875, 2.591552734375, 2.67999267578125, 2.7684326171875, 2.85687255859375, 2.9453125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 6.0, 4.0, 8.0, 13.0, 17.0, 29.0, 33.0, 44.0, 79.0, 92.0, 122.0, 146.0, 182.0, 265.0, 395.0, 589.0, 952.0, 1611.0, 3097.0, 7088.0, 22185.0, 115969.0, 604598.0, 234183.0, 37133.0, 10169.0, 4086.0, 2049.0, 1138.0, 656.0, 460.0, 317.0, 215.0, 157.0, 113.0, 90.0, 63.0, 49.0, 58.0, 36.0, 15.0, 14.0, 13.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.6640625, -5.49072265625, -5.3173828125, -5.14404296875, -4.970703125, -4.79736328125, -4.6240234375, -4.45068359375, -4.27734375, -4.10400390625, -3.9306640625, -3.75732421875, -3.583984375, -3.41064453125, -3.2373046875, -3.06396484375, -2.890625, -2.71728515625, -2.5439453125, -2.37060546875, -2.197265625, -2.02392578125, -1.8505859375, -1.67724609375, -1.50390625, -1.33056640625, -1.1572265625, -0.98388671875, -0.810546875, -0.63720703125, -0.4638671875, -0.29052734375, -0.1171875, 0.05615234375, 0.2294921875, 0.40283203125, 0.576171875, 0.74951171875, 0.9228515625, 1.09619140625, 1.26953125, 1.44287109375, 1.6162109375, 1.78955078125, 1.962890625, 2.13623046875, 2.3095703125, 2.48291015625, 2.65625, 2.82958984375, 3.0029296875, 3.17626953125, 3.349609375, 3.52294921875, 3.6962890625, 3.86962890625, 4.04296875, 4.21630859375, 4.3896484375, 4.56298828125, 4.736328125, 4.90966796875, 5.0830078125, 5.25634765625, 5.4296875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 12.0, 6.0, 11.0, 3.0, 14.0, 18.0, 28.0, 24.0, 40.0, 39.0, 62.0, 62.0, 95.0, 140.0, 394.0, 1517.0, 166.0, 86.0, 60.0, 58.0, 43.0, 34.0, 32.0, 22.0, 22.0, 7.0, 13.0, 9.0, 4.0, 8.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-12.140625, -11.813232421875, -11.48583984375, -11.158447265625, -10.8310546875, -10.503662109375, -10.17626953125, -9.848876953125, -9.521484375, -9.194091796875, -8.86669921875, -8.539306640625, -8.2119140625, -7.884521484375, -7.55712890625, -7.229736328125, -6.90234375, -6.574951171875, -6.24755859375, -5.920166015625, -5.5927734375, -5.265380859375, -4.93798828125, -4.610595703125, -4.283203125, -3.955810546875, -3.62841796875, -3.301025390625, -2.9736328125, -2.646240234375, -2.31884765625, -1.991455078125, -1.6640625, -1.336669921875, -1.00927734375, -0.681884765625, -0.3544921875, -0.027099609375, 0.30029296875, 0.627685546875, 0.955078125, 1.282470703125, 1.60986328125, 1.937255859375, 2.2646484375, 2.592041015625, 2.91943359375, 3.246826171875, 3.57421875, 3.901611328125, 4.22900390625, 4.556396484375, 4.8837890625, 5.211181640625, 5.53857421875, 5.865966796875, 6.193359375, 6.520751953125, 6.84814453125, 7.175537109375, 7.5029296875, 7.830322265625, 8.15771484375, 8.485107421875, 8.8125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 1.0, 8.0, 6.0, 5.0, 15.0, 8.0, 11.0, 24.0, 35.0, 29.0, 64.0, 67.0, 101.0, 132.0, 202.0, 339.0, 778.0, 2494.0, 1414444.0, 1722491.0, 2597.0, 764.0, 371.0, 216.0, 129.0, 117.0, 59.0, 62.0, 31.0, 27.0, 25.0, 13.0, 10.0, 10.0, 11.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.90625, -17.266845703125, -16.62744140625, -15.988037109375, -15.3486328125, -14.709228515625, -14.06982421875, -13.430419921875, -12.791015625, -12.151611328125, -11.51220703125, -10.872802734375, -10.2333984375, -9.593994140625, -8.95458984375, -8.315185546875, -7.67578125, -7.036376953125, -6.39697265625, -5.757568359375, -5.1181640625, -4.478759765625, -3.83935546875, -3.199951171875, -2.560546875, -1.921142578125, -1.28173828125, -0.642333984375, -0.0029296875, 0.636474609375, 1.27587890625, 1.915283203125, 2.5546875, 3.194091796875, 3.83349609375, 4.472900390625, 5.1123046875, 5.751708984375, 6.39111328125, 7.030517578125, 7.669921875, 8.309326171875, 8.94873046875, 9.588134765625, 10.2275390625, 10.866943359375, 11.50634765625, 12.145751953125, 12.78515625, 13.424560546875, 14.06396484375, 14.703369140625, 15.3427734375, 15.982177734375, 16.62158203125, 17.260986328125, 17.900390625, 18.539794921875, 19.17919921875, 19.818603515625, 20.4580078125, 21.097412109375, 21.73681640625, 22.376220703125, 23.015625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 44.0, 489.0, 446.0, 33.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.157018661499023, -27.982383728027344, -25.807750701904297, -23.63311767578125, -21.45848274230957, -19.28384780883789, -17.109214782714844, -14.93458080291748, -12.759946823120117, -10.585312843322754, -8.41067886352539, -6.236044883728027, -4.061410903930664, -1.8867769241333008, 0.2878570556640625, 2.462491035461426, 4.637125015258789, 6.811758995056152, 8.986392974853516, 11.161026954650879, 13.335660934448242, 15.510294914245605, 17.68492889404297, 19.859561920166016, 22.034196853637695, 24.208831787109375, 26.383464813232422, 28.55809783935547, 30.73273277282715, 32.90736770629883, 35.082000732421875, 37.25663375854492, 39.4312744140625, 41.60590744018555, 43.780540466308594, 45.955177307128906, 48.12981033325195, 50.304443359375, 52.47908020019531, 54.65371322631836, 56.828346252441406, 59.00297927856445, 61.1776123046875, 63.35224914550781, 65.52688598632812, 67.7015151977539, 69.87615203857422, 72.05078125, 74.22541809082031, 76.40005493164062, 78.5746841430664, 80.74932098388672, 82.9239501953125, 85.09858703613281, 87.27322387695312, 89.4478530883789, 91.62248992919922, 93.79712677001953, 95.97175598144531, 98.14639282226562, 100.32102966308594, 102.49565887451172, 104.67029571533203, 106.84492492675781, 109.01956176757812]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 8.0, 6.0, 12.0, 9.0, 7.0, 14.0, 11.0, 25.0, 24.0, 25.0, 31.0, 25.0, 26.0, 31.0, 27.0, 36.0, 34.0, 28.0, 28.0, 43.0, 35.0, 41.0, 43.0, 50.0, 37.0, 34.0, 30.0, 26.0, 30.0, 33.0, 25.0, 24.0, 28.0, 17.0, 13.0, 6.0, 17.0, 10.0, 10.0, 9.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-17.1634521484375, -16.640655517578125, -16.11785888671875, -15.595062255859375, -15.072265625, -14.549468994140625, -14.02667236328125, -13.503875732421875, -12.9810791015625, -12.458282470703125, -11.93548583984375, -11.412689208984375, -10.889892578125, -10.367095947265625, -9.84429931640625, -9.321502685546875, -8.798705101013184, -8.275908470153809, -7.753111839294434, -7.230315208435059, -6.707518577575684, -6.184721946716309, -5.661924839019775, -5.1391282081604, -4.616331577301025, -4.09353494644165, -3.5707383155822754, -3.0479414463043213, -2.5251448154449463, -2.0023481845855713, -1.4795513153076172, -0.9567546844482422, -0.4339580535888672, 0.08883863687515259, 0.6116353273391724, 1.134432077407837, 1.657228708267212, 2.180025339126587, 2.702822208404541, 3.225618839263916, 3.748415470123291, 4.271212100982666, 4.794008731842041, 5.316805839538574, 5.839602470397949, 6.362399101257324, 6.885195732116699, 7.407992362976074, 7.930788993835449, 8.453585624694824, 8.9763822555542, 9.499178886413574, 10.02197551727295, 10.544772148132324, 11.067569732666016, 11.59036636352539, 12.113162994384766, 12.63595962524414, 13.158756256103516, 13.68155288696289, 14.204349517822266, 14.72714614868164, 15.249942779541016, 15.77273941040039, 16.295536041259766]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 6.0, 11.0, 10.0, 10.0, 14.0, 8.0, 13.0, 12.0, 16.0, 19.0, 26.0, 13.0, 30.0, 26.0, 31.0, 31.0, 39.0, 39.0, 38.0, 44.0, 38.0, 38.0, 36.0, 44.0, 34.0, 48.0, 32.0, 21.0, 26.0, 24.0, 26.0, 24.0, 25.0, 27.0, 19.0, 14.0, 18.0, 14.0, 9.0, 8.0, 2.0, 12.0, 7.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.7576904296875, -2.663818359375, -2.5699462890625, -2.47607421875, -2.3822021484375, -2.288330078125, -2.1944580078125, -2.1005859375, -2.0067138671875, -1.912841796875, -1.8189697265625, -1.72509765625, -1.6312255859375, -1.537353515625, -1.4434814453125, -1.349609375, -1.2557373046875, -1.161865234375, -1.0679931640625, -0.97412109375, -0.8802490234375, -0.786376953125, -0.6925048828125, -0.5986328125, -0.5047607421875, -0.410888671875, -0.3170166015625, -0.22314453125, -0.1292724609375, -0.035400390625, 0.0584716796875, 0.15234375, 0.2462158203125, 0.340087890625, 0.4339599609375, 0.52783203125, 0.6217041015625, 0.715576171875, 0.8094482421875, 0.9033203125, 0.9971923828125, 1.091064453125, 1.1849365234375, 1.27880859375, 1.3726806640625, 1.466552734375, 1.5604248046875, 1.654296875, 1.7481689453125, 1.842041015625, 1.9359130859375, 2.02978515625, 2.1236572265625, 2.217529296875, 2.3114013671875, 2.4052734375, 2.4991455078125, 2.593017578125, 2.6868896484375, 2.78076171875, 2.8746337890625, 2.968505859375, 3.0623779296875, 3.15625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 9.0, 9.0, 8.0, 9.0, 7.0, 12.0, 15.0, 23.0, 23.0, 43.0, 47.0, 66.0, 78.0, 116.0, 130.0, 212.0, 253.0, 356.0, 593.0, 969.0, 1852.0, 5855.0, 135751.0, 3630405.0, 402897.0, 9023.0, 2229.0, 1074.0, 614.0, 423.0, 317.0, 237.0, 156.0, 108.0, 78.0, 64.0, 47.0, 35.0, 39.0, 14.0, 25.0, 16.0, 8.0, 11.0, 6.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-16.328125, -15.8115234375, -15.294921875, -14.7783203125, -14.26171875, -13.7451171875, -13.228515625, -12.7119140625, -12.1953125, -11.6787109375, -11.162109375, -10.6455078125, -10.12890625, -9.6123046875, -9.095703125, -8.5791015625, -8.0625, -7.5458984375, -7.029296875, -6.5126953125, -5.99609375, -5.4794921875, -4.962890625, -4.4462890625, -3.9296875, -3.4130859375, -2.896484375, -2.3798828125, -1.86328125, -1.3466796875, -0.830078125, -0.3134765625, 0.203125, 0.7197265625, 1.236328125, 1.7529296875, 2.26953125, 2.7861328125, 3.302734375, 3.8193359375, 4.3359375, 4.8525390625, 5.369140625, 5.8857421875, 6.40234375, 6.9189453125, 7.435546875, 7.9521484375, 8.46875, 8.9853515625, 9.501953125, 10.0185546875, 10.53515625, 11.0517578125, 11.568359375, 12.0849609375, 12.6015625, 13.1181640625, 13.634765625, 14.1513671875, 14.66796875, 15.1845703125, 15.701171875, 16.2177734375, 16.734375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 5.0, 6.0, 3.0, 15.0, 37.0, 62.0, 159.0, 396.0, 933.0, 1196.0, 737.0, 309.0, 130.0, 41.0, 22.0, 11.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9453125, -13.5001220703125, -13.054931640625, -12.6097412109375, -12.16455078125, -11.7193603515625, -11.274169921875, -10.8289794921875, -10.3837890625, -9.9385986328125, -9.493408203125, -9.0482177734375, -8.60302734375, -8.1578369140625, -7.712646484375, -7.2674560546875, -6.822265625, -6.3770751953125, -5.931884765625, -5.4866943359375, -5.04150390625, -4.5963134765625, -4.151123046875, -3.7059326171875, -3.2607421875, -2.8155517578125, -2.370361328125, -1.9251708984375, -1.47998046875, -1.0347900390625, -0.589599609375, -0.1444091796875, 0.30078125, 0.7459716796875, 1.191162109375, 1.6363525390625, 2.08154296875, 2.5267333984375, 2.971923828125, 3.4171142578125, 3.8623046875, 4.3074951171875, 4.752685546875, 5.1978759765625, 5.64306640625, 6.0882568359375, 6.533447265625, 6.9786376953125, 7.423828125, 7.8690185546875, 8.314208984375, 8.7593994140625, 9.20458984375, 9.6497802734375, 10.094970703125, 10.5401611328125, 10.9853515625, 11.4305419921875, 11.875732421875, 12.3209228515625, 12.76611328125, 13.2113037109375, 13.656494140625, 14.1016845703125, 14.546875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 2.0, 9.0, 10.0, 29.0, 36.0, 63.0, 70.0, 124.0, 164.0, 290.0, 402.0, 801.0, 1511.0, 3937.0, 14198.0, 118092.0, 2119326.0, 1816272.0, 99516.0, 12480.0, 3510.0, 1501.0, 742.0, 396.0, 274.0, 157.0, 117.0, 76.0, 60.0, 25.0, 24.0, 17.0, 9.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-9.4375, -9.17510986328125, -8.9127197265625, -8.65032958984375, -8.387939453125, -8.12554931640625, -7.8631591796875, -7.60076904296875, -7.33837890625, -7.07598876953125, -6.8135986328125, -6.55120849609375, -6.288818359375, -6.02642822265625, -5.7640380859375, -5.50164794921875, -5.2392578125, -4.97686767578125, -4.7144775390625, -4.45208740234375, -4.189697265625, -3.92730712890625, -3.6649169921875, -3.40252685546875, -3.14013671875, -2.87774658203125, -2.6153564453125, -2.35296630859375, -2.090576171875, -1.82818603515625, -1.5657958984375, -1.30340576171875, -1.041015625, -0.77862548828125, -0.5162353515625, -0.25384521484375, 0.008544921875, 0.27093505859375, 0.5333251953125, 0.79571533203125, 1.05810546875, 1.32049560546875, 1.5828857421875, 1.84527587890625, 2.107666015625, 2.37005615234375, 2.6324462890625, 2.89483642578125, 3.1572265625, 3.41961669921875, 3.6820068359375, 3.94439697265625, 4.206787109375, 4.46917724609375, 4.7315673828125, 4.99395751953125, 5.25634765625, 5.51873779296875, 5.7811279296875, 6.04351806640625, 6.305908203125, 6.56829833984375, 6.8306884765625, 7.09307861328125, 7.35546875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 7.0, 8.0, 13.0, 22.0, 27.0, 21.0, 31.0, 42.0, 50.0, 58.0, 61.0, 71.0, 84.0, 88.0, 75.0, 53.0, 48.0, 55.0, 37.0, 47.0, 23.0, 21.0, 13.0, 9.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.53204345703125, -39.5267219543457, -38.521400451660156, -37.51607894897461, -36.51075744628906, -35.505435943603516, -34.50011444091797, -33.49479293823242, -32.489471435546875, -31.484149932861328, -30.47882843017578, -29.473506927490234, -28.468185424804688, -27.46286392211914, -26.457542419433594, -25.452220916748047, -24.446901321411133, -23.441579818725586, -22.43625831604004, -21.430936813354492, -20.425615310668945, -19.4202938079834, -18.414974212646484, -17.409652709960938, -16.40433120727539, -15.399009704589844, -14.393688201904297, -13.38836669921875, -12.383045196533203, -11.377723693847656, -10.372403144836426, -9.367081642150879, -8.361759185791016, -7.356437683105469, -6.351116180419922, -5.345795154571533, -4.340473651885986, -3.3351521492004395, -2.329831123352051, -1.324509620666504, -0.31918811798095703, 0.6861332654953003, 1.6914546489715576, 2.6967759132385254, 3.7020974159240723, 4.707418918609619, 5.712739944458008, 6.718061447143555, 7.723382949829102, 8.728704452514648, 9.734025955200195, 10.739347457885742, 11.744668960571289, 12.749990463256836, 13.755311012268066, 14.760632514953613, 15.76595401763916, 16.77127456665039, 17.776596069335938, 18.781917572021484, 19.78723907470703, 20.792560577392578, 21.797882080078125, 22.803203582763672, 23.80852508544922]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 10.0, 2.0, 4.0, 9.0, 4.0, 9.0, 11.0, 13.0, 18.0, 21.0, 19.0, 26.0, 21.0, 34.0, 21.0, 32.0, 39.0, 35.0, 46.0, 47.0, 37.0, 43.0, 42.0, 49.0, 55.0, 37.0, 34.0, 26.0, 35.0, 27.0, 22.0, 32.0, 23.0, 22.0, 18.0, 16.0, 11.0, 13.0, 9.0, 11.0, 7.0, 8.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.17300796508789, -20.441434860229492, -19.70985984802246, -18.978286743164062, -18.24671173095703, -17.515138626098633, -16.783565521240234, -16.051990509033203, -15.320416450500488, -14.588842391967773, -13.857268333435059, -13.125694274902344, -12.394121170043945, -11.662546157836914, -10.930973052978516, -10.1993989944458, -9.467824935913086, -8.736250877380371, -8.004676818847656, -7.2731032371521, -6.541529178619385, -5.80995512008667, -5.078381538391113, -4.346807479858398, -3.6152334213256836, -2.8836593627929688, -2.152085542678833, -1.4205117225646973, -0.6889376640319824, 0.04263639450073242, 0.7742099761962891, 1.505784034729004, 2.2373580932617188, 2.9689321517944336, 3.7005059719085693, 4.432079792022705, 5.16365385055542, 5.895227909088135, 6.626801490783691, 7.358375549316406, 8.089949607849121, 8.821523666381836, 9.55309772491455, 10.284671783447266, 11.016244888305664, 11.747819900512695, 12.479393005371094, 13.210967063903809, 13.942541122436523, 14.674115180969238, 15.405689239501953, 16.13726234436035, 16.868837356567383, 17.60041046142578, 18.331985473632812, 19.06355857849121, 19.79513168334961, 20.526704788208008, 21.25827980041504, 21.989852905273438, 22.72142791748047, 23.453001022338867, 24.184574127197266, 24.916149139404297, 25.647724151611328]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 10.0, 12.0, 14.0, 17.0, 9.0, 19.0, 24.0, 17.0, 33.0, 28.0, 39.0, 35.0, 38.0, 42.0, 45.0, 45.0, 44.0, 51.0, 51.0, 47.0, 42.0, 36.0, 39.0, 33.0, 26.0, 24.0, 26.0, 25.0, 24.0, 18.0, 13.0, 16.0, 8.0, 7.0, 9.0, 4.0, 11.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.03125, -38.6982421875, -37.365234375, -36.0322265625, -34.69921875, -33.3662109375, -32.033203125, -30.7001953125, -29.3671875, -28.0341796875, -26.701171875, -25.3681640625, -24.03515625, -22.7021484375, -21.369140625, -20.0361328125, -18.703125, -17.3701171875, -16.037109375, -14.7041015625, -13.37109375, -12.0380859375, -10.705078125, -9.3720703125, -8.0390625, -6.7060546875, -5.373046875, -4.0400390625, -2.70703125, -1.3740234375, -0.041015625, 1.2919921875, 2.625, 3.9580078125, 5.291015625, 6.6240234375, 7.95703125, 9.2900390625, 10.623046875, 11.9560546875, 13.2890625, 14.6220703125, 15.955078125, 17.2880859375, 18.62109375, 19.9541015625, 21.287109375, 22.6201171875, 23.953125, 25.2861328125, 26.619140625, 27.9521484375, 29.28515625, 30.6181640625, 31.951171875, 33.2841796875, 34.6171875, 35.9501953125, 37.283203125, 38.6162109375, 39.94921875, 41.2822265625, 42.615234375, 43.9482421875, 45.28125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 2.0, 4.0, 8.0, 14.0, 12.0, 36.0, 36.0, 62.0, 103.0, 129.0, 188.0, 300.0, 398.0, 739.0, 1096.0, 1734.0, 2803.0, 4443.0, 7127.0, 11427.0, 19079.0, 32460.0, 58592.0, 117305.0, 273891.0, 264318.0, 113915.0, 57322.0, 32053.0, 18850.0, 11281.0, 6910.0, 4395.0, 2700.0, 1793.0, 1058.0, 690.0, 398.0, 283.0, 160.0, 143.0, 101.0, 75.0, 43.0, 27.0, 9.0, 13.0, 7.0, 6.0, 8.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-7.54296875, -7.31427001953125, -7.0855712890625, -6.85687255859375, -6.628173828125, -6.39947509765625, -6.1707763671875, -5.94207763671875, -5.71337890625, -5.48468017578125, -5.2559814453125, -5.02728271484375, -4.798583984375, -4.56988525390625, -4.3411865234375, -4.11248779296875, -3.8837890625, -3.65509033203125, -3.4263916015625, -3.19769287109375, -2.968994140625, -2.74029541015625, -2.5115966796875, -2.28289794921875, -2.05419921875, -1.82550048828125, -1.5968017578125, -1.36810302734375, -1.139404296875, -0.91070556640625, -0.6820068359375, -0.45330810546875, -0.224609375, 0.00408935546875, 0.2327880859375, 0.46148681640625, 0.690185546875, 0.91888427734375, 1.1475830078125, 1.37628173828125, 1.60498046875, 1.83367919921875, 2.0623779296875, 2.29107666015625, 2.519775390625, 2.74847412109375, 2.9771728515625, 3.20587158203125, 3.4345703125, 3.66326904296875, 3.8919677734375, 4.12066650390625, 4.349365234375, 4.57806396484375, 4.8067626953125, 5.03546142578125, 5.26416015625, 5.49285888671875, 5.7215576171875, 5.95025634765625, 6.178955078125, 6.40765380859375, 6.6363525390625, 6.86505126953125, 7.09375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 4.0, 9.0, 8.0, 8.0, 17.0, 13.0, 17.0, 14.0, 22.0, 21.0, 25.0, 32.0, 38.0, 34.0, 44.0, 23.0, 34.0, 51.0, 27.0, 36.0, 1059.0, 35.0, 48.0, 41.0, 33.0, 33.0, 28.0, 31.0, 39.0, 35.0, 21.0, 25.0, 12.0, 18.0, 10.0, 13.0, 10.0, 9.0, 11.0, 4.0, 11.0, 1.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.9375, -23.15625, -22.375, -21.59375, -20.8125, -20.03125, -19.25, -18.46875, -17.6875, -16.90625, -16.125, -15.34375, -14.5625, -13.78125, -13.0, -12.21875, -11.4375, -10.65625, -9.875, -9.09375, -8.3125, -7.53125, -6.75, -5.96875, -5.1875, -4.40625, -3.625, -2.84375, -2.0625, -1.28125, -0.5, 0.28125, 1.0625, 1.84375, 2.625, 3.40625, 4.1875, 4.96875, 5.75, 6.53125, 7.3125, 8.09375, 8.875, 9.65625, 10.4375, 11.21875, 12.0, 12.78125, 13.5625, 14.34375, 15.125, 15.90625, 16.6875, 17.46875, 18.25, 19.03125, 19.8125, 20.59375, 21.375, 22.15625, 22.9375, 23.71875, 24.5, 25.28125, 26.0625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 7.0, 9.0, 18.0, 17.0, 27.0, 42.0, 65.0, 86.0, 145.0, 186.0, 253.0, 356.0, 515.0, 752.0, 955.0, 1461.0, 1942.0, 2662.0, 3878.0, 5390.0, 7601.0, 11165.0, 16238.0, 23634.0, 35329.0, 54334.0, 88722.0, 163968.0, 1301107.0, 142143.0, 79405.0, 49557.0, 33055.0, 21890.0, 14980.0, 10248.0, 7179.0, 5064.0, 3624.0, 2631.0, 1850.0, 1389.0, 904.0, 681.0, 516.0, 356.0, 234.0, 189.0, 101.0, 102.0, 75.0, 43.0, 21.0, 18.0, 16.0, 3.0, 3.0, 3.0, 0.0, 2.0], "bins": [-5.609375, -5.43621826171875, -5.2630615234375, -5.08990478515625, -4.916748046875, -4.74359130859375, -4.5704345703125, -4.39727783203125, -4.22412109375, -4.05096435546875, -3.8778076171875, -3.70465087890625, -3.531494140625, -3.35833740234375, -3.1851806640625, -3.01202392578125, -2.8388671875, -2.66571044921875, -2.4925537109375, -2.31939697265625, -2.146240234375, -1.97308349609375, -1.7999267578125, -1.62677001953125, -1.45361328125, -1.28045654296875, -1.1072998046875, -0.93414306640625, -0.760986328125, -0.58782958984375, -0.4146728515625, -0.24151611328125, -0.068359375, 0.10479736328125, 0.2779541015625, 0.45111083984375, 0.624267578125, 0.79742431640625, 0.9705810546875, 1.14373779296875, 1.31689453125, 1.49005126953125, 1.6632080078125, 1.83636474609375, 2.009521484375, 2.18267822265625, 2.3558349609375, 2.52899169921875, 2.7021484375, 2.87530517578125, 3.0484619140625, 3.22161865234375, 3.394775390625, 3.56793212890625, 3.7410888671875, 3.91424560546875, 4.08740234375, 4.26055908203125, 4.4337158203125, 4.60687255859375, 4.780029296875, 4.95318603515625, 5.1263427734375, 5.29949951171875, 5.47265625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 4.0, 6.0, 4.0, 8.0, 8.0, 10.0, 12.0, 19.0, 27.0, 17.0, 30.0, 37.0, 58.0, 59.0, 66.0, 74.0, 77.0, 80.0, 87.0, 60.0, 59.0, 40.0, 29.0, 20.0, 14.0, 21.0, 18.0, 13.0, 6.0, 11.0, 3.0, 10.0, 1.0, 6.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0030040740966796875, -0.002924621105194092, -0.002845168113708496, -0.0027657151222229004, -0.0026862621307373047, -0.002606809139251709, -0.0025273561477661133, -0.0024479031562805176, -0.002368450164794922, -0.002288997173309326, -0.0022095441818237305, -0.0021300911903381348, -0.002050638198852539, -0.0019711852073669434, -0.0018917322158813477, -0.001812279224395752, -0.0017328262329101562, -0.0016533732414245605, -0.0015739202499389648, -0.0014944672584533691, -0.0014150142669677734, -0.0013355612754821777, -0.001256108283996582, -0.0011766552925109863, -0.0010972023010253906, -0.001017749309539795, -0.0009382963180541992, -0.0008588433265686035, -0.0007793903350830078, -0.0006999373435974121, -0.0006204843521118164, -0.0005410313606262207, -0.000461578369140625, -0.0003821253776550293, -0.0003026723861694336, -0.0002232193946838379, -0.0001437664031982422, -6.431341171264648e-05, 1.5139579772949219e-05, 9.459257125854492e-05, 0.00017404556274414062, 0.00025349855422973633, 0.00033295154571533203, 0.00041240453720092773, 0.0004918575286865234, 0.0005713105201721191, 0.0006507635116577148, 0.0007302165031433105, 0.0008096694946289062, 0.000889122486114502, 0.0009685754776000977, 0.0010480284690856934, 0.001127481460571289, 0.0012069344520568848, 0.0012863874435424805, 0.0013658404350280762, 0.0014452934265136719, 0.0015247464179992676, 0.0016041994094848633, 0.001683652400970459, 0.0017631053924560547, 0.0018425583839416504, 0.001922011375427246, 0.002001464366912842, 0.0020809173583984375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 7.0, 9.0, 4.0, 11.0, 14.0, 20.0, 20.0, 48.0, 45.0, 54.0, 92.0, 135.0, 246.0, 368.0, 692.0, 1432.0, 3556.0, 11108.0, 43637.0, 245876.0, 552097.0, 147490.0, 28343.0, 7791.0, 2757.0, 1159.0, 619.0, 302.0, 197.0, 130.0, 79.0, 64.0, 38.0, 31.0, 23.0, 8.0, 21.0, 17.0, 3.0, 9.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01285552978515625, -0.012402176856994629, -0.011948823928833008, -0.011495471000671387, -0.011042118072509766, -0.010588765144348145, -0.010135412216186523, -0.009682059288024902, -0.009228706359863281, -0.00877535343170166, -0.008322000503540039, -0.007868647575378418, -0.007415294647216797, -0.006961941719055176, -0.006508588790893555, -0.006055235862731934, -0.0056018829345703125, -0.005148530006408691, -0.00469517707824707, -0.004241824150085449, -0.003788471221923828, -0.003335118293762207, -0.002881765365600586, -0.002428412437438965, -0.0019750595092773438, -0.0015217065811157227, -0.0010683536529541016, -0.0006150007247924805, -0.00016164779663085938, 0.0002917051315307617, 0.0007450580596923828, 0.001198410987854004, 0.001651763916015625, 0.002105116844177246, 0.002558469772338867, 0.0030118227005004883, 0.0034651756286621094, 0.0039185285568237305, 0.0043718814849853516, 0.004825234413146973, 0.005278587341308594, 0.005731940269470215, 0.006185293197631836, 0.006638646125793457, 0.007091999053955078, 0.007545351982116699, 0.00799870491027832, 0.008452057838439941, 0.008905410766601562, 0.009358763694763184, 0.009812116622924805, 0.010265469551086426, 0.010718822479248047, 0.011172175407409668, 0.011625528335571289, 0.01207888126373291, 0.012532234191894531, 0.012985587120056152, 0.013438940048217773, 0.013892292976379395, 0.014345645904541016, 0.014798998832702637, 0.015252351760864258, 0.01570570468902588, 0.0161590576171875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 19.0, 37.0, 70.0, 99.0, 142.0, 177.0, 145.0, 126.0, 70.0, 50.0, 18.0, 19.0, 10.0, 9.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012861154973506927, -0.0011907619191333652, -0.0010954084573313594, -0.0010000548791140318, -0.000904701417312026, -0.0008093478390946984, -0.0007139943190850317, -0.0006186407990753651, -0.0005232872790656984, -0.0004279337590560317, -0.000332580239046365, -0.00023722668993286788, -0.0001418731699232012, -4.651964991353452e-05, 4.8833899199962616e-05, 0.0001441874192096293, 0.00023954093921929598, 0.00033489445922896266, 0.00043024797923862934, 0.0005256015574559569, 0.0006209550192579627, 0.0007163085974752903, 0.000811662117484957, 0.0009070156374946237, 0.0010023692157119513, 0.0010977227939292789, 0.0011930762557312846, 0.0012884298339486122, 0.001383783295750618, 0.0014791368739679456, 0.0015744904521852732, 0.001669843913987279, 0.0017651973757892847, 0.0018605509540066123, 0.00195590453222394, 0.0020512579940259457, 0.0021466114558279514, 0.002241964917629957, 0.0023373186122626066, 0.0024326720740646124, 0.002528025535866618, 0.002623378997668624, 0.0027187326923012733, 0.002814086154103279, 0.002909439615905285, 0.0030047930777072906, 0.00310014677233994, 0.003195500234141946, 0.0032908539287745953, 0.003386207390576601, 0.0034815610852092505, 0.0035769145470112562, 0.003672268008813262, 0.0037676214706152678, 0.003862975165247917, 0.003958328627049923, 0.004053682088851929, 0.0041490355506539345, 0.00424438901245594, 0.004339742474257946, 0.004435096401721239, 0.004530449863523245, 0.004625803325325251, 0.004721156787127256, 0.004816510248929262]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 11.0, 16.0, 9.0, 18.0, 17.0, 28.0, 26.0, 23.0, 26.0, 30.0, 38.0, 34.0, 49.0, 58.0, 48.0, 39.0, 36.0, 33.0, 53.0, 41.0, 40.0, 35.0, 32.0, 30.0, 36.0, 30.0, 29.0, 27.0, 26.0, 15.0, 17.0, 12.0, 5.0, 6.0, 4.0, 4.0, 6.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011513829231262207, -0.0011114394292235374, -0.0010714959353208542, -0.001031552441418171, -0.0009916089475154877, -0.0009516654536128044, -0.0009117219597101212, -0.0008717784658074379, -0.0008318349719047546, -0.0007918914780020714, -0.0007519479840993881, -0.0007120044901967049, -0.0006720609962940216, -0.0006321175023913383, -0.0005921740084886551, -0.0005522305145859718, -0.0005122870206832886, -0.0004723435267806053, -0.00043240003287792206, -0.0003924565389752388, -0.00035251304507255554, -0.0003125695511698723, -0.000272626057267189, -0.00023268256336450577, -0.0001927390694618225, -0.00015279557555913925, -0.000112852081656456, -7.290858775377274e-05, -3.296509385108948e-05, 6.9784000515937805e-06, 4.692189395427704e-05, 8.68653878569603e-05, 0.00012680888175964355, 0.0001667523756623268, 0.00020669586956501007, 0.00024663936346769333, 0.0002865828573703766, 0.00032652635127305984, 0.0003664698451757431, 0.00040641333907842636, 0.0004463568329811096, 0.0004863003268837929, 0.0005262438207864761, 0.0005661873146891594, 0.0006061308085918427, 0.0006460743024945259, 0.0006860177963972092, 0.0007259612902998924, 0.0007659047842025757, 0.0008058482781052589, 0.0008457917720079422, 0.0008857352659106255, 0.0009256787598133087, 0.000965622253715992, 0.0010055657476186752, 0.0010455092415213585, 0.0010854527354240417, 0.001125396229326725, 0.0011653397232294083, 0.0012052832171320915, 0.0012452267110347748, 0.001285170204937458, 0.0013251136988401413, 0.0013650571927428246, 0.0014050006866455078]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 10.0, 12.0, 14.0, 17.0, 9.0, 19.0, 24.0, 17.0, 33.0, 28.0, 39.0, 35.0, 38.0, 43.0, 44.0, 45.0, 44.0, 51.0, 51.0, 46.0, 43.0, 36.0, 39.0, 33.0, 26.0, 24.0, 26.0, 25.0, 24.0, 18.0, 13.0, 16.0, 8.0, 7.0, 9.0, 4.0, 11.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.03125, -38.6982421875, -37.365234375, -36.0322265625, -34.69921875, -33.3662109375, -32.033203125, -30.7001953125, -29.3671875, -28.0341796875, -26.701171875, -25.3681640625, -24.03515625, -22.7021484375, -21.369140625, -20.0361328125, -18.703125, -17.3701171875, -16.037109375, -14.7041015625, -13.37109375, -12.0380859375, -10.705078125, -9.3720703125, -8.0390625, -6.7060546875, -5.373046875, -4.0400390625, -2.70703125, -1.3740234375, -0.041015625, 1.2919921875, 2.625, 3.9580078125, 5.291015625, 6.6240234375, 7.95703125, 9.2900390625, 10.623046875, 11.9560546875, 13.2890625, 14.6220703125, 15.955078125, 17.2880859375, 18.62109375, 19.9541015625, 21.287109375, 22.6201171875, 23.953125, 25.2861328125, 26.619140625, 27.9521484375, 29.28515625, 30.6181640625, 31.951171875, 33.2841796875, 34.6171875, 35.9501953125, 37.283203125, 38.6162109375, 39.94921875, 41.2822265625, 42.615234375, 43.9482421875, 45.28125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 6.0, 6.0, 20.0, 22.0, 25.0, 52.0, 52.0, 98.0, 142.0, 239.0, 398.0, 684.0, 1265.0, 2582.0, 6308.0, 19585.0, 83851.0, 404437.0, 410750.0, 86228.0, 19923.0, 6230.0, 2633.0, 1224.0, 648.0, 398.0, 241.0, 150.0, 101.0, 74.0, 49.0, 27.0, 40.0, 12.0, 11.0, 13.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.109375, -8.86322021484375, -8.6170654296875, -8.37091064453125, -8.124755859375, -7.87860107421875, -7.6324462890625, -7.38629150390625, -7.14013671875, -6.89398193359375, -6.6478271484375, -6.40167236328125, -6.155517578125, -5.90936279296875, -5.6632080078125, -5.41705322265625, -5.1708984375, -4.92474365234375, -4.6785888671875, -4.43243408203125, -4.186279296875, -3.94012451171875, -3.6939697265625, -3.44781494140625, -3.20166015625, -2.95550537109375, -2.7093505859375, -2.46319580078125, -2.217041015625, -1.97088623046875, -1.7247314453125, -1.47857666015625, -1.232421875, -0.98626708984375, -0.7401123046875, -0.49395751953125, -0.247802734375, -0.00164794921875, 0.2445068359375, 0.49066162109375, 0.73681640625, 0.98297119140625, 1.2291259765625, 1.47528076171875, 1.721435546875, 1.96759033203125, 2.2137451171875, 2.45989990234375, 2.7060546875, 2.95220947265625, 3.1983642578125, 3.44451904296875, 3.690673828125, 3.93682861328125, 4.1829833984375, 4.42913818359375, 4.67529296875, 4.92144775390625, 5.1676025390625, 5.41375732421875, 5.659912109375, 5.90606689453125, 6.1522216796875, 6.39837646484375, 6.64453125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 4.0, 5.0, 13.0, 17.0, 16.0, 25.0, 27.0, 35.0, 38.0, 32.0, 48.0, 59.0, 52.0, 66.0, 2113.0, 64.0, 60.0, 57.0, 63.0, 50.0, 37.0, 37.0, 27.0, 22.0, 19.0, 10.0, 14.0, 12.0, 9.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.625, -73.0703125, -70.515625, -67.9609375, -65.40625, -62.8515625, -60.296875, -57.7421875, -55.1875, -52.6328125, -50.078125, -47.5234375, -44.96875, -42.4140625, -39.859375, -37.3046875, -34.75, -32.1953125, -29.640625, -27.0859375, -24.53125, -21.9765625, -19.421875, -16.8671875, -14.3125, -11.7578125, -9.203125, -6.6484375, -4.09375, -1.5390625, 1.015625, 3.5703125, 6.125, 8.6796875, 11.234375, 13.7890625, 16.34375, 18.8984375, 21.453125, 24.0078125, 26.5625, 29.1171875, 31.671875, 34.2265625, 36.78125, 39.3359375, 41.890625, 44.4453125, 47.0, 49.5546875, 52.109375, 54.6640625, 57.21875, 59.7734375, 62.328125, 64.8828125, 67.4375, 69.9921875, 72.546875, 75.1015625, 77.65625, 80.2109375, 82.765625, 85.3203125, 87.875]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 5.0, 4.0, 9.0, 8.0, 20.0, 29.0, 35.0, 66.0, 87.0, 121.0, 171.0, 264.0, 347.0, 582.0, 949.0, 2060.0, 5759.0, 38899.0, 2370507.0, 681233.0, 34807.0, 5205.0, 1840.0, 955.0, 560.0, 376.0, 228.0, 167.0, 127.0, 74.0, 59.0, 40.0, 26.0, 17.0, 8.0, 8.0, 9.0, 8.0, 3.0, 2.0, 10.0, 1.0, 7.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0], "bins": [-12.6875, -12.302734375, -11.91796875, -11.533203125, -11.1484375, -10.763671875, -10.37890625, -9.994140625, -9.609375, -9.224609375, -8.83984375, -8.455078125, -8.0703125, -7.685546875, -7.30078125, -6.916015625, -6.53125, -6.146484375, -5.76171875, -5.376953125, -4.9921875, -4.607421875, -4.22265625, -3.837890625, -3.453125, -3.068359375, -2.68359375, -2.298828125, -1.9140625, -1.529296875, -1.14453125, -0.759765625, -0.375, 0.009765625, 0.39453125, 0.779296875, 1.1640625, 1.548828125, 1.93359375, 2.318359375, 2.703125, 3.087890625, 3.47265625, 3.857421875, 4.2421875, 4.626953125, 5.01171875, 5.396484375, 5.78125, 6.166015625, 6.55078125, 6.935546875, 7.3203125, 7.705078125, 8.08984375, 8.474609375, 8.859375, 9.244140625, 9.62890625, 10.013671875, 10.3984375, 10.783203125, 11.16796875, 11.552734375, 11.9375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 13.0, 8.0, 20.0, 27.0, 56.0, 81.0, 108.0, 156.0, 154.0, 127.0, 92.0, 55.0, 34.0, 18.0, 11.0, 7.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-111.04193878173828, -107.97674560546875, -104.91155242919922, -101.84636688232422, -98.78117370605469, -95.71598052978516, -92.65078735351562, -89.58560180664062, -86.5204086303711, -83.45521545410156, -80.39002227783203, -77.32483673095703, -74.2596435546875, -71.19445037841797, -68.12925720214844, -65.06407165527344, -61.99887466430664, -58.93368148803711, -55.868492126464844, -52.80329895019531, -49.73810958862305, -46.672916412353516, -43.60772705078125, -40.54253387451172, -37.47734069824219, -34.412147521972656, -31.34695816040039, -28.28176498413086, -25.216575622558594, -22.151382446289062, -19.086191177368164, -16.020999908447266, -12.955810546875, -9.890619277954102, -6.825427532196045, -3.7602357864379883, -0.6950445175170898, 2.3701467514038086, 5.435338973999023, 8.500530242919922, 11.56572151184082, 14.630912780761719, 17.696104049682617, 20.761295318603516, 23.826488494873047, 26.891677856445312, 29.956871032714844, 33.022064208984375, 36.08725357055664, 39.15244674682617, 42.21763610839844, 45.28282928466797, 48.348018646240234, 51.413211822509766, 54.47840118408203, 57.54359436035156, 60.608787536621094, 63.673980712890625, 66.73917388916016, 69.80435943603516, 72.86955261230469, 75.93474578857422, 78.99993896484375, 82.06512451171875, 85.13031768798828]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 6.0, 8.0, 3.0, 4.0, 8.0, 5.0, 8.0, 16.0, 13.0, 22.0, 34.0, 27.0, 29.0, 33.0, 31.0, 34.0, 55.0, 55.0, 56.0, 51.0, 59.0, 51.0, 55.0, 51.0, 40.0, 41.0, 35.0, 27.0, 29.0, 24.0, 20.0, 18.0, 9.0, 7.0, 11.0, 7.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.08335876464844, -81.07108306884766, -78.05879974365234, -75.04652404785156, -72.03424072265625, -69.02196502685547, -66.00968933105469, -62.99740982055664, -59.985130310058594, -56.97285079956055, -53.9605712890625, -50.94829559326172, -47.93601608276367, -44.923736572265625, -41.911460876464844, -38.8991813659668, -35.88690185546875, -32.8746223449707, -29.86234474182129, -26.850067138671875, -23.837787628173828, -20.82550811767578, -17.813230514526367, -14.800952911376953, -11.788673400878906, -8.776394844055176, -5.764116287231445, -2.751837730407715, 0.2604408264160156, 3.272719383239746, 6.284997940063477, 9.29727554321289, 12.309555053710938, 15.321833610534668, 18.3341121673584, 21.346389770507812, 24.35866928100586, 27.370948791503906, 30.38322639465332, 33.395503997802734, 36.40778350830078, 39.42006301879883, 42.432342529296875, 45.444618225097656, 48.4568977355957, 51.46917724609375, 54.48145294189453, 57.49373245239258, 60.506011962890625, 63.51829147338867, 66.53057098388672, 69.5428466796875, 72.55513000488281, 75.5674057006836, 78.57968139648438, 81.59196472167969, 84.60424041748047, 87.61651611328125, 90.62879943847656, 93.64107513427734, 96.65335083007812, 99.66563415527344, 102.67790985107422, 105.690185546875, 108.70246887207031]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 9.0, 18.0, 13.0, 15.0, 30.0, 33.0, 62.0, 79.0, 128.0, 216.0, 364.0, 578.0, 1003.0, 1629.0, 2505.0, 4026.0, 6529.0, 1014182.0, 6573.0, 3903.0, 2553.0, 1560.0, 973.0, 572.0, 330.0, 214.0, 150.0, 105.0, 69.0, 38.0, 37.0, 14.0, 20.0, 10.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.47530746459961, -21.875869750976562, -21.276432037353516, -20.67699432373047, -20.077556610107422, -19.478118896484375, -18.878681182861328, -18.27924346923828, -17.679805755615234, -17.080368041992188, -16.48093032836914, -15.881492614746094, -15.282054901123047, -14.6826171875, -14.083179473876953, -13.483741760253906, -12.884303092956543, -12.284865379333496, -11.68542766571045, -11.085989952087402, -10.486552238464355, -9.887114524841309, -9.287675857543945, -8.688238143920898, -8.088800430297852, -7.489362716674805, -6.889925003051758, -6.290487289428711, -5.691049575805664, -5.091611862182617, -4.492173671722412, -3.8927359580993652, -3.2932987213134766, -2.6938610076904297, -2.094423294067383, -1.4949853420257568, -0.89554762840271, -0.2961099147796631, 0.3033280372619629, 0.9027657508850098, 1.5022034645080566, 2.1016411781311035, 2.7010788917541504, 3.3005168437957764, 3.8999545574188232, 4.499392509460449, 5.098830223083496, 5.698267936706543, 6.29770565032959, 6.897143363952637, 7.496581077575684, 8.09601879119873, 8.695456504821777, 9.294894218444824, 9.894332885742188, 10.493770599365234, 11.093208312988281, 11.692646026611328, 12.292083740234375, 12.891521453857422, 13.490959167480469, 14.090396881103516, 14.689834594726562, 15.28927230834961, 15.888710021972656]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 11.0, 19.0, 23.0, 44.0, 56.0, 61.0, 141.0, 3677.0, 51458920.0, 193.0, 74.0, 31.0, 25.0, 21.0, 29.0, 21.0, 16.0, 18.0, 11.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2878.673095703125, -2727.9326171875, -2577.192138671875, -2426.45166015625, -2275.71142578125, -2124.970703125, -1974.23046875, -1823.489990234375, -1672.74951171875, -1522.009033203125, -1371.2685546875, -1220.5281982421875, -1069.7877197265625, -919.0472412109375, -768.3068237304688, -617.56640625, -466.825927734375, -316.0854797363281, -165.34503173828125, -14.604583740234375, 136.1358642578125, 286.8763427734375, 437.61676025390625, 588.357177734375, 739.09765625, 889.838134765625, 1040.57861328125, 1191.3189697265625, 1342.0594482421875, 1492.7999267578125, 1643.540283203125, 1794.28076171875, 1945.02099609375, 2095.761474609375, 2246.501953125, 2397.242431640625, 2547.98291015625, 2698.72314453125, 2849.463623046875, 3000.2041015625, 3150.944580078125, 3301.68505859375, 3452.425537109375, 3603.166015625, 3753.90625, 3904.64697265625, 4055.38720703125, 4206.1279296875, 4356.8681640625, 4507.6083984375, 4658.34912109375, 4809.08935546875, 4959.830078125, 5110.5703125, 5261.31103515625, 5412.05126953125, 5562.7919921875, 5713.5322265625, 5864.27294921875, 6015.01318359375, 6165.75390625, 6316.494140625, 6467.23486328125, 6617.97509765625, 6768.71533203125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [5.0, 4.0, 3.0, 3.0, 8.0, 9.0, 17.0, 18.0, 45.0, 66.0, 105.0, 147.0, 197.0, 290.0, 412.0, 640.0, 950.0, 1282.0, 1937.0, 2784.0, 4204.0, 6218.0, 9463.0, 14161.0, 21730.0, 33251.0, 52523.0, 85826.0, 145477.0, 268958.0, 670255.0, 3980681.0, 449581.0, 218233.0, 120667.0, 71686.0, 44560.0, 28543.0, 18471.0, 12185.0, 8070.0, 5657.0, 3669.0, 2647.0, 1753.0, 1293.0, 881.0, 541.0, 471.0, 238.0, 226.0, 104.0, 100.0, 68.0, 43.0, 20.0, 27.0, 19.0, 3.0, 16.0, 6.0, 3.0, 0.0, 6.0], "bins": [-3.53515625, -3.422332763671875, -3.30950927734375, -3.196685791015625, -3.0838623046875, -2.971038818359375, -2.85821533203125, -2.745391845703125, -2.632568359375, -2.519744873046875, -2.40692138671875, -2.294097900390625, -2.1812744140625, -2.068450927734375, -1.95562744140625, -1.842803955078125, -1.72998046875, -1.617156982421875, -1.50433349609375, -1.391510009765625, -1.2786865234375, -1.165863037109375, -1.05303955078125, -0.940216064453125, -0.827392578125, -0.714569091796875, -0.60174560546875, -0.488922119140625, -0.3760986328125, -0.263275146484375, -0.15045166015625, -0.037628173828125, 0.0751953125, 0.188018798828125, 0.30084228515625, 0.413665771484375, 0.5264892578125, 0.639312744140625, 0.75213623046875, 0.864959716796875, 0.977783203125, 1.090606689453125, 1.20343017578125, 1.316253662109375, 1.4290771484375, 1.541900634765625, 1.65472412109375, 1.767547607421875, 1.88037109375, 1.993194580078125, 2.10601806640625, 2.218841552734375, 2.3316650390625, 2.444488525390625, 2.55731201171875, 2.670135498046875, 2.782958984375, 2.895782470703125, 3.00860595703125, 3.121429443359375, 3.2342529296875, 3.347076416015625, 3.45989990234375, 3.572723388671875, 3.685546875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [4.0, 6.0, 1.0, 4.0, 6.0, 4.0, 2.0, 10.0, 10.0, 14.0, 11.0, 8.0, 13.0, 17.0, 16.0, 24.0, 34.0, 27.0, 43.0, 25.0, 34.0, 38.0, 31.0, 52.0, 71.0, 224.0, 702.0, 158.0, 47.0, 41.0, 41.0, 45.0, 32.0, 28.0, 26.0, 24.0, 20.0, 25.0, 23.0, 11.0, 13.0, 14.0, 10.0, 10.0, 6.0, 9.0, 3.0, 7.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.1484375, -6.877685546875, -6.60693359375, -6.336181640625, -6.0654296875, -5.794677734375, -5.52392578125, -5.253173828125, -4.982421875, -4.711669921875, -4.44091796875, -4.170166015625, -3.8994140625, -3.628662109375, -3.35791015625, -3.087158203125, -2.81640625, -2.545654296875, -2.27490234375, -2.004150390625, -1.7333984375, -1.462646484375, -1.19189453125, -0.921142578125, -0.650390625, -0.379638671875, -0.10888671875, 0.161865234375, 0.4326171875, 0.703369140625, 0.97412109375, 1.244873046875, 1.515625, 1.786376953125, 2.05712890625, 2.327880859375, 2.5986328125, 2.869384765625, 3.14013671875, 3.410888671875, 3.681640625, 3.952392578125, 4.22314453125, 4.493896484375, 4.7646484375, 5.035400390625, 5.30615234375, 5.576904296875, 5.84765625, 6.118408203125, 6.38916015625, 6.659912109375, 6.9306640625, 7.201416015625, 7.47216796875, 7.742919921875, 8.013671875, 8.284423828125, 8.55517578125, 8.825927734375, 9.0966796875, 9.367431640625, 9.63818359375, 9.908935546875, 10.1796875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 6.0, 0.0, 1.0, 9.0, 14.0, 9.0, 6.0, 26.0, 31.0, 32.0, 71.0, 85.0, 131.0, 185.0, 327.0, 462.0, 733.0, 1179.0, 1789.0, 2884.0, 4955.0, 8276.0, 14839.0, 25292.0, 45872.0, 87943.0, 175064.0, 413169.0, 4056166.0, 903253.0, 274324.0, 126114.0, 64995.0, 34977.0, 19790.0, 11287.0, 6506.0, 3972.0, 2333.0, 1562.0, 943.0, 644.0, 409.0, 229.0, 177.0, 117.0, 76.0, 67.0, 38.0, 25.0, 11.0, 14.0, 9.0, 7.0, 1.0, 8.0, 3.0, 0.0, 0.0, 3.0], "bins": [-6.0234375, -5.83966064453125, -5.6558837890625, -5.47210693359375, -5.288330078125, -5.10455322265625, -4.9207763671875, -4.73699951171875, -4.55322265625, -4.36944580078125, -4.1856689453125, -4.00189208984375, -3.818115234375, -3.63433837890625, -3.4505615234375, -3.26678466796875, -3.0830078125, -2.89923095703125, -2.7154541015625, -2.53167724609375, -2.347900390625, -2.16412353515625, -1.9803466796875, -1.79656982421875, -1.61279296875, -1.42901611328125, -1.2452392578125, -1.06146240234375, -0.877685546875, -0.69390869140625, -0.5101318359375, -0.32635498046875, -0.142578125, 0.04119873046875, 0.2249755859375, 0.40875244140625, 0.592529296875, 0.77630615234375, 0.9600830078125, 1.14385986328125, 1.32763671875, 1.51141357421875, 1.6951904296875, 1.87896728515625, 2.062744140625, 2.24652099609375, 2.4302978515625, 2.61407470703125, 2.7978515625, 2.98162841796875, 3.1654052734375, 3.34918212890625, 3.532958984375, 3.71673583984375, 3.9005126953125, 4.08428955078125, 4.26806640625, 4.45184326171875, 4.6356201171875, 4.81939697265625, 5.003173828125, 5.18695068359375, 5.3707275390625, 5.55450439453125, 5.73828125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 5.0, 13.0, 16.0, 7.0, 14.0, 27.0, 20.0, 38.0, 27.0, 26.0, 39.0, 50.0, 59.0, 79.0, 144.0, 560.0, 388.0, 101.0, 61.0, 46.0, 40.0, 40.0, 36.0, 36.0, 33.0, 20.0, 21.0, 19.0, 11.0, 10.0, 12.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.4537353515625, -8.188720703125, -7.9237060546875, -7.65869140625, -7.3936767578125, -7.128662109375, -6.8636474609375, -6.5986328125, -6.3336181640625, -6.068603515625, -5.8035888671875, -5.53857421875, -5.2735595703125, -5.008544921875, -4.7435302734375, -4.478515625, -4.2135009765625, -3.948486328125, -3.6834716796875, -3.41845703125, -3.1534423828125, -2.888427734375, -2.6234130859375, -2.3583984375, -2.0933837890625, -1.828369140625, -1.5633544921875, -1.29833984375, -1.0333251953125, -0.768310546875, -0.5032958984375, -0.23828125, 0.0267333984375, 0.291748046875, 0.5567626953125, 0.82177734375, 1.0867919921875, 1.351806640625, 1.6168212890625, 1.8818359375, 2.1468505859375, 2.411865234375, 2.6768798828125, 2.94189453125, 3.2069091796875, 3.471923828125, 3.7369384765625, 4.001953125, 4.2669677734375, 4.531982421875, 4.7969970703125, 5.06201171875, 5.3270263671875, 5.592041015625, 5.8570556640625, 6.1220703125, 6.3870849609375, 6.652099609375, 6.9171142578125, 7.18212890625, 7.4471435546875, 7.712158203125, 7.9771728515625, 8.2421875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 7.0, 0.0, 22.0, 32.0, 27.0, 23.0, 37.0, 36.0, 52.0, 110.0, 139.0, 207.0, 201.0, 197.0, 350.0, 550.0, 713.0, 900.0, 1481.0, 2248.0, 3271.0, 6101.0, 11756.0, 26628.0, 86872.0, 5900256.0, 174958.0, 38521.0, 15504.0, 7640.0, 4237.0, 2670.0, 1566.0, 1210.0, 785.0, 505.0, 387.0, 313.0, 244.0, 130.0, 136.0, 88.0, 83.0, 85.0, 39.0, 47.0, 8.0, 12.0, 4.0, 10.0, 23.0, 12.0, 0.0, 0.0, 3.0, 6.0], "bins": [-14.4296875, -14.0013427734375, -13.572998046875, -13.1446533203125, -12.71630859375, -12.2879638671875, -11.859619140625, -11.4312744140625, -11.0029296875, -10.5745849609375, -10.146240234375, -9.7178955078125, -9.28955078125, -8.8612060546875, -8.432861328125, -8.0045166015625, -7.576171875, -7.1478271484375, -6.719482421875, -6.2911376953125, -5.86279296875, -5.4344482421875, -5.006103515625, -4.5777587890625, -4.1494140625, -3.7210693359375, -3.292724609375, -2.8643798828125, -2.43603515625, -2.0076904296875, -1.579345703125, -1.1510009765625, -0.72265625, -0.2943115234375, 0.134033203125, 0.5623779296875, 0.99072265625, 1.4190673828125, 1.847412109375, 2.2757568359375, 2.7041015625, 3.1324462890625, 3.560791015625, 3.9891357421875, 4.41748046875, 4.8458251953125, 5.274169921875, 5.7025146484375, 6.130859375, 6.5592041015625, 6.987548828125, 7.4158935546875, 7.84423828125, 8.2725830078125, 8.700927734375, 9.1292724609375, 9.5576171875, 9.9859619140625, 10.414306640625, 10.8426513671875, 11.27099609375, 11.6993408203125, 12.127685546875, 12.5560302734375, 12.984375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 8.0, 5.0, 3.0, 10.0, 7.0, 12.0, 17.0, 16.0, 21.0, 16.0, 22.0, 22.0, 23.0, 35.0, 45.0, 41.0, 50.0, 71.0, 103.0, 190.0, 460.0, 251.0, 126.0, 68.0, 50.0, 44.0, 44.0, 37.0, 30.0, 25.0, 21.0, 23.0, 26.0, 21.0, 8.0, 11.0, 13.0, 16.0, 12.0, 9.0, 5.0, 1.0, 5.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-5.18359375, -5.0343017578125, -4.885009765625, -4.7357177734375, -4.58642578125, -4.4371337890625, -4.287841796875, -4.1385498046875, -3.9892578125, -3.8399658203125, -3.690673828125, -3.5413818359375, -3.39208984375, -3.2427978515625, -3.093505859375, -2.9442138671875, -2.794921875, -2.6456298828125, -2.496337890625, -2.3470458984375, -2.19775390625, -2.0484619140625, -1.899169921875, -1.7498779296875, -1.6005859375, -1.4512939453125, -1.302001953125, -1.1527099609375, -1.00341796875, -0.8541259765625, -0.704833984375, -0.5555419921875, -0.40625, -0.2569580078125, -0.107666015625, 0.0416259765625, 0.19091796875, 0.3402099609375, 0.489501953125, 0.6387939453125, 0.7880859375, 0.9373779296875, 1.086669921875, 1.2359619140625, 1.38525390625, 1.5345458984375, 1.683837890625, 1.8331298828125, 1.982421875, 2.1317138671875, 2.281005859375, 2.4302978515625, 2.57958984375, 2.7288818359375, 2.878173828125, 3.0274658203125, 3.1767578125, 3.3260498046875, 3.475341796875, 3.6246337890625, 3.77392578125, 3.9232177734375, 4.072509765625, 4.2218017578125, 4.37109375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 4.0, 16.0, 29.0, 50.0, 69.0, 131.0, 364.0, 170.0, 68.0, 53.0, 20.0, 4.0, 8.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.03418731689453, -19.437789916992188, -18.84139060974121, -18.244993209838867, -17.648595809936523, -17.052196502685547, -16.455799102783203, -15.85940170288086, -15.2630033493042, -14.666604995727539, -14.070207595825195, -13.473809242248535, -12.877410888671875, -12.281013488769531, -11.684615135192871, -11.088216781616211, -10.491819381713867, -9.895421028137207, -9.299023628234863, -8.702625274658203, -8.10622787475586, -7.509829521179199, -6.913431167602539, -6.317033290863037, -5.720635414123535, -5.124237537384033, -4.527839660644531, -3.931441307067871, -3.335043430328369, -2.738645553588867, -2.142247438430786, -1.545849323272705, -0.9494514465332031, -0.3530534505844116, 0.24334454536437988, 0.8397425413131714, 1.436140537261963, 2.032538414001465, 2.628936529159546, 3.225334644317627, 3.821732521057129, 4.418130397796631, 5.014528274536133, 5.610926628112793, 6.207324504852295, 6.803722381591797, 7.400120735168457, 7.996518611907959, 8.592916488647461, 9.189314842224121, 9.785712242126465, 10.382110595703125, 10.978507995605469, 11.574906349182129, 12.171304702758789, 12.767702102661133, 13.364100456237793, 13.960498809814453, 14.556896209716797, 15.153294563293457, 15.749692916870117, 16.34609031677246, 16.942487716674805, 17.53888702392578, 18.135284423828125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 9.0, 6.0, 8.0, 16.0, 20.0, 19.0, 21.0, 22.0, 26.0, 23.0, 30.0, 41.0, 36.0, 42.0, 48.0, 48.0, 42.0, 49.0, 43.0, 32.0, 37.0, 39.0, 40.0, 29.0, 40.0, 24.0, 34.0, 22.0, 26.0, 19.0, 16.0, 20.0, 17.0, 13.0, 13.0, 3.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.480586051940918, -6.259017467498779, -6.037448406219482, -5.815879821777344, -5.594310760498047, -5.372742176055908, -5.151173114776611, -4.929604530334473, -4.708035469055176, -4.486466884613037, -4.26489782333374, -4.043329238891602, -3.8217601776123047, -3.600191593170166, -3.378622531890869, -3.1570539474487305, -2.9354851245880127, -2.713916301727295, -2.492347478866577, -2.2707786560058594, -2.0492098331451416, -1.8276411294937134, -1.6060723066329956, -1.3845034837722778, -1.16293466091156, -0.9413658380508423, -0.7197970151901245, -0.4982282519340515, -0.27665942907333374, -0.05509066581726074, 0.16647815704345703, 0.3880469799041748, 0.6096158027648926, 0.8311846256256104, 1.0527534484863281, 1.274322271347046, 1.4958910942077637, 1.717459797859192, 1.9390286207199097, 2.160597324371338, 2.3821663856506348, 2.6037352085113525, 2.8253040313720703, 3.046872854232788, 3.268441677093506, 3.4900102615356445, 3.7115793228149414, 3.93314790725708, 4.154716491699219, 4.376285076141357, 4.597854137420654, 4.819422721862793, 5.04099178314209, 5.2625603675842285, 5.484129428863525, 5.705698013305664, 5.927267074584961, 6.1488356590271, 6.3704047203063965, 6.591973304748535, 6.813542366027832, 7.035110950469971, 7.256680011749268, 7.478248596191406, 7.699817657470703]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 5.0, 6.0, 15.0, 9.0, 17.0, 23.0, 26.0, 25.0, 42.0, 84.0, 80.0, 113.0, 164.0, 264.0, 376.0, 535.0, 871.0, 1559.0, 3267.0, 8737.0, 32905.0, 3847217.0, 263781.0, 22978.0, 5919.0, 2298.0, 1127.0, 632.0, 369.0, 265.0, 167.0, 100.0, 83.0, 63.0, 42.0, 26.0, 14.0, 28.0, 12.0, 6.0, 7.0, 4.0, 7.0, 5.0, 5.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0196533203125, -0.01894974708557129, -0.018246173858642578, -0.017542600631713867, -0.016839027404785156, -0.016135454177856445, -0.015431880950927734, -0.014728307723999023, -0.014024734497070312, -0.013321161270141602, -0.01261758804321289, -0.01191401481628418, -0.011210441589355469, -0.010506868362426758, -0.009803295135498047, -0.009099721908569336, -0.008396148681640625, -0.007692575454711914, -0.006989002227783203, -0.006285429000854492, -0.005581855773925781, -0.00487828254699707, -0.004174709320068359, -0.0034711360931396484, -0.0027675628662109375, -0.0020639896392822266, -0.0013604164123535156, -0.0006568431854248047, 4.673004150390625e-05, 0.0007503032684326172, 0.0014538764953613281, 0.002157449722290039, 0.00286102294921875, 0.003564596176147461, 0.004268169403076172, 0.004971742630004883, 0.005675315856933594, 0.006378889083862305, 0.007082462310791016, 0.0077860355377197266, 0.008489608764648438, 0.009193181991577148, 0.00989675521850586, 0.01060032844543457, 0.011303901672363281, 0.012007474899291992, 0.012711048126220703, 0.013414621353149414, 0.014118194580078125, 0.014821767807006836, 0.015525341033935547, 0.016228914260864258, 0.01693248748779297, 0.01763606071472168, 0.01833963394165039, 0.0190432071685791, 0.019746780395507812, 0.020450353622436523, 0.021153926849365234, 0.021857500076293945, 0.022561073303222656, 0.023264646530151367, 0.023968219757080078, 0.02467179298400879, 0.0253753662109375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 6.0, 3.0, 8.0, 10.0, 7.0, 12.0, 10.0, 15.0, 13.0, 31.0, 753.0, 22.0, 12.0, 7.0, 14.0, 10.0, 4.0, 6.0, 7.0, 5.0, 4.0, 4.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014944076538085938, -0.0014466643333435059, -0.001398921012878418, -0.00135117769241333, -0.0013034343719482422, -0.0012556910514831543, -0.0012079477310180664, -0.0011602044105529785, -0.0011124610900878906, -0.0010647177696228027, -0.0010169744491577148, -0.000969231128692627, -0.0009214878082275391, -0.0008737444877624512, -0.0008260011672973633, -0.0007782578468322754, -0.0007305145263671875, -0.0006827712059020996, -0.0006350278854370117, -0.0005872845649719238, -0.0005395412445068359, -0.000491797924041748, -0.00044405460357666016, -0.00039631128311157227, -0.0003485679626464844, -0.0003008246421813965, -0.0002530813217163086, -0.0002053380012512207, -0.0001575946807861328, -0.00010985136032104492, -6.210803985595703e-05, -1.436471939086914e-05, 3.337860107421875e-05, 8.112192153930664e-05, 0.00012886524200439453, 0.00017660856246948242, 0.0002243518829345703, 0.0002720952033996582, 0.0003198385238647461, 0.000367581844329834, 0.0004153251647949219, 0.00046306848526000977, 0.0005108118057250977, 0.0005585551261901855, 0.0006062984466552734, 0.0006540417671203613, 0.0007017850875854492, 0.0007495284080505371, 0.000797271728515625, 0.0008450150489807129, 0.0008927583694458008, 0.0009405016899108887, 0.0009882450103759766, 0.0010359883308410645, 0.0010837316513061523, 0.0011314749717712402, 0.0011792182922363281, 0.001226961612701416, 0.001274704933166504, 0.0013224482536315918, 0.0013701915740966797, 0.0014179348945617676, 0.0014656782150268555, 0.0015134215354919434, 0.0015611648559570312]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 10.0, 6.0, 11.0, 14.0, 21.0, 26.0, 38.0, 49.0, 58.0, 73.0, 118.0, 179.0, 275.0, 421.0, 762.0, 1422.0, 3273.0, 11801.0, 133313.0, 3877668.0, 145607.0, 12274.0, 3382.0, 1412.0, 754.0, 423.0, 252.0, 188.0, 127.0, 91.0, 68.0, 34.0, 30.0, 25.0, 21.0, 14.0, 9.0, 9.0, 3.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.024169921875, -0.023448705673217773, -0.022727489471435547, -0.02200627326965332, -0.021285057067871094, -0.020563840866088867, -0.01984262466430664, -0.019121408462524414, -0.018400192260742188, -0.01767897605895996, -0.016957759857177734, -0.016236543655395508, -0.015515327453613281, -0.014794111251831055, -0.014072895050048828, -0.013351678848266602, -0.012630462646484375, -0.011909246444702148, -0.011188030242919922, -0.010466814041137695, -0.009745597839355469, -0.009024381637573242, -0.008303165435791016, -0.007581949234008789, -0.0068607330322265625, -0.006139516830444336, -0.005418300628662109, -0.004697084426879883, -0.003975868225097656, -0.0032546520233154297, -0.002533435821533203, -0.0018122196197509766, -0.00109100341796875, -0.00036978721618652344, 0.0003514289855957031, 0.0010726451873779297, 0.0017938613891601562, 0.002515077590942383, 0.0032362937927246094, 0.003957509994506836, 0.0046787261962890625, 0.005399942398071289, 0.006121158599853516, 0.006842374801635742, 0.007563591003417969, 0.008284807205200195, 0.009006023406982422, 0.009727239608764648, 0.010448455810546875, 0.011169672012329102, 0.011890888214111328, 0.012612104415893555, 0.013333320617675781, 0.014054536819458008, 0.014775753021240234, 0.015496969223022461, 0.016218185424804688, 0.016939401626586914, 0.01766061782836914, 0.018381834030151367, 0.019103050231933594, 0.01982426643371582, 0.020545482635498047, 0.021266698837280273, 0.0219879150390625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 9.0, 9.0, 15.0, 12.0, 22.0, 21.0, 36.0, 32.0, 51.0, 66.0, 104.0, 120.0, 167.0, 193.0, 302.0, 570.0, 967.0, 401.0, 239.0, 183.0, 144.0, 79.0, 69.0, 55.0, 51.0, 29.0, 40.0, 22.0, 10.0, 8.0, 9.0, 10.0, 8.0, 2.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0025920867919921875, -0.0025163888931274414, -0.0024406909942626953, -0.0023649930953979492, -0.002289295196533203, -0.002213597297668457, -0.002137899398803711, -0.002062201499938965, -0.0019865036010742188, -0.0019108057022094727, -0.0018351078033447266, -0.0017594099044799805, -0.0016837120056152344, -0.0016080141067504883, -0.0015323162078857422, -0.001456618309020996, -0.00138092041015625, -0.001305222511291504, -0.0012295246124267578, -0.0011538267135620117, -0.0010781288146972656, -0.0010024309158325195, -0.0009267330169677734, -0.0008510351181030273, -0.0007753372192382812, -0.0006996393203735352, -0.0006239414215087891, -0.000548243522644043, -0.0004725456237792969, -0.0003968477249145508, -0.0003211498260498047, -0.0002454519271850586, -0.0001697540283203125, -9.40561294555664e-05, -1.8358230590820312e-05, 5.733966827392578e-05, 0.00013303756713867188, 0.00020873546600341797, 0.00028443336486816406, 0.00036013126373291016, 0.00043582916259765625, 0.0005115270614624023, 0.0005872249603271484, 0.0006629228591918945, 0.0007386207580566406, 0.0008143186569213867, 0.0008900165557861328, 0.0009657144546508789, 0.001041412353515625, 0.001117110252380371, 0.0011928081512451172, 0.0012685060501098633, 0.0013442039489746094, 0.0014199018478393555, 0.0014955997467041016, 0.0015712976455688477, 0.0016469955444335938, 0.0017226934432983398, 0.001798391342163086, 0.001874089241027832, 0.0019497871398925781, 0.0020254850387573242, 0.0021011829376220703, 0.0021768808364868164, 0.0022525787353515625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 21.0, 24.0, 56.0, 145.0, 251.0, 268.0, 123.0, 55.0, 23.0, 12.0, 5.0, 4.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03887498751282692, -0.03776520863175392, -0.036655426025390625, -0.03554564714431763, -0.03443586453795433, -0.03332608565688133, -0.032216303050518036, -0.031106524169445038, -0.02999674342572689, -0.028886962682008743, -0.027777181938290596, -0.02666740119457245, -0.02555762231349945, -0.024447839707136154, -0.023338060826063156, -0.02222828008234501, -0.02111849933862686, -0.020008718594908714, -0.018898937851190567, -0.01778915710747242, -0.016679376363754272, -0.0155695965513587, -0.014459816738963127, -0.01335003599524498, -0.012240255251526833, -0.011130474507808685, -0.010020693764090538, -0.008910913951694965, -0.007801133207976818, -0.006691352464258671, -0.005581572186201811, -0.004471791908144951, -0.003362007439136505, -0.0022522269282490015, -0.0011424464173614979, -3.2665906473994255e-05, 0.0010771146044135094, 0.0021868953481316566, 0.0032966756261885166, 0.004406455904245377, 0.005516236647963524, 0.006626017391681671, 0.007735797669738531, 0.008845577947795391, 0.009955358691513538, 0.011065139435231686, 0.012174919247627258, 0.013284699991345406, 0.014394480735063553, 0.0155042614787817, 0.016614042222499847, 0.017723822966217995, 0.018833603709936142, 0.01994338259100914, 0.021053163334727287, 0.022162944078445435, 0.023272724822163582, 0.02438250556588173, 0.025492286309599876, 0.026602067053318024, 0.02771184593439102, 0.028821628540754318, 0.029931407421827316, 0.031041188165545464, 0.03215096890926361]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 7.0, 5.0, 4.0, 5.0, 7.0, 5.0, 12.0, 14.0, 10.0, 13.0, 12.0, 40.0, 28.0, 28.0, 47.0, 31.0, 49.0, 45.0, 33.0, 45.0, 54.0, 56.0, 47.0, 56.0, 46.0, 38.0, 39.0, 43.0, 29.0, 24.0, 26.0, 25.0, 17.0, 12.0, 8.0, 7.0, 4.0, 14.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010569870471954346, -0.010247211903333664, -0.009924553334712982, -0.0096018947660923, -0.009279236197471619, -0.008956577628850937, -0.008633919060230255, -0.008311260491609573, -0.007988601922988892, -0.00766594335436821, -0.007343284785747528, -0.007020626217126846, -0.0066979676485061646, -0.006375309079885483, -0.006052650511264801, -0.005729991942644119, -0.0054073333740234375, -0.005084674805402756, -0.004762016236782074, -0.004439357668161392, -0.0041166990995407104, -0.0037940405309200287, -0.003471381962299347, -0.003148723393678665, -0.0028260648250579834, -0.0025034062564373016, -0.00218074768781662, -0.0018580891191959381, -0.0015354305505752563, -0.0012127719819545746, -0.0008901134133338928, -0.0005674548447132111, -0.0002447962760925293, 7.786229252815247e-05, 0.00040052086114883423, 0.000723179429769516, 0.0010458379983901978, 0.0013684965670108795, 0.0016911551356315613, 0.002013813704252243, 0.002336472272872925, 0.0026591308414936066, 0.0029817894101142883, 0.00330444797873497, 0.003627106547355652, 0.003949765115976334, 0.004272423684597015, 0.004595082253217697, 0.004917740821838379, 0.005240399390459061, 0.005563057959079742, 0.005885716527700424, 0.006208375096321106, 0.006531033664941788, 0.0068536922335624695, 0.007176350802183151, 0.007499009370803833, 0.007821667939424515, 0.008144326508045197, 0.008466985076665878, 0.00878964364528656, 0.009112302213907242, 0.009434960782527924, 0.009757619351148605, 0.010080277919769287]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 7.0, 12.0, 17.0, 14.0, 24.0, 34.0, 38.0, 58.0, 90.0, 117.0, 147.0, 204.0, 290.0, 390.0, 628.0, 902.0, 1330.0, 2223.0, 3608.0, 6576.0, 13349.0, 35932.0, 873521.0, 71017.0, 17790.0, 8226.0, 4489.0, 2699.0, 1569.0, 988.0, 684.0, 476.0, 319.0, 210.0, 131.0, 112.0, 87.0, 64.0, 45.0, 28.0, 27.0, 23.0, 14.0, 12.0, 7.0, 15.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0169677734375, -0.01643204689025879, -0.015896320343017578, -0.015360593795776367, -0.014824867248535156, -0.014289140701293945, -0.013753414154052734, -0.013217687606811523, -0.012681961059570312, -0.012146234512329102, -0.01161050796508789, -0.01107478141784668, -0.010539054870605469, -0.010003328323364258, -0.009467601776123047, -0.008931875228881836, -0.008396148681640625, -0.007860422134399414, -0.007324695587158203, -0.006788969039916992, -0.006253242492675781, -0.00571751594543457, -0.005181789398193359, -0.0046460628509521484, -0.0041103363037109375, -0.0035746097564697266, -0.0030388832092285156, -0.0025031566619873047, -0.0019674301147460938, -0.0014317035675048828, -0.0008959770202636719, -0.00036025047302246094, 0.00017547607421875, 0.0007112026214599609, 0.0012469291687011719, 0.0017826557159423828, 0.0023183822631835938, 0.0028541088104248047, 0.0033898353576660156, 0.0039255619049072266, 0.0044612884521484375, 0.0049970149993896484, 0.005532741546630859, 0.00606846809387207, 0.006604194641113281, 0.007139921188354492, 0.007675647735595703, 0.008211374282836914, 0.008747100830078125, 0.009282827377319336, 0.009818553924560547, 0.010354280471801758, 0.010890007019042969, 0.01142573356628418, 0.01196146011352539, 0.012497186660766602, 0.013032913208007812, 0.013568639755249023, 0.014104366302490234, 0.014640092849731445, 0.015175819396972656, 0.015711545944213867, 0.016247272491455078, 0.01678299903869629, 0.0173187255859375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 0.0, 7.0, 4.0, 6.0, 8.0, 4.0, 7.0, 7.0, 12.0, 16.0, 29.0, 131.0, 377.0, 245.0, 45.0, 21.0, 14.0, 7.0, 9.0, 5.0, 2.0, 9.0, 4.0, 1.0, 7.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015516281127929688, -0.0015009045600891113, -0.001450181007385254, -0.0013994574546813965, -0.001348733901977539, -0.0012980103492736816, -0.0012472867965698242, -0.0011965632438659668, -0.0011458396911621094, -0.001095116138458252, -0.0010443925857543945, -0.0009936690330505371, -0.0009429454803466797, -0.0008922219276428223, -0.0008414983749389648, -0.0007907748222351074, -0.00074005126953125, -0.0006893277168273926, -0.0006386041641235352, -0.0005878806114196777, -0.0005371570587158203, -0.0004864335060119629, -0.00043570995330810547, -0.00038498640060424805, -0.0003342628479003906, -0.0002835392951965332, -0.00023281574249267578, -0.00018209218978881836, -0.00013136863708496094, -8.064508438110352e-05, -2.9921531677246094e-05, 2.0802021026611328e-05, 7.152557373046875e-05, 0.00012224912643432617, 0.0001729726791381836, 0.00022369623184204102, 0.00027441978454589844, 0.00032514333724975586, 0.0003758668899536133, 0.0004265904426574707, 0.0004773139953613281, 0.0005280375480651855, 0.000578761100769043, 0.0006294846534729004, 0.0006802082061767578, 0.0007309317588806152, 0.0007816553115844727, 0.0008323788642883301, 0.0008831024169921875, 0.0009338259696960449, 0.0009845495223999023, 0.0010352730751037598, 0.0010859966278076172, 0.0011367201805114746, 0.001187443733215332, 0.0012381672859191895, 0.0012888908386230469, 0.0013396143913269043, 0.0013903379440307617, 0.0014410614967346191, 0.0014917850494384766, 0.001542508602142334, 0.0015932321548461914, 0.0016439557075500488, 0.0016946792602539062]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 3.0, 8.0, 9.0, 15.0, 17.0, 18.0, 34.0, 50.0, 48.0, 88.0, 93.0, 164.0, 252.0, 342.0, 531.0, 761.0, 1231.0, 2167.0, 4180.0, 10363.0, 50879.0, 840122.0, 110396.0, 14726.0, 5235.0, 2656.0, 1446.0, 863.0, 535.0, 386.0, 271.0, 187.0, 141.0, 92.0, 67.0, 48.0, 41.0, 25.0, 17.0, 14.0, 10.0, 7.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0266876220703125, -0.025870084762573242, -0.025052547454833984, -0.024235010147094727, -0.02341747283935547, -0.02259993553161621, -0.021782398223876953, -0.020964860916137695, -0.020147323608398438, -0.01932978630065918, -0.018512248992919922, -0.017694711685180664, -0.016877174377441406, -0.01605963706970215, -0.01524209976196289, -0.014424562454223633, -0.013607025146484375, -0.012789487838745117, -0.01197195053100586, -0.011154413223266602, -0.010336875915527344, -0.009519338607788086, -0.008701801300048828, -0.00788426399230957, -0.0070667266845703125, -0.006249189376831055, -0.005431652069091797, -0.004614114761352539, -0.0037965774536132812, -0.0029790401458740234, -0.0021615028381347656, -0.0013439655303955078, -0.00052642822265625, 0.0002911090850830078, 0.0011086463928222656, 0.0019261837005615234, 0.0027437210083007812, 0.003561258316040039, 0.004378795623779297, 0.005196332931518555, 0.0060138702392578125, 0.00683140754699707, 0.007648944854736328, 0.008466482162475586, 0.009284019470214844, 0.010101556777954102, 0.01091909408569336, 0.011736631393432617, 0.012554168701171875, 0.013371706008911133, 0.01418924331665039, 0.015006780624389648, 0.015824317932128906, 0.016641855239868164, 0.017459392547607422, 0.01827692985534668, 0.019094467163085938, 0.019912004470825195, 0.020729541778564453, 0.02154707908630371, 0.02236461639404297, 0.023182153701782227, 0.023999691009521484, 0.024817228317260742, 0.025634765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 6.0, 2.0, 6.0, 11.0, 24.0, 17.0, 24.0, 20.0, 17.0, 35.0, 29.0, 30.0, 35.0, 37.0, 41.0, 40.0, 32.0, 44.0, 27.0, 46.0, 43.0, 45.0, 48.0, 50.0, 37.0, 31.0, 32.0, 27.0, 26.0, 20.0, 10.0, 25.0, 15.0, 11.0, 11.0, 4.0, 7.0, 3.0, 7.0, 1.0, 4.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.006847381591796875, -0.006637156009674072, -0.0064269304275512695, -0.006216704845428467, -0.006006479263305664, -0.005796253681182861, -0.005586028099060059, -0.005375802516937256, -0.005165576934814453, -0.00495535135269165, -0.004745125770568848, -0.004534900188446045, -0.004324674606323242, -0.0041144490242004395, -0.0039042234420776367, -0.003693997859954834, -0.0034837722778320312, -0.0032735466957092285, -0.0030633211135864258, -0.002853095531463623, -0.0026428699493408203, -0.0024326443672180176, -0.002222418785095215, -0.002012193202972412, -0.0018019676208496094, -0.0015917420387268066, -0.001381516456604004, -0.0011712908744812012, -0.0009610652923583984, -0.0007508397102355957, -0.000540614128112793, -0.00033038854598999023, -0.0001201629638671875, 9.006261825561523e-05, 0.00030028820037841797, 0.0005105137825012207, 0.0007207393646240234, 0.0009309649467468262, 0.001141190528869629, 0.0013514161109924316, 0.0015616416931152344, 0.0017718672752380371, 0.00198209285736084, 0.0021923184394836426, 0.0024025440216064453, 0.002612769603729248, 0.0028229951858520508, 0.0030332207679748535, 0.0032434463500976562, 0.003453671932220459, 0.0036638975143432617, 0.0038741230964660645, 0.004084348678588867, 0.00429457426071167, 0.004504799842834473, 0.004715025424957275, 0.004925251007080078, 0.005135476589202881, 0.005345702171325684, 0.005555927753448486, 0.005766153335571289, 0.005976378917694092, 0.0061866044998168945, 0.006396830081939697, 0.0066070556640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 11.0, 21.0, 33.0, 49.0, 82.0, 126.0, 235.0, 591.0, 1517.0, 6355.0, 153795.0, 872177.0, 10137.0, 2012.0, 735.0, 309.0, 154.0, 78.0, 45.0, 25.0, 27.0, 11.0, 7.0, 7.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038330078125, -0.03720664978027344, -0.036083221435546875, -0.03495979309082031, -0.03383636474609375, -0.03271293640136719, -0.031589508056640625, -0.030466079711914062, -0.0293426513671875, -0.028219223022460938, -0.027095794677734375, -0.025972366333007812, -0.02484893798828125, -0.023725509643554688, -0.022602081298828125, -0.021478652954101562, -0.020355224609375, -0.019231796264648438, -0.018108367919921875, -0.016984939575195312, -0.01586151123046875, -0.014738082885742188, -0.013614654541015625, -0.012491226196289062, -0.0113677978515625, -0.010244369506835938, -0.009120941162109375, -0.007997512817382812, -0.00687408447265625, -0.0057506561279296875, -0.004627227783203125, -0.0035037994384765625, -0.00238037109375, -0.0012569427490234375, -0.000133514404296875, 0.0009899139404296875, 0.00211334228515625, 0.0032367706298828125, 0.004360198974609375, 0.0054836273193359375, 0.0066070556640625, 0.0077304840087890625, 0.008853912353515625, 0.009977340698242188, 0.01110076904296875, 0.012224197387695312, 0.013347625732421875, 0.014471054077148438, 0.015594482421875, 0.016717910766601562, 0.017841339111328125, 0.018964767456054688, 0.02008819580078125, 0.021211624145507812, 0.022335052490234375, 0.023458480834960938, 0.0245819091796875, 0.025705337524414062, 0.026828765869140625, 0.027952194213867188, 0.02907562255859375, 0.030199050903320312, 0.031322479248046875, 0.03244590759277344, 0.0335693359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 4.0, 8.0, 2.0, 9.0, 6.0, 18.0, 15.0, 30.0, 24.0, 34.0, 38.0, 54.0, 80.0, 148.0, 154.0, 83.0, 63.0, 50.0, 45.0, 30.0, 21.0, 21.0, 8.0, 15.0, 9.0, 4.0, 7.0, 0.0, 3.0, 5.0, 3.0, 1.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003353118896484375, -0.0032486021518707275, -0.00314408540725708, -0.0030395686626434326, -0.002935051918029785, -0.0028305351734161377, -0.0027260184288024902, -0.0026215016841888428, -0.0025169849395751953, -0.002412468194961548, -0.0023079514503479004, -0.002203434705734253, -0.0020989179611206055, -0.001994401216506958, -0.0018898844718933105, -0.001785367727279663, -0.0016808509826660156, -0.0015763342380523682, -0.0014718174934387207, -0.0013673007488250732, -0.0012627840042114258, -0.0011582672595977783, -0.0010537505149841309, -0.0009492337703704834, -0.0008447170257568359, -0.0007402002811431885, -0.000635683536529541, -0.0005311667919158936, -0.0004266500473022461, -0.00032213330268859863, -0.00021761655807495117, -0.00011309981346130371, -8.58306884765625e-06, 9.593367576599121e-05, 0.00020045042037963867, 0.00030496716499328613, 0.0004094839096069336, 0.0005140006542205811, 0.0006185173988342285, 0.000723034143447876, 0.0008275508880615234, 0.0009320676326751709, 0.0010365843772888184, 0.0011411011219024658, 0.0012456178665161133, 0.0013501346111297607, 0.0014546513557434082, 0.0015591681003570557, 0.0016636848449707031, 0.0017682015895843506, 0.001872718334197998, 0.0019772350788116455, 0.002081751823425293, 0.0021862685680389404, 0.002290785312652588, 0.0023953020572662354, 0.002499818801879883, 0.0026043355464935303, 0.0027088522911071777, 0.002813369035720825, 0.0029178857803344727, 0.00302240252494812, 0.0031269192695617676, 0.003231436014175415, 0.0033359527587890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 13.0, 25.0, 28.0, 35.0, 58.0, 83.0, 104.0, 178.0, 455.0, 806.0, 2521.0, 12330.0, 904569.0, 116749.0, 7190.0, 1893.0, 641.0, 331.0, 179.0, 119.0, 78.0, 38.0, 24.0, 14.0, 19.0, 15.0, 21.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.039581298828125, -0.03805065155029297, -0.03652000427246094, -0.034989356994628906, -0.033458709716796875, -0.031928062438964844, -0.030397415161132812, -0.02886676788330078, -0.02733612060546875, -0.02580547332763672, -0.024274826049804688, -0.022744178771972656, -0.021213531494140625, -0.019682884216308594, -0.018152236938476562, -0.01662158966064453, -0.0150909423828125, -0.013560295104980469, -0.012029647827148438, -0.010499000549316406, -0.008968353271484375, -0.007437705993652344, -0.0059070587158203125, -0.004376411437988281, -0.00284576416015625, -0.0013151168823242188, 0.0002155303955078125, 0.0017461776733398438, 0.003276824951171875, 0.004807472229003906, 0.0063381195068359375, 0.007868766784667969, 0.0093994140625, 0.010930061340332031, 0.012460708618164062, 0.013991355895996094, 0.015522003173828125, 0.017052650451660156, 0.018583297729492188, 0.02011394500732422, 0.02164459228515625, 0.02317523956298828, 0.024705886840820312, 0.026236534118652344, 0.027767181396484375, 0.029297828674316406, 0.030828475952148438, 0.03235912322998047, 0.0338897705078125, 0.03542041778564453, 0.03695106506347656, 0.038481712341308594, 0.040012359619140625, 0.041543006896972656, 0.04307365417480469, 0.04460430145263672, 0.04613494873046875, 0.04766559600830078, 0.04919624328613281, 0.050726890563964844, 0.052257537841796875, 0.053788185119628906, 0.05531883239746094, 0.05684947967529297, 0.058380126953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 8.0, 8.0, 9.0, 18.0, 20.0, 42.0, 152.0, 334.0, 206.0, 78.0, 29.0, 22.0, 16.0, 13.0, 14.0, 5.0, 8.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0271453857421875, -0.026406288146972656, -0.025667190551757812, -0.02492809295654297, -0.024188995361328125, -0.02344989776611328, -0.022710800170898438, -0.021971702575683594, -0.02123260498046875, -0.020493507385253906, -0.019754409790039062, -0.01901531219482422, -0.018276214599609375, -0.01753711700439453, -0.016798019409179688, -0.016058921813964844, -0.01531982421875, -0.014580726623535156, -0.013841629028320312, -0.013102531433105469, -0.012363433837890625, -0.011624336242675781, -0.010885238647460938, -0.010146141052246094, -0.00940704345703125, -0.008667945861816406, -0.007928848266601562, -0.007189750671386719, -0.006450653076171875, -0.005711555480957031, -0.0049724578857421875, -0.004233360290527344, -0.0034942626953125, -0.0027551651000976562, -0.0020160675048828125, -0.0012769699096679688, -0.000537872314453125, 0.00020122528076171875, 0.0009403228759765625, 0.0016794204711914062, 0.00241851806640625, 0.0031576156616210938, 0.0038967132568359375, 0.004635810852050781, 0.005374908447265625, 0.006114006042480469, 0.0068531036376953125, 0.007592201232910156, 0.008331298828125, 0.009070396423339844, 0.009809494018554688, 0.010548591613769531, 0.011287689208984375, 0.012026786804199219, 0.012765884399414062, 0.013504981994628906, 0.01424407958984375, 0.014983177185058594, 0.015722274780273438, 0.01646137237548828, 0.017200469970703125, 0.01793956756591797, 0.018678665161132812, 0.019417762756347656, 0.0201568603515625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 26.0, 59.0, 207.0, 542.0, 93.0, 22.0, 12.0, 5.0, 4.0, 0.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.38651442527770996, -0.3774142563343048, -0.36831408739089966, -0.3592139184474945, -0.35011374950408936, -0.3410135805606842, -0.33191341161727905, -0.3228132426738739, -0.31371307373046875, -0.3046129047870636, -0.29551273584365845, -0.2864125669002533, -0.27731239795684814, -0.268212229013443, -0.25911206007003784, -0.2500118911266327, -0.24091173708438873, -0.23181156814098358, -0.22271139919757843, -0.21361123025417328, -0.20451106131076813, -0.19541089236736298, -0.18631073832511902, -0.17721056938171387, -0.16811040043830872, -0.15901023149490356, -0.1499100625514984, -0.14080989360809326, -0.1317097246646881, -0.12260955572128296, -0.1135093942284584, -0.10440922528505325, -0.0953090488910675, -0.08620887994766235, -0.0771087110042572, -0.06800854206085205, -0.0589083768427372, -0.049808207899332047, -0.040708042681217194, -0.03160787373781204, -0.02250770479440689, -0.013407536782324314, -0.004307368770241737, 0.004792798310518265, 0.013892967253923416, 0.022993136197328568, 0.03209330141544342, 0.04119347035884857, 0.05029363930225372, 0.059393808245658875, 0.06849397718906403, 0.07759414613246918, 0.08669431507587433, 0.09579448401927948, 0.10489464551210403, 0.11399481445550919, 0.12309498339891434, 0.1321951448917389, 0.14129531383514404, 0.1503954827785492, 0.15949565172195435, 0.1685958206653595, 0.17769598960876465, 0.1867961585521698, 0.19589632749557495]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 9.0, 2.0, 4.0, 7.0, 9.0, 7.0, 17.0, 21.0, 33.0, 59.0, 73.0, 107.0, 105.0, 139.0, 118.0, 65.0, 72.0, 20.0, 38.0, 17.0, 11.0, 9.0, 12.0, 4.0, 9.0, 9.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.12486505508422852, -0.12102162837982178, -0.11717820912599564, -0.1133347824215889, -0.10949136316776276, -0.10564793646335602, -0.10180450975894928, -0.09796108305454254, -0.0941176638007164, -0.09027423709630966, -0.08643081784248352, -0.08258739113807678, -0.07874396443367004, -0.0749005451798439, -0.07105711847543716, -0.06721369922161102, -0.06337027251720428, -0.059526849538087845, -0.055683426558971405, -0.05183999985456467, -0.04799657687544823, -0.04415315389633179, -0.04030972719192505, -0.03646630421280861, -0.03262288123369217, -0.02877945825457573, -0.02493603341281414, -0.02109260857105255, -0.01724918559193611, -0.013405762612819672, -0.009562337771058083, -0.0057189129292964935, -0.0018754899501800537, 0.0019679339602589607, 0.005811357870697975, 0.00965478178113699, 0.013498205691576004, 0.017341628670692444, 0.021185053512454033, 0.025028478354215622, 0.028871901333332062, 0.0327153243124485, 0.03655874729156494, 0.04040217399597168, 0.04424559697508812, 0.04808901995420456, 0.0519324466586113, 0.05577586963772774, 0.05961929261684418, 0.06346271932125092, 0.06730613857507706, 0.0711495652794838, 0.07499298453330994, 0.07883641123771667, 0.08267983794212341, 0.08652326464653015, 0.09036668390035629, 0.09421011060476303, 0.09805352985858917, 0.10189695656299591, 0.10574038326740265, 0.10958380252122879, 0.11342722922563553, 0.11727064847946167, 0.12111407518386841]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 8.0, 7.0, 9.0, 10.0, 17.0, 19.0, 21.0, 26.0, 47.0, 169.0, 2220.0, 4129894.0, 60744.0, 791.0, 112.0, 47.0, 37.0, 17.0, 18.0, 21.0, 8.0, 3.0, 5.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03515625, -1.962127685546875, -1.88909912109375, -1.816070556640625, -1.7430419921875, -1.670013427734375, -1.59698486328125, -1.523956298828125, -1.450927734375, -1.377899169921875, -1.30487060546875, -1.231842041015625, -1.1588134765625, -1.085784912109375, -1.01275634765625, -0.939727783203125, -0.86669921875, -0.793670654296875, -0.72064208984375, -0.647613525390625, -0.5745849609375, -0.501556396484375, -0.42852783203125, -0.355499267578125, -0.282470703125, -0.209442138671875, -0.13641357421875, -0.063385009765625, 0.0096435546875, 0.082672119140625, 0.15570068359375, 0.228729248046875, 0.3017578125, 0.374786376953125, 0.44781494140625, 0.520843505859375, 0.5938720703125, 0.666900634765625, 0.73992919921875, 0.812957763671875, 0.885986328125, 0.959014892578125, 1.03204345703125, 1.105072021484375, 1.1781005859375, 1.251129150390625, 1.32415771484375, 1.397186279296875, 1.47021484375, 1.543243408203125, 1.61627197265625, 1.689300537109375, 1.7623291015625, 1.835357666015625, 1.90838623046875, 1.981414794921875, 2.054443359375, 2.127471923828125, 2.20050048828125, 2.273529052734375, 2.3465576171875, 2.419586181640625, 2.49261474609375, 2.565643310546875, 2.638671875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 5.0, 5.0, 2.0, 0.0, 6.0, 6.0, 7.0, 5.0, 4.0, 15.0, 17.0, 30.0, 54.0, 124.0, 178.0, 217.0, 109.0, 71.0, 46.0, 18.0, 17.0, 5.0, 7.0, 7.0, 3.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 6.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010204315185546875, -0.0009855031967163086, -0.0009505748748779297, -0.0009156465530395508, -0.0008807182312011719, -0.000845789909362793, -0.0008108615875244141, -0.0007759332656860352, -0.0007410049438476562, -0.0007060766220092773, -0.0006711483001708984, -0.0006362199783325195, -0.0006012916564941406, -0.0005663633346557617, -0.0005314350128173828, -0.0004965066909790039, -0.000461578369140625, -0.0004266500473022461, -0.0003917217254638672, -0.0003567934036254883, -0.0003218650817871094, -0.00028693675994873047, -0.00025200843811035156, -0.00021708011627197266, -0.00018215179443359375, -0.00014722347259521484, -0.00011229515075683594, -7.736682891845703e-05, -4.2438507080078125e-05, -7.510185241699219e-06, 2.7418136596679688e-05, 6.23464584350586e-05, 9.72747802734375e-05, 0.0001322031021118164, 0.0001671314239501953, 0.00020205974578857422, 0.00023698806762695312, 0.00027191638946533203, 0.00030684471130371094, 0.00034177303314208984, 0.00037670135498046875, 0.00041162967681884766, 0.00044655799865722656, 0.00048148632049560547, 0.0005164146423339844, 0.0005513429641723633, 0.0005862712860107422, 0.0006211996078491211, 0.0006561279296875, 0.0006910562515258789, 0.0007259845733642578, 0.0007609128952026367, 0.0007958412170410156, 0.0008307695388793945, 0.0008656978607177734, 0.0009006261825561523, 0.0009355545043945312, 0.0009704828262329102, 0.001005411148071289, 0.001040339469909668, 0.0010752677917480469, 0.0011101961135864258, 0.0011451244354248047, 0.0011800527572631836, 0.0012149810791015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 9.0, 8.0, 16.0, 21.0, 22.0, 29.0, 42.0, 54.0, 72.0, 85.0, 133.0, 201.0, 2060.0, 4170460.0, 19588.0, 565.0, 182.0, 139.0, 124.0, 86.0, 78.0, 63.0, 55.0, 46.0, 36.0, 28.0, 19.0, 17.0, 9.0, 4.0, 9.0, 5.0, 3.0, 1.0, 6.0, 1.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3271484375, -0.31390380859375, -0.3006591796875, -0.28741455078125, -0.274169921875, -0.26092529296875, -0.2476806640625, -0.23443603515625, -0.22119140625, -0.20794677734375, -0.1947021484375, -0.18145751953125, -0.168212890625, -0.15496826171875, -0.1417236328125, -0.12847900390625, -0.115234375, -0.10198974609375, -0.0887451171875, -0.07550048828125, -0.062255859375, -0.04901123046875, -0.0357666015625, -0.02252197265625, -0.00927734375, 0.00396728515625, 0.0172119140625, 0.03045654296875, 0.043701171875, 0.05694580078125, 0.0701904296875, 0.08343505859375, 0.0966796875, 0.10992431640625, 0.1231689453125, 0.13641357421875, 0.149658203125, 0.16290283203125, 0.1761474609375, 0.18939208984375, 0.20263671875, 0.21588134765625, 0.2291259765625, 0.24237060546875, 0.255615234375, 0.26885986328125, 0.2821044921875, 0.29534912109375, 0.30859375, 0.32183837890625, 0.3350830078125, 0.34832763671875, 0.361572265625, 0.37481689453125, 0.3880615234375, 0.40130615234375, 0.41455078125, 0.42779541015625, 0.4410400390625, 0.45428466796875, 0.467529296875, 0.48077392578125, 0.4940185546875, 0.50726318359375, 0.5205078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 11.0, 13.0, 19.0, 28.0, 30.0, 45.0, 72.0, 81.0, 106.0, 150.0, 220.0, 289.0, 1346.0, 479.0, 242.0, 168.0, 143.0, 118.0, 97.0, 78.0, 68.0, 59.0, 47.0, 37.0, 29.0, 25.0, 12.0, 9.0, 8.0, 9.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002529144287109375, -0.0024268031120300293, -0.0023244619369506836, -0.002222120761871338, -0.002119779586791992, -0.0020174384117126465, -0.0019150972366333008, -0.001812756061553955, -0.0017104148864746094, -0.0016080737113952637, -0.001505732536315918, -0.0014033913612365723, -0.0013010501861572266, -0.0011987090110778809, -0.0010963678359985352, -0.0009940266609191895, -0.0008916854858398438, -0.000789344310760498, -0.0006870031356811523, -0.0005846619606018066, -0.00048232078552246094, -0.00037997961044311523, -0.00027763843536376953, -0.00017529726028442383, -7.295608520507812e-05, 2.9385089874267578e-05, 0.00013172626495361328, 0.00023406744003295898, 0.0003364086151123047, 0.0004387497901916504, 0.0005410909652709961, 0.0006434321403503418, 0.0007457733154296875, 0.0008481144905090332, 0.0009504556655883789, 0.0010527968406677246, 0.0011551380157470703, 0.001257479190826416, 0.0013598203659057617, 0.0014621615409851074, 0.0015645027160644531, 0.0016668438911437988, 0.0017691850662231445, 0.0018715262413024902, 0.001973867416381836, 0.0020762085914611816, 0.0021785497665405273, 0.002280890941619873, 0.0023832321166992188, 0.0024855732917785645, 0.00258791446685791, 0.002690255641937256, 0.0027925968170166016, 0.0028949379920959473, 0.002997279167175293, 0.0030996203422546387, 0.0032019615173339844, 0.00330430269241333, 0.0034066438674926758, 0.0035089850425720215, 0.003611326217651367, 0.003713667392730713, 0.0038160085678100586, 0.003918349742889404, 0.00402069091796875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 4.0, 734.0, 249.0, 25.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09924425184726715, -0.06409721076488495, -0.028950177133083344, 0.006196856498718262, 0.041343897581100464, 0.07649093866348267, 0.11163796484470367, 0.14678500592708588, 0.18193204700946808, 0.21707908809185028, 0.2522261142730713, 0.2873731553554535, 0.3225201964378357, 0.3576672375202179, 0.3928142786026001, 0.4279612898826599, 0.4631083607673645, 0.4982554018497467, 0.5334024429321289, 0.5685494542121887, 0.6036965250968933, 0.6388435363769531, 0.6739906072616577, 0.7091376185417175, 0.7442846298217773, 0.7794316411018372, 0.8145787119865417, 0.8497257232666016, 0.8848727941513062, 0.920019805431366, 0.9551668167114258, 0.9903138875961304, 1.0254608392715454, 1.06060791015625, 1.095754861831665, 1.1309019327163696, 1.1660490036010742, 1.2011960744857788, 1.2363430261611938, 1.2714900970458984, 1.306637167930603, 1.3417842388153076, 1.3769311904907227, 1.4120782613754272, 1.4472253322601318, 1.4823724031448364, 1.5175193548202515, 1.552666425704956, 1.587813377380371, 1.6229604482650757, 1.6581073999404907, 1.6932544708251953, 1.7284015417099, 1.7635486125946045, 1.7986955642700195, 1.8338426351547241, 1.8689897060394287, 1.9041367769241333, 1.9392837285995483, 1.974430799484253, 2.009577751159668, 2.044724941253662, 2.079871892929077, 2.115018844604492, 2.1501660346984863]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 4.0, 11.0, 12.0, 16.0, 14.0, 36.0, 46.0, 65.0, 84.0, 106.0, 100.0, 121.0, 92.0, 82.0, 69.0, 56.0, 39.0, 17.0, 11.0, 5.0, 11.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0771322250366211, -0.07387250661849976, -0.07061278820037842, -0.06735306978225708, -0.06409335136413574, -0.060833629220724106, -0.05757390707731247, -0.05431418865919113, -0.051054470241069794, -0.047794751822948456, -0.04453503340482712, -0.04127531126141548, -0.038015592843294144, -0.034755874425172806, -0.03149615228176117, -0.02823643386363983, -0.024976715445518494, -0.021716997027397156, -0.01845727674663067, -0.015197557397186756, -0.011937838047742844, -0.008678119629621506, -0.005418399348855019, -0.0021586790680885315, 0.0011010393500328064, 0.004360758699476719, 0.007620478048920631, 0.010880197398364544, 0.014139916747808456, 0.017399635165929794, 0.02065935544669628, 0.02391907572746277, 0.027178794145584106, 0.030438512563705444, 0.03369823098182678, 0.03695795312523842, 0.040217671543359756, 0.043477389961481094, 0.04673711210489273, 0.04999683052301407, 0.053256548941135406, 0.056516267359256744, 0.05977598577737808, 0.06303570419549942, 0.06629543006420135, 0.06955514848232269, 0.07281486690044403, 0.07607458531856537, 0.0793343037366867, 0.08259402215480804, 0.08585374057292938, 0.08911345899105072, 0.09237317740917206, 0.0956328958272934, 0.09889262169599533, 0.10215234011411667, 0.105412058532238, 0.10867177695035934, 0.11193149536848068, 0.11519121378660202, 0.11845093965530396, 0.12171065807342529, 0.12497037649154663, 0.12823009490966797, 0.1314898133277893]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 2.0, 9.0, 8.0, 13.0, 14.0, 27.0, 28.0, 28.0, 52.0, 76.0, 92.0, 107.0, 196.0, 235.0, 315.0, 458.0, 673.0, 990.0, 1485.0, 2446.0, 4091.0, 7072.0, 14600.0, 48956.0, 818299.0, 106689.0, 19515.0, 8881.0, 4802.0, 2794.0, 1767.0, 1146.0, 750.0, 505.0, 413.0, 253.0, 192.0, 155.0, 113.0, 67.0, 70.0, 51.0, 31.0, 18.0, 17.0, 22.0, 10.0, 9.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0219268798828125, -0.0212554931640625, -0.0205841064453125, -0.0199127197265625, -0.0192413330078125, -0.0185699462890625, -0.0178985595703125, -0.0172271728515625, -0.0165557861328125, -0.0158843994140625, -0.0152130126953125, -0.0145416259765625, -0.0138702392578125, -0.0131988525390625, -0.0125274658203125, -0.0118560791015625, -0.0111846923828125, -0.0105133056640625, -0.0098419189453125, -0.0091705322265625, -0.0084991455078125, -0.0078277587890625, -0.0071563720703125, -0.0064849853515625, -0.0058135986328125, -0.0051422119140625, -0.0044708251953125, -0.0037994384765625, -0.0031280517578125, -0.0024566650390625, -0.0017852783203125, -0.0011138916015625, -0.0004425048828125, 0.0002288818359375, 0.0009002685546875, 0.0015716552734375, 0.0022430419921875, 0.0029144287109375, 0.0035858154296875, 0.0042572021484375, 0.0049285888671875, 0.0055999755859375, 0.0062713623046875, 0.0069427490234375, 0.0076141357421875, 0.0082855224609375, 0.0089569091796875, 0.0096282958984375, 0.0102996826171875, 0.0109710693359375, 0.0116424560546875, 0.0123138427734375, 0.0129852294921875, 0.0136566162109375, 0.0143280029296875, 0.0149993896484375, 0.0156707763671875, 0.0163421630859375, 0.0170135498046875, 0.0176849365234375, 0.0183563232421875, 0.0190277099609375, 0.0196990966796875, 0.0203704833984375, 0.0210418701171875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 3.0, 5.0, 7.0, 8.0, 8.0, 8.0, 11.0, 18.0, 33.0, 67.0, 130.0, 213.0, 200.0, 114.0, 55.0, 25.0, 11.0, 10.0, 6.0, 10.0, 5.0, 5.0, 4.0, 5.0, 6.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011262893676757812, -0.0010872185230255127, -0.0010481476783752441, -0.0010090768337249756, -0.000970005989074707, -0.0009309351444244385, -0.0008918642997741699, -0.0008527934551239014, -0.0008137226104736328, -0.0007746517658233643, -0.0007355809211730957, -0.0006965100765228271, -0.0006574392318725586, -0.00061836838722229, -0.0005792975425720215, -0.0005402266979217529, -0.0005011558532714844, -0.0004620850086212158, -0.00042301416397094727, -0.0003839433193206787, -0.00034487247467041016, -0.0003058016300201416, -0.00026673078536987305, -0.0002276599407196045, -0.00018858909606933594, -0.00014951825141906738, -0.00011044740676879883, -7.137656211853027e-05, -3.230571746826172e-05, 6.765127182006836e-06, 4.583597183227539e-05, 8.490681648254395e-05, 0.0001239776611328125, 0.00016304850578308105, 0.0002021193504333496, 0.00024119019508361816, 0.0002802610397338867, 0.0003193318843841553, 0.00035840272903442383, 0.0003974735736846924, 0.00043654441833496094, 0.0004756152629852295, 0.000514686107635498, 0.0005537569522857666, 0.0005928277969360352, 0.0006318986415863037, 0.0006709694862365723, 0.0007100403308868408, 0.0007491111755371094, 0.0007881820201873779, 0.0008272528648376465, 0.000866323709487915, 0.0009053945541381836, 0.0009444653987884521, 0.0009835362434387207, 0.0010226070880889893, 0.0010616779327392578, 0.0011007487773895264, 0.001139819622039795, 0.0011788904666900635, 0.001217961311340332, 0.0012570321559906006, 0.0012961030006408691, 0.0013351738452911377, 0.0013742446899414062]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 5.0, 2.0, 5.0, 2.0, 4.0, 6.0, 9.0, 6.0, 12.0, 16.0, 16.0, 16.0, 11.0, 13.0, 23.0, 24.0, 30.0, 35.0, 39.0, 40.0, 122.0, 627.0, 4079.0, 196423.0, 838584.0, 7055.0, 855.0, 176.0, 59.0, 34.0, 33.0, 25.0, 20.0, 17.0, 24.0, 11.0, 17.0, 13.0, 8.0, 12.0, 6.0, 8.0, 5.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.05023193359375, -0.04856395721435547, -0.04689598083496094, -0.045228004455566406, -0.043560028076171875, -0.041892051696777344, -0.04022407531738281, -0.03855609893798828, -0.03688812255859375, -0.03522014617919922, -0.03355216979980469, -0.031884193420410156, -0.030216217041015625, -0.028548240661621094, -0.026880264282226562, -0.02521228790283203, -0.0235443115234375, -0.02187633514404297, -0.020208358764648438, -0.018540382385253906, -0.016872406005859375, -0.015204429626464844, -0.013536453247070312, -0.011868476867675781, -0.01020050048828125, -0.008532524108886719, -0.0068645477294921875, -0.005196571350097656, -0.003528594970703125, -0.0018606185913085938, -0.0001926422119140625, 0.0014753341674804688, 0.003143310546875, 0.004811286926269531, 0.0064792633056640625, 0.008147239685058594, 0.009815216064453125, 0.011483192443847656, 0.013151168823242188, 0.014819145202636719, 0.01648712158203125, 0.01815509796142578, 0.019823074340820312, 0.021491050720214844, 0.023159027099609375, 0.024827003479003906, 0.026494979858398438, 0.02816295623779297, 0.0298309326171875, 0.03149890899658203, 0.03316688537597656, 0.034834861755371094, 0.036502838134765625, 0.038170814514160156, 0.03983879089355469, 0.04150676727294922, 0.04317474365234375, 0.04484272003173828, 0.04651069641113281, 0.048178672790527344, 0.049846649169921875, 0.051514625549316406, 0.05318260192871094, 0.05485057830810547, 0.0565185546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 8.0, 11.0, 11.0, 11.0, 18.0, 20.0, 15.0, 19.0, 28.0, 31.0, 24.0, 20.0, 27.0, 29.0, 31.0, 38.0, 36.0, 36.0, 35.0, 42.0, 32.0, 41.0, 38.0, 41.0, 49.0, 34.0, 30.0, 30.0, 22.0, 30.0, 22.0, 22.0, 18.0, 21.0, 4.0, 9.0, 9.0, 8.0, 13.0, 7.0, 9.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.004161834716796875, -0.004039019346237183, -0.00391620397567749, -0.003793388605117798, -0.0036705732345581055, -0.003547757863998413, -0.0034249424934387207, -0.0033021271228790283, -0.003179311752319336, -0.0030564963817596436, -0.002933681011199951, -0.002810865640640259, -0.0026880502700805664, -0.002565234899520874, -0.0024424195289611816, -0.0023196041584014893, -0.002196788787841797, -0.0020739734172821045, -0.0019511580467224121, -0.0018283426761627197, -0.0017055273056030273, -0.001582711935043335, -0.0014598965644836426, -0.0013370811939239502, -0.0012142658233642578, -0.0010914504528045654, -0.000968635082244873, -0.0008458197116851807, -0.0007230043411254883, -0.0006001889705657959, -0.0004773736000061035, -0.00035455822944641113, -0.00023174285888671875, -0.00010892748832702637, 1.3887882232666016e-05, 0.0001367032527923584, 0.0002595186233520508, 0.00038233399391174316, 0.0005051493644714355, 0.0006279647350311279, 0.0007507801055908203, 0.0008735954761505127, 0.000996410846710205, 0.0011192262172698975, 0.0012420415878295898, 0.0013648569583892822, 0.0014876723289489746, 0.001610487699508667, 0.0017333030700683594, 0.0018561184406280518, 0.001978933811187744, 0.0021017491817474365, 0.002224564552307129, 0.0023473799228668213, 0.0024701952934265137, 0.002593010663986206, 0.0027158260345458984, 0.002838641405105591, 0.002961456775665283, 0.0030842721462249756, 0.003207087516784668, 0.0033299028873443604, 0.0034527182579040527, 0.003575533628463745, 0.0036983489990234375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 10.0, 17.0, 30.0, 29.0, 59.0, 140.0, 508.0, 2911.0, 123239.0, 915083.0, 5427.0, 684.0, 215.0, 77.0, 35.0, 22.0, 10.0, 15.0, 9.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038360595703125, -0.03694629669189453, -0.03553199768066406, -0.034117698669433594, -0.032703399658203125, -0.031289100646972656, -0.029874801635742188, -0.02846050262451172, -0.02704620361328125, -0.02563190460205078, -0.024217605590820312, -0.022803306579589844, -0.021389007568359375, -0.019974708557128906, -0.018560409545898438, -0.01714611053466797, -0.0157318115234375, -0.014317512512207031, -0.012903213500976562, -0.011488914489746094, -0.010074615478515625, -0.008660316467285156, -0.0072460174560546875, -0.005831718444824219, -0.00441741943359375, -0.0030031204223632812, -0.0015888214111328125, -0.00017452239990234375, 0.001239776611328125, 0.0026540756225585938, 0.0040683746337890625, 0.005482673645019531, 0.00689697265625, 0.008311271667480469, 0.009725570678710938, 0.011139869689941406, 0.012554168701171875, 0.013968467712402344, 0.015382766723632812, 0.01679706573486328, 0.01821136474609375, 0.01962566375732422, 0.021039962768554688, 0.022454261779785156, 0.023868560791015625, 0.025282859802246094, 0.026697158813476562, 0.02811145782470703, 0.0295257568359375, 0.03094005584716797, 0.03235435485839844, 0.033768653869628906, 0.035182952880859375, 0.036597251892089844, 0.03801155090332031, 0.03942584991455078, 0.04084014892578125, 0.04225444793701172, 0.04366874694824219, 0.045083045959472656, 0.046497344970703125, 0.047911643981933594, 0.04932594299316406, 0.05074024200439453, 0.052154541015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 5.0, 4.0, 6.0, 3.0, 4.0, 10.0, 8.0, 18.0, 16.0, 27.0, 56.0, 158.0, 359.0, 162.0, 52.0, 18.0, 16.0, 11.0, 14.0, 8.0, 11.0, 2.0, 5.0, 3.0, 3.0, 5.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009007453918457031, -0.0008607730269432068, -0.0008208006620407104, -0.0007808282971382141, -0.0007408559322357178, -0.0007008835673332214, -0.0006609112024307251, -0.0006209388375282288, -0.0005809664726257324, -0.0005409941077232361, -0.0005010217428207397, -0.0004610493779182434, -0.00042107701301574707, -0.00038110464811325073, -0.0003411322832107544, -0.00030115991830825806, -0.0002611875534057617, -0.00022121518850326538, -0.00018124282360076904, -0.0001412704586982727, -0.00010129809379577637, -6.132572889328003e-05, -2.135336399078369e-05, 1.8619000911712646e-05, 5.8591365814208984e-05, 9.856373071670532e-05, 0.00013853609561920166, 0.000178508460521698, 0.00021848082542419434, 0.0002584531903266907, 0.000298425555229187, 0.00033839792013168335, 0.0003783702850341797, 0.000418342649936676, 0.00045831501483917236, 0.0004982873797416687, 0.000538259744644165, 0.0005782321095466614, 0.0006182044744491577, 0.000658176839351654, 0.0006981492042541504, 0.0007381215691566467, 0.0007780939340591431, 0.0008180662989616394, 0.0008580386638641357, 0.0008980110287666321, 0.0009379833936691284, 0.0009779557585716248, 0.001017928123474121, 0.0010579004883766174, 0.0010978728532791138, 0.00113784521818161, 0.0011778175830841064, 0.0012177899479866028, 0.0012577623128890991, 0.0012977346777915955, 0.0013377070426940918, 0.0013776794075965881, 0.0014176517724990845, 0.0014576241374015808, 0.0014975965023040771, 0.0015375688672065735, 0.0015775412321090698, 0.0016175135970115662, 0.0016574859619140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 3.0, 8.0, 13.0, 9.0, 23.0, 24.0, 51.0, 126.0, 473.0, 3267.0, 823387.0, 218284.0, 2304.0, 339.0, 117.0, 50.0, 27.0, 22.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031158447265625, -0.02973794937133789, -0.02831745147705078, -0.026896953582763672, -0.025476455688476562, -0.024055957794189453, -0.022635459899902344, -0.021214962005615234, -0.019794464111328125, -0.018373966217041016, -0.016953468322753906, -0.015532970428466797, -0.014112472534179688, -0.012691974639892578, -0.011271476745605469, -0.00985097885131836, -0.00843048095703125, -0.007009983062744141, -0.005589485168457031, -0.004168987274169922, -0.0027484893798828125, -0.0013279914855957031, 9.250640869140625e-05, 0.0015130043029785156, 0.002933502197265625, 0.004354000091552734, 0.005774497985839844, 0.007194995880126953, 0.008615493774414062, 0.010035991668701172, 0.011456489562988281, 0.01287698745727539, 0.0142974853515625, 0.01571798324584961, 0.01713848114013672, 0.018558979034423828, 0.019979476928710938, 0.021399974822998047, 0.022820472717285156, 0.024240970611572266, 0.025661468505859375, 0.027081966400146484, 0.028502464294433594, 0.029922962188720703, 0.03134346008300781, 0.03276395797729492, 0.03418445587158203, 0.03560495376586914, 0.03702545166015625, 0.03844594955444336, 0.03986644744873047, 0.04128694534301758, 0.04270744323730469, 0.0441279411315918, 0.045548439025878906, 0.046968936920166016, 0.048389434814453125, 0.049809932708740234, 0.051230430603027344, 0.05265092849731445, 0.05407142639160156, 0.05549192428588867, 0.05691242218017578, 0.05833292007446289, 0.05975341796875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 8.0, 16.0, 18.0, 18.0, 34.0, 36.0, 68.0, 71.0, 121.0, 164.0, 124.0, 102.0, 54.0, 37.0, 26.0, 22.0, 20.0, 8.0, 6.0, 9.0, 4.0, 2.0, 8.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00431060791015625, -0.004147708415985107, -0.003984808921813965, -0.0038219094276428223, -0.0036590099334716797, -0.003496110439300537, -0.0033332109451293945, -0.003170311450958252, -0.0030074119567871094, -0.002844512462615967, -0.0026816129684448242, -0.0025187134742736816, -0.002355813980102539, -0.0021929144859313965, -0.002030014991760254, -0.0018671154975891113, -0.0017042160034179688, -0.0015413165092468262, -0.0013784170150756836, -0.001215517520904541, -0.0010526180267333984, -0.0008897185325622559, -0.0007268190383911133, -0.0005639195442199707, -0.0004010200500488281, -0.00023812055587768555, -7.522106170654297e-05, 8.767843246459961e-05, 0.0002505779266357422, 0.00041347742080688477, 0.0005763769149780273, 0.0007392764091491699, 0.0009021759033203125, 0.001065075397491455, 0.0012279748916625977, 0.0013908743858337402, 0.0015537738800048828, 0.0017166733741760254, 0.001879572868347168, 0.0020424723625183105, 0.002205371856689453, 0.0023682713508605957, 0.0025311708450317383, 0.002694070339202881, 0.0028569698333740234, 0.003019869327545166, 0.0031827688217163086, 0.003345668315887451, 0.0035085678100585938, 0.0036714673042297363, 0.003834366798400879, 0.0039972662925720215, 0.004160165786743164, 0.004323065280914307, 0.004485964775085449, 0.004648864269256592, 0.004811763763427734, 0.004974663257598877, 0.0051375627517700195, 0.005300462245941162, 0.005463361740112305, 0.005626261234283447, 0.00578916072845459, 0.005952060222625732, 0.006114959716796875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 10.0, 3.0, 7.0, 12.0, 37.0, 190.0, 404.0, 219.0, 64.0, 25.0, 11.0, 5.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14002105593681335, -0.1365664303302765, -0.13311180472373962, -0.12965716421604156, -0.1262025386095047, -0.12274791300296783, -0.11929328739643097, -0.1158386617898941, -0.11238402873277664, -0.10892940312623978, -0.10547477006912231, -0.10202014446258545, -0.09856551885604858, -0.09511088579893112, -0.09165626019239426, -0.0882016271352768, -0.08474700152873993, -0.08129237592220306, -0.0778377428650856, -0.07438311725854874, -0.07092848420143127, -0.06747385859489441, -0.06401923298835754, -0.06056460365653038, -0.05710997432470322, -0.05365534499287605, -0.05020071566104889, -0.046746090054512024, -0.04329146072268486, -0.0398368313908577, -0.03638220578432083, -0.03292757645249367, -0.029472939670085907, -0.026018310338258743, -0.02256368286907673, -0.019109055399894714, -0.01565442606806755, -0.012199796736240387, -0.008745169267058372, -0.005290541797876358, -0.0018359124660491943, 0.0016187159344553947, 0.005073344334959984, 0.008527972735464573, 0.011982601135969162, 0.015437230467796326, 0.01889185793697834, 0.022346485406160355, 0.02580111473798752, 0.029255744069814682, 0.032710373401641846, 0.03616499900817871, 0.039619628340005875, 0.04307425767183304, 0.046528883278369904, 0.04998351261019707, 0.05343814194202423, 0.056892771273851395, 0.06034740060567856, 0.06380202621221542, 0.06725665926933289, 0.07071128487586975, 0.07416591048240662, 0.07762053608894348, 0.08107516914606094]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 10.0, 12.0, 11.0, 27.0, 25.0, 44.0, 45.0, 54.0, 57.0, 85.0, 69.0, 80.0, 76.0, 73.0, 57.0, 48.0, 36.0, 35.0, 28.0, 21.0, 20.0, 16.0, 5.0, 8.0, 9.0, 8.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.04657745361328125, -0.0452071912586689, -0.04383692890405655, -0.0424666702747345, -0.04109640792012215, -0.039726145565509796, -0.038355886936187744, -0.036985624581575394, -0.03561536222696304, -0.03424509987235069, -0.03287483751773834, -0.03150457888841629, -0.03013431653380394, -0.02876405417919159, -0.027393793687224388, -0.026023533195257187, -0.024653270840644836, -0.023283008486032486, -0.021912747994065285, -0.020542487502098083, -0.019172225147485733, -0.017801962792873383, -0.01643170230090618, -0.015061440877616405, -0.01369117945432663, -0.012320918031036854, -0.010950656607747078, -0.009580395184457302, -0.008210133761167526, -0.00683987233787775, -0.0054696109145879745, -0.004099349491298199, -0.002729088068008423, -0.001358826644718647, 1.1434778571128845e-05, 0.0013816962018609047, 0.0027519576251506805, 0.004122219048440456, 0.005492480471730232, 0.006862741895020008, 0.008233003318309784, 0.00960326474159956, 0.010973526164889336, 0.012343787588179111, 0.013714049011468887, 0.015084310434758663, 0.01645457185804844, 0.01782483235001564, 0.01919509470462799, 0.02056535705924034, 0.021935617551207542, 0.023305878043174744, 0.024676140397787094, 0.026046402752399445, 0.027416663244366646, 0.028786923736333847, 0.030157186090946198, 0.03152744844555855, 0.0328977108001709, 0.03426796942949295, 0.0356382317841053, 0.03700849413871765, 0.0383787527680397, 0.039749015122652054, 0.041119277477264404]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 0.0, 6.0, 5.0, 3.0, 4.0, 4.0, 0.0, 6.0, 14.0, 13.0, 7.0, 8.0, 16.0, 14.0, 18.0, 32.0, 64.0, 322.0, 4193249.0, 263.0, 54.0, 22.0, 17.0, 33.0, 12.0, 20.0, 16.0, 8.0, 8.0, 14.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.8828125, -0.8495025634765625, -0.816192626953125, -0.7828826904296875, -0.74957275390625, -0.7162628173828125, -0.682952880859375, -0.6496429443359375, -0.6163330078125, -0.5830230712890625, -0.549713134765625, -0.5164031982421875, -0.48309326171875, -0.4497833251953125, -0.416473388671875, -0.3831634521484375, -0.349853515625, -0.3165435791015625, -0.283233642578125, -0.2499237060546875, -0.21661376953125, -0.1833038330078125, -0.149993896484375, -0.1166839599609375, -0.0833740234375, -0.0500640869140625, -0.016754150390625, 0.0165557861328125, 0.04986572265625, 0.0831756591796875, 0.116485595703125, 0.1497955322265625, 0.18310546875, 0.2164154052734375, 0.249725341796875, 0.2830352783203125, 0.31634521484375, 0.3496551513671875, 0.382965087890625, 0.4162750244140625, 0.4495849609375, 0.4828948974609375, 0.516204833984375, 0.5495147705078125, 0.58282470703125, 0.6161346435546875, 0.649444580078125, 0.6827545166015625, 0.716064453125, 0.7493743896484375, 0.782684326171875, 0.8159942626953125, 0.84930419921875, 0.8826141357421875, 0.915924072265625, 0.9492340087890625, 0.9825439453125, 1.0158538818359375, 1.049163818359375, 1.0824737548828125, 1.11578369140625, 1.1490936279296875, 1.182403564453125, 1.2157135009765625, 1.2490234375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 9.0, 1.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 8.0, 12.0, 13.0, 22.0, 25.0, 33.0, 83.0, 122.0, 171.0, 148.0, 107.0, 88.0, 43.0, 26.0, 12.0, 9.0, 7.0, 6.0, 12.0, 6.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00107574462890625, -0.0010420680046081543, -0.0010083913803100586, -0.0009747147560119629, -0.0009410381317138672, -0.0009073615074157715, -0.0008736848831176758, -0.0008400082588195801, -0.0008063316345214844, -0.0007726550102233887, -0.000738978385925293, -0.0007053017616271973, -0.0006716251373291016, -0.0006379485130310059, -0.0006042718887329102, -0.0005705952644348145, -0.0005369186401367188, -0.000503242015838623, -0.00046956539154052734, -0.00043588876724243164, -0.00040221214294433594, -0.00036853551864624023, -0.00033485889434814453, -0.00030118227005004883, -0.0002675056457519531, -0.00023382902145385742, -0.00020015239715576172, -0.00016647577285766602, -0.0001327991485595703, -9.912252426147461e-05, -6.54458999633789e-05, -3.17692756652832e-05, 1.9073486328125e-06, 3.55839729309082e-05, 6.92605972290039e-05, 0.00010293722152709961, 0.0001366138458251953, 0.00017029047012329102, 0.00020396709442138672, 0.00023764371871948242, 0.0002713203430175781, 0.00030499696731567383, 0.00033867359161376953, 0.00037235021591186523, 0.00040602684020996094, 0.00043970346450805664, 0.00047338008880615234, 0.000507056713104248, 0.0005407333374023438, 0.0005744099617004395, 0.0006080865859985352, 0.0006417632102966309, 0.0006754398345947266, 0.0007091164588928223, 0.000742793083190918, 0.0007764697074890137, 0.0008101463317871094, 0.0008438229560852051, 0.0008774995803833008, 0.0009111762046813965, 0.0009448528289794922, 0.0009785294532775879, 0.0010122060775756836, 0.0010458827018737793, 0.001079559326171875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 17.0, 39.0, 138.0, 23876.0, 4170048.0, 122.0, 24.0, 7.0, 7.0, 3.0, 1.0, 4.0], "bins": [-1.498046875, -1.4713134765625, -1.444580078125, -1.4178466796875, -1.39111328125, -1.3643798828125, -1.337646484375, -1.3109130859375, -1.2841796875, -1.2574462890625, -1.230712890625, -1.2039794921875, -1.17724609375, -1.1505126953125, -1.123779296875, -1.0970458984375, -1.0703125, -1.0435791015625, -1.016845703125, -0.9901123046875, -0.96337890625, -0.9366455078125, -0.909912109375, -0.8831787109375, -0.8564453125, -0.8297119140625, -0.802978515625, -0.7762451171875, -0.74951171875, -0.7227783203125, -0.696044921875, -0.6693115234375, -0.642578125, -0.6158447265625, -0.589111328125, -0.5623779296875, -0.53564453125, -0.5089111328125, -0.482177734375, -0.4554443359375, -0.4287109375, -0.4019775390625, -0.375244140625, -0.3485107421875, -0.32177734375, -0.2950439453125, -0.268310546875, -0.2415771484375, -0.21484375, -0.1881103515625, -0.161376953125, -0.1346435546875, -0.10791015625, -0.0811767578125, -0.054443359375, -0.0277099609375, -0.0009765625, 0.0257568359375, 0.052490234375, 0.0792236328125, 0.10595703125, 0.1326904296875, 0.159423828125, 0.1861572265625, 0.212890625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 11.0, 32.0, 108.0, 412.0, 2929.0, 461.0, 83.0, 20.0, 9.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0138397216796875, -0.013581395149230957, -0.013323068618774414, -0.013064742088317871, -0.012806415557861328, -0.012548089027404785, -0.012289762496948242, -0.0120314359664917, -0.011773109436035156, -0.011514782905578613, -0.01125645637512207, -0.010998129844665527, -0.010739803314208984, -0.010481476783752441, -0.010223150253295898, -0.009964823722839355, -0.009706497192382812, -0.00944817066192627, -0.009189844131469727, -0.008931517601013184, -0.00867319107055664, -0.008414864540100098, -0.008156538009643555, -0.007898211479187012, -0.007639884948730469, -0.007381558418273926, -0.007123231887817383, -0.00686490535736084, -0.006606578826904297, -0.006348252296447754, -0.006089925765991211, -0.005831599235534668, -0.005573272705078125, -0.005314946174621582, -0.005056619644165039, -0.004798293113708496, -0.004539966583251953, -0.00428164005279541, -0.004023313522338867, -0.0037649869918823242, -0.0035066604614257812, -0.0032483339309692383, -0.0029900074005126953, -0.0027316808700561523, -0.0024733543395996094, -0.0022150278091430664, -0.0019567012786865234, -0.0016983747482299805, -0.0014400482177734375, -0.0011817216873168945, -0.0009233951568603516, -0.0006650686264038086, -0.0004067420959472656, -0.00014841556549072266, 0.00010991096496582031, 0.0003682374954223633, 0.0006265640258789062, 0.0008848905563354492, 0.0011432170867919922, 0.0014015436172485352, 0.0016598701477050781, 0.001918196678161621, 0.002176523208618164, 0.002434849739074707, 0.00269317626953125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1002.0, 18.0, 1.0], "bins": [-3.636082410812378, -3.577230930328369, -3.5183792114257812, -3.4595277309417725, -3.4006762504577637, -3.341824531555176, -3.282973051071167, -3.224121332168579, -3.1652698516845703, -3.1064183712005615, -3.0475666522979736, -2.988715171813965, -2.929863452911377, -2.871011972427368, -2.8121604919433594, -2.7533087730407715, -2.6944572925567627, -2.635605812072754, -2.576754093170166, -2.5179026126861572, -2.4590511322021484, -2.4001994132995605, -2.3413479328155518, -2.282496213912964, -2.223644733428955, -2.1647932529449463, -2.1059415340423584, -2.0470900535583496, -1.9882384538650513, -1.929386854171753, -1.8705353736877441, -1.8116837739944458, -1.7528321743011475, -1.6939805746078491, -1.6351289749145508, -1.576277494430542, -1.5174258947372437, -1.4585742950439453, -1.3997228145599365, -1.3408712148666382, -1.2820196151733398, -1.2231680154800415, -1.1643164157867432, -1.1054649353027344, -1.046613335609436, -0.9877617359161377, -0.9289101958274841, -0.8700586557388306, -0.811207115650177, -0.7523555755615234, -0.6935039758682251, -0.6346523761749268, -0.5758008360862732, -0.5169492959976196, -0.4580976963043213, -0.39924612641334534, -0.3403945565223694, -0.28154298663139343, -0.22269141674041748, -0.16383984684944153, -0.10498827695846558, -0.046136707067489624, 0.012714862823486328, 0.07156643271446228, 0.13041800260543823]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 11.0, 25.0, 66.0, 151.0, 254.0, 238.0, 161.0, 69.0, 28.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.28930211067199707, -0.28349003195762634, -0.2776779532432556, -0.2718658745288849, -0.26605379581451416, -0.26024168729782104, -0.2544296383857727, -0.24861754477024078, -0.24280545115470886, -0.23699337244033813, -0.2311812937259674, -0.22536921501159668, -0.21955712139606476, -0.21374504268169403, -0.2079329639673233, -0.20212088525295258, -0.19630880653858185, -0.19049672782421112, -0.1846846491098404, -0.17887255549430847, -0.17306047677993774, -0.16724839806556702, -0.1614363193511963, -0.15562424063682556, -0.14981216192245483, -0.1440000832080841, -0.13818800449371338, -0.13237592577934265, -0.12656383216381073, -0.12075175344944, -0.11493967473506927, -0.10912759602069855, -0.10331550240516663, -0.0975034236907959, -0.09169133752584457, -0.08587925881147385, -0.08006717264652252, -0.0742550939321518, -0.06844301521778107, -0.06263093650341034, -0.056818850338459015, -0.05100676789879799, -0.04519468545913696, -0.039382606744766235, -0.03357052430510521, -0.027758441865444183, -0.021946363151073456, -0.01613428071141243, -0.010322198271751404, -0.004510116763412952, 0.001301964744925499, 0.007114045321941376, 0.012926127761602402, 0.018738210201263428, 0.024550288915634155, 0.03036237135529518, 0.03617445379495621, 0.04198653623461723, 0.04779861867427826, 0.05361069738864899, 0.05942277982831001, 0.06523486226797104, 0.07104694098234177, 0.07685902714729309, 0.08267110586166382]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 9.0, 6.0, 14.0, 18.0, 14.0, 21.0, 26.0, 39.0, 43.0, 39.0, 36.0, 59.0, 44.0, 73.0, 3148.0, 1043755.0, 780.0, 58.0, 55.0, 43.0, 49.0, 44.0, 30.0, 35.0, 16.0, 15.0, 17.0, 14.0, 9.0, 10.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.274658203125, -0.26618194580078125, -0.2577056884765625, -0.24922943115234375, -0.240753173828125, -0.23227691650390625, -0.2238006591796875, -0.21532440185546875, -0.20684814453125, -0.19837188720703125, -0.1898956298828125, -0.18141937255859375, -0.172943115234375, -0.16446685791015625, -0.1559906005859375, -0.14751434326171875, -0.1390380859375, -0.13056182861328125, -0.1220855712890625, -0.11360931396484375, -0.105133056640625, -0.09665679931640625, -0.0881805419921875, -0.07970428466796875, -0.07122802734375, -0.06275177001953125, -0.0542755126953125, -0.04579925537109375, -0.037322998046875, -0.02884674072265625, -0.0203704833984375, -0.01189422607421875, -0.00341796875, 0.00505828857421875, 0.0135345458984375, 0.02201080322265625, 0.030487060546875, 0.03896331787109375, 0.0474395751953125, 0.05591583251953125, 0.06439208984375, 0.07286834716796875, 0.0813446044921875, 0.08982086181640625, 0.098297119140625, 0.10677337646484375, 0.1152496337890625, 0.12372589111328125, 0.1322021484375, 0.14067840576171875, 0.1491546630859375, 0.15763092041015625, 0.166107177734375, 0.17458343505859375, 0.1830596923828125, 0.19153594970703125, 0.20001220703125, 0.20848846435546875, 0.2169647216796875, 0.22544097900390625, 0.233917236328125, 0.24239349365234375, 0.2508697509765625, 0.25934600830078125, 0.267822265625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 118.0, 565.0, 306.0, 24.0, 3.0], "bins": [-0.07366943359375, -0.07245504856109619, -0.07124066352844238, -0.07002627849578857, -0.06881189346313477, -0.06759750843048096, -0.06638312339782715, -0.06516873836517334, -0.06395435333251953, -0.06273996829986572, -0.061525583267211914, -0.060311198234558105, -0.0590968132019043, -0.05788242816925049, -0.05666804313659668, -0.05545365810394287, -0.05423927307128906, -0.053024888038635254, -0.051810503005981445, -0.05059611797332764, -0.04938173294067383, -0.04816734790802002, -0.04695296287536621, -0.0457385778427124, -0.044524192810058594, -0.043309807777404785, -0.04209542274475098, -0.04088103771209717, -0.03966665267944336, -0.03845226764678955, -0.03723788261413574, -0.036023497581481934, -0.034809112548828125, -0.033594727516174316, -0.03238034248352051, -0.0311659574508667, -0.02995157241821289, -0.028737187385559082, -0.027522802352905273, -0.026308417320251465, -0.025094032287597656, -0.023879647254943848, -0.02266526222229004, -0.02145087718963623, -0.020236492156982422, -0.019022107124328613, -0.017807722091674805, -0.016593337059020996, -0.015378952026367188, -0.014164566993713379, -0.01295018196105957, -0.011735796928405762, -0.010521411895751953, -0.009307026863098145, -0.008092641830444336, -0.006878256797790527, -0.005663871765136719, -0.00444948673248291, -0.0032351016998291016, -0.002020716667175293, -0.0008063316345214844, 0.0004080533981323242, 0.0016224384307861328, 0.0028368234634399414, 0.00405120849609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 1.0, 6.0, 2.0, 8.0, 10.0, 13.0, 14.0, 17.0, 27.0, 35.0, 39.0, 45.0, 79.0, 110.0, 176.0, 269.0, 861.0, 4597.0, 67812.0, 922823.0, 46351.0, 3672.0, 750.0, 283.0, 163.0, 111.0, 76.0, 47.0, 36.0, 23.0, 30.0, 16.0, 12.0, 9.0, 8.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11181640625, -0.10801887512207031, -0.10422134399414062, -0.10042381286621094, -0.09662628173828125, -0.09282875061035156, -0.08903121948242188, -0.08523368835449219, -0.0814361572265625, -0.07763862609863281, -0.07384109497070312, -0.07004356384277344, -0.06624603271484375, -0.06244850158691406, -0.058650970458984375, -0.05485343933105469, -0.051055908203125, -0.04725837707519531, -0.043460845947265625, -0.03966331481933594, -0.03586578369140625, -0.03206825256347656, -0.028270721435546875, -0.024473190307617188, -0.0206756591796875, -0.016878128051757812, -0.013080596923828125, -0.009283065795898438, -0.00548553466796875, -0.0016880035400390625, 0.002109527587890625, 0.0059070587158203125, 0.00970458984375, 0.013502120971679688, 0.017299652099609375, 0.021097183227539062, 0.02489471435546875, 0.028692245483398438, 0.032489776611328125, 0.03628730773925781, 0.0400848388671875, 0.04388236999511719, 0.047679901123046875, 0.05147743225097656, 0.05527496337890625, 0.05907249450683594, 0.06287002563476562, 0.06666755676269531, 0.070465087890625, 0.07426261901855469, 0.07806015014648438, 0.08185768127441406, 0.08565521240234375, 0.08945274353027344, 0.09325027465820312, 0.09704780578613281, 0.1008453369140625, 0.10464286804199219, 0.10844039916992188, 0.11223793029785156, 0.11603546142578125, 0.11983299255371094, 0.12363052368164062, 0.1274280548095703, 0.1312255859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 3.0, 7.0, 13.0, 21.0, 14.0, 17.0, 23.0, 24.0, 40.0, 40.0, 54.0, 54.0, 60.0, 73.0, 59.0, 59.0, 65.0, 73.0, 46.0, 41.0, 49.0, 39.0, 29.0, 19.0, 18.0, 12.0, 12.0, 8.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0494384765625, -0.04771757125854492, -0.045996665954589844, -0.044275760650634766, -0.04255485534667969, -0.04083395004272461, -0.03911304473876953, -0.03739213943481445, -0.035671234130859375, -0.0339503288269043, -0.03222942352294922, -0.03050851821899414, -0.028787612915039062, -0.027066707611083984, -0.025345802307128906, -0.023624897003173828, -0.02190399169921875, -0.020183086395263672, -0.018462181091308594, -0.016741275787353516, -0.015020370483398438, -0.01329946517944336, -0.011578559875488281, -0.009857654571533203, -0.008136749267578125, -0.006415843963623047, -0.004694938659667969, -0.0029740333557128906, -0.0012531280517578125, 0.0004677772521972656, 0.0021886825561523438, 0.003909587860107422, 0.0056304931640625, 0.007351398468017578, 0.009072303771972656, 0.010793209075927734, 0.012514114379882812, 0.01423501968383789, 0.01595592498779297, 0.017676830291748047, 0.019397735595703125, 0.021118640899658203, 0.02283954620361328, 0.02456045150756836, 0.026281356811523438, 0.028002262115478516, 0.029723167419433594, 0.03144407272338867, 0.03316497802734375, 0.03488588333129883, 0.036606788635253906, 0.038327693939208984, 0.04004859924316406, 0.04176950454711914, 0.04349040985107422, 0.0452113151550293, 0.046932220458984375, 0.04865312576293945, 0.05037403106689453, 0.05209493637084961, 0.05381584167480469, 0.055536746978759766, 0.057257652282714844, 0.05897855758666992, 0.060699462890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 7.0, 9.0, 9.0, 6.0, 4.0, 12.0, 10.0, 18.0, 22.0, 24.0, 34.0, 43.0, 97.0, 181.0, 523.0, 2548.0, 27013.0, 1006834.0, 9064.0, 1322.0, 361.0, 147.0, 72.0, 32.0, 33.0, 23.0, 20.0, 19.0, 5.0, 8.0, 12.0, 4.0, 7.0, 6.0, 8.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.41650390625, -0.4040031433105469, -0.39150238037109375, -0.3790016174316406, -0.3665008544921875, -0.3540000915527344, -0.34149932861328125, -0.3289985656738281, -0.316497802734375, -0.3039970397949219, -0.29149627685546875, -0.2789955139160156, -0.2664947509765625, -0.2539939880371094, -0.24149322509765625, -0.22899246215820312, -0.21649169921875, -0.20399093627929688, -0.19149017333984375, -0.17898941040039062, -0.1664886474609375, -0.15398788452148438, -0.14148712158203125, -0.12898635864257812, -0.116485595703125, -0.10398483276367188, -0.09148406982421875, -0.07898330688476562, -0.0664825439453125, -0.053981781005859375, -0.04148101806640625, -0.028980255126953125, -0.0164794921875, -0.003978729248046875, 0.00852203369140625, 0.021022796630859375, 0.0335235595703125, 0.046024322509765625, 0.05852508544921875, 0.07102584838867188, 0.083526611328125, 0.09602737426757812, 0.10852813720703125, 0.12102890014648438, 0.1335296630859375, 0.14603042602539062, 0.15853118896484375, 0.17103195190429688, 0.18353271484375, 0.19603347778320312, 0.20853424072265625, 0.22103500366210938, 0.2335357666015625, 0.24603652954101562, 0.25853729248046875, 0.2710380554199219, 0.283538818359375, 0.2960395812988281, 0.30854034423828125, 0.3210411071777344, 0.3335418701171875, 0.3460426330566406, 0.35854339599609375, 0.3710441589355469, 0.383544921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 13.0, 14.0, 10.0, 8.0, 11.0, 10.0, 21.0, 19.0, 31.0, 51.0, 63.0, 74.0, 111.0, 165.0, 92.0, 78.0, 55.0, 41.0, 20.0, 27.0, 18.0, 9.0, 12.0, 5.0, 8.0, 5.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003249645233154297, -0.00031453371047973633, -0.00030410289764404297, -0.0002936720848083496, -0.00028324127197265625, -0.0002728104591369629, -0.00026237964630126953, -0.00025194883346557617, -0.0002415180206298828, -0.00023108720779418945, -0.0002206563949584961, -0.00021022558212280273, -0.00019979476928710938, -0.00018936395645141602, -0.00017893314361572266, -0.0001685023307800293, -0.00015807151794433594, -0.00014764070510864258, -0.00013720989227294922, -0.00012677907943725586, -0.0001163482666015625, -0.00010591745376586914, -9.548664093017578e-05, -8.505582809448242e-05, -7.462501525878906e-05, -6.41942024230957e-05, -5.3763389587402344e-05, -4.3332576751708984e-05, -3.2901763916015625e-05, -2.2470951080322266e-05, -1.2040138244628906e-05, -1.6093254089355469e-06, 8.821487426757812e-06, 1.9252300262451172e-05, 2.968311309814453e-05, 4.011392593383789e-05, 5.054473876953125e-05, 6.097555160522461e-05, 7.140636444091797e-05, 8.183717727661133e-05, 9.226799011230469e-05, 0.00010269880294799805, 0.0001131296157836914, 0.00012356042861938477, 0.00013399124145507812, 0.00014442205429077148, 0.00015485286712646484, 0.0001652836799621582, 0.00017571449279785156, 0.00018614530563354492, 0.00019657611846923828, 0.00020700693130493164, 0.000217437744140625, 0.00022786855697631836, 0.00023829936981201172, 0.0002487301826477051, 0.00025916099548339844, 0.0002695918083190918, 0.00028002262115478516, 0.0002904534339904785, 0.0003008842468261719, 0.00031131505966186523, 0.0003217458724975586, 0.00033217668533325195, 0.0003426074981689453]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 3.0, 5.0, 2.0, 6.0, 8.0, 10.0, 12.0, 31.0, 78.0, 282.0, 1410.0, 10726.0, 981798.0, 49198.0, 3969.0, 687.0, 185.0, 52.0, 20.0, 19.0, 14.0, 4.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47314453125, -0.4586982727050781, -0.44425201416015625, -0.4298057556152344, -0.4153594970703125, -0.4009132385253906, -0.38646697998046875, -0.3720207214355469, -0.357574462890625, -0.3431282043457031, -0.32868194580078125, -0.3142356872558594, -0.2997894287109375, -0.2853431701660156, -0.27089691162109375, -0.2564506530761719, -0.24200439453125, -0.22755813598632812, -0.21311187744140625, -0.19866561889648438, -0.1842193603515625, -0.16977310180664062, -0.15532684326171875, -0.14088058471679688, -0.126434326171875, -0.11198806762695312, -0.09754180908203125, -0.08309555053710938, -0.0686492919921875, -0.054203033447265625, -0.03975677490234375, -0.025310516357421875, -0.0108642578125, 0.003582000732421875, 0.01802825927734375, 0.032474517822265625, 0.0469207763671875, 0.061367034912109375, 0.07581329345703125, 0.09025955200195312, 0.104705810546875, 0.11915206909179688, 0.13359832763671875, 0.14804458618164062, 0.1624908447265625, 0.17693710327148438, 0.19138336181640625, 0.20582962036132812, 0.22027587890625, 0.23472213745117188, 0.24916839599609375, 0.2636146545410156, 0.2780609130859375, 0.2925071716308594, 0.30695343017578125, 0.3213996887207031, 0.335845947265625, 0.3502922058105469, 0.36473846435546875, 0.3791847229003906, 0.3936309814453125, 0.4080772399902344, 0.42252349853515625, 0.4369697570800781, 0.451416015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 8.0, 7.0, 13.0, 16.0, 32.0, 39.0, 124.0, 455.0, 142.0, 45.0, 28.0, 18.0, 14.0, 2.0, 9.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1689453125, -0.1637554168701172, -0.15856552124023438, -0.15337562561035156, -0.14818572998046875, -0.14299583435058594, -0.13780593872070312, -0.1326160430908203, -0.1274261474609375, -0.12223625183105469, -0.11704635620117188, -0.11185646057128906, -0.10666656494140625, -0.10147666931152344, -0.09628677368164062, -0.09109687805175781, -0.085906982421875, -0.08071708679199219, -0.07552719116210938, -0.07033729553222656, -0.06514739990234375, -0.05995750427246094, -0.054767608642578125, -0.04957771301269531, -0.0443878173828125, -0.03919792175292969, -0.034008026123046875, -0.028818130493164062, -0.02362823486328125, -0.018438339233398438, -0.013248443603515625, -0.008058547973632812, -0.00286865234375, 0.0023212432861328125, 0.007511138916015625, 0.012701034545898438, 0.01789093017578125, 0.023080825805664062, 0.028270721435546875, 0.03346061706542969, 0.0386505126953125, 0.04384040832519531, 0.049030303955078125, 0.05422019958496094, 0.05941009521484375, 0.06459999084472656, 0.06978988647460938, 0.07497978210449219, 0.080169677734375, 0.08535957336425781, 0.09054946899414062, 0.09573936462402344, 0.10092926025390625, 0.10611915588378906, 0.11130905151367188, 0.11649894714355469, 0.1216888427734375, 0.1268787384033203, 0.13206863403320312, 0.13725852966308594, 0.14244842529296875, 0.14763832092285156, 0.15282821655273438, 0.1580181121826172, 0.1632080078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 984.0, 28.0, 4.0, 1.0], "bins": [-35.275917053222656, -34.69390106201172, -34.11188888549805, -33.52987289428711, -32.94785690307617, -32.3658447265625, -31.783828735351562, -31.201814651489258, -30.619800567626953, -30.03778648376465, -29.45577049255371, -28.873756408691406, -28.2917423248291, -27.709728240966797, -27.12771224975586, -26.545698165893555, -25.96368408203125, -25.381669998168945, -24.799654006958008, -24.217639923095703, -23.6356258392334, -23.053611755371094, -22.471595764160156, -21.88958168029785, -21.307565689086914, -20.72555160522461, -20.143535614013672, -19.561521530151367, -18.979507446289062, -18.397493362426758, -17.81547737121582, -17.233463287353516, -16.65144920349121, -16.069435119628906, -15.487420082092285, -14.905405044555664, -14.32339096069336, -13.741375923156738, -13.159360885620117, -12.577346801757812, -11.995332717895508, -11.413317680358887, -10.831303596496582, -10.249288558959961, -9.667274475097656, -9.085259437561035, -8.503244400024414, -7.921230316162109, -7.339215278625488, -6.757200717926025, -6.1751861572265625, -5.593171119689941, -5.011157035827637, -4.429141998291016, -3.8471274375915527, -3.26511287689209, -2.683098316192627, -2.101083755493164, -1.5190690755844116, -0.9370543956756592, -0.3550398349761963, 0.2269747257232666, 0.8089895248413086, 1.3910040855407715, 1.9730185270309448]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 25.0, 50.0, 115.0, 184.0, 179.0, 199.0, 131.0, 77.0, 33.0, 12.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.587221622467041, -2.5386786460876465, -2.490135431289673, -2.4415924549102783, -2.3930492401123047, -2.34450626373291, -2.2959632873535156, -2.247420072555542, -2.1988770961761475, -2.150334119796753, -2.1017909049987793, -2.0532479286193848, -2.004704713821411, -1.9561617374420166, -1.9076186418533325, -1.8590755462646484, -1.8105324506759644, -1.7619893550872803, -1.7134462594985962, -1.664903163909912, -1.6163601875305176, -1.5678170919418335, -1.5192739963531494, -1.4707309007644653, -1.4221878051757812, -1.3736447095870972, -1.325101613998413, -1.2765586376190186, -1.2280155420303345, -1.1794724464416504, -1.1309293508529663, -1.0823862552642822, -1.0338433980941772, -0.9853003025054932, -0.9367572665214539, -0.8882141709327698, -0.8396711349487305, -0.7911280393600464, -0.7425849437713623, -0.6940418481826782, -0.6454988121986389, -0.5969557166099548, -0.5484126806259155, -0.49986958503723145, -0.45132651925086975, -0.40278345346450806, -0.354240357875824, -0.3056972920894623, -0.2571542263031006, -0.2086111605167389, -0.160068079829216, -0.11152499914169312, -0.06298193335533142, -0.014438867568969727, 0.034104228019714355, 0.08264729380607605, 0.13119035959243774, 0.17973342537879944, 0.22827650606632233, 0.2768195867538452, 0.3253626525402069, 0.3739057183265686, 0.4224488139152527, 0.4709918797016144, 0.5195349454879761]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 9.0, 18.0, 38.0, 75.0, 150.0, 498.0, 42257.0, 4150998.0, 205.0, 41.0, 6.0, 1.0], "bins": [-3.6875, -3.625072479248047, -3.5626449584960938, -3.5002174377441406, -3.4377899169921875, -3.3753623962402344, -3.3129348754882812, -3.250507354736328, -3.188079833984375, -3.125652313232422, -3.0632247924804688, -3.0007972717285156, -2.9383697509765625, -2.8759422302246094, -2.8135147094726562, -2.751087188720703, -2.68865966796875, -2.626232147216797, -2.5638046264648438, -2.5013771057128906, -2.4389495849609375, -2.3765220642089844, -2.3140945434570312, -2.251667022705078, -2.189239501953125, -2.126811981201172, -2.0643844604492188, -2.0019569396972656, -1.9395294189453125, -1.8771018981933594, -1.8146743774414062, -1.7522468566894531, -1.6898193359375, -1.6273918151855469, -1.5649642944335938, -1.5025367736816406, -1.4401092529296875, -1.3776817321777344, -1.3152542114257812, -1.2528266906738281, -1.190399169921875, -1.1279716491699219, -1.0655441284179688, -1.0031166076660156, -0.9406890869140625, -0.8782615661621094, -0.8158340454101562, -0.7534065246582031, -0.69097900390625, -0.6285514831542969, -0.5661239624023438, -0.5036964416503906, -0.4412689208984375, -0.3788414001464844, -0.31641387939453125, -0.2539863586425781, -0.191558837890625, -0.12913131713867188, -0.06670379638671875, -0.004276275634765625, 0.0581512451171875, 0.12057876586914062, 0.18300628662109375, 0.24543380737304688, 0.307861328125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 58.0, 247.0, 377.0, 234.0, 76.0, 14.0, 3.0, 1.0], "bins": [-0.0992431640625, -0.09754598140716553, -0.09584879875183105, -0.09415161609649658, -0.09245443344116211, -0.09075725078582764, -0.08906006813049316, -0.08736288547515869, -0.08566570281982422, -0.08396852016448975, -0.08227133750915527, -0.0805741548538208, -0.07887697219848633, -0.07717978954315186, -0.07548260688781738, -0.07378542423248291, -0.07208824157714844, -0.07039105892181396, -0.06869387626647949, -0.06699669361114502, -0.06529951095581055, -0.06360232830047607, -0.0619051456451416, -0.06020796298980713, -0.058510780334472656, -0.056813597679138184, -0.05511641502380371, -0.05341923236846924, -0.051722049713134766, -0.05002486705780029, -0.04832768440246582, -0.04663050174713135, -0.044933319091796875, -0.0432361364364624, -0.04153895378112793, -0.03984177112579346, -0.038144588470458984, -0.03644740581512451, -0.03475022315979004, -0.033053040504455566, -0.031355857849121094, -0.02965867519378662, -0.02796149253845215, -0.026264309883117676, -0.024567127227783203, -0.02286994457244873, -0.021172761917114258, -0.019475579261779785, -0.017778396606445312, -0.01608121395111084, -0.014384031295776367, -0.012686848640441895, -0.010989665985107422, -0.00929248332977295, -0.0075953006744384766, -0.005898118019104004, -0.004200935363769531, -0.0025037527084350586, -0.0008065700531005859, 0.0008906126022338867, 0.0025877952575683594, 0.004284977912902832, 0.005982160568237305, 0.007679343223571777, 0.00937652587890625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 18.0, 38.0, 79.0, 202.0, 237.0, 382.0, 4186524.0, 6212.0, 304.0, 154.0, 85.0, 37.0, 5.0, 1.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.015625, -4.91497802734375, -4.8143310546875, -4.71368408203125, -4.613037109375, -4.51239013671875, -4.4117431640625, -4.31109619140625, -4.21044921875, -4.10980224609375, -4.0091552734375, -3.90850830078125, -3.807861328125, -3.70721435546875, -3.6065673828125, -3.50592041015625, -3.4052734375, -3.30462646484375, -3.2039794921875, -3.10333251953125, -3.002685546875, -2.90203857421875, -2.8013916015625, -2.70074462890625, -2.60009765625, -2.49945068359375, -2.3988037109375, -2.29815673828125, -2.197509765625, -2.09686279296875, -1.9962158203125, -1.89556884765625, -1.794921875, -1.69427490234375, -1.5936279296875, -1.49298095703125, -1.392333984375, -1.29168701171875, -1.1910400390625, -1.09039306640625, -0.98974609375, -0.88909912109375, -0.7884521484375, -0.68780517578125, -0.587158203125, -0.48651123046875, -0.3858642578125, -0.28521728515625, -0.1845703125, -0.08392333984375, 0.0167236328125, 0.11737060546875, 0.218017578125, 0.31866455078125, 0.4193115234375, 0.51995849609375, 0.62060546875, 0.72125244140625, 0.8218994140625, 0.92254638671875, 1.023193359375, 1.12384033203125, 1.2244873046875, 1.32513427734375, 1.42578125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 112.0, 3858.0, 88.0, 14.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47607421875, -0.46661949157714844, -0.4571647644042969, -0.4477100372314453, -0.43825531005859375, -0.4288005828857422, -0.4193458557128906, -0.40989112854003906, -0.4004364013671875, -0.39098167419433594, -0.3815269470214844, -0.3720722198486328, -0.36261749267578125, -0.3531627655029297, -0.3437080383300781, -0.33425331115722656, -0.324798583984375, -0.31534385681152344, -0.3058891296386719, -0.2964344024658203, -0.28697967529296875, -0.2775249481201172, -0.2680702209472656, -0.25861549377441406, -0.2491607666015625, -0.23970603942871094, -0.23025131225585938, -0.2207965850830078, -0.21134185791015625, -0.2018871307373047, -0.19243240356445312, -0.18297767639160156, -0.17352294921875, -0.16406822204589844, -0.15461349487304688, -0.1451587677001953, -0.13570404052734375, -0.1262493133544922, -0.11679458618164062, -0.10733985900878906, -0.0978851318359375, -0.08843040466308594, -0.07897567749023438, -0.06952095031738281, -0.06006622314453125, -0.05061149597167969, -0.041156768798828125, -0.03170204162597656, -0.022247314453125, -0.012792587280273438, -0.003337860107421875, 0.0061168670654296875, 0.01557159423828125, 0.025026321411132812, 0.034481048583984375, 0.04393577575683594, 0.0533905029296875, 0.06284523010253906, 0.07229995727539062, 0.08175468444824219, 0.09120941162109375, 0.10066413879394531, 0.11011886596679688, 0.11957359313964844, 0.1290283203125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 15.0, 38.0, 736.0, 185.0, 27.0, 8.0, 3.0, 2.0], "bins": [-5.6812028884887695, -5.584517002105713, -5.487830638885498, -5.391144752502441, -5.294458389282227, -5.19777250289917, -5.101086139678955, -5.004400253295898, -4.907713890075684, -4.811028003692627, -4.714341640472412, -4.6176557540893555, -4.520969390869141, -4.424283504486084, -4.327597141265869, -4.2309112548828125, -4.134225368499756, -4.037539482116699, -3.9408531188964844, -3.8441669940948486, -3.747480869293213, -3.6507949829101562, -3.5541088581085205, -3.4574227333068848, -3.360736608505249, -3.2640504837036133, -3.1673643589019775, -3.070678234100342, -2.973992347717285, -2.8773062229156494, -2.7806200981140137, -2.683933973312378, -2.587247848510742, -2.4905617237091064, -2.3938755989074707, -2.297189474105835, -2.200503349304199, -2.1038174629211426, -2.007131338119507, -1.910445213317871, -1.8137590885162354, -1.7170729637145996, -1.6203868389129639, -1.5237008333206177, -1.427014708518982, -1.3303285837173462, -1.233642578125, -1.1369564533233643, -1.0402703285217285, -0.9435842037200928, -0.8468981385231018, -0.7502120733261108, -0.6535259485244751, -0.5568398237228394, -0.4601537585258484, -0.3634676933288574, -0.2667815685272217, -0.17009547352790833, -0.07340937852859497, 0.023276716470718384, 0.11996281147003174, 0.2166489064693451, 0.31333500146865845, 0.4100210666656494, 0.5067071914672852]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 9.0, 21.0, 38.0, 58.0, 122.0, 144.0, 158.0, 164.0, 108.0, 82.0, 57.0, 19.0, 11.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.633592128753662, -1.581588864326477, -1.5295854806900024, -1.4775822162628174, -1.4255788326263428, -1.3735755681991577, -1.3215723037719727, -1.269568920135498, -1.217565655708313, -1.165562391281128, -1.1135590076446533, -1.0615557432174683, -1.0095523595809937, -0.9575490951538086, -0.9055457711219788, -0.8535424470901489, -0.8015391230583191, -0.7495357990264893, -0.6975324749946594, -0.6455291509628296, -0.5935258865356445, -0.5415225625038147, -0.48951923847198486, -0.4375159442424774, -0.3855126202106476, -0.33350929617881775, -0.2815060019493103, -0.22950267791748047, -0.17749936878681183, -0.1254960596561432, -0.07349273562431335, -0.021489441394805908, 0.030513882637023926, 0.08251719176769257, 0.1345205008983612, 0.18652382493019104, 0.23852713406085968, 0.2905304431915283, 0.34253376722335815, 0.3945370614528656, 0.44654038548469543, 0.49854370951652527, 0.5505470037460327, 0.6025503277778625, 0.6545536518096924, 0.7065569162368774, 0.758560299873352, 0.8105635643005371, 0.8625668883323669, 0.9145702123641968, 0.9665735363960266, 1.0185768604278564, 1.0705801248550415, 1.1225833892822266, 1.1745867729187012, 1.2265900373458862, 1.2785934209823608, 1.330596685409546, 1.3826000690460205, 1.4346033334732056, 1.4866067171096802, 1.5386099815368652, 1.5906133651733398, 1.642616629600525, 1.69461989402771]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 9.0, 14.0, 15.0, 28.0, 27.0, 49.0, 85.0, 202.0, 603.0, 2058.0, 23305.0, 974635.0, 43625.0, 2660.0, 740.0, 248.0, 83.0, 52.0, 39.0, 30.0, 16.0, 9.0, 10.0, 9.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8212890625, -0.7975387573242188, -0.7737884521484375, -0.7500381469726562, -0.726287841796875, -0.7025375366210938, -0.6787872314453125, -0.6550369262695312, -0.63128662109375, -0.6075363159179688, -0.5837860107421875, -0.5600357055664062, -0.536285400390625, -0.5125350952148438, -0.4887847900390625, -0.46503448486328125, -0.4412841796875, -0.41753387451171875, -0.3937835693359375, -0.37003326416015625, -0.346282958984375, -0.32253265380859375, -0.2987823486328125, -0.27503204345703125, -0.25128173828125, -0.22753143310546875, -0.2037811279296875, -0.18003082275390625, -0.156280517578125, -0.13253021240234375, -0.1087799072265625, -0.08502960205078125, -0.061279296875, -0.03752899169921875, -0.0137786865234375, 0.00997161865234375, 0.033721923828125, 0.05747222900390625, 0.0812225341796875, 0.10497283935546875, 0.12872314453125, 0.15247344970703125, 0.1762237548828125, 0.19997406005859375, 0.223724365234375, 0.24747467041015625, 0.2712249755859375, 0.29497528076171875, 0.3187255859375, 0.34247589111328125, 0.3662261962890625, 0.38997650146484375, 0.413726806640625, 0.43747711181640625, 0.4612274169921875, 0.48497772216796875, 0.50872802734375, 0.5324783325195312, 0.5562286376953125, 0.5799789428710938, 0.603729248046875, 0.6274795532226562, 0.6512298583984375, 0.6749801635742188, 0.69873046875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 6.0, 25.0, 41.0, 75.0, 139.0, 174.0, 188.0, 151.0, 87.0, 71.0, 27.0, 14.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.142578125, -0.1394186019897461, -0.1362590789794922, -0.13309955596923828, -0.12994003295898438, -0.12678050994873047, -0.12362098693847656, -0.12046146392822266, -0.11730194091796875, -0.11414241790771484, -0.11098289489746094, -0.10782337188720703, -0.10466384887695312, -0.10150432586669922, -0.09834480285644531, -0.0951852798461914, -0.0920257568359375, -0.0888662338256836, -0.08570671081542969, -0.08254718780517578, -0.07938766479492188, -0.07622814178466797, -0.07306861877441406, -0.06990909576416016, -0.06674957275390625, -0.06359004974365234, -0.06043052673339844, -0.05727100372314453, -0.054111480712890625, -0.05095195770263672, -0.04779243469238281, -0.044632911682128906, -0.041473388671875, -0.038313865661621094, -0.03515434265136719, -0.03199481964111328, -0.028835296630859375, -0.02567577362060547, -0.022516250610351562, -0.019356727600097656, -0.01619720458984375, -0.013037681579589844, -0.009878158569335938, -0.006718635559082031, -0.003559112548828125, -0.00039958953857421875, 0.0027599334716796875, 0.005919456481933594, 0.0090789794921875, 0.012238502502441406, 0.015398025512695312, 0.01855754852294922, 0.021717071533203125, 0.02487659454345703, 0.028036117553710938, 0.031195640563964844, 0.03435516357421875, 0.037514686584472656, 0.04067420959472656, 0.04383373260498047, 0.046993255615234375, 0.05015277862548828, 0.05331230163574219, 0.056471824645996094, 0.05963134765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 2.0, 5.0, 7.0, 7.0, 19.0, 15.0, 22.0, 34.0, 35.0, 46.0, 87.0, 180.0, 420.0, 2552.0, 62169.0, 961949.0, 19033.0, 1308.0, 283.0, 109.0, 67.0, 50.0, 39.0, 17.0, 25.0, 18.0, 8.0, 13.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44482421875, -0.4306373596191406, -0.41645050048828125, -0.4022636413574219, -0.3880767822265625, -0.3738899230957031, -0.35970306396484375, -0.3455162048339844, -0.331329345703125, -0.3171424865722656, -0.30295562744140625, -0.2887687683105469, -0.2745819091796875, -0.2603950500488281, -0.24620819091796875, -0.23202133178710938, -0.21783447265625, -0.20364761352539062, -0.18946075439453125, -0.17527389526367188, -0.1610870361328125, -0.14690017700195312, -0.13271331787109375, -0.11852645874023438, -0.104339599609375, -0.09015274047851562, -0.07596588134765625, -0.061779022216796875, -0.0475921630859375, -0.033405303955078125, -0.01921844482421875, -0.005031585693359375, 0.0091552734375, 0.023342132568359375, 0.03752899169921875, 0.051715850830078125, 0.0659027099609375, 0.08008956909179688, 0.09427642822265625, 0.10846328735351562, 0.122650146484375, 0.13683700561523438, 0.15102386474609375, 0.16521072387695312, 0.1793975830078125, 0.19358444213867188, 0.20777130126953125, 0.22195816040039062, 0.23614501953125, 0.2503318786621094, 0.26451873779296875, 0.2787055969238281, 0.2928924560546875, 0.3070793151855469, 0.32126617431640625, 0.3354530334472656, 0.349639892578125, 0.3638267517089844, 0.37801361083984375, 0.3922004699707031, 0.4063873291015625, 0.4205741882324219, 0.43476104736328125, 0.4489479064941406, 0.463134765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 5.0, 4.0, 10.0, 12.0, 15.0, 26.0, 24.0, 36.0, 26.0, 39.0, 48.0, 61.0, 58.0, 63.0, 56.0, 69.0, 67.0, 49.0, 58.0, 41.0, 40.0, 34.0, 31.0, 25.0, 29.0, 11.0, 11.0, 13.0, 11.0, 3.0, 5.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1689453125, -0.1636638641357422, -0.15838241577148438, -0.15310096740722656, -0.14781951904296875, -0.14253807067871094, -0.13725662231445312, -0.1319751739501953, -0.1266937255859375, -0.12141227722167969, -0.11613082885742188, -0.11084938049316406, -0.10556793212890625, -0.10028648376464844, -0.09500503540039062, -0.08972358703613281, -0.084442138671875, -0.07916069030761719, -0.07387924194335938, -0.06859779357910156, -0.06331634521484375, -0.05803489685058594, -0.052753448486328125, -0.04747200012207031, -0.0421905517578125, -0.03690910339355469, -0.031627655029296875, -0.026346206665039062, -0.02106475830078125, -0.015783309936523438, -0.010501861572265625, -0.0052204132080078125, 6.103515625e-05, 0.0053424835205078125, 0.010623931884765625, 0.015905380249023438, 0.02118682861328125, 0.026468276977539062, 0.031749725341796875, 0.03703117370605469, 0.0423126220703125, 0.04759407043457031, 0.052875518798828125, 0.05815696716308594, 0.06343841552734375, 0.06871986389160156, 0.07400131225585938, 0.07928276062011719, 0.084564208984375, 0.08984565734863281, 0.09512710571289062, 0.10040855407714844, 0.10569000244140625, 0.11097145080566406, 0.11625289916992188, 0.12153434753417969, 0.1268157958984375, 0.1320972442626953, 0.13737869262695312, 0.14266014099121094, 0.14794158935546875, 0.15322303771972656, 0.15850448608398438, 0.1637859344482422, 0.1690673828125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 12.0, 18.0, 34.0, 46.0, 121.0, 237.0, 489.0, 1250.0, 5862.0, 152218.0, 873167.0, 11871.0, 1927.0, 638.0, 296.0, 140.0, 86.0, 41.0, 22.0, 16.0, 15.0, 9.0, 8.0, 6.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24560546875, -0.23917007446289062, -0.23273468017578125, -0.22629928588867188, -0.2198638916015625, -0.21342849731445312, -0.20699310302734375, -0.20055770874023438, -0.194122314453125, -0.18768692016601562, -0.18125152587890625, -0.17481613159179688, -0.1683807373046875, -0.16194534301757812, -0.15550994873046875, -0.14907455444335938, -0.14263916015625, -0.13620376586914062, -0.12976837158203125, -0.12333297729492188, -0.1168975830078125, -0.11046218872070312, -0.10402679443359375, -0.09759140014648438, -0.091156005859375, -0.08472061157226562, -0.07828521728515625, -0.07184982299804688, -0.0654144287109375, -0.058979034423828125, -0.05254364013671875, -0.046108245849609375, -0.0396728515625, -0.033237457275390625, -0.02680206298828125, -0.020366668701171875, -0.0139312744140625, -0.007495880126953125, -0.00106048583984375, 0.005374908447265625, 0.011810302734375, 0.018245697021484375, 0.02468109130859375, 0.031116485595703125, 0.0375518798828125, 0.043987274169921875, 0.05042266845703125, 0.056858062744140625, 0.06329345703125, 0.06972885131835938, 0.07616424560546875, 0.08259963989257812, 0.0890350341796875, 0.09547042846679688, 0.10190582275390625, 0.10834121704101562, 0.114776611328125, 0.12121200561523438, 0.12764739990234375, 0.13408279418945312, 0.1405181884765625, 0.14695358276367188, 0.15338897705078125, 0.15982437133789062, 0.166259765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 8.0, 1.0, 3.0, 6.0, 8.0, 8.0, 17.0, 14.0, 12.0, 16.0, 29.0, 34.0, 60.0, 66.0, 95.0, 132.0, 113.0, 73.0, 71.0, 41.0, 39.0, 28.0, 32.0, 16.0, 13.0, 20.0, 6.0, 8.0, 11.0, 2.0, 3.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002493858337402344, -0.00024043768644332886, -0.00023148953914642334, -0.00022254139184951782, -0.0002135932445526123, -0.0002046450972557068, -0.00019569694995880127, -0.00018674880266189575, -0.00017780065536499023, -0.00016885250806808472, -0.0001599043607711792, -0.00015095621347427368, -0.00014200806617736816, -0.00013305991888046265, -0.00012411177158355713, -0.00011516362428665161, -0.0001062154769897461, -9.726732969284058e-05, -8.831918239593506e-05, -7.937103509902954e-05, -7.042288780212402e-05, -6.14747405052185e-05, -5.252659320831299e-05, -4.357844591140747e-05, -3.463029861450195e-05, -2.5682151317596436e-05, -1.6734004020690918e-05, -7.7858567237854e-06, 1.1622905731201172e-06, 1.0110437870025635e-05, 1.9058585166931152e-05, 2.800673246383667e-05, 3.695487976074219e-05, 4.5903027057647705e-05, 5.485117435455322e-05, 6.379932165145874e-05, 7.274746894836426e-05, 8.169561624526978e-05, 9.064376354217529e-05, 9.959191083908081e-05, 0.00010854005813598633, 0.00011748820543289185, 0.00012643635272979736, 0.00013538450002670288, 0.0001443326473236084, 0.00015328079462051392, 0.00016222894191741943, 0.00017117708921432495, 0.00018012523651123047, 0.00018907338380813599, 0.0001980215311050415, 0.00020696967840194702, 0.00021591782569885254, 0.00022486597299575806, 0.00023381412029266357, 0.0002427622675895691, 0.0002517104148864746, 0.0002606585621833801, 0.00026960670948028564, 0.00027855485677719116, 0.0002875030040740967, 0.0002964511513710022, 0.0003053992986679077, 0.00031434744596481323, 0.00032329559326171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 9.0, 10.0, 16.0, 20.0, 38.0, 54.0, 147.0, 380.0, 1668.0, 20007.0, 1003969.0, 19747.0, 1692.0, 419.0, 172.0, 75.0, 41.0, 18.0, 21.0, 13.0, 13.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.28125, -0.2723197937011719, -0.26338958740234375, -0.2544593811035156, -0.2455291748046875, -0.23659896850585938, -0.22766876220703125, -0.21873855590820312, -0.209808349609375, -0.20087814331054688, -0.19194793701171875, -0.18301773071289062, -0.1740875244140625, -0.16515731811523438, -0.15622711181640625, -0.14729690551757812, -0.13836669921875, -0.12943649291992188, -0.12050628662109375, -0.11157608032226562, -0.1026458740234375, -0.09371566772460938, -0.08478546142578125, -0.07585525512695312, -0.066925048828125, -0.057994842529296875, -0.04906463623046875, -0.040134429931640625, -0.0312042236328125, -0.022274017333984375, -0.01334381103515625, -0.004413604736328125, 0.0045166015625, 0.013446807861328125, 0.02237701416015625, 0.031307220458984375, 0.0402374267578125, 0.049167633056640625, 0.05809783935546875, 0.06702804565429688, 0.075958251953125, 0.08488845825195312, 0.09381866455078125, 0.10274887084960938, 0.1116790771484375, 0.12060928344726562, 0.12953948974609375, 0.13846969604492188, 0.14739990234375, 0.15633010864257812, 0.16526031494140625, 0.17419052124023438, 0.1831207275390625, 0.19205093383789062, 0.20098114013671875, 0.20991134643554688, 0.218841552734375, 0.22777175903320312, 0.23670196533203125, 0.24563217163085938, 0.2545623779296875, 0.2634925842285156, 0.27242279052734375, 0.2813529968261719, 0.290283203125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 16.0, 22.0, 19.0, 39.0, 59.0, 122.0, 169.0, 190.0, 131.0, 78.0, 39.0, 32.0, 21.0, 12.0, 8.0, 9.0, 8.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1055908203125, -0.10196685791015625, -0.0983428955078125, -0.09471893310546875, -0.091094970703125, -0.08747100830078125, -0.0838470458984375, -0.08022308349609375, -0.07659912109375, -0.07297515869140625, -0.0693511962890625, -0.06572723388671875, -0.062103271484375, -0.05847930908203125, -0.0548553466796875, -0.05123138427734375, -0.047607421875, -0.04398345947265625, -0.0403594970703125, -0.03673553466796875, -0.033111572265625, -0.02948760986328125, -0.0258636474609375, -0.02223968505859375, -0.01861572265625, -0.01499176025390625, -0.0113677978515625, -0.00774383544921875, -0.004119873046875, -0.00049591064453125, 0.0031280517578125, 0.00675201416015625, 0.0103759765625, 0.01399993896484375, 0.0176239013671875, 0.02124786376953125, 0.024871826171875, 0.02849578857421875, 0.0321197509765625, 0.03574371337890625, 0.03936767578125, 0.04299163818359375, 0.0466156005859375, 0.05023956298828125, 0.053863525390625, 0.05748748779296875, 0.0611114501953125, 0.06473541259765625, 0.068359375, 0.07198333740234375, 0.0756072998046875, 0.07923126220703125, 0.082855224609375, 0.08647918701171875, 0.0901031494140625, 0.09372711181640625, 0.09735107421875, 0.10097503662109375, 0.1045989990234375, 0.10822296142578125, 0.111846923828125, 0.11547088623046875, 0.1190948486328125, 0.12271881103515625, 0.1263427734375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 84.0, 755.0, 124.0, 27.0, 10.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.53749942779541, -5.410022258758545, -5.28254508972168, -5.155067443847656, -5.027590274810791, -4.900113105773926, -4.772635459899902, -4.645158290863037, -4.517681121826172, -4.390203952789307, -4.262726783752441, -4.135249137878418, -4.007771968841553, -3.8802947998046875, -3.752817392349243, -3.625339984893799, -3.4978628158569336, -3.3703856468200684, -3.242908239364624, -3.1154308319091797, -2.9879536628723145, -2.860476493835449, -2.732999086380005, -2.6055216789245605, -2.4780445098876953, -2.35056734085083, -2.2230899333953857, -2.0956125259399414, -1.9681353569030762, -1.8406580686569214, -1.7131807804107666, -1.5857034921646118, -1.458226203918457, -1.3307489156723022, -1.2032716274261475, -1.0757943391799927, -0.9483170509338379, -0.8208397626876831, -0.6933624744415283, -0.5658851861953735, -0.43840789794921875, -0.31093060970306396, -0.18345332145690918, -0.055976033210754395, 0.07150125503540039, 0.19897854328155518, 0.32645583152770996, 0.45393311977386475, 0.5814104080200195, 0.7088876962661743, 0.8363649845123291, 0.9638422727584839, 1.0913195610046387, 1.2187968492507935, 1.3462741374969482, 1.473751425743103, 1.6012287139892578, 1.7287060022354126, 1.8561832904815674, 1.9836605787277222, 2.111137866973877, 2.238615036010742, 2.3660924434661865, 2.493569850921631, 2.621047019958496]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 13.0, 7.0, 17.0, 18.0, 22.0, 19.0, 33.0, 38.0, 48.0, 42.0, 49.0, 66.0, 74.0, 69.0, 55.0, 69.0, 49.0, 48.0, 50.0, 37.0, 32.0, 28.0, 26.0, 20.0, 19.0, 14.0, 9.0, 12.0, 6.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9222455024719238, -0.8873699307441711, -0.8524943590164185, -0.8176187872886658, -0.7827432155609131, -0.7478677034378052, -0.7129921317100525, -0.6781165599822998, -0.6432409882545471, -0.6083654165267944, -0.5734898447990417, -0.5386142730712891, -0.5037387609481812, -0.4688631594181061, -0.4339876174926758, -0.3991120457649231, -0.3642364740371704, -0.3293609023094177, -0.29448533058166504, -0.25960978865623474, -0.22473421692848206, -0.18985864520072937, -0.15498308837413788, -0.12010753154754639, -0.0852319598197937, -0.05035639554262161, -0.015480831265449524, 0.019394733011722565, 0.05427029728889465, 0.08914586901664734, 0.12402142584323883, 0.15889698266983032, 0.19377243518829346, 0.22864800691604614, 0.26352357864379883, 0.2983991205692291, 0.3332746922969818, 0.3681502640247345, 0.4030258059501648, 0.4379013776779175, 0.47277694940567017, 0.5076525211334229, 0.5425280928611755, 0.5774036645889282, 0.6122791767120361, 0.6471548080444336, 0.6820303201675415, 0.7169058918952942, 0.7517814636230469, 0.7866570353507996, 0.8215326070785522, 0.8564081788063049, 0.8912837505340576, 0.9261592626571655, 0.9610348343849182, 0.9959104061126709, 1.0307860374450684, 1.0656615495681763, 1.1005371809005737, 1.1354126930236816, 1.170288324356079, 1.205163836479187, 1.2400394678115845, 1.2749149799346924, 1.3097904920578003]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 0.0, 2.0, 3.0, 3.0, 6.0, 12.0, 7.0, 8.0, 11.0, 17.0, 22.0, 19.0, 23.0, 30.0, 48.0, 56.0, 79.0, 125.0, 152.0, 268.0, 535.0, 1258.0, 4077.0, 25681.0, 3612346.0, 526275.0, 18891.0, 3099.0, 787.0, 280.0, 94.0, 34.0, 20.0, 13.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.9873046875, -0.9679145812988281, -0.9485244750976562, -0.9291343688964844, -0.9097442626953125, -0.8903541564941406, -0.8709640502929688, -0.8515739440917969, -0.832183837890625, -0.8127937316894531, -0.7934036254882812, -0.7740135192871094, -0.7546234130859375, -0.7352333068847656, -0.7158432006835938, -0.6964530944824219, -0.67706298828125, -0.6576728820800781, -0.6382827758789062, -0.6188926696777344, -0.5995025634765625, -0.5801124572753906, -0.5607223510742188, -0.5413322448730469, -0.521942138671875, -0.5025520324707031, -0.48316192626953125, -0.4637718200683594, -0.4443817138671875, -0.4249916076660156, -0.40560150146484375, -0.3862113952636719, -0.3668212890625, -0.3474311828613281, -0.32804107666015625, -0.3086509704589844, -0.2892608642578125, -0.2698707580566406, -0.25048065185546875, -0.23109054565429688, -0.211700439453125, -0.19231033325195312, -0.17292022705078125, -0.15353012084960938, -0.1341400146484375, -0.11474990844726562, -0.09535980224609375, -0.07596969604492188, -0.05657958984375, -0.037189483642578125, -0.01779937744140625, 0.001590728759765625, 0.0209808349609375, 0.040370941162109375, 0.05976104736328125, 0.07915115356445312, 0.098541259765625, 0.11793136596679688, 0.13732147216796875, 0.15671157836914062, 0.1761016845703125, 0.19549179077148438, 0.21488189697265625, 0.23427200317382812, 0.253662109375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 8.0, 13.0, 33.0, 61.0, 102.0, 123.0, 178.0, 157.0, 132.0, 79.0, 50.0, 34.0, 19.0, 8.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.149658203125, -0.14671659469604492, -0.14377498626708984, -0.14083337783813477, -0.1378917694091797, -0.1349501609802246, -0.13200855255126953, -0.12906694412231445, -0.12612533569335938, -0.1231837272644043, -0.12024211883544922, -0.11730051040649414, -0.11435890197753906, -0.11141729354858398, -0.1084756851196289, -0.10553407669067383, -0.10259246826171875, -0.09965085983276367, -0.0967092514038086, -0.09376764297485352, -0.09082603454589844, -0.08788442611694336, -0.08494281768798828, -0.0820012092590332, -0.07905960083007812, -0.07611799240112305, -0.07317638397216797, -0.07023477554321289, -0.06729316711425781, -0.06435155868530273, -0.061409950256347656, -0.05846834182739258, -0.0555267333984375, -0.05258512496948242, -0.049643516540527344, -0.046701908111572266, -0.04376029968261719, -0.04081869125366211, -0.03787708282470703, -0.03493547439575195, -0.031993865966796875, -0.029052257537841797, -0.02611064910888672, -0.02316904067993164, -0.020227432250976562, -0.017285823822021484, -0.014344215393066406, -0.011402606964111328, -0.00846099853515625, -0.005519390106201172, -0.0025777816772460938, 0.0003638267517089844, 0.0033054351806640625, 0.006247043609619141, 0.009188652038574219, 0.012130260467529297, 0.015071868896484375, 0.018013477325439453, 0.02095508575439453, 0.02389669418334961, 0.026838302612304688, 0.029779911041259766, 0.032721519470214844, 0.03566312789916992, 0.038604736328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 8.0, 22.0, 70.0, 151.0, 544.0, 105600.0, 4087409.0, 346.0, 89.0, 34.0, 10.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76953125, -6.6368865966796875, -6.504241943359375, -6.3715972900390625, -6.23895263671875, -6.1063079833984375, -5.973663330078125, -5.8410186767578125, -5.7083740234375, -5.5757293701171875, -5.443084716796875, -5.3104400634765625, -5.17779541015625, -5.0451507568359375, -4.912506103515625, -4.7798614501953125, -4.647216796875, -4.5145721435546875, -4.381927490234375, -4.2492828369140625, -4.11663818359375, -3.9839935302734375, -3.851348876953125, -3.7187042236328125, -3.5860595703125, -3.4534149169921875, -3.320770263671875, -3.1881256103515625, -3.05548095703125, -2.9228363037109375, -2.790191650390625, -2.6575469970703125, -2.52490234375, -2.3922576904296875, -2.259613037109375, -2.1269683837890625, -1.99432373046875, -1.8616790771484375, -1.729034423828125, -1.5963897705078125, -1.4637451171875, -1.3311004638671875, -1.198455810546875, -1.0658111572265625, -0.93316650390625, -0.8005218505859375, -0.667877197265625, -0.5352325439453125, -0.402587890625, -0.2699432373046875, -0.137298583984375, -0.0046539306640625, 0.12799072265625, 0.2606353759765625, 0.393280029296875, 0.5259246826171875, 0.6585693359375, 0.7912139892578125, 0.923858642578125, 1.0565032958984375, 1.18914794921875, 1.3217926025390625, 1.454437255859375, 1.5870819091796875, 1.7197265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 16.0, 53.0, 467.0, 3381.0, 112.0, 31.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.62646484375, -0.6151199340820312, -0.6037750244140625, -0.5924301147460938, -0.581085205078125, -0.5697402954101562, -0.5583953857421875, -0.5470504760742188, -0.53570556640625, -0.5243606567382812, -0.5130157470703125, -0.5016708374023438, -0.490325927734375, -0.47898101806640625, -0.4676361083984375, -0.45629119873046875, -0.4449462890625, -0.43360137939453125, -0.4222564697265625, -0.41091156005859375, -0.399566650390625, -0.38822174072265625, -0.3768768310546875, -0.36553192138671875, -0.35418701171875, -0.34284210205078125, -0.3314971923828125, -0.32015228271484375, -0.308807373046875, -0.29746246337890625, -0.2861175537109375, -0.27477264404296875, -0.263427734375, -0.25208282470703125, -0.2407379150390625, -0.22939300537109375, -0.218048095703125, -0.20670318603515625, -0.1953582763671875, -0.18401336669921875, -0.17266845703125, -0.16132354736328125, -0.1499786376953125, -0.13863372802734375, -0.127288818359375, -0.11594390869140625, -0.1045989990234375, -0.09325408935546875, -0.0819091796875, -0.07056427001953125, -0.0592193603515625, -0.04787445068359375, -0.036529541015625, -0.02518463134765625, -0.0138397216796875, -0.00249481201171875, 0.00885009765625, 0.02019500732421875, 0.0315399169921875, 0.04288482666015625, 0.054229736328125, 0.06557464599609375, 0.0769195556640625, 0.08826446533203125, 0.099609375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 6.0, 24.0, 128.0, 780.0, 60.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.548156499862671, -3.4421892166137695, -3.3362221717834473, -3.230254888534546, -3.1242876052856445, -3.0183205604553223, -2.912353277206421, -2.8063859939575195, -2.7004189491271973, -2.594451665878296, -2.4884846210479736, -2.3825173377990723, -2.27655029296875, -2.1705830097198486, -2.0646157264709473, -1.9586485624313354, -1.8526813983917236, -1.7467142343521118, -1.6407470703125, -1.5347797870635986, -1.4288126230239868, -1.322845458984375, -1.2168781757354736, -1.1109110116958618, -1.00494384765625, -0.8989766836166382, -0.7930094599723816, -0.687042236328125, -0.5810750722885132, -0.47510790824890137, -0.3691406846046448, -0.2631734609603882, -0.15720605850219727, -0.05123886466026306, 0.05472832918167114, 0.16069552302360535, 0.26666271686553955, 0.37262988090515137, 0.47859710454940796, 0.5845643281936646, 0.6905314922332764, 0.7964986562728882, 0.9024658799171448, 1.0084331035614014, 1.1144002676010132, 1.220367431640625, 1.3263347148895264, 1.4323018789291382, 1.53826904296875, 1.6442362070083618, 1.7502033710479736, 1.856170654296875, 1.9621378183364868, 2.0681049823760986, 2.174072265625, 2.2800393104553223, 2.3860065937042236, 2.491973876953125, 2.5979409217834473, 2.7039082050323486, 2.80987548828125, 2.9158425331115723, 3.0218098163604736, 3.127777099609375, 3.2337441444396973]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 8.0, 13.0, 28.0, 41.0, 53.0, 78.0, 95.0, 106.0, 129.0, 100.0, 96.0, 94.0, 70.0, 35.0, 19.0, 21.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.502690315246582, -1.4595664739608765, -1.4164427518844604, -1.3733189105987549, -1.3301951885223389, -1.2870713472366333, -1.2439475059509277, -1.2008237838745117, -1.1576999425888062, -1.1145761013031006, -1.0714523792266846, -1.028328537940979, -0.9852047562599182, -0.9420809745788574, -0.8989571928977966, -0.8558334112167358, -0.812709629535675, -0.7695858478546143, -0.7264620661735535, -0.6833382844924927, -0.6402144432067871, -0.5970906615257263, -0.5539668798446655, -0.51084303855896, -0.46771928668022156, -0.42459550499916077, -0.3814716935157776, -0.3383479118347168, -0.295224130153656, -0.2521003186702728, -0.20897653698921204, -0.16585272550582886, -0.12272894382476807, -0.07960514724254608, -0.036481358110904694, 0.006642431020736694, 0.04976622760295868, 0.09289002418518066, 0.13601380586624146, 0.17913761734962463, 0.22226139903068542, 0.2653851807117462, 0.3085089921951294, 0.3516327738761902, 0.394756555557251, 0.43788036704063416, 0.48100414872169495, 0.5241279602050781, 0.5672517418861389, 0.6103755235671997, 0.6534993052482605, 0.6966230869293213, 0.7397469282150269, 0.7828707098960876, 0.8259944915771484, 0.869118332862854, 0.91224205493927, 0.9553658366203308, 0.9984896183013916, 1.0416134595870972, 1.0847371816635132, 1.1278610229492188, 1.1709847450256348, 1.2141085863113403, 1.257232427597046]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 7.0, 11.0, 12.0, 18.0, 20.0, 23.0, 40.0, 40.0, 53.0, 90.0, 102.0, 178.0, 303.0, 487.0, 975.0, 2264.0, 6958.0, 27766.0, 171432.0, 717394.0, 93601.0, 18000.0, 4936.0, 1749.0, 762.0, 403.0, 274.0, 177.0, 142.0, 90.0, 67.0, 38.0, 40.0, 28.0, 23.0, 11.0, 8.0, 11.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.34521484375, -0.33516693115234375, -0.3251190185546875, -0.31507110595703125, -0.305023193359375, -0.29497528076171875, -0.2849273681640625, -0.27487945556640625, -0.26483154296875, -0.25478363037109375, -0.2447357177734375, -0.23468780517578125, -0.224639892578125, -0.21459197998046875, -0.2045440673828125, -0.19449615478515625, -0.1844482421875, -0.17440032958984375, -0.1643524169921875, -0.15430450439453125, -0.144256591796875, -0.13420867919921875, -0.1241607666015625, -0.11411285400390625, -0.10406494140625, -0.09401702880859375, -0.0839691162109375, -0.07392120361328125, -0.063873291015625, -0.05382537841796875, -0.0437774658203125, -0.03372955322265625, -0.023681640625, -0.01363372802734375, -0.0035858154296875, 0.00646209716796875, 0.016510009765625, 0.02655792236328125, 0.0366058349609375, 0.04665374755859375, 0.05670166015625, 0.06674957275390625, 0.0767974853515625, 0.08684539794921875, 0.096893310546875, 0.10694122314453125, 0.1169891357421875, 0.12703704833984375, 0.1370849609375, 0.14713287353515625, 0.1571807861328125, 0.16722869873046875, 0.177276611328125, 0.18732452392578125, 0.1973724365234375, 0.20742034912109375, 0.21746826171875, 0.22751617431640625, 0.2375640869140625, 0.24761199951171875, 0.257659912109375, 0.26770782470703125, 0.2777557373046875, 0.28780364990234375, 0.2978515625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 9.0, 8.0, 17.0, 28.0, 38.0, 57.0, 83.0, 80.0, 95.0, 124.0, 112.0, 93.0, 84.0, 52.0, 45.0, 37.0, 22.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.14599609375, -0.14256668090820312, -0.13913726806640625, -0.13570785522460938, -0.1322784423828125, -0.12884902954101562, -0.12541961669921875, -0.12199020385742188, -0.118560791015625, -0.11513137817382812, -0.11170196533203125, -0.10827255249023438, -0.1048431396484375, -0.10141372680664062, -0.09798431396484375, -0.09455490112304688, -0.09112548828125, -0.08769607543945312, -0.08426666259765625, -0.08083724975585938, -0.0774078369140625, -0.07397842407226562, -0.07054901123046875, -0.06711959838867188, -0.063690185546875, -0.060260772705078125, -0.05683135986328125, -0.053401947021484375, -0.0499725341796875, -0.046543121337890625, -0.04311370849609375, -0.039684295654296875, -0.0362548828125, -0.032825469970703125, -0.02939605712890625, -0.025966644287109375, -0.0225372314453125, -0.019107818603515625, -0.01567840576171875, -0.012248992919921875, -0.008819580078125, -0.005390167236328125, -0.00196075439453125, 0.001468658447265625, 0.0048980712890625, 0.008327484130859375, 0.01175689697265625, 0.015186309814453125, 0.01861572265625, 0.022045135498046875, 0.02547454833984375, 0.028903961181640625, 0.0323333740234375, 0.035762786865234375, 0.03919219970703125, 0.042621612548828125, 0.046051025390625, 0.049480438232421875, 0.05290985107421875, 0.056339263916015625, 0.0597686767578125, 0.06319808959960938, 0.06662750244140625, 0.07005691528320312, 0.073486328125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 2.0, 5.0, 2.0, 13.0, 14.0, 8.0, 13.0, 31.0, 35.0, 32.0, 57.0, 89.0, 178.0, 338.0, 1403.0, 8092.0, 109582.0, 876361.0, 46058.0, 4629.0, 899.0, 292.0, 122.0, 81.0, 51.0, 47.0, 30.0, 19.0, 17.0, 19.0, 9.0, 8.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.399658203125, -0.3864936828613281, -0.37332916259765625, -0.3601646423339844, -0.3470001220703125, -0.3338356018066406, -0.32067108154296875, -0.3075065612792969, -0.294342041015625, -0.2811775207519531, -0.26801300048828125, -0.2548484802246094, -0.2416839599609375, -0.22851943969726562, -0.21535491943359375, -0.20219039916992188, -0.18902587890625, -0.17586135864257812, -0.16269683837890625, -0.14953231811523438, -0.1363677978515625, -0.12320327758789062, -0.11003875732421875, -0.09687423706054688, -0.083709716796875, -0.07054519653320312, -0.05738067626953125, -0.044216156005859375, -0.0310516357421875, -0.017887115478515625, -0.00472259521484375, 0.008441925048828125, 0.0216064453125, 0.034770965576171875, 0.04793548583984375, 0.061100006103515625, 0.0742645263671875, 0.08742904663085938, 0.10059356689453125, 0.11375808715820312, 0.126922607421875, 0.14008712768554688, 0.15325164794921875, 0.16641616821289062, 0.1795806884765625, 0.19274520874023438, 0.20590972900390625, 0.21907424926757812, 0.23223876953125, 0.24540328979492188, 0.25856781005859375, 0.2717323303222656, 0.2848968505859375, 0.2980613708496094, 0.31122589111328125, 0.3243904113769531, 0.337554931640625, 0.3507194519042969, 0.36388397216796875, 0.3770484924316406, 0.3902130126953125, 0.4033775329589844, 0.41654205322265625, 0.4297065734863281, 0.44287109375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 12.0, 10.0, 14.0, 18.0, 24.0, 21.0, 28.0, 41.0, 47.0, 44.0, 64.0, 65.0, 58.0, 64.0, 69.0, 51.0, 63.0, 57.0, 37.0, 38.0, 28.0, 29.0, 24.0, 21.0, 11.0, 14.0, 10.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2578125, -0.24934005737304688, -0.24086761474609375, -0.23239517211914062, -0.2239227294921875, -0.21545028686523438, -0.20697784423828125, -0.19850540161132812, -0.190032958984375, -0.18156051635742188, -0.17308807373046875, -0.16461563110351562, -0.1561431884765625, -0.14767074584960938, -0.13919830322265625, -0.13072586059570312, -0.12225341796875, -0.11378097534179688, -0.10530853271484375, -0.09683609008789062, -0.0883636474609375, -0.07989120483398438, -0.07141876220703125, -0.06294631958007812, -0.054473876953125, -0.046001434326171875, -0.03752899169921875, -0.029056549072265625, -0.0205841064453125, -0.012111663818359375, -0.00363922119140625, 0.004833221435546875, 0.0133056640625, 0.021778106689453125, 0.03025054931640625, 0.038722991943359375, 0.0471954345703125, 0.055667877197265625, 0.06414031982421875, 0.07261276245117188, 0.081085205078125, 0.08955764770507812, 0.09803009033203125, 0.10650253295898438, 0.1149749755859375, 0.12344741821289062, 0.13191986083984375, 0.14039230346679688, 0.14886474609375, 0.15733718872070312, 0.16580963134765625, 0.17428207397460938, 0.1827545166015625, 0.19122695922851562, 0.19969940185546875, 0.20817184448242188, 0.216644287109375, 0.22511672973632812, 0.23358917236328125, 0.24206161499023438, 0.2505340576171875, 0.2590065002441406, 0.26747894287109375, 0.2759513854980469, 0.284423828125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 2.0, 5.0, 5.0, 3.0, 4.0, 8.0, 8.0, 9.0, 15.0, 27.0, 41.0, 75.0, 133.0, 370.0, 992.0, 3711.0, 27125.0, 937379.0, 70653.0, 5676.0, 1451.0, 464.0, 158.0, 76.0, 50.0, 35.0, 10.0, 17.0, 7.0, 6.0, 11.0, 4.0, 9.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1434326171875, -0.13916778564453125, -0.1349029541015625, -0.13063812255859375, -0.126373291015625, -0.12210845947265625, -0.1178436279296875, -0.11357879638671875, -0.10931396484375, -0.10504913330078125, -0.1007843017578125, -0.09651947021484375, -0.092254638671875, -0.08798980712890625, -0.0837249755859375, -0.07946014404296875, -0.0751953125, -0.07093048095703125, -0.0666656494140625, -0.06240081787109375, -0.058135986328125, -0.05387115478515625, -0.0496063232421875, -0.04534149169921875, -0.04107666015625, -0.03681182861328125, -0.0325469970703125, -0.02828216552734375, -0.024017333984375, -0.01975250244140625, -0.0154876708984375, -0.01122283935546875, -0.0069580078125, -0.00269317626953125, 0.0015716552734375, 0.00583648681640625, 0.010101318359375, 0.01436614990234375, 0.0186309814453125, 0.02289581298828125, 0.02716064453125, 0.03142547607421875, 0.0356903076171875, 0.03995513916015625, 0.044219970703125, 0.04848480224609375, 0.0527496337890625, 0.05701446533203125, 0.061279296875, 0.06554412841796875, 0.0698089599609375, 0.07407379150390625, 0.078338623046875, 0.08260345458984375, 0.0868682861328125, 0.09113311767578125, 0.09539794921875, 0.09966278076171875, 0.1039276123046875, 0.10819244384765625, 0.112457275390625, 0.11672210693359375, 0.1209869384765625, 0.12525177001953125, 0.1295166015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 10.0, 10.0, 11.0, 24.0, 29.0, 37.0, 50.0, 54.0, 68.0, 96.0, 102.0, 89.0, 85.0, 77.0, 56.0, 50.0, 30.0, 23.0, 35.0, 12.0, 9.0, 7.0, 5.0, 4.0, 2.0, 8.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.733438491821289e-05, -9.361002594232559e-05, -8.98856669664383e-05, -8.6161307990551e-05, -8.24369490146637e-05, -7.87125900387764e-05, -7.49882310628891e-05, -7.12638720870018e-05, -6.75395131111145e-05, -6.38151541352272e-05, -6.0090795159339905e-05, -5.6366436183452606e-05, -5.264207720756531e-05, -4.891771823167801e-05, -4.519335925579071e-05, -4.146900027990341e-05, -3.774464130401611e-05, -3.4020282328128815e-05, -3.0295923352241516e-05, -2.6571564376354218e-05, -2.284720540046692e-05, -1.912284642457962e-05, -1.5398487448692322e-05, -1.1674128472805023e-05, -7.949769496917725e-06, -4.225410521030426e-06, -5.010515451431274e-07, 3.223307430744171e-06, 6.94766640663147e-06, 1.0672025382518768e-05, 1.4396384358406067e-05, 1.8120743334293365e-05, 2.1845102310180664e-05, 2.5569461286067963e-05, 2.929382026195526e-05, 3.301817923784256e-05, 3.674253821372986e-05, 4.046689718961716e-05, 4.4191256165504456e-05, 4.7915615141391754e-05, 5.163997411727905e-05, 5.536433309316635e-05, 5.908869206905365e-05, 6.281305104494095e-05, 6.653741002082825e-05, 7.026176899671555e-05, 7.398612797260284e-05, 7.771048694849014e-05, 8.143484592437744e-05, 8.515920490026474e-05, 8.888356387615204e-05, 9.260792285203934e-05, 9.633228182792664e-05, 0.00010005664080381393, 0.00010378099977970123, 0.00010750535875558853, 0.00011122971773147583, 0.00011495407670736313, 0.00011867843568325043, 0.00012240279465913773, 0.00012612715363502502, 0.00012985151261091232, 0.00013357587158679962, 0.00013730023056268692, 0.00014102458953857422]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 6.0, 3.0, 10.0, 12.0, 28.0, 47.0, 86.0, 139.0, 281.0, 809.0, 3284.0, 21482.0, 757184.0, 251412.0, 10706.0, 1973.0, 537.0, 249.0, 110.0, 73.0, 40.0, 21.0, 13.0, 16.0, 7.0, 8.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11639404296875, -0.1130533218383789, -0.10971260070800781, -0.10637187957763672, -0.10303115844726562, -0.09969043731689453, -0.09634971618652344, -0.09300899505615234, -0.08966827392578125, -0.08632755279541016, -0.08298683166503906, -0.07964611053466797, -0.07630538940429688, -0.07296466827392578, -0.06962394714355469, -0.0662832260131836, -0.0629425048828125, -0.059601783752441406, -0.05626106262207031, -0.05292034149169922, -0.049579620361328125, -0.04623889923095703, -0.04289817810058594, -0.039557456970214844, -0.03621673583984375, -0.032876014709472656, -0.029535293579101562, -0.02619457244873047, -0.022853851318359375, -0.01951313018798828, -0.016172409057617188, -0.012831687927246094, -0.009490966796875, -0.006150245666503906, -0.0028095245361328125, 0.0005311965942382812, 0.003871917724609375, 0.007212638854980469, 0.010553359985351562, 0.013894081115722656, 0.01723480224609375, 0.020575523376464844, 0.023916244506835938, 0.02725696563720703, 0.030597686767578125, 0.03393840789794922, 0.03727912902832031, 0.040619850158691406, 0.0439605712890625, 0.047301292419433594, 0.05064201354980469, 0.05398273468017578, 0.057323455810546875, 0.06066417694091797, 0.06400489807128906, 0.06734561920166016, 0.07068634033203125, 0.07402706146240234, 0.07736778259277344, 0.08070850372314453, 0.08404922485351562, 0.08738994598388672, 0.09073066711425781, 0.0940713882446289, 0.097412109375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 8.0, 7.0, 18.0, 25.0, 31.0, 59.0, 85.0, 123.0, 142.0, 137.0, 123.0, 78.0, 48.0, 34.0, 16.0, 17.0, 8.0, 6.0, 8.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07537841796875, -0.07315254211425781, -0.07092666625976562, -0.06870079040527344, -0.06647491455078125, -0.06424903869628906, -0.062023162841796875, -0.05979728698730469, -0.0575714111328125, -0.05534553527832031, -0.053119659423828125, -0.05089378356933594, -0.04866790771484375, -0.04644203186035156, -0.044216156005859375, -0.04199028015136719, -0.039764404296875, -0.03753852844238281, -0.035312652587890625, -0.03308677673339844, -0.03086090087890625, -0.028635025024414062, -0.026409149169921875, -0.024183273315429688, -0.0219573974609375, -0.019731521606445312, -0.017505645751953125, -0.015279769897460938, -0.01305389404296875, -0.010828018188476562, -0.008602142333984375, -0.0063762664794921875, -0.004150390625, -0.0019245147705078125, 0.000301361083984375, 0.0025272369384765625, 0.00475311279296875, 0.0069789886474609375, 0.009204864501953125, 0.011430740356445312, 0.0136566162109375, 0.015882492065429688, 0.018108367919921875, 0.020334243774414062, 0.02256011962890625, 0.024785995483398438, 0.027011871337890625, 0.029237747192382812, 0.031463623046875, 0.03368949890136719, 0.035915374755859375, 0.03814125061035156, 0.04036712646484375, 0.04259300231933594, 0.044818878173828125, 0.04704475402832031, 0.0492706298828125, 0.05149650573730469, 0.053722381591796875, 0.05594825744628906, 0.05817413330078125, 0.06040000915527344, 0.06262588500976562, 0.06485176086425781, 0.06707763671875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 13.0, 31.0, 74.0, 333.0, 378.0, 108.0, 36.0, 20.0, 7.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3696460723876953, -3.2929718494415283, -3.2162978649139404, -3.1396236419677734, -3.0629496574401855, -2.9862754344940186, -2.9096014499664307, -2.8329272270202637, -2.756253242492676, -2.679579019546509, -2.602905035018921, -2.526230812072754, -2.449556827545166, -2.372882604598999, -2.296208620071411, -2.219534397125244, -2.142860174179077, -2.06618595123291, -1.9895119667053223, -1.9128378629684448, -1.8361637592315674, -1.7594895362854004, -1.682815432548523, -1.6061413288116455, -1.529467225074768, -1.4527931213378906, -1.3761190176010132, -1.2994449138641357, -1.2227706909179688, -1.1460967063903809, -1.0694224834442139, -0.9927483797073364, -0.9160740375518799, -0.8393999338150024, -0.762725830078125, -0.6860516667366028, -0.6093775629997253, -0.5327034592628479, -0.45602932572364807, -0.37935519218444824, -0.3026810884475708, -0.22600696980953217, -0.14933285117149353, -0.0726587325334549, 0.00401538610458374, 0.08068948984146118, 0.157363623380661, 0.23403775691986084, 0.3107118606567383, 0.3873859643936157, 0.46406009793281555, 0.5407342314720154, 0.6174083352088928, 0.6940824389457703, 0.7707566022872925, 0.8474307060241699, 0.9241048097610474, 1.0007789134979248, 1.0774530172348022, 1.1541271209716797, 1.2308013439178467, 1.3074753284454346, 1.3841495513916016, 1.460823655128479, 1.5374977588653564]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 7.0, 8.0, 9.0, 14.0, 7.0, 15.0, 25.0, 17.0, 27.0, 27.0, 26.0, 32.0, 43.0, 52.0, 40.0, 56.0, 59.0, 45.0, 73.0, 59.0, 60.0, 42.0, 44.0, 37.0, 35.0, 23.0, 22.0, 20.0, 14.0, 18.0, 6.0, 16.0, 6.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.36531400680542, -1.323684573173523, -1.282055139541626, -1.2404258251190186, -1.1987963914871216, -1.1571669578552246, -1.1155375242233276, -1.0739080905914307, -1.0322786569595337, -0.9906492233276367, -0.9490198493003845, -0.9073904156684875, -0.8657609820365906, -0.8241316080093384, -0.7825021743774414, -0.7408727407455444, -0.6992433667182922, -0.6576139330863953, -0.6159845590591431, -0.5743551254272461, -0.5327256917953491, -0.49109628796577454, -0.44946688413619995, -0.407837450504303, -0.3662080466747284, -0.3245786428451538, -0.28294920921325684, -0.24131980538368225, -0.19969038665294647, -0.1580609679222107, -0.11643156409263611, -0.07480213046073914, -0.03317272663116455, 0.00845668837428093, 0.05008610337972641, 0.09171551465988159, 0.13334493339061737, 0.17497435212135315, 0.21660375595092773, 0.2582331895828247, 0.2998625934123993, 0.3414919972419739, 0.38312143087387085, 0.42475083470344543, 0.46638023853302, 0.508009672164917, 0.549639105796814, 0.5912685394287109, 0.6328979134559631, 0.6745273470878601, 0.7161567211151123, 0.7577861547470093, 0.7994155883789062, 0.8410450220108032, 0.8826743960380554, 0.9243038296699524, 0.9659332036972046, 1.0075626373291016, 1.0491920709609985, 1.0908215045928955, 1.132450819015503, 1.1740802526474, 1.2157096862792969, 1.2573391199111938, 1.2989685535430908]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 6.0, 4.0, 10.0, 14.0, 21.0, 26.0, 24.0, 39.0, 51.0, 65.0, 81.0, 115.0, 165.0, 265.0, 403.0, 747.0, 1616.0, 4115.0, 13727.0, 88205.0, 3905189.0, 153854.0, 18077.0, 4543.0, 1523.0, 671.0, 337.0, 172.0, 85.0, 46.0, 29.0, 13.0, 13.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.548828125, -0.5362358093261719, -0.5236434936523438, -0.5110511779785156, -0.4984588623046875, -0.4858665466308594, -0.47327423095703125, -0.4606819152832031, -0.448089599609375, -0.4354972839355469, -0.42290496826171875, -0.4103126525878906, -0.3977203369140625, -0.3851280212402344, -0.37253570556640625, -0.3599433898925781, -0.34735107421875, -0.3347587585449219, -0.32216644287109375, -0.3095741271972656, -0.2969818115234375, -0.2843894958496094, -0.27179718017578125, -0.2592048645019531, -0.246612548828125, -0.23402023315429688, -0.22142791748046875, -0.20883560180664062, -0.1962432861328125, -0.18365097045898438, -0.17105865478515625, -0.15846633911132812, -0.1458740234375, -0.13328170776367188, -0.12068939208984375, -0.10809707641601562, -0.0955047607421875, -0.08291244506835938, -0.07032012939453125, -0.057727813720703125, -0.045135498046875, -0.032543182373046875, -0.01995086669921875, -0.007358551025390625, 0.0052337646484375, 0.017826080322265625, 0.03041839599609375, 0.043010711669921875, 0.05560302734375, 0.06819534301757812, 0.08078765869140625, 0.09337997436523438, 0.1059722900390625, 0.11856460571289062, 0.13115692138671875, 0.14374923706054688, 0.156341552734375, 0.16893386840820312, 0.18152618408203125, 0.19411849975585938, 0.2067108154296875, 0.21930313110351562, 0.23189544677734375, 0.24448776245117188, 0.257080078125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 3.0, 10.0, 23.0, 21.0, 50.0, 63.0, 70.0, 99.0, 97.0, 113.0, 89.0, 80.0, 79.0, 77.0, 46.0, 32.0, 16.0, 13.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1478271484375, -0.1444253921508789, -0.1410236358642578, -0.13762187957763672, -0.13422012329101562, -0.13081836700439453, -0.12741661071777344, -0.12401485443115234, -0.12061309814453125, -0.11721134185791016, -0.11380958557128906, -0.11040782928466797, -0.10700607299804688, -0.10360431671142578, -0.10020256042480469, -0.0968008041381836, -0.0933990478515625, -0.0899972915649414, -0.08659553527832031, -0.08319377899169922, -0.07979202270507812, -0.07639026641845703, -0.07298851013183594, -0.06958675384521484, -0.06618499755859375, -0.06278324127197266, -0.05938148498535156, -0.05597972869873047, -0.052577972412109375, -0.04917621612548828, -0.04577445983886719, -0.042372703552246094, -0.038970947265625, -0.035569190979003906, -0.03216743469238281, -0.02876567840576172, -0.025363922119140625, -0.02196216583251953, -0.018560409545898438, -0.015158653259277344, -0.01175689697265625, -0.008355140686035156, -0.0049533843994140625, -0.0015516281127929688, 0.001850128173828125, 0.005251884460449219, 0.008653640747070312, 0.012055397033691406, 0.0154571533203125, 0.018858909606933594, 0.022260665893554688, 0.02566242218017578, 0.029064178466796875, 0.03246593475341797, 0.03586769104003906, 0.039269447326660156, 0.04267120361328125, 0.046072959899902344, 0.04947471618652344, 0.05287647247314453, 0.056278228759765625, 0.05967998504638672, 0.06308174133300781, 0.0664834976196289, 0.06988525390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 17.0, 61.0, 107.0, 275.0, 898.0, 4101483.0, 90266.0, 759.0, 271.0, 92.0, 26.0, 13.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.005859375, -1.9515228271484375, -1.897186279296875, -1.8428497314453125, -1.78851318359375, -1.7341766357421875, -1.679840087890625, -1.6255035400390625, -1.5711669921875, -1.5168304443359375, -1.462493896484375, -1.4081573486328125, -1.35382080078125, -1.2994842529296875, -1.245147705078125, -1.1908111572265625, -1.136474609375, -1.0821380615234375, -1.027801513671875, -0.9734649658203125, -0.91912841796875, -0.8647918701171875, -0.810455322265625, -0.7561187744140625, -0.7017822265625, -0.6474456787109375, -0.593109130859375, -0.5387725830078125, -0.48443603515625, -0.4300994873046875, -0.375762939453125, -0.3214263916015625, -0.26708984375, -0.2127532958984375, -0.158416748046875, -0.1040802001953125, -0.04974365234375, 0.0045928955078125, 0.058929443359375, 0.1132659912109375, 0.1676025390625, 0.2219390869140625, 0.276275634765625, 0.3306121826171875, 0.38494873046875, 0.4392852783203125, 0.493621826171875, 0.5479583740234375, 0.602294921875, 0.6566314697265625, 0.710968017578125, 0.7653045654296875, 0.81964111328125, 0.8739776611328125, 0.928314208984375, 0.9826507568359375, 1.0369873046875, 1.0913238525390625, 1.145660400390625, 1.1999969482421875, 1.25433349609375, 1.3086700439453125, 1.363006591796875, 1.4173431396484375, 1.4716796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 9.0, 22.0, 77.0, 735.0, 3081.0, 125.0, 23.0, 5.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33056640625, -0.32141876220703125, -0.3122711181640625, -0.30312347412109375, -0.293975830078125, -0.28482818603515625, -0.2756805419921875, -0.26653289794921875, -0.25738525390625, -0.24823760986328125, -0.2390899658203125, -0.22994232177734375, -0.220794677734375, -0.21164703369140625, -0.2024993896484375, -0.19335174560546875, -0.1842041015625, -0.17505645751953125, -0.1659088134765625, -0.15676116943359375, -0.147613525390625, -0.13846588134765625, -0.1293182373046875, -0.12017059326171875, -0.11102294921875, -0.10187530517578125, -0.0927276611328125, -0.08358001708984375, -0.074432373046875, -0.06528472900390625, -0.0561370849609375, -0.04698944091796875, -0.037841796875, -0.02869415283203125, -0.0195465087890625, -0.01039886474609375, -0.001251220703125, 0.00789642333984375, 0.0170440673828125, 0.02619171142578125, 0.03533935546875, 0.04448699951171875, 0.0536346435546875, 0.06278228759765625, 0.071929931640625, 0.08107757568359375, 0.0902252197265625, 0.09937286376953125, 0.1085205078125, 0.11766815185546875, 0.1268157958984375, 0.13596343994140625, 0.145111083984375, 0.15425872802734375, 0.1634063720703125, 0.17255401611328125, 0.18170166015625, 0.19084930419921875, 0.1999969482421875, 0.20914459228515625, 0.218292236328125, 0.22743988037109375, 0.2365875244140625, 0.24573516845703125, 0.2548828125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 26.0, 779.0, 192.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.393536329269409, -3.316080093383789, -3.23862361907959, -3.1611673831939697, -3.0837111473083496, -3.0062546730041504, -2.9287984371185303, -2.85134220123291, -2.773885726928711, -2.696429491043091, -2.6189730167388916, -2.5415167808532715, -2.4640605449676514, -2.3866043090820312, -2.309147834777832, -2.231691598892212, -2.154235363006592, -2.0767791271209717, -1.999322772026062, -1.9218664169311523, -1.8444101810455322, -1.7669538259506226, -1.689497470855713, -1.6120412349700928, -1.534584879875183, -1.4571285247802734, -1.3796722888946533, -1.3022159337997437, -1.224759578704834, -1.1473033428192139, -1.0698469877243042, -0.9923906922340393, -0.9149341583251953, -0.8374778628349304, -0.7600215673446655, -0.6825652122497559, -0.605108916759491, -0.5276526212692261, -0.4501962959766388, -0.3727399706840515, -0.2952836751937866, -0.21782736480236053, -0.14037105441093445, -0.06291474401950836, 0.014541566371917725, 0.09199786186218262, 0.1694541871547699, 0.24691051244735718, 0.32436680793762207, 0.40182310342788696, 0.47927942872047424, 0.5567357540130615, 0.6341920495033264, 0.7116483449935913, 0.789104700088501, 0.8665609955787659, 0.9440172910690308, 1.0214736461639404, 1.0989298820495605, 1.1763862371444702, 1.2538425922393799, 1.331298828125, 1.4087551832199097, 1.4862115383148193, 1.5636677742004395]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 9.0, 4.0, 17.0, 20.0, 28.0, 30.0, 42.0, 61.0, 59.0, 81.0, 74.0, 91.0, 79.0, 81.0, 63.0, 47.0, 41.0, 31.0, 48.0, 29.0, 16.0, 8.0, 9.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4426233172416687, -0.4294520616531372, -0.4162808060646057, -0.4031095504760742, -0.3899383246898651, -0.3767670691013336, -0.3635958135128021, -0.35042455792427063, -0.3372533321380615, -0.32408207654953003, -0.31091082096099854, -0.29773956537246704, -0.28456833958625793, -0.27139708399772644, -0.25822582840919495, -0.24505457282066345, -0.23188331723213196, -0.21871206164360046, -0.20554082095623016, -0.19236956536769867, -0.17919832468032837, -0.16602706909179688, -0.15285581350326538, -0.1396845579147339, -0.1265133172273636, -0.11334206908941269, -0.10017082095146179, -0.0869995653629303, -0.0738283172249794, -0.0606570690870285, -0.04748581349849701, -0.03431456536054611, -0.021143317222595215, -0.007972067221999168, 0.005199182778596878, 0.018370434641838074, 0.03154168277978897, 0.04471293091773987, 0.05788418650627136, 0.07105543464422226, 0.08422668278217316, 0.09739793092012405, 0.11056917905807495, 0.12374043464660645, 0.13691169023513794, 0.15008293092250824, 0.16325418651103973, 0.17642542719841003, 0.18959668278694153, 0.20276793837547302, 0.21593917906284332, 0.22911043465137482, 0.24228167533874512, 0.2554529309272766, 0.2686241865158081, 0.2817954421043396, 0.2949666976928711, 0.3081379532814026, 0.3213092088699341, 0.3344804644584656, 0.3476516902446747, 0.3608229458332062, 0.37399420142173767, 0.38716545701026917, 0.40033668279647827]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 12.0, 7.0, 14.0, 15.0, 20.0, 40.0, 64.0, 87.0, 136.0, 163.0, 290.0, 463.0, 783.0, 1835.0, 5165.0, 20206.0, 120450.0, 722843.0, 143078.0, 23003.0, 5635.0, 2030.0, 902.0, 472.0, 261.0, 184.0, 113.0, 74.0, 64.0, 26.0, 32.0, 16.0, 22.0, 16.0, 8.0, 5.0, 8.0, 5.0, 3.0, 0.0, 4.0, 2.0], "bins": [-0.37255859375, -0.36313629150390625, -0.3537139892578125, -0.34429168701171875, -0.334869384765625, -0.32544708251953125, -0.3160247802734375, -0.30660247802734375, -0.29718017578125, -0.28775787353515625, -0.2783355712890625, -0.26891326904296875, -0.259490966796875, -0.25006866455078125, -0.2406463623046875, -0.23122406005859375, -0.2218017578125, -0.21237945556640625, -0.2029571533203125, -0.19353485107421875, -0.184112548828125, -0.17469024658203125, -0.1652679443359375, -0.15584564208984375, -0.14642333984375, -0.13700103759765625, -0.1275787353515625, -0.11815643310546875, -0.108734130859375, -0.09931182861328125, -0.0898895263671875, -0.08046722412109375, -0.071044921875, -0.06162261962890625, -0.0522003173828125, -0.04277801513671875, -0.033355712890625, -0.02393341064453125, -0.0145111083984375, -0.00508880615234375, 0.00433349609375, 0.01375579833984375, 0.0231781005859375, 0.03260040283203125, 0.042022705078125, 0.05144500732421875, 0.0608673095703125, 0.07028961181640625, 0.0797119140625, 0.08913421630859375, 0.0985565185546875, 0.10797882080078125, 0.117401123046875, 0.12682342529296875, 0.1362457275390625, 0.14566802978515625, 0.15509033203125, 0.16451263427734375, 0.1739349365234375, 0.18335723876953125, 0.192779541015625, 0.20220184326171875, 0.2116241455078125, 0.22104644775390625, 0.23046875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 9.0, 8.0, 15.0, 25.0, 43.0, 41.0, 56.0, 74.0, 86.0, 86.0, 95.0, 95.0, 68.0, 66.0, 73.0, 54.0, 32.0, 30.0, 17.0, 17.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.1339111328125, -0.13083744049072266, -0.1277637481689453, -0.12469005584716797, -0.12161636352539062, -0.11854267120361328, -0.11546897888183594, -0.1123952865600586, -0.10932159423828125, -0.1062479019165039, -0.10317420959472656, -0.10010051727294922, -0.09702682495117188, -0.09395313262939453, -0.09087944030761719, -0.08780574798583984, -0.0847320556640625, -0.08165836334228516, -0.07858467102050781, -0.07551097869873047, -0.07243728637695312, -0.06936359405517578, -0.06628990173339844, -0.0632162094116211, -0.06014251708984375, -0.057068824768066406, -0.05399513244628906, -0.05092144012451172, -0.047847747802734375, -0.04477405548095703, -0.04170036315917969, -0.038626670837402344, -0.035552978515625, -0.032479286193847656, -0.029405593872070312, -0.02633190155029297, -0.023258209228515625, -0.02018451690673828, -0.017110824584960938, -0.014037132263183594, -0.01096343994140625, -0.007889747619628906, -0.0048160552978515625, -0.0017423629760742188, 0.001331329345703125, 0.004405021667480469, 0.0074787139892578125, 0.010552406311035156, 0.0136260986328125, 0.016699790954589844, 0.019773483276367188, 0.02284717559814453, 0.025920867919921875, 0.02899456024169922, 0.03206825256347656, 0.035141944885253906, 0.03821563720703125, 0.041289329528808594, 0.04436302185058594, 0.04743671417236328, 0.050510406494140625, 0.05358409881591797, 0.05665779113769531, 0.059731483459472656, 0.06280517578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 6.0, 5.0, 10.0, 13.0, 26.0, 41.0, 52.0, 101.0, 212.0, 493.0, 1785.0, 10293.0, 232058.0, 778949.0, 20526.0, 2649.0, 745.0, 265.0, 126.0, 59.0, 45.0, 28.0, 12.0, 12.0, 10.0, 8.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.65625, -0.6394844055175781, -0.6227188110351562, -0.6059532165527344, -0.5891876220703125, -0.5724220275878906, -0.5556564331054688, -0.5388908386230469, -0.522125244140625, -0.5053596496582031, -0.48859405517578125, -0.4718284606933594, -0.4550628662109375, -0.4382972717285156, -0.42153167724609375, -0.4047660827636719, -0.38800048828125, -0.3712348937988281, -0.35446929931640625, -0.3377037048339844, -0.3209381103515625, -0.3041725158691406, -0.28740692138671875, -0.2706413269042969, -0.253875732421875, -0.23711013793945312, -0.22034454345703125, -0.20357894897460938, -0.1868133544921875, -0.17004776000976562, -0.15328216552734375, -0.13651657104492188, -0.1197509765625, -0.10298538208007812, -0.08621978759765625, -0.06945419311523438, -0.0526885986328125, -0.035923004150390625, -0.01915740966796875, -0.002391815185546875, 0.014373779296875, 0.031139373779296875, 0.04790496826171875, 0.06467056274414062, 0.0814361572265625, 0.09820175170898438, 0.11496734619140625, 0.13173294067382812, 0.14849853515625, 0.16526412963867188, 0.18202972412109375, 0.19879531860351562, 0.2155609130859375, 0.23232650756835938, 0.24909210205078125, 0.2658576965332031, 0.282623291015625, 0.2993888854980469, 0.31615447998046875, 0.3329200744628906, 0.3496856689453125, 0.3664512634277344, 0.38321685791015625, 0.3999824523925781, 0.416748046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 4.0, 7.0, 5.0, 12.0, 21.0, 30.0, 36.0, 36.0, 53.0, 67.0, 85.0, 95.0, 102.0, 81.0, 74.0, 69.0, 60.0, 42.0, 21.0, 30.0, 19.0, 9.0, 7.0, 9.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5166015625, -0.5034751892089844, -0.49034881591796875, -0.4772224426269531, -0.4640960693359375, -0.4509696960449219, -0.43784332275390625, -0.4247169494628906, -0.411590576171875, -0.3984642028808594, -0.38533782958984375, -0.3722114562988281, -0.3590850830078125, -0.3459587097167969, -0.33283233642578125, -0.3197059631347656, -0.30657958984375, -0.2934532165527344, -0.28032684326171875, -0.2672004699707031, -0.2540740966796875, -0.24094772338867188, -0.22782135009765625, -0.21469497680664062, -0.201568603515625, -0.18844223022460938, -0.17531585693359375, -0.16218948364257812, -0.1490631103515625, -0.13593673706054688, -0.12281036376953125, -0.10968399047851562, -0.0965576171875, -0.08343124389648438, -0.07030487060546875, -0.057178497314453125, -0.0440521240234375, -0.030925750732421875, -0.01779937744140625, -0.004673004150390625, 0.008453369140625, 0.021579742431640625, 0.03470611572265625, 0.047832489013671875, 0.0609588623046875, 0.07408523559570312, 0.08721160888671875, 0.10033798217773438, 0.11346435546875, 0.12659072875976562, 0.13971710205078125, 0.15284347534179688, 0.1659698486328125, 0.17909622192382812, 0.19222259521484375, 0.20534896850585938, 0.218475341796875, 0.23160171508789062, 0.24472808837890625, 0.2578544616699219, 0.2709808349609375, 0.2841072082519531, 0.29723358154296875, 0.3103599548339844, 0.323486328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 12.0, 8.0, 11.0, 27.0, 32.0, 45.0, 86.0, 145.0, 272.0, 579.0, 1224.0, 3774.0, 22868.0, 785909.0, 219029.0, 10277.0, 2364.0, 861.0, 429.0, 213.0, 132.0, 81.0, 57.0, 26.0, 21.0, 11.0, 8.0, 6.0, 7.0, 9.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1031494140625, -0.0994415283203125, -0.095733642578125, -0.0920257568359375, -0.08831787109375, -0.0846099853515625, -0.080902099609375, -0.0771942138671875, -0.073486328125, -0.0697784423828125, -0.066070556640625, -0.0623626708984375, -0.05865478515625, -0.0549468994140625, -0.051239013671875, -0.0475311279296875, -0.0438232421875, -0.0401153564453125, -0.036407470703125, -0.0326995849609375, -0.02899169921875, -0.0252838134765625, -0.021575927734375, -0.0178680419921875, -0.01416015625, -0.0104522705078125, -0.006744384765625, -0.0030364990234375, 0.00067138671875, 0.0043792724609375, 0.008087158203125, 0.0117950439453125, 0.0155029296875, 0.0192108154296875, 0.022918701171875, 0.0266265869140625, 0.03033447265625, 0.0340423583984375, 0.037750244140625, 0.0414581298828125, 0.045166015625, 0.0488739013671875, 0.052581787109375, 0.0562896728515625, 0.05999755859375, 0.0637054443359375, 0.067413330078125, 0.0711212158203125, 0.0748291015625, 0.0785369873046875, 0.082244873046875, 0.0859527587890625, 0.08966064453125, 0.0933685302734375, 0.097076416015625, 0.1007843017578125, 0.1044921875, 0.1082000732421875, 0.111907958984375, 0.1156158447265625, 0.11932373046875, 0.1230316162109375, 0.126739501953125, 0.1304473876953125, 0.1341552734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 13.0, 17.0, 29.0, 40.0, 50.0, 75.0, 97.0, 95.0, 146.0, 111.0, 93.0, 69.0, 54.0, 39.0, 20.0, 17.0, 9.0, 9.0, 5.0, 2.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001747608184814453, -0.00017011724412441254, -0.00016547366976737976, -0.00016083009541034698, -0.0001561865210533142, -0.00015154294669628143, -0.00014689937233924866, -0.00014225579798221588, -0.0001376122236251831, -0.00013296864926815033, -0.00012832507491111755, -0.00012368150055408478, -0.000119037926197052, -0.00011439435184001923, -0.00010975077748298645, -0.00010510720312595367, -0.0001004636287689209, -9.582005441188812e-05, -9.117648005485535e-05, -8.653290569782257e-05, -8.18893313407898e-05, -7.724575698375702e-05, -7.260218262672424e-05, -6.795860826969147e-05, -6.331503391265869e-05, -5.8671459555625916e-05, -5.402788519859314e-05, -4.9384310841560364e-05, -4.474073648452759e-05, -4.009716212749481e-05, -3.5453587770462036e-05, -3.081001341342926e-05, -2.6166439056396484e-05, -2.152286469936371e-05, -1.6879290342330933e-05, -1.2235715985298157e-05, -7.592141628265381e-06, -2.948567271232605e-06, 1.695007085800171e-06, 6.338581442832947e-06, 1.0982155799865723e-05, 1.56257301568985e-05, 2.0269304513931274e-05, 2.491287887096405e-05, 2.9556453227996826e-05, 3.42000275850296e-05, 3.884360194206238e-05, 4.3487176299095154e-05, 4.813075065612793e-05, 5.2774325013160706e-05, 5.741789937019348e-05, 6.206147372722626e-05, 6.670504808425903e-05, 7.134862244129181e-05, 7.599219679832458e-05, 8.063577115535736e-05, 8.527934551239014e-05, 8.992291986942291e-05, 9.456649422645569e-05, 9.921006858348846e-05, 0.00010385364294052124, 0.00010849721729755402, 0.00011314079165458679, 0.00011778436601161957, 0.00012242794036865234]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 16.0, 33.0, 68.0, 160.0, 449.0, 1396.0, 10040.0, 781470.0, 248022.0, 5270.0, 982.0, 353.0, 131.0, 61.0, 29.0, 20.0, 13.0, 11.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0999755859375, -0.09494590759277344, -0.08991622924804688, -0.08488655090332031, -0.07985687255859375, -0.07482719421386719, -0.06979751586914062, -0.06476783752441406, -0.0597381591796875, -0.05470848083496094, -0.049678802490234375, -0.04464912414550781, -0.03961944580078125, -0.03458976745605469, -0.029560089111328125, -0.024530410766601562, -0.019500732421875, -0.014471054077148438, -0.009441375732421875, -0.0044116973876953125, 0.00061798095703125, 0.0056476593017578125, 0.010677337646484375, 0.015707015991210938, 0.0207366943359375, 0.025766372680664062, 0.030796051025390625, 0.03582572937011719, 0.04085540771484375, 0.04588508605957031, 0.050914764404296875, 0.05594444274902344, 0.06097412109375, 0.06600379943847656, 0.07103347778320312, 0.07606315612792969, 0.08109283447265625, 0.08612251281738281, 0.09115219116210938, 0.09618186950683594, 0.1012115478515625, 0.10624122619628906, 0.11127090454101562, 0.11630058288574219, 0.12133026123046875, 0.1263599395751953, 0.13138961791992188, 0.13641929626464844, 0.141448974609375, 0.14647865295410156, 0.15150833129882812, 0.1565380096435547, 0.16156768798828125, 0.1665973663330078, 0.17162704467773438, 0.17665672302246094, 0.1816864013671875, 0.18671607971191406, 0.19174575805664062, 0.1967754364013672, 0.20180511474609375, 0.2068347930908203, 0.21186447143554688, 0.21689414978027344, 0.221923828125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 9.0, 10.0, 31.0, 49.0, 107.0, 148.0, 222.0, 180.0, 105.0, 51.0, 32.0, 18.0, 11.0, 10.0, 4.0, 7.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08544921875, -0.08183860778808594, -0.07822799682617188, -0.07461738586425781, -0.07100677490234375, -0.06739616394042969, -0.06378555297851562, -0.06017494201660156, -0.0565643310546875, -0.05295372009277344, -0.049343109130859375, -0.04573249816894531, -0.04212188720703125, -0.03851127624511719, -0.034900665283203125, -0.03129005432128906, -0.027679443359375, -0.024068832397460938, -0.020458221435546875, -0.016847610473632812, -0.01323699951171875, -0.009626388549804688, -0.006015777587890625, -0.0024051666259765625, 0.0012054443359375, 0.0048160552978515625, 0.008426666259765625, 0.012037277221679688, 0.01564788818359375, 0.019258499145507812, 0.022869110107421875, 0.026479721069335938, 0.03009033203125, 0.03370094299316406, 0.037311553955078125, 0.04092216491699219, 0.04453277587890625, 0.04814338684082031, 0.051753997802734375, 0.05536460876464844, 0.0589752197265625, 0.06258583068847656, 0.06619644165039062, 0.06980705261230469, 0.07341766357421875, 0.07702827453613281, 0.08063888549804688, 0.08424949645996094, 0.087860107421875, 0.09147071838378906, 0.09508132934570312, 0.09869194030761719, 0.10230255126953125, 0.10591316223144531, 0.10952377319335938, 0.11313438415527344, 0.1167449951171875, 0.12035560607910156, 0.12396621704101562, 0.1275768280029297, 0.13118743896484375, 0.1347980499267578, 0.13840866088867188, 0.14201927185058594, 0.1456298828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 10.0, 32.0, 129.0, 630.0, 181.0, 25.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.594270706176758, -8.424546241760254, -8.254822731018066, -8.085098266601562, -7.915374755859375, -7.745650768280029, -7.575926780700684, -7.406202793121338, -7.236478805541992, -7.0667548179626465, -6.897030830383301, -6.727306842803955, -6.557582855224609, -6.387858867645264, -6.218134880065918, -6.048410892486572, -5.878686904907227, -5.708962917327881, -5.539238929748535, -5.3695149421691895, -5.199790954589844, -5.030066967010498, -4.860342979431152, -4.690618991851807, -4.520894527435303, -4.351170539855957, -4.181446552276611, -4.011722564697266, -3.84199857711792, -3.672274589538574, -3.5025506019592285, -3.332826614379883, -3.163102388381958, -2.9933784008026123, -2.8236544132232666, -2.653930425643921, -2.484206438064575, -2.3144824504852295, -2.1447582244873047, -1.9750343561172485, -1.8053103685379028, -1.6355863809585571, -1.4658623933792114, -1.2961382865905762, -1.1264142990112305, -0.9566903710365295, -0.7869663238525391, -0.6172423362731934, -0.44751834869384766, -0.27779436111450195, -0.10807034373283386, 0.06165367364883423, 0.23137766122817993, 0.40110164880752563, 0.5708256959915161, 0.7405496835708618, 0.9102736711502075, 1.0799976587295532, 1.249721646308899, 1.4194457530975342, 1.5891697406768799, 1.7588937282562256, 1.9286177158355713, 2.098341703414917, 2.2680656909942627]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 6.0, 5.0, 6.0, 9.0, 9.0, 10.0, 18.0, 24.0, 18.0, 24.0, 27.0, 29.0, 35.0, 36.0, 34.0, 45.0, 39.0, 44.0, 61.0, 56.0, 37.0, 52.0, 44.0, 44.0, 35.0, 28.0, 33.0, 32.0, 22.0, 31.0, 19.0, 23.0, 9.0, 14.0, 4.0, 8.0, 5.0, 7.0, 4.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4786643981933594, -1.433106541633606, -1.3875486850738525, -1.3419908285140991, -1.2964329719543457, -1.2508751153945923, -1.2053172588348389, -1.1597594022750854, -1.114201545715332, -1.0686436891555786, -1.0230858325958252, -0.9775279760360718, -0.9319701194763184, -0.8864122629165649, -0.8408544063568115, -0.7952965497970581, -0.7497387528419495, -0.704180896282196, -0.6586230397224426, -0.6130651831626892, -0.5675073266029358, -0.5219494700431824, -0.47639164328575134, -0.4308337867259979, -0.3852759301662445, -0.3397180736064911, -0.29416021704673767, -0.24860237538814545, -0.20304451882839203, -0.1574866622686386, -0.11192882061004639, -0.06637096405029297, -0.02081310749053955, 0.02474474534392357, 0.07030259817838669, 0.11586044728755951, 0.16141830384731293, 0.20697616040706635, 0.25253400206565857, 0.298091858625412, 0.3436497151851654, 0.3892075717449188, 0.43476542830467224, 0.48032325506210327, 0.5258811116218567, 0.5714389681816101, 0.6169968247413635, 0.6625546813011169, 0.7081125378608704, 0.7536703944206238, 0.7992282509803772, 0.8447861075401306, 0.890343964099884, 0.9359018206596375, 0.9814596176147461, 1.0270174741744995, 1.072575330734253, 1.1181331872940063, 1.1636910438537598, 1.2092489004135132, 1.2548067569732666, 1.30036461353302, 1.3459224700927734, 1.3914803266525269, 1.4370381832122803]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 6.0, 1.0, 9.0, 9.0, 5.0, 6.0, 8.0, 10.0, 13.0, 24.0, 25.0, 36.0, 64.0, 85.0, 122.0, 209.0, 347.0, 615.0, 1304.0, 2743.0, 7491.0, 36287.0, 3054392.0, 1047091.0, 32023.0, 6908.0, 2353.0, 1023.0, 479.0, 274.0, 132.0, 63.0, 52.0, 22.0, 17.0, 19.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.72998046875, -0.7133750915527344, -0.6967697143554688, -0.6801643371582031, -0.6635589599609375, -0.6469535827636719, -0.6303482055664062, -0.6137428283691406, -0.597137451171875, -0.5805320739746094, -0.5639266967773438, -0.5473213195800781, -0.5307159423828125, -0.5141105651855469, -0.49750518798828125, -0.4808998107910156, -0.46429443359375, -0.4476890563964844, -0.43108367919921875, -0.4144783020019531, -0.3978729248046875, -0.3812675476074219, -0.36466217041015625, -0.3480567932128906, -0.331451416015625, -0.3148460388183594, -0.29824066162109375, -0.2816352844238281, -0.2650299072265625, -0.24842453002929688, -0.23181915283203125, -0.21521377563476562, -0.1986083984375, -0.18200302124023438, -0.16539764404296875, -0.14879226684570312, -0.1321868896484375, -0.11558151245117188, -0.09897613525390625, -0.08237075805664062, -0.065765380859375, -0.049160003662109375, -0.03255462646484375, -0.015949249267578125, 0.0006561279296875, 0.017261505126953125, 0.03386688232421875, 0.050472259521484375, 0.06707763671875, 0.08368301391601562, 0.10028839111328125, 0.11689376831054688, 0.1334991455078125, 0.15010452270507812, 0.16670989990234375, 0.18331527709960938, 0.199920654296875, 0.21652603149414062, 0.23313140869140625, 0.24973678588867188, 0.2663421630859375, 0.2829475402832031, 0.29955291748046875, 0.3161582946777344, 0.332763671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 9.0, 9.0, 21.0, 26.0, 47.0, 45.0, 46.0, 69.0, 95.0, 94.0, 91.0, 79.0, 90.0, 68.0, 58.0, 44.0, 41.0, 19.0, 15.0, 14.0, 11.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.1396484375, -0.13650083541870117, -0.13335323333740234, -0.13020563125610352, -0.1270580291748047, -0.12391042709350586, -0.12076282501220703, -0.1176152229309082, -0.11446762084960938, -0.11132001876831055, -0.10817241668701172, -0.10502481460571289, -0.10187721252441406, -0.09872961044311523, -0.0955820083618164, -0.09243440628051758, -0.08928680419921875, -0.08613920211791992, -0.0829916000366211, -0.07984399795532227, -0.07669639587402344, -0.07354879379272461, -0.07040119171142578, -0.06725358963012695, -0.06410598754882812, -0.0609583854675293, -0.05781078338623047, -0.05466318130493164, -0.05151557922363281, -0.048367977142333984, -0.045220375061035156, -0.04207277297973633, -0.0389251708984375, -0.03577756881713867, -0.032629966735839844, -0.029482364654541016, -0.026334762573242188, -0.02318716049194336, -0.02003955841064453, -0.016891956329345703, -0.013744354248046875, -0.010596752166748047, -0.007449150085449219, -0.004301548004150391, -0.0011539459228515625, 0.0019936561584472656, 0.005141258239746094, 0.008288860321044922, 0.01143646240234375, 0.014584064483642578, 0.017731666564941406, 0.020879268646240234, 0.024026870727539062, 0.02717447280883789, 0.03032207489013672, 0.03346967697143555, 0.036617279052734375, 0.0397648811340332, 0.04291248321533203, 0.04606008529663086, 0.04920768737792969, 0.052355289459228516, 0.055502891540527344, 0.05865049362182617, 0.061798095703125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 1.0, 13.0, 19.0, 28.0, 37.0, 72.0, 125.0, 275.0, 1075.0, 10511.0, 4162900.0, 17565.0, 1213.0, 241.0, 103.0, 47.0, 20.0, 15.0, 9.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.052734375, -2.0066909790039062, -1.9606475830078125, -1.9146041870117188, -1.868560791015625, -1.8225173950195312, -1.7764739990234375, -1.7304306030273438, -1.68438720703125, -1.6383438110351562, -1.5923004150390625, -1.5462570190429688, -1.500213623046875, -1.4541702270507812, -1.4081268310546875, -1.3620834350585938, -1.3160400390625, -1.2699966430664062, -1.2239532470703125, -1.1779098510742188, -1.131866455078125, -1.0858230590820312, -1.0397796630859375, -0.9937362670898438, -0.94769287109375, -0.9016494750976562, -0.8556060791015625, -0.8095626831054688, -0.763519287109375, -0.7174758911132812, -0.6714324951171875, -0.6253890991210938, -0.579345703125, -0.5333023071289062, -0.4872589111328125, -0.44121551513671875, -0.395172119140625, -0.34912872314453125, -0.3030853271484375, -0.25704193115234375, -0.21099853515625, -0.16495513916015625, -0.1189117431640625, -0.07286834716796875, -0.026824951171875, 0.01921844482421875, 0.0652618408203125, 0.11130523681640625, 0.1573486328125, 0.20339202880859375, 0.2494354248046875, 0.29547882080078125, 0.341522216796875, 0.38756561279296875, 0.4336090087890625, 0.47965240478515625, 0.52569580078125, 0.5717391967773438, 0.6177825927734375, 0.6638259887695312, 0.709869384765625, 0.7559127807617188, 0.8019561767578125, 0.8479995727539062, 0.89404296875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 9.0, 11.0, 13.0, 40.0, 151.0, 2782.0, 907.0, 84.0, 38.0, 13.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.646484375, -0.6329746246337891, -0.6194648742675781, -0.6059551239013672, -0.5924453735351562, -0.5789356231689453, -0.5654258728027344, -0.5519161224365234, -0.5384063720703125, -0.5248966217041016, -0.5113868713378906, -0.4978771209716797, -0.48436737060546875, -0.4708576202392578, -0.4573478698730469, -0.44383811950683594, -0.430328369140625, -0.41681861877441406, -0.4033088684082031, -0.3897991180419922, -0.37628936767578125, -0.3627796173095703, -0.3492698669433594, -0.33576011657714844, -0.3222503662109375, -0.30874061584472656, -0.2952308654785156, -0.2817211151123047, -0.26821136474609375, -0.2547016143798828, -0.24119186401367188, -0.22768211364746094, -0.21417236328125, -0.20066261291503906, -0.18715286254882812, -0.1736431121826172, -0.16013336181640625, -0.1466236114501953, -0.13311386108398438, -0.11960411071777344, -0.1060943603515625, -0.09258460998535156, -0.07907485961914062, -0.06556510925292969, -0.05205535888671875, -0.03854560852050781, -0.025035858154296875, -0.011526107788085938, 0.001983642578125, 0.015493392944335938, 0.029003143310546875, 0.04251289367675781, 0.05602264404296875, 0.06953239440917969, 0.08304214477539062, 0.09655189514160156, 0.1100616455078125, 0.12357139587402344, 0.13708114624023438, 0.1505908966064453, 0.16410064697265625, 0.1776103973388672, 0.19112014770507812, 0.20462989807128906, 0.2181396484375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 12.0, 35.0, 179.0, 538.0, 179.0, 31.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-3.164594888687134, -3.105350971221924, -3.046107292175293, -2.986863613128662, -2.927619695663452, -2.868375778198242, -2.8091320991516113, -2.7498884201049805, -2.6906445026397705, -2.6314005851745605, -2.5721569061279297, -2.512913227081299, -2.453669309616089, -2.394425392150879, -2.335181713104248, -2.275938034057617, -2.2166941165924072, -2.1574501991271973, -2.0982065200805664, -2.0389628410339355, -1.9797189235687256, -1.9204751253128052, -1.8612313270568848, -1.8019875288009644, -1.742743730545044, -1.6834999322891235, -1.6242561340332031, -1.5650123357772827, -1.5057685375213623, -1.446524739265442, -1.3872809410095215, -1.328037142753601, -1.2687932252883911, -1.2095494270324707, -1.1503056287765503, -1.0910618305206299, -1.0318180322647095, -0.9725742340087891, -0.9133304357528687, -0.8540866374969482, -0.7948428392410278, -0.7355990409851074, -0.676355242729187, -0.6171114444732666, -0.5578676462173462, -0.4986238479614258, -0.43938004970550537, -0.38013625144958496, -0.32089245319366455, -0.26164865493774414, -0.20240485668182373, -0.14316105842590332, -0.08391726016998291, -0.0246734619140625, 0.03457033634185791, 0.09381413459777832, 0.15305793285369873, 0.21230173110961914, 0.27154552936553955, 0.33078932762145996, 0.39003312587738037, 0.4492769241333008, 0.5085207223892212, 0.5677645206451416, 0.627008318901062]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 10.0, 16.0, 31.0, 43.0, 70.0, 103.0, 131.0, 129.0, 111.0, 112.0, 85.0, 56.0, 54.0, 19.0, 18.0, 6.0, 8.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5089569091796875, -1.4624419212341309, -1.4159269332885742, -1.3694119453430176, -1.322896957397461, -1.2763819694519043, -1.2298669815063477, -1.183351993560791, -1.1368370056152344, -1.0903220176696777, -1.043807029724121, -0.9972920417785645, -0.9507770538330078, -0.9042620658874512, -0.8577470183372498, -0.8112320303916931, -0.7647169828414917, -0.7182019948959351, -0.6716870069503784, -0.6251720190048218, -0.5786570310592651, -0.5321420431137085, -0.4856269955635071, -0.43911200761795044, -0.3925970196723938, -0.34608203172683716, -0.2995670437812805, -0.2530520260334015, -0.20653703808784485, -0.1600220501422882, -0.11350703239440918, -0.06699204444885254, -0.020476937294006348, 0.02603805810213089, 0.07255305349826813, 0.11906805634498596, 0.1655830442905426, 0.21209803223609924, 0.25861304998397827, 0.3051280379295349, 0.35164302587509155, 0.3981580138206482, 0.44467300176620483, 0.49118801951408386, 0.5377030372619629, 0.5842180252075195, 0.6307330131530762, 0.6772480010986328, 0.7237629890441895, 0.7702779769897461, 0.8167929649353027, 0.8633079528808594, 0.909822940826416, 0.9563379287719727, 1.0028529167175293, 1.049367904663086, 1.0958828926086426, 1.1423978805541992, 1.1889128684997559, 1.2354278564453125, 1.2819428443908691, 1.3284578323364258, 1.3749728202819824, 1.421487808227539, 1.4680029153823853]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 10.0, 10.0, 15.0, 22.0, 24.0, 51.0, 66.0, 106.0, 172.0, 314.0, 604.0, 1590.0, 5636.0, 43905.0, 757039.0, 217950.0, 16196.0, 2872.0, 953.0, 408.0, 223.0, 110.0, 82.0, 65.0, 24.0, 33.0, 18.0, 10.0, 13.0, 8.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5045356750488281, -0.49002838134765625, -0.4755210876464844, -0.4610137939453125, -0.4465065002441406, -0.43199920654296875, -0.4174919128417969, -0.402984619140625, -0.3884773254394531, -0.37397003173828125, -0.3594627380371094, -0.3449554443359375, -0.3304481506347656, -0.31594085693359375, -0.3014335632324219, -0.28692626953125, -0.2724189758300781, -0.25791168212890625, -0.24340438842773438, -0.2288970947265625, -0.21438980102539062, -0.19988250732421875, -0.18537521362304688, -0.170867919921875, -0.15636062622070312, -0.14185333251953125, -0.12734603881835938, -0.1128387451171875, -0.09833145141601562, -0.08382415771484375, -0.06931686401367188, -0.0548095703125, -0.040302276611328125, -0.02579498291015625, -0.011287689208984375, 0.0032196044921875, 0.017726898193359375, 0.03223419189453125, 0.046741485595703125, 0.061248779296875, 0.07575607299804688, 0.09026336669921875, 0.10477066040039062, 0.1192779541015625, 0.13378524780273438, 0.14829254150390625, 0.16279983520507812, 0.17730712890625, 0.19181442260742188, 0.20632171630859375, 0.22082901000976562, 0.2353363037109375, 0.24984359741210938, 0.26435089111328125, 0.2788581848144531, 0.293365478515625, 0.3078727722167969, 0.32238006591796875, 0.3368873596191406, 0.3513946533203125, 0.3659019470214844, 0.38040924072265625, 0.3949165344238281, 0.409423828125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 10.0, 8.0, 22.0, 43.0, 65.0, 100.0, 107.0, 129.0, 137.0, 122.0, 106.0, 65.0, 45.0, 25.0, 11.0, 5.0, 6.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2049560546875, -0.20030498504638672, -0.19565391540527344, -0.19100284576416016, -0.18635177612304688, -0.1817007064819336, -0.1770496368408203, -0.17239856719970703, -0.16774749755859375, -0.16309642791748047, -0.1584453582763672, -0.1537942886352539, -0.14914321899414062, -0.14449214935302734, -0.13984107971191406, -0.13519001007080078, -0.1305389404296875, -0.12588787078857422, -0.12123680114746094, -0.11658573150634766, -0.11193466186523438, -0.1072835922241211, -0.10263252258300781, -0.09798145294189453, -0.09333038330078125, -0.08867931365966797, -0.08402824401855469, -0.0793771743774414, -0.07472610473632812, -0.07007503509521484, -0.06542396545410156, -0.06077289581298828, -0.056121826171875, -0.05147075653076172, -0.04681968688964844, -0.042168617248535156, -0.037517547607421875, -0.032866477966308594, -0.028215408325195312, -0.02356433868408203, -0.01891326904296875, -0.014262199401855469, -0.009611129760742188, -0.004960060119628906, -0.000308990478515625, 0.004342079162597656, 0.008993148803710938, 0.013644218444824219, 0.0182952880859375, 0.02294635772705078, 0.027597427368164062, 0.032248497009277344, 0.036899566650390625, 0.041550636291503906, 0.04620170593261719, 0.05085277557373047, 0.05550384521484375, 0.06015491485595703, 0.06480598449707031, 0.0694570541381836, 0.07410812377929688, 0.07875919342041016, 0.08341026306152344, 0.08806133270263672, 0.09271240234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 10.0, 20.0, 20.0, 37.0, 40.0, 66.0, 96.0, 149.0, 283.0, 481.0, 1049.0, 2470.0, 6880.0, 23034.0, 93815.0, 537750.0, 304715.0, 54966.0, 14380.0, 4669.0, 1773.0, 781.0, 397.0, 254.0, 132.0, 91.0, 46.0, 31.0, 27.0, 24.0, 7.0, 14.0, 11.0, 8.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1915283203125, -0.18551063537597656, -0.17949295043945312, -0.1734752655029297, -0.16745758056640625, -0.1614398956298828, -0.15542221069335938, -0.14940452575683594, -0.1433868408203125, -0.13736915588378906, -0.13135147094726562, -0.1253337860107422, -0.11931610107421875, -0.11329841613769531, -0.10728073120117188, -0.10126304626464844, -0.095245361328125, -0.08922767639160156, -0.08320999145507812, -0.07719230651855469, -0.07117462158203125, -0.06515693664550781, -0.059139251708984375, -0.05312156677246094, -0.0471038818359375, -0.04108619689941406, -0.035068511962890625, -0.029050827026367188, -0.02303314208984375, -0.017015457153320312, -0.010997772216796875, -0.0049800872802734375, 0.00103759765625, 0.0070552825927734375, 0.013072967529296875, 0.019090652465820312, 0.02510833740234375, 0.031126022338867188, 0.037143707275390625, 0.04316139221191406, 0.0491790771484375, 0.05519676208496094, 0.061214447021484375, 0.06723213195800781, 0.07324981689453125, 0.07926750183105469, 0.08528518676757812, 0.09130287170410156, 0.097320556640625, 0.10333824157714844, 0.10935592651367188, 0.11537361145019531, 0.12139129638671875, 0.1274089813232422, 0.13342666625976562, 0.13944435119628906, 0.1454620361328125, 0.15147972106933594, 0.15749740600585938, 0.1635150909423828, 0.16953277587890625, 0.1755504608154297, 0.18156814575195312, 0.18758583068847656, 0.193603515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 9.0, 10.0, 17.0, 19.0, 23.0, 17.0, 22.0, 34.0, 41.0, 31.0, 46.0, 51.0, 41.0, 53.0, 55.0, 42.0, 46.0, 52.0, 46.0, 43.0, 43.0, 29.0, 47.0, 32.0, 27.0, 34.0, 21.0, 14.0, 17.0, 11.0, 8.0, 2.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.210693359375, -0.20326614379882812, -0.19583892822265625, -0.18841171264648438, -0.1809844970703125, -0.17355728149414062, -0.16613006591796875, -0.15870285034179688, -0.151275634765625, -0.14384841918945312, -0.13642120361328125, -0.12899398803710938, -0.1215667724609375, -0.11413955688476562, -0.10671234130859375, -0.09928512573242188, -0.09185791015625, -0.08443069458007812, -0.07700347900390625, -0.06957626342773438, -0.0621490478515625, -0.054721832275390625, -0.04729461669921875, -0.039867401123046875, -0.032440185546875, -0.025012969970703125, -0.01758575439453125, -0.010158538818359375, -0.0027313232421875, 0.004695892333984375, 0.01212310791015625, 0.019550323486328125, 0.0269775390625, 0.034404754638671875, 0.04183197021484375, 0.049259185791015625, 0.0566864013671875, 0.06411361694335938, 0.07154083251953125, 0.07896804809570312, 0.086395263671875, 0.09382247924804688, 0.10124969482421875, 0.10867691040039062, 0.1161041259765625, 0.12353134155273438, 0.13095855712890625, 0.13838577270507812, 0.14581298828125, 0.15324020385742188, 0.16066741943359375, 0.16809463500976562, 0.1755218505859375, 0.18294906616210938, 0.19037628173828125, 0.19780349731445312, 0.205230712890625, 0.21265792846679688, 0.22008514404296875, 0.22751235961914062, 0.2349395751953125, 0.24236679077148438, 0.24979400634765625, 0.2572212219238281, 0.2646484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 7.0, 11.0, 21.0, 16.0, 17.0, 21.0, 26.0, 34.0, 51.0, 68.0, 94.0, 173.0, 310.0, 706.0, 1747.0, 5656.0, 37510.0, 752021.0, 231332.0, 13307.0, 3211.0, 1062.0, 472.0, 222.0, 119.0, 82.0, 52.0, 29.0, 26.0, 41.0, 16.0, 18.0, 14.0, 7.0, 6.0, 9.0, 9.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08026123046875, -0.07726287841796875, -0.0742645263671875, -0.07126617431640625, -0.068267822265625, -0.06526947021484375, -0.0622711181640625, -0.05927276611328125, -0.0562744140625, -0.05327606201171875, -0.0502777099609375, -0.04727935791015625, -0.044281005859375, -0.04128265380859375, -0.0382843017578125, -0.03528594970703125, -0.03228759765625, -0.02928924560546875, -0.0262908935546875, -0.02329254150390625, -0.020294189453125, -0.01729583740234375, -0.0142974853515625, -0.01129913330078125, -0.00830078125, -0.00530242919921875, -0.0023040771484375, 0.00069427490234375, 0.003692626953125, 0.00669097900390625, 0.0096893310546875, 0.01268768310546875, 0.01568603515625, 0.01868438720703125, 0.0216827392578125, 0.02468109130859375, 0.027679443359375, 0.03067779541015625, 0.0336761474609375, 0.03667449951171875, 0.0396728515625, 0.04267120361328125, 0.0456695556640625, 0.04866790771484375, 0.051666259765625, 0.05466461181640625, 0.0576629638671875, 0.06066131591796875, 0.06365966796875, 0.06665802001953125, 0.0696563720703125, 0.07265472412109375, 0.075653076171875, 0.07865142822265625, 0.0816497802734375, 0.08464813232421875, 0.087646484375, 0.09064483642578125, 0.0936431884765625, 0.09664154052734375, 0.099639892578125, 0.10263824462890625, 0.1056365966796875, 0.10863494873046875, 0.11163330078125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 14.0, 13.0, 24.0, 34.0, 66.0, 141.0, 245.0, 207.0, 129.0, 59.0, 33.0, 17.0, 17.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00043272972106933594, -0.0004240460693836212, -0.0004153624176979065, -0.00040667876601219177, -0.00039799511432647705, -0.00038931146264076233, -0.0003806278109550476, -0.0003719441592693329, -0.00036326050758361816, -0.00035457685589790344, -0.0003458932042121887, -0.000337209552526474, -0.0003285259008407593, -0.00031984224915504456, -0.00031115859746932983, -0.0003024749457836151, -0.0002937912940979004, -0.00028510764241218567, -0.00027642399072647095, -0.0002677403390407562, -0.0002590566873550415, -0.0002503730356693268, -0.00024168938398361206, -0.00023300573229789734, -0.00022432208061218262, -0.0002156384289264679, -0.00020695477724075317, -0.00019827112555503845, -0.00018958747386932373, -0.000180903822183609, -0.0001722201704978943, -0.00016353651881217957, -0.00015485286712646484, -0.00014616921544075012, -0.0001374855637550354, -0.00012880191206932068, -0.00012011826038360596, -0.00011143460869789124, -0.00010275095701217651, -9.406730532646179e-05, -8.538365364074707e-05, -7.670000195503235e-05, -6.801635026931763e-05, -5.9332698583602905e-05, -5.0649046897888184e-05, -4.196539521217346e-05, -3.328174352645874e-05, -2.459809184074402e-05, -1.5914440155029297e-05, -7.230788469314575e-06, 1.4528632164001465e-06, 1.0136514902114868e-05, 1.882016658782959e-05, 2.750381827354431e-05, 3.618746995925903e-05, 4.4871121644973755e-05, 5.3554773330688477e-05, 6.22384250164032e-05, 7.092207670211792e-05, 7.960572838783264e-05, 8.828938007354736e-05, 9.697303175926208e-05, 0.0001056566834449768, 0.00011434033513069153, 0.00012302398681640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 14.0, 19.0, 35.0, 86.0, 187.0, 958.0, 88151.0, 954967.0, 3542.0, 319.0, 123.0, 71.0, 41.0, 25.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.354736328125, -0.346710205078125, -0.33868408203125, -0.330657958984375, -0.3226318359375, -0.314605712890625, -0.30657958984375, -0.298553466796875, -0.29052734375, -0.282501220703125, -0.27447509765625, -0.266448974609375, -0.2584228515625, -0.250396728515625, -0.24237060546875, -0.234344482421875, -0.226318359375, -0.218292236328125, -0.21026611328125, -0.202239990234375, -0.1942138671875, -0.186187744140625, -0.17816162109375, -0.170135498046875, -0.162109375, -0.154083251953125, -0.14605712890625, -0.138031005859375, -0.1300048828125, -0.121978759765625, -0.11395263671875, -0.105926513671875, -0.097900390625, -0.089874267578125, -0.08184814453125, -0.073822021484375, -0.0657958984375, -0.057769775390625, -0.04974365234375, -0.041717529296875, -0.03369140625, -0.025665283203125, -0.01763916015625, -0.009613037109375, -0.0015869140625, 0.006439208984375, 0.01446533203125, 0.022491455078125, 0.030517578125, 0.038543701171875, 0.04656982421875, 0.054595947265625, 0.0626220703125, 0.070648193359375, 0.07867431640625, 0.086700439453125, 0.0947265625, 0.102752685546875, 0.11077880859375, 0.118804931640625, 0.1268310546875, 0.134857177734375, 0.14288330078125, 0.150909423828125, 0.158935546875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 9.0, 13.0, 21.0, 20.0, 75.0, 175.0, 263.0, 222.0, 114.0, 49.0, 20.0, 15.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.2851533889770508, -0.27953529357910156, -0.27391719818115234, -0.2682991027832031, -0.2626810073852539, -0.2570629119873047, -0.25144481658935547, -0.24582672119140625, -0.24020862579345703, -0.2345905303955078, -0.2289724349975586, -0.22335433959960938, -0.21773624420166016, -0.21211814880371094, -0.20650005340576172, -0.2008819580078125, -0.19526386260986328, -0.18964576721191406, -0.18402767181396484, -0.17840957641601562, -0.1727914810180664, -0.1671733856201172, -0.16155529022216797, -0.15593719482421875, -0.15031909942626953, -0.1447010040283203, -0.1390829086303711, -0.13346481323242188, -0.12784671783447266, -0.12222862243652344, -0.11661052703857422, -0.110992431640625, -0.10537433624267578, -0.09975624084472656, -0.09413814544677734, -0.08852005004882812, -0.0829019546508789, -0.07728385925292969, -0.07166576385498047, -0.06604766845703125, -0.06042957305908203, -0.05481147766113281, -0.049193382263183594, -0.043575286865234375, -0.037957191467285156, -0.03233909606933594, -0.02672100067138672, -0.0211029052734375, -0.015484809875488281, -0.009866714477539062, -0.004248619079589844, 0.001369476318359375, 0.006987571716308594, 0.012605667114257812, 0.01822376251220703, 0.02384185791015625, 0.02945995330810547, 0.03507804870605469, 0.040696144104003906, 0.046314239501953125, 0.051932334899902344, 0.05755043029785156, 0.06316852569580078, 0.06878662109375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 16.0, 51.0, 289.0, 497.0, 109.0, 36.0, 9.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4458900690078735, -1.3271595239639282, -1.2084288597106934, -1.089698314666748, -0.9709676504135132, -0.8522371053695679, -0.7335065007209778, -0.6147758960723877, -0.4960452914237976, -0.3773146867752075, -0.25858408212661743, -0.13985350728034973, -0.021122902631759644, 0.09760767221450806, 0.21633827686309814, 0.33506888151168823, 0.4537994861602783, 0.5725300908088684, 0.6912606954574585, 0.8099912405014038, 0.9287219047546387, 1.047452449798584, 1.1661829948425293, 1.2849136590957642, 1.403644323348999, 1.5223748683929443, 1.6411055326461792, 1.7598360776901245, 1.8785667419433594, 1.9972972869873047, 2.11602783203125, 2.2347583770751953, 2.3534891605377197, 2.472219705581665, 2.5909502506256104, 2.7096810340881348, 2.82841157913208, 2.9471421241760254, 3.0658726692199707, 3.184603214263916, 3.3033339977264404, 3.4220645427703857, 3.540795087814331, 3.6595258712768555, 3.778256416320801, 3.896986961364746, 4.015717506408691, 4.134448051452637, 4.253178596496582, 4.371909141540527, 4.490639686584473, 4.609370231628418, 4.728100776672363, 4.846831321716309, 4.965562343597412, 5.084292888641357, 5.203023433685303, 5.321753978729248, 5.440484523773193, 5.559215068817139, 5.677945613861084, 5.7966766357421875, 5.915407180786133, 6.034137725830078, 6.152868270874023]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 5.0, 4.0, 14.0, 9.0, 20.0, 21.0, 29.0, 30.0, 29.0, 22.0, 23.0, 37.0, 40.0, 37.0, 35.0, 34.0, 51.0, 57.0, 39.0, 52.0, 58.0, 38.0, 41.0, 49.0, 35.0, 37.0, 27.0, 28.0, 21.0, 10.0, 12.0, 9.0, 8.0, 7.0, 6.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.4333292245864868, -1.3927112817764282, -1.3520934581756592, -1.3114755153656006, -1.270857572555542, -1.2302396297454834, -1.1896216869354248, -1.1490038633346558, -1.1083859205245972, -1.0677679777145386, -1.0271501541137695, -0.9865322113037109, -0.9459142684936523, -0.9052963256835938, -0.8646784424781799, -0.8240605592727661, -0.7834426164627075, -0.7428246736526489, -0.7022067904472351, -0.6615889072418213, -0.6209709644317627, -0.5803530216217041, -0.5397351384162903, -0.4991172254085541, -0.45849931240081787, -0.41788139939308167, -0.37726348638534546, -0.33664557337760925, -0.29602766036987305, -0.25540974736213684, -0.21479183435440063, -0.17417392134666443, -0.13355612754821777, -0.09293821454048157, -0.05232030153274536, -0.011702388525009155, 0.02891552448272705, 0.06953343749046326, 0.11015135049819946, 0.15076926350593567, 0.19138717651367188, 0.23200508952140808, 0.2726230025291443, 0.3132409155368805, 0.3538588285446167, 0.3944767415523529, 0.4350946545600891, 0.4757125675678253, 0.5163304805755615, 0.5569484233856201, 0.5975663065910339, 0.6381841897964478, 0.6788021326065063, 0.7194200754165649, 0.7600379586219788, 0.8006558418273926, 0.8412737846374512, 0.8818917274475098, 0.9225096106529236, 0.9631274938583374, 1.003745436668396, 1.0443633794784546, 1.0849812030792236, 1.1255991458892822, 1.1662170886993408]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 0.0, 1.0, 8.0, 2.0, 4.0, 3.0, 9.0, 7.0, 14.0, 9.0, 15.0, 17.0, 21.0, 32.0, 40.0, 55.0, 72.0, 86.0, 142.0, 178.0, 336.0, 493.0, 1107.0, 2482.0, 7372.0, 31182.0, 627146.0, 3462332.0, 46805.0, 9338.0, 2823.0, 1070.0, 482.0, 275.0, 131.0, 79.0, 33.0, 35.0, 13.0, 13.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.35498046875, -0.3471088409423828, -0.3392372131347656, -0.33136558532714844, -0.32349395751953125, -0.31562232971191406, -0.3077507019042969, -0.2998790740966797, -0.2920074462890625, -0.2841358184814453, -0.2762641906738281, -0.26839256286621094, -0.26052093505859375, -0.25264930725097656, -0.24477767944335938, -0.2369060516357422, -0.229034423828125, -0.2211627960205078, -0.21329116821289062, -0.20541954040527344, -0.19754791259765625, -0.18967628479003906, -0.18180465698242188, -0.1739330291748047, -0.1660614013671875, -0.1581897735595703, -0.15031814575195312, -0.14244651794433594, -0.13457489013671875, -0.12670326232910156, -0.11883163452148438, -0.11096000671386719, -0.10308837890625, -0.09521675109863281, -0.08734512329101562, -0.07947349548339844, -0.07160186767578125, -0.06373023986816406, -0.055858612060546875, -0.04798698425292969, -0.0401153564453125, -0.03224372863769531, -0.024372100830078125, -0.016500473022460938, -0.00862884521484375, -0.0007572174072265625, 0.007114410400390625, 0.014986038208007812, 0.022857666015625, 0.030729293823242188, 0.038600921630859375, 0.04647254943847656, 0.05434417724609375, 0.06221580505371094, 0.07008743286132812, 0.07795906066894531, 0.0858306884765625, 0.09370231628417969, 0.10157394409179688, 0.10944557189941406, 0.11731719970703125, 0.12518882751464844, 0.13306045532226562, 0.1409320831298828, 0.1488037109375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 6.0, 8.0, 12.0, 29.0, 47.0, 78.0, 80.0, 100.0, 123.0, 121.0, 120.0, 110.0, 65.0, 53.0, 26.0, 10.0, 6.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2015380859375, -0.1969614028930664, -0.1923847198486328, -0.18780803680419922, -0.18323135375976562, -0.17865467071533203, -0.17407798767089844, -0.16950130462646484, -0.16492462158203125, -0.16034793853759766, -0.15577125549316406, -0.15119457244873047, -0.14661788940429688, -0.14204120635986328, -0.1374645233154297, -0.1328878402709961, -0.1283111572265625, -0.1237344741821289, -0.11915779113769531, -0.11458110809326172, -0.11000442504882812, -0.10542774200439453, -0.10085105895996094, -0.09627437591552734, -0.09169769287109375, -0.08712100982666016, -0.08254432678222656, -0.07796764373779297, -0.07339096069335938, -0.06881427764892578, -0.06423759460449219, -0.059660911560058594, -0.055084228515625, -0.050507545471191406, -0.04593086242675781, -0.04135417938232422, -0.036777496337890625, -0.03220081329345703, -0.027624130249023438, -0.023047447204589844, -0.01847076416015625, -0.013894081115722656, -0.009317398071289062, -0.004740715026855469, -0.000164031982421875, 0.004412651062011719, 0.008989334106445312, 0.013566017150878906, 0.0181427001953125, 0.022719383239746094, 0.027296066284179688, 0.03187274932861328, 0.036449432373046875, 0.04102611541748047, 0.04560279846191406, 0.050179481506347656, 0.05475616455078125, 0.059332847595214844, 0.06390953063964844, 0.06848621368408203, 0.07306289672851562, 0.07763957977294922, 0.08221626281738281, 0.0867929458618164, 0.09136962890625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 12.0, 8.0, 23.0, 24.0, 31.0, 71.0, 156.0, 339.0, 877.0, 2361.0, 7894.0, 52221.0, 3983862.0, 129421.0, 11767.0, 3139.0, 1112.0, 506.0, 206.0, 118.0, 43.0, 28.0, 16.0, 11.0, 4.0, 8.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2364501953125, -0.2284717559814453, -0.22049331665039062, -0.21251487731933594, -0.20453643798828125, -0.19655799865722656, -0.18857955932617188, -0.1806011199951172, -0.1726226806640625, -0.1646442413330078, -0.15666580200195312, -0.14868736267089844, -0.14070892333984375, -0.13273048400878906, -0.12475204467773438, -0.11677360534667969, -0.108795166015625, -0.10081672668457031, -0.09283828735351562, -0.08485984802246094, -0.07688140869140625, -0.06890296936035156, -0.060924530029296875, -0.05294609069824219, -0.0449676513671875, -0.03698921203613281, -0.029010772705078125, -0.021032333374023438, -0.01305389404296875, -0.0050754547119140625, 0.002902984619140625, 0.010881423950195312, 0.01885986328125, 0.026838302612304688, 0.034816741943359375, 0.04279518127441406, 0.05077362060546875, 0.05875205993652344, 0.06673049926757812, 0.07470893859863281, 0.0826873779296875, 0.09066581726074219, 0.09864425659179688, 0.10662269592285156, 0.11460113525390625, 0.12257957458496094, 0.13055801391601562, 0.1385364532470703, 0.146514892578125, 0.1544933319091797, 0.16247177124023438, 0.17045021057128906, 0.17842864990234375, 0.18640708923339844, 0.19438552856445312, 0.2023639678955078, 0.2103424072265625, 0.2183208465576172, 0.22629928588867188, 0.23427772521972656, 0.24225616455078125, 0.25023460388183594, 0.2582130432128906, 0.2661914825439453, 0.274169921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 6.0, 7.0, 12.0, 13.0, 15.0, 25.0, 42.0, 81.0, 137.0, 648.0, 2427.0, 360.0, 134.0, 64.0, 25.0, 26.0, 11.0, 10.0, 4.0, 7.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0902099609375, -0.0873250961303711, -0.08444023132324219, -0.08155536651611328, -0.07867050170898438, -0.07578563690185547, -0.07290077209472656, -0.07001590728759766, -0.06713104248046875, -0.06424617767333984, -0.06136131286621094, -0.05847644805908203, -0.055591583251953125, -0.05270671844482422, -0.04982185363769531, -0.046936988830566406, -0.0440521240234375, -0.041167259216308594, -0.03828239440917969, -0.03539752960205078, -0.032512664794921875, -0.02962779998779297, -0.026742935180664062, -0.023858070373535156, -0.02097320556640625, -0.018088340759277344, -0.015203475952148438, -0.012318611145019531, -0.009433746337890625, -0.006548881530761719, -0.0036640167236328125, -0.0007791519165039062, 0.002105712890625, 0.004990577697753906, 0.007875442504882812, 0.010760307312011719, 0.013645172119140625, 0.01653003692626953, 0.019414901733398438, 0.022299766540527344, 0.02518463134765625, 0.028069496154785156, 0.030954360961914062, 0.03383922576904297, 0.036724090576171875, 0.03960895538330078, 0.04249382019042969, 0.045378684997558594, 0.0482635498046875, 0.051148414611816406, 0.05403327941894531, 0.05691814422607422, 0.059803009033203125, 0.06268787384033203, 0.06557273864746094, 0.06845760345458984, 0.07134246826171875, 0.07422733306884766, 0.07711219787597656, 0.07999706268310547, 0.08288192749023438, 0.08576679229736328, 0.08865165710449219, 0.0915365219116211, 0.09442138671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 55.0, 261.0, 459.0, 167.0, 33.0, 12.0, 8.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32473528385162354, -0.29798340797424316, -0.2712315618991852, -0.244479700922966, -0.21772783994674683, -0.19097597897052765, -0.16422411799430847, -0.1374722570180893, -0.11072039604187012, -0.08396853506565094, -0.05721667408943176, -0.030464813113212585, -0.003712952136993408, 0.02303890883922577, 0.049790769815444946, 0.07654263079166412, 0.1032944917678833, 0.13004635274410248, 0.15679821372032166, 0.18355007469654083, 0.21030193567276, 0.2370537966489792, 0.26380565762519836, 0.29055750370025635, 0.3173093795776367, 0.3440612554550171, 0.3708131015300751, 0.39756494760513306, 0.4243168234825134, 0.4510686993598938, 0.4778205454349518, 0.5045723915100098, 0.5313242673873901, 0.5580761432647705, 0.5848280191421509, 0.6115798354148865, 0.6383317112922668, 0.6650835871696472, 0.6918354034423828, 0.7185872793197632, 0.7453391551971436, 0.7720910310745239, 0.7988429069519043, 0.8255947232246399, 0.8523465991020203, 0.8790984749794006, 0.9058502912521362, 0.9326021671295166, 0.959354043006897, 0.9861059188842773, 1.0128577947616577, 1.039609670639038, 1.066361427307129, 1.0931133031845093, 1.1198651790618896, 1.14661705493927, 1.1733689308166504, 1.2001208066940308, 1.2268726825714111, 1.2536245584487915, 1.2803764343261719, 1.3071281909942627, 1.333880066871643, 1.3606319427490234, 1.3873838186264038]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 9.0, 4.0, 6.0, 9.0, 13.0, 9.0, 20.0, 23.0, 29.0, 29.0, 20.0, 44.0, 35.0, 44.0, 46.0, 47.0, 56.0, 48.0, 44.0, 42.0, 41.0, 54.0, 29.0, 46.0, 40.0, 30.0, 25.0, 22.0, 21.0, 13.0, 23.0, 15.0, 7.0, 8.0, 9.0, 8.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.21170544624328613, -0.20439811050891876, -0.1970907747745514, -0.18978342413902283, -0.18247608840465546, -0.17516875267028809, -0.16786141693592072, -0.16055408120155334, -0.15324673056602478, -0.1459393948316574, -0.13863205909729004, -0.13132470846176147, -0.1240173727273941, -0.11671003699302673, -0.10940270125865936, -0.10209536552429199, -0.09478802978992462, -0.08748069405555725, -0.08017335087060928, -0.07286601513624191, -0.06555867195129395, -0.058251336216926575, -0.050944000482559204, -0.043636661022901535, -0.036329321563243866, -0.029021982103586197, -0.021714644506573677, -0.014407306909561157, -0.007099967449903488, 0.0002073720097541809, 0.0075147077441215515, 0.01482204720377922, 0.02212938666343689, 0.02943672612309456, 0.03674406558275223, 0.0440514013171196, 0.05135874077677727, 0.058666080236434937, 0.06597341597080231, 0.07328075170516968, 0.08058809489011765, 0.08789543062448502, 0.09520277380943298, 0.10251010954380035, 0.10981744527816772, 0.11712478846311569, 0.12443212419748306, 0.13173946738243103, 0.1390468031167984, 0.14635413885116577, 0.15366147458553314, 0.1609688103199005, 0.16827616095542908, 0.17558349668979645, 0.18289083242416382, 0.1901981681585312, 0.19750550389289856, 0.20481283962726593, 0.2121201753616333, 0.21942752599716187, 0.22673486173152924, 0.2340421974658966, 0.24134953320026398, 0.24865686893463135, 0.2559642195701599]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 5.0, 12.0, 27.0, 13.0, 15.0, 25.0, 34.0, 76.0, 74.0, 121.0, 216.0, 342.0, 711.0, 1839.0, 6566.0, 34943.0, 345368.0, 588396.0, 55990.0, 9270.0, 2515.0, 913.0, 426.0, 217.0, 145.0, 84.0, 56.0, 34.0, 33.0, 28.0, 9.0, 9.0, 9.0, 6.0, 11.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24072265625, -0.23150634765625, -0.2222900390625, -0.21307373046875, -0.203857421875, -0.19464111328125, -0.1854248046875, -0.17620849609375, -0.1669921875, -0.15777587890625, -0.1485595703125, -0.13934326171875, -0.130126953125, -0.12091064453125, -0.1116943359375, -0.10247802734375, -0.09326171875, -0.08404541015625, -0.0748291015625, -0.06561279296875, -0.056396484375, -0.04718017578125, -0.0379638671875, -0.02874755859375, -0.01953125, -0.01031494140625, -0.0010986328125, 0.00811767578125, 0.017333984375, 0.02655029296875, 0.0357666015625, 0.04498291015625, 0.05419921875, 0.06341552734375, 0.0726318359375, 0.08184814453125, 0.091064453125, 0.10028076171875, 0.1094970703125, 0.11871337890625, 0.1279296875, 0.13714599609375, 0.1463623046875, 0.15557861328125, 0.164794921875, 0.17401123046875, 0.1832275390625, 0.19244384765625, 0.20166015625, 0.21087646484375, 0.2200927734375, 0.22930908203125, 0.238525390625, 0.24774169921875, 0.2569580078125, 0.26617431640625, 0.275390625, 0.28460693359375, 0.2938232421875, 0.30303955078125, 0.312255859375, 0.32147216796875, 0.3306884765625, 0.33990478515625, 0.34912109375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 17.0, 37.0, 37.0, 67.0, 81.0, 98.0, 115.0, 139.0, 111.0, 105.0, 73.0, 51.0, 35.0, 12.0, 7.0, 7.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.191162109375, -0.18673419952392578, -0.18230628967285156, -0.17787837982177734, -0.17345046997070312, -0.1690225601196289, -0.1645946502685547, -0.16016674041748047, -0.15573883056640625, -0.15131092071533203, -0.1468830108642578, -0.1424551010131836, -0.13802719116210938, -0.13359928131103516, -0.12917137145996094, -0.12474346160888672, -0.1203155517578125, -0.11588764190673828, -0.11145973205566406, -0.10703182220458984, -0.10260391235351562, -0.0981760025024414, -0.09374809265136719, -0.08932018280029297, -0.08489227294921875, -0.08046436309814453, -0.07603645324707031, -0.0716085433959961, -0.06718063354492188, -0.06275272369384766, -0.05832481384277344, -0.05389690399169922, -0.049468994140625, -0.04504108428955078, -0.04061317443847656, -0.036185264587402344, -0.031757354736328125, -0.027329444885253906, -0.022901535034179688, -0.01847362518310547, -0.01404571533203125, -0.009617805480957031, -0.0051898956298828125, -0.0007619857788085938, 0.003665924072265625, 0.008093833923339844, 0.012521743774414062, 0.01694965362548828, 0.0213775634765625, 0.02580547332763672, 0.030233383178710938, 0.034661293029785156, 0.039089202880859375, 0.043517112731933594, 0.04794502258300781, 0.05237293243408203, 0.05680084228515625, 0.06122875213623047, 0.06565666198730469, 0.0700845718383789, 0.07451248168945312, 0.07894039154052734, 0.08336830139160156, 0.08779621124267578, 0.09222412109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 0.0, 2.0, 8.0, 5.0, 12.0, 8.0, 20.0, 22.0, 29.0, 34.0, 37.0, 56.0, 70.0, 82.0, 106.0, 131.0, 201.0, 318.0, 574.0, 1164.0, 2380.0, 5627.0, 13819.0, 37207.0, 115464.0, 426185.0, 314018.0, 83049.0, 28068.0, 10952.0, 4478.0, 1939.0, 943.0, 527.0, 311.0, 180.0, 106.0, 83.0, 78.0, 57.0, 42.0, 45.0, 25.0, 25.0, 25.0, 11.0, 6.0, 8.0, 8.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.127197265625, -0.12320518493652344, -0.11921310424804688, -0.11522102355957031, -0.11122894287109375, -0.10723686218261719, -0.10324478149414062, -0.09925270080566406, -0.0952606201171875, -0.09126853942871094, -0.08727645874023438, -0.08328437805175781, -0.07929229736328125, -0.07530021667480469, -0.07130813598632812, -0.06731605529785156, -0.063323974609375, -0.05933189392089844, -0.055339813232421875, -0.05134773254394531, -0.04735565185546875, -0.04336357116699219, -0.039371490478515625, -0.03537940979003906, -0.0313873291015625, -0.027395248413085938, -0.023403167724609375, -0.019411087036132812, -0.01541900634765625, -0.011426925659179688, -0.007434844970703125, -0.0034427642822265625, 0.00054931640625, 0.0045413970947265625, 0.008533477783203125, 0.012525558471679688, 0.01651763916015625, 0.020509719848632812, 0.024501800537109375, 0.028493881225585938, 0.0324859619140625, 0.03647804260253906, 0.040470123291015625, 0.04446220397949219, 0.04845428466796875, 0.05244636535644531, 0.056438446044921875, 0.06043052673339844, 0.064422607421875, 0.06841468811035156, 0.07240676879882812, 0.07639884948730469, 0.08039093017578125, 0.08438301086425781, 0.08837509155273438, 0.09236717224121094, 0.0963592529296875, 0.10035133361816406, 0.10434341430664062, 0.10833549499511719, 0.11232757568359375, 0.11631965637207031, 0.12031173706054688, 0.12430381774902344, 0.1282958984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 5.0, 7.0, 5.0, 13.0, 6.0, 16.0, 21.0, 20.0, 17.0, 16.0, 30.0, 37.0, 20.0, 30.0, 24.0, 48.0, 35.0, 34.0, 28.0, 41.0, 33.0, 40.0, 39.0, 36.0, 38.0, 35.0, 28.0, 37.0, 30.0, 32.0, 27.0, 23.0, 11.0, 23.0, 14.0, 12.0, 13.0, 10.0, 2.0, 12.0, 13.0, 7.0, 4.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193115234375, -0.18722152709960938, -0.18132781982421875, -0.17543411254882812, -0.1695404052734375, -0.16364669799804688, -0.15775299072265625, -0.15185928344726562, -0.145965576171875, -0.14007186889648438, -0.13417816162109375, -0.12828445434570312, -0.1223907470703125, -0.11649703979492188, -0.11060333251953125, -0.10470962524414062, -0.09881591796875, -0.09292221069335938, -0.08702850341796875, -0.08113479614257812, -0.0752410888671875, -0.06934738159179688, -0.06345367431640625, -0.057559967041015625, -0.051666259765625, -0.045772552490234375, -0.03987884521484375, -0.033985137939453125, -0.0280914306640625, -0.022197723388671875, -0.01630401611328125, -0.010410308837890625, -0.0045166015625, 0.001377105712890625, 0.00727081298828125, 0.013164520263671875, 0.0190582275390625, 0.024951934814453125, 0.03084564208984375, 0.036739349365234375, 0.042633056640625, 0.048526763916015625, 0.05442047119140625, 0.060314178466796875, 0.0662078857421875, 0.07210159301757812, 0.07799530029296875, 0.08388900756835938, 0.08978271484375, 0.09567642211914062, 0.10157012939453125, 0.10746383666992188, 0.1133575439453125, 0.11925125122070312, 0.12514495849609375, 0.13103866577148438, 0.136932373046875, 0.14282608032226562, 0.14871978759765625, 0.15461349487304688, 0.1605072021484375, 0.16640090942382812, 0.17229461669921875, 0.17818832397460938, 0.18408203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 15.0, 23.0, 25.0, 32.0, 71.0, 106.0, 206.0, 394.0, 769.0, 1757.0, 4843.0, 20293.0, 244252.0, 703290.0, 58143.0, 9139.0, 2803.0, 1160.0, 549.0, 275.0, 168.0, 89.0, 38.0, 38.0, 17.0, 10.0, 15.0, 2.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0733642578125, -0.07085609436035156, -0.06834793090820312, -0.06583976745605469, -0.06333160400390625, -0.06082344055175781, -0.058315277099609375, -0.05580711364746094, -0.0532989501953125, -0.05079078674316406, -0.048282623291015625, -0.04577445983886719, -0.04326629638671875, -0.04075813293457031, -0.038249969482421875, -0.03574180603027344, -0.033233642578125, -0.030725479125976562, -0.028217315673828125, -0.025709152221679688, -0.02320098876953125, -0.020692825317382812, -0.018184661865234375, -0.015676498413085938, -0.0131683349609375, -0.010660171508789062, -0.008152008056640625, -0.0056438446044921875, -0.00313568115234375, -0.0006275177001953125, 0.001880645751953125, 0.0043888092041015625, 0.00689697265625, 0.009405136108398438, 0.011913299560546875, 0.014421463012695312, 0.01692962646484375, 0.019437789916992188, 0.021945953369140625, 0.024454116821289062, 0.0269622802734375, 0.029470443725585938, 0.031978607177734375, 0.03448677062988281, 0.03699493408203125, 0.03950309753417969, 0.042011260986328125, 0.04451942443847656, 0.047027587890625, 0.04953575134277344, 0.052043914794921875, 0.05455207824707031, 0.05706024169921875, 0.05956840515136719, 0.062076568603515625, 0.06458473205566406, 0.0670928955078125, 0.06960105895996094, 0.07210922241210938, 0.07461738586425781, 0.07712554931640625, 0.07963371276855469, 0.08214187622070312, 0.08465003967285156, 0.087158203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 5.0, 7.0, 7.0, 6.0, 20.0, 14.0, 15.0, 19.0, 35.0, 37.0, 68.0, 70.0, 108.0, 107.0, 104.0, 75.0, 71.0, 43.0, 40.0, 26.0, 22.0, 16.0, 22.0, 8.0, 8.0, 11.0, 7.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00011348724365234375, -0.00011000689119100571, -0.00010652653872966766, -0.00010304618626832962, -9.956583380699158e-05, -9.608548134565353e-05, -9.260512888431549e-05, -8.912477642297745e-05, -8.56444239616394e-05, -8.216407150030136e-05, -7.868371903896332e-05, -7.520336657762527e-05, -7.172301411628723e-05, -6.824266165494919e-05, -6.476230919361115e-05, -6.12819567322731e-05, -5.780160427093506e-05, -5.4321251809597015e-05, -5.084089934825897e-05, -4.736054688692093e-05, -4.3880194425582886e-05, -4.039984196424484e-05, -3.69194895029068e-05, -3.3439137041568756e-05, -2.9958784580230713e-05, -2.647843211889267e-05, -2.2998079657554626e-05, -1.9517727196216583e-05, -1.603737473487854e-05, -1.2557022273540497e-05, -9.076669812202454e-06, -5.59631735086441e-06, -2.115964889526367e-06, 1.364387571811676e-06, 4.844740033149719e-06, 8.325092494487762e-06, 1.1805444955825806e-05, 1.528579741716385e-05, 1.8766149878501892e-05, 2.2246502339839935e-05, 2.572685480117798e-05, 2.9207207262516022e-05, 3.2687559723854065e-05, 3.616791218519211e-05, 3.964826464653015e-05, 4.3128617107868195e-05, 4.660896956920624e-05, 5.008932203054428e-05, 5.3569674491882324e-05, 5.705002695322037e-05, 6.053037941455841e-05, 6.401073187589645e-05, 6.74910843372345e-05, 7.097143679857254e-05, 7.445178925991058e-05, 7.793214172124863e-05, 8.141249418258667e-05, 8.489284664392471e-05, 8.837319910526276e-05, 9.18535515666008e-05, 9.533390402793884e-05, 9.881425648927689e-05, 0.00010229460895061493, 0.00010577496141195297, 0.00010925531387329102]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 6.0, 9.0, 14.0, 24.0, 14.0, 43.0, 55.0, 81.0, 149.0, 266.0, 531.0, 1192.0, 2987.0, 10243.0, 60028.0, 552983.0, 370827.0, 37256.0, 7405.0, 2415.0, 962.0, 450.0, 226.0, 135.0, 76.0, 36.0, 38.0, 23.0, 25.0, 20.0, 9.0, 8.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0819091796875, -0.07968854904174805, -0.0774679183959961, -0.07524728775024414, -0.07302665710449219, -0.07080602645874023, -0.06858539581298828, -0.06636476516723633, -0.06414413452148438, -0.06192350387573242, -0.05970287322998047, -0.057482242584228516, -0.05526161193847656, -0.05304098129272461, -0.050820350646972656, -0.0485997200012207, -0.04637908935546875, -0.0441584587097168, -0.041937828063964844, -0.03971719741821289, -0.03749656677246094, -0.035275936126708984, -0.03305530548095703, -0.030834674835205078, -0.028614044189453125, -0.026393413543701172, -0.02417278289794922, -0.021952152252197266, -0.019731521606445312, -0.01751089096069336, -0.015290260314941406, -0.013069629669189453, -0.0108489990234375, -0.008628368377685547, -0.006407737731933594, -0.004187107086181641, -0.0019664764404296875, 0.0002541542053222656, 0.0024747848510742188, 0.004695415496826172, 0.006916046142578125, 0.009136676788330078, 0.011357307434082031, 0.013577938079833984, 0.015798568725585938, 0.01801919937133789, 0.020239830017089844, 0.022460460662841797, 0.02468109130859375, 0.026901721954345703, 0.029122352600097656, 0.03134298324584961, 0.03356361389160156, 0.035784244537353516, 0.03800487518310547, 0.04022550582885742, 0.042446136474609375, 0.04466676712036133, 0.04688739776611328, 0.049108028411865234, 0.05132865905761719, 0.05354928970336914, 0.055769920349121094, 0.05799055099487305, 0.060211181640625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 14.0, 13.0, 34.0, 37.0, 50.0, 91.0, 99.0, 96.0, 119.0, 107.0, 95.0, 66.0, 41.0, 26.0, 33.0, 28.0, 9.0, 9.0, 9.0, 3.0, 3.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.09991455078125, -0.09750843048095703, -0.09510231018066406, -0.0926961898803711, -0.09029006958007812, -0.08788394927978516, -0.08547782897949219, -0.08307170867919922, -0.08066558837890625, -0.07825946807861328, -0.07585334777832031, -0.07344722747802734, -0.07104110717773438, -0.0686349868774414, -0.06622886657714844, -0.06382274627685547, -0.0614166259765625, -0.05901050567626953, -0.05660438537597656, -0.054198265075683594, -0.051792144775390625, -0.049386024475097656, -0.04697990417480469, -0.04457378387451172, -0.04216766357421875, -0.03976154327392578, -0.03735542297363281, -0.034949302673339844, -0.032543182373046875, -0.030137062072753906, -0.027730941772460938, -0.02532482147216797, -0.022918701171875, -0.02051258087158203, -0.018106460571289062, -0.015700340270996094, -0.013294219970703125, -0.010888099670410156, -0.008481979370117188, -0.006075859069824219, -0.00366973876953125, -0.0012636184692382812, 0.0011425018310546875, 0.0035486221313476562, 0.005954742431640625, 0.008360862731933594, 0.010766983032226562, 0.013173103332519531, 0.0155792236328125, 0.01798534393310547, 0.020391464233398438, 0.022797584533691406, 0.025203704833984375, 0.027609825134277344, 0.030015945434570312, 0.03242206573486328, 0.03482818603515625, 0.03723430633544922, 0.03964042663574219, 0.042046546936035156, 0.044452667236328125, 0.046858787536621094, 0.04926490783691406, 0.05167102813720703, 0.0540771484375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 29.0, 245.0, 570.0, 125.0, 26.0, 9.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.828999996185303, -6.695713043212891, -6.56242561340332, -6.429138660430908, -6.295851230621338, -6.162564277648926, -6.0292768478393555, -5.895989894866943, -5.762702941894531, -5.629415988922119, -5.496128559112549, -5.362841606140137, -5.229554176330566, -5.096267223358154, -4.962980270385742, -4.829692840576172, -4.696405410766602, -4.5631184577941895, -4.429831027984619, -4.296544075012207, -4.163256645202637, -4.029969692230225, -3.8966825008392334, -3.763395309448242, -3.63010835647583, -3.496821165084839, -3.3635339736938477, -3.2302470207214355, -3.0969598293304443, -2.963672637939453, -2.830385446548462, -2.6970982551574707, -2.5638108253479004, -2.430523633956909, -2.297236442565918, -2.163949489593506, -2.0306622982025146, -1.8973751068115234, -1.7640879154205322, -1.630800724029541, -1.497513771057129, -1.3642265796661377, -1.230939507484436, -1.0976523160934448, -0.9643651843070984, -0.831078052520752, -0.6977908611297607, -0.5645037293434143, -0.43121659755706787, -0.29792946577072144, -0.1646423041820526, -0.03135514259338379, 0.10193198919296265, 0.23521912097930908, 0.3685063123703003, 0.5017934441566467, 0.6350805759429932, 0.7683677077293396, 0.901654839515686, 1.0349420309066772, 1.168229103088379, 1.3015162944793701, 1.4348034858703613, 1.5680906772613525, 1.7013777494430542]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 7.0, 8.0, 6.0, 9.0, 10.0, 14.0, 18.0, 21.0, 24.0, 21.0, 35.0, 34.0, 34.0, 38.0, 33.0, 33.0, 35.0, 42.0, 49.0, 43.0, 50.0, 45.0, 42.0, 38.0, 36.0, 32.0, 29.0, 18.0, 25.0, 27.0, 20.0, 19.0, 23.0, 14.0, 16.0, 8.0, 11.0, 8.0, 4.0, 4.0, 1.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.0462589263916016, -1.0107876062393188, -0.9753163456916809, -0.939845085144043, -0.9043737649917603, -0.8689024448394775, -0.8334311842918396, -0.7979599237442017, -0.762488603591919, -0.7270172834396362, -0.6915460228919983, -0.6560747623443604, -0.6206034421920776, -0.5851321220397949, -0.549660861492157, -0.514189600944519, -0.47871828079223633, -0.443246990442276, -0.4077757000923157, -0.37230440974235535, -0.336833119392395, -0.3013618290424347, -0.26589053869247437, -0.23041924834251404, -0.1949479579925537, -0.15947666764259338, -0.12400537729263306, -0.08853408694267273, -0.0530627965927124, -0.017591506242752075, 0.017879784107208252, 0.05335107445716858, 0.08882224559783936, 0.12429353594779968, 0.15976482629776, 0.19523611664772034, 0.23070740699768066, 0.266178697347641, 0.3016499876976013, 0.33712127804756165, 0.372592568397522, 0.4080638587474823, 0.4435351490974426, 0.47900643944740295, 0.5144777297973633, 0.549949049949646, 0.5854203104972839, 0.6208915710449219, 0.6563628911972046, 0.6918342113494873, 0.7273054718971252, 0.7627767324447632, 0.7982480525970459, 0.8337193727493286, 0.8691906332969666, 0.9046618938446045, 0.9401332139968872, 0.9756045341491699, 1.011075735092163, 1.0465470552444458, 1.0820183753967285, 1.1174896955490112, 1.152961015701294, 1.188432216644287, 1.2239035367965698]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 10.0, 10.0, 22.0, 23.0, 28.0, 40.0, 52.0, 79.0, 146.0, 242.0, 518.0, 1190.0, 3286.0, 12614.0, 96002.0, 3967201.0, 95484.0, 12129.0, 3224.0, 1097.0, 448.0, 204.0, 94.0, 60.0, 22.0, 18.0, 11.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44091796875, -0.4305419921875, -0.420166015625, -0.4097900390625, -0.3994140625, -0.3890380859375, -0.378662109375, -0.3682861328125, -0.35791015625, -0.3475341796875, -0.337158203125, -0.3267822265625, -0.31640625, -0.3060302734375, -0.295654296875, -0.2852783203125, -0.27490234375, -0.2645263671875, -0.254150390625, -0.2437744140625, -0.2333984375, -0.2230224609375, -0.212646484375, -0.2022705078125, -0.19189453125, -0.1815185546875, -0.171142578125, -0.1607666015625, -0.150390625, -0.1400146484375, -0.129638671875, -0.1192626953125, -0.10888671875, -0.0985107421875, -0.088134765625, -0.0777587890625, -0.0673828125, -0.0570068359375, -0.046630859375, -0.0362548828125, -0.02587890625, -0.0155029296875, -0.005126953125, 0.0052490234375, 0.015625, 0.0260009765625, 0.036376953125, 0.0467529296875, 0.05712890625, 0.0675048828125, 0.077880859375, 0.0882568359375, 0.0986328125, 0.1090087890625, 0.119384765625, 0.1297607421875, 0.14013671875, 0.1505126953125, 0.160888671875, 0.1712646484375, 0.181640625, 0.1920166015625, 0.202392578125, 0.2127685546875, 0.22314453125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 14.0, 18.0, 35.0, 49.0, 63.0, 80.0, 78.0, 114.0, 107.0, 90.0, 87.0, 94.0, 57.0, 44.0, 26.0, 17.0, 7.0, 6.0, 6.0, 2.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.182373046875, -0.1780719757080078, -0.17377090454101562, -0.16946983337402344, -0.16516876220703125, -0.16086769104003906, -0.15656661987304688, -0.1522655487060547, -0.1479644775390625, -0.1436634063720703, -0.13936233520507812, -0.13506126403808594, -0.13076019287109375, -0.12645912170410156, -0.12215805053710938, -0.11785697937011719, -0.113555908203125, -0.10925483703613281, -0.10495376586914062, -0.10065269470214844, -0.09635162353515625, -0.09205055236816406, -0.08774948120117188, -0.08344841003417969, -0.0791473388671875, -0.07484626770019531, -0.07054519653320312, -0.06624412536621094, -0.06194305419921875, -0.05764198303222656, -0.053340911865234375, -0.04903984069824219, -0.04473876953125, -0.04043769836425781, -0.036136627197265625, -0.03183555603027344, -0.02753448486328125, -0.023233413696289062, -0.018932342529296875, -0.014631271362304688, -0.0103302001953125, -0.0060291290283203125, -0.001728057861328125, 0.0025730133056640625, 0.00687408447265625, 0.011175155639648438, 0.015476226806640625, 0.019777297973632812, 0.024078369140625, 0.028379440307617188, 0.032680511474609375, 0.03698158264160156, 0.04128265380859375, 0.04558372497558594, 0.049884796142578125, 0.05418586730957031, 0.0584869384765625, 0.06278800964355469, 0.06708908081054688, 0.07139015197753906, 0.07569122314453125, 0.07999229431152344, 0.08429336547851562, 0.08859443664550781, 0.0928955078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 8.0, 5.0, 20.0, 21.0, 33.0, 56.0, 87.0, 183.0, 388.0, 1158.0, 4386.0, 21449.0, 587428.0, 3539031.0, 31787.0, 5737.0, 1552.0, 468.0, 187.0, 101.0, 63.0, 42.0, 33.0, 17.0, 15.0, 12.0, 3.0, 8.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.256591796875, -0.24746322631835938, -0.23833465576171875, -0.22920608520507812, -0.2200775146484375, -0.21094894409179688, -0.20182037353515625, -0.19269180297851562, -0.183563232421875, -0.17443466186523438, -0.16530609130859375, -0.15617752075195312, -0.1470489501953125, -0.13792037963867188, -0.12879180908203125, -0.11966323852539062, -0.11053466796875, -0.10140609741210938, -0.09227752685546875, -0.08314895629882812, -0.0740203857421875, -0.06489181518554688, -0.05576324462890625, -0.046634674072265625, -0.037506103515625, -0.028377532958984375, -0.01924896240234375, -0.010120391845703125, -0.0009918212890625, 0.008136749267578125, 0.01726531982421875, 0.026393890380859375, 0.0355224609375, 0.044651031494140625, 0.05377960205078125, 0.06290817260742188, 0.0720367431640625, 0.08116531372070312, 0.09029388427734375, 0.09942245483398438, 0.108551025390625, 0.11767959594726562, 0.12680816650390625, 0.13593673706054688, 0.1450653076171875, 0.15419387817382812, 0.16332244873046875, 0.17245101928710938, 0.18157958984375, 0.19070816040039062, 0.19983673095703125, 0.20896530151367188, 0.2180938720703125, 0.22722244262695312, 0.23635101318359375, 0.24547958374023438, 0.254608154296875, 0.2637367248535156, 0.27286529541015625, 0.2819938659667969, 0.2911224365234375, 0.3002510070800781, 0.30937957763671875, 0.3185081481933594, 0.32763671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 2.0, 6.0, 8.0, 12.0, 29.0, 48.0, 67.0, 145.0, 400.0, 2549.0, 540.0, 129.0, 56.0, 26.0, 21.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09259033203125, -0.0878610610961914, -0.08313179016113281, -0.07840251922607422, -0.07367324829101562, -0.06894397735595703, -0.06421470642089844, -0.059485435485839844, -0.05475616455078125, -0.050026893615722656, -0.04529762268066406, -0.04056835174560547, -0.035839080810546875, -0.03110980987548828, -0.026380538940429688, -0.021651268005371094, -0.0169219970703125, -0.012192726135253906, -0.0074634552001953125, -0.0027341842651367188, 0.001995086669921875, 0.006724357604980469, 0.011453628540039062, 0.016182899475097656, 0.02091217041015625, 0.025641441345214844, 0.030370712280273438, 0.03509998321533203, 0.039829254150390625, 0.04455852508544922, 0.04928779602050781, 0.054017066955566406, 0.058746337890625, 0.0634756088256836, 0.06820487976074219, 0.07293415069580078, 0.07766342163085938, 0.08239269256591797, 0.08712196350097656, 0.09185123443603516, 0.09658050537109375, 0.10130977630615234, 0.10603904724121094, 0.11076831817626953, 0.11549758911132812, 0.12022686004638672, 0.12495613098144531, 0.1296854019165039, 0.1344146728515625, 0.1391439437866211, 0.1438732147216797, 0.14860248565673828, 0.15333175659179688, 0.15806102752685547, 0.16279029846191406, 0.16751956939697266, 0.17224884033203125, 0.17697811126708984, 0.18170738220214844, 0.18643665313720703, 0.19116592407226562, 0.19589519500732422, 0.2006244659423828, 0.2053537368774414, 0.2100830078125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 7.0, 22.0, 110.0, 476.0, 316.0, 55.0, 8.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0404784679412842, -0.9969796538352966, -0.9534808397293091, -0.9099820852279663, -0.866483211517334, -0.8229844570159912, -0.7794856429100037, -0.7359868288040161, -0.6924880146980286, -0.648989200592041, -0.6054903864860535, -0.5619915723800659, -0.5184928178787231, -0.4749939739704132, -0.43149518966674805, -0.3879963755607605, -0.34449756145477295, -0.3009987473487854, -0.25749993324279785, -0.2140011489391327, -0.17050233483314514, -0.1270035207271576, -0.08350473642349243, -0.04000592231750488, 0.003492891788482666, 0.04699169844388962, 0.09049050509929657, 0.13398930430412292, 0.17748811841011047, 0.22098693251609802, 0.2644857168197632, 0.30798453092575073, 0.3514833450317383, 0.39498215913772583, 0.4384809732437134, 0.48197975754737854, 0.5254786014556885, 0.5689773559570312, 0.6124761700630188, 0.6559749841690063, 0.6994737982749939, 0.7429726123809814, 0.786471426486969, 0.8299702405929565, 0.8734689950942993, 0.9169678688049316, 0.9604666233062744, 1.0039653778076172, 1.0474642515182495, 1.0909630060195923, 1.1344618797302246, 1.1779606342315674, 1.2214595079421997, 1.2649582624435425, 1.3084571361541748, 1.3519558906555176, 1.3954546451568604, 1.4389533996582031, 1.4824522733688354, 1.5259510278701782, 1.5694499015808105, 1.6129486560821533, 1.656447410583496, 1.6999462842941284, 1.7434451580047607]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 11.0, 15.0, 9.0, 13.0, 18.0, 27.0, 20.0, 19.0, 27.0, 41.0, 40.0, 49.0, 31.0, 44.0, 58.0, 51.0, 48.0, 55.0, 47.0, 55.0, 36.0, 46.0, 44.0, 28.0, 26.0, 20.0, 27.0, 15.0, 15.0, 18.0, 13.0, 10.0, 7.0, 8.0, 4.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.301017701625824, -0.29016268253326416, -0.27930769324302673, -0.2684526741504669, -0.2575976550579071, -0.24674266576766968, -0.23588764667510986, -0.22503264248371124, -0.21417763829231262, -0.203322634100914, -0.1924676150083542, -0.18161261081695557, -0.17075760662555695, -0.15990260243415833, -0.1490475833415985, -0.1381925791501999, -0.12733756005764008, -0.11648254841566086, -0.10562754422426224, -0.09477253258228302, -0.0839175283908844, -0.07306251674890518, -0.062207505106925964, -0.051352500915527344, -0.040497489273548126, -0.029642481356859207, -0.01878747157752514, -0.00793246179819107, 0.0029225461184978485, 0.013777554035186768, 0.024632565677165985, 0.035487569868564606, 0.04634258151054382, 0.05719758942723274, 0.06805259734392166, 0.07890760898590088, 0.0897626131772995, 0.10061762481927872, 0.11147263646125793, 0.12232764065265656, 0.13318264484405518, 0.1440376490354538, 0.1548926681280136, 0.16574767231941223, 0.17660267651081085, 0.18745768070220947, 0.1983126997947693, 0.2091677039861679, 0.22002272307872772, 0.23087772727012634, 0.24173274636268616, 0.2525877356529236, 0.2634427547454834, 0.2742977738380432, 0.285152792930603, 0.29600778222084045, 0.30686280131340027, 0.3177178204059601, 0.3285728096961975, 0.3394278287887573, 0.35028284788131714, 0.36113783717155457, 0.3719928562641144, 0.3828478455543518, 0.3937028646469116]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 6.0, 4.0, 1.0, 10.0, 11.0, 17.0, 12.0, 31.0, 44.0, 64.0, 99.0, 189.0, 399.0, 791.0, 1879.0, 5812.0, 25884.0, 272724.0, 674975.0, 51667.0, 9031.0, 2822.0, 1006.0, 481.0, 218.0, 151.0, 61.0, 54.0, 31.0, 31.0, 15.0, 6.0, 5.0, 3.0, 7.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.466796875, -0.4535255432128906, -0.44025421142578125, -0.4269828796386719, -0.4137115478515625, -0.4004402160644531, -0.38716888427734375, -0.3738975524902344, -0.360626220703125, -0.3473548889160156, -0.33408355712890625, -0.3208122253417969, -0.3075408935546875, -0.2942695617675781, -0.28099822998046875, -0.2677268981933594, -0.25445556640625, -0.24118423461914062, -0.22791290283203125, -0.21464157104492188, -0.2013702392578125, -0.18809890747070312, -0.17482757568359375, -0.16155624389648438, -0.148284912109375, -0.13501358032226562, -0.12174224853515625, -0.10847091674804688, -0.0951995849609375, -0.08192825317382812, -0.06865692138671875, -0.055385589599609375, -0.0421142578125, -0.028842926025390625, -0.01557159423828125, -0.002300262451171875, 0.0109710693359375, 0.024242401123046875, 0.03751373291015625, 0.050785064697265625, 0.064056396484375, 0.07732772827148438, 0.09059906005859375, 0.10387039184570312, 0.1171417236328125, 0.13041305541992188, 0.14368438720703125, 0.15695571899414062, 0.17022705078125, 0.18349838256835938, 0.19676971435546875, 0.21004104614257812, 0.2233123779296875, 0.23658370971679688, 0.24985504150390625, 0.2631263732910156, 0.276397705078125, 0.2896690368652344, 0.30294036865234375, 0.3162117004394531, 0.3294830322265625, 0.3427543640136719, 0.35602569580078125, 0.3692970275878906, 0.382568359375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 10.0, 37.0, 36.0, 54.0, 62.0, 91.0, 93.0, 113.0, 103.0, 99.0, 82.0, 74.0, 46.0, 45.0, 18.0, 8.0, 9.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.183837890625, -0.17944908142089844, -0.17506027221679688, -0.1706714630126953, -0.16628265380859375, -0.1618938446044922, -0.15750503540039062, -0.15311622619628906, -0.1487274169921875, -0.14433860778808594, -0.13994979858398438, -0.1355609893798828, -0.13117218017578125, -0.1267833709716797, -0.12239456176757812, -0.11800575256347656, -0.113616943359375, -0.10922813415527344, -0.10483932495117188, -0.10045051574707031, -0.09606170654296875, -0.09167289733886719, -0.08728408813476562, -0.08289527893066406, -0.0785064697265625, -0.07411766052246094, -0.06972885131835938, -0.06534004211425781, -0.06095123291015625, -0.05656242370605469, -0.052173614501953125, -0.04778480529785156, -0.04339599609375, -0.03900718688964844, -0.034618377685546875, -0.030229568481445312, -0.02584075927734375, -0.021451950073242188, -0.017063140869140625, -0.012674331665039062, -0.0082855224609375, -0.0038967132568359375, 0.000492095947265625, 0.0048809051513671875, 0.00926971435546875, 0.013658523559570312, 0.018047332763671875, 0.022436141967773438, 0.026824951171875, 0.031213760375976562, 0.035602569580078125, 0.03999137878417969, 0.04438018798828125, 0.04876899719238281, 0.053157806396484375, 0.05754661560058594, 0.0619354248046875, 0.06632423400878906, 0.07071304321289062, 0.07510185241699219, 0.07949066162109375, 0.08387947082519531, 0.08826828002929688, 0.09265708923339844, 0.0970458984375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 4.0, 5.0, 4.0, 6.0, 17.0, 17.0, 32.0, 55.0, 75.0, 126.0, 199.0, 349.0, 617.0, 1257.0, 2511.0, 6265.0, 20116.0, 98876.0, 675917.0, 194776.0, 32014.0, 8711.0, 3275.0, 1477.0, 759.0, 403.0, 252.0, 137.0, 97.0, 58.0, 35.0, 37.0, 24.0, 16.0, 7.0, 4.0, 9.0, 5.0, 7.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.223388671875, -0.21531295776367188, -0.20723724365234375, -0.19916152954101562, -0.1910858154296875, -0.18301010131835938, -0.17493438720703125, -0.16685867309570312, -0.158782958984375, -0.15070724487304688, -0.14263153076171875, -0.13455581665039062, -0.1264801025390625, -0.11840438842773438, -0.11032867431640625, -0.10225296020507812, -0.09417724609375, -0.08610153198242188, -0.07802581787109375, -0.06995010375976562, -0.0618743896484375, -0.053798675537109375, -0.04572296142578125, -0.037647247314453125, -0.029571533203125, -0.021495819091796875, -0.01342010498046875, -0.005344390869140625, 0.0027313232421875, 0.010807037353515625, 0.01888275146484375, 0.026958465576171875, 0.0350341796875, 0.043109893798828125, 0.05118560791015625, 0.059261322021484375, 0.0673370361328125, 0.07541275024414062, 0.08348846435546875, 0.09156417846679688, 0.099639892578125, 0.10771560668945312, 0.11579132080078125, 0.12386703491210938, 0.1319427490234375, 0.14001846313476562, 0.14809417724609375, 0.15616989135742188, 0.16424560546875, 0.17232131958007812, 0.18039703369140625, 0.18847274780273438, 0.1965484619140625, 0.20462417602539062, 0.21269989013671875, 0.22077560424804688, 0.228851318359375, 0.23692703247070312, 0.24500274658203125, 0.2530784606933594, 0.2611541748046875, 0.2692298889160156, 0.27730560302734375, 0.2853813171386719, 0.29345703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 9.0, 7.0, 10.0, 6.0, 17.0, 14.0, 18.0, 23.0, 27.0, 25.0, 33.0, 36.0, 24.0, 35.0, 32.0, 48.0, 54.0, 59.0, 44.0, 55.0, 48.0, 52.0, 43.0, 34.0, 32.0, 26.0, 22.0, 26.0, 24.0, 16.0, 17.0, 13.0, 11.0, 11.0, 5.0, 6.0, 8.0, 3.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.280029296875, -0.27203369140625, -0.2640380859375, -0.25604248046875, -0.248046875, -0.24005126953125, -0.2320556640625, -0.22406005859375, -0.216064453125, -0.20806884765625, -0.2000732421875, -0.19207763671875, -0.18408203125, -0.17608642578125, -0.1680908203125, -0.16009521484375, -0.152099609375, -0.14410400390625, -0.1361083984375, -0.12811279296875, -0.1201171875, -0.11212158203125, -0.1041259765625, -0.09613037109375, -0.088134765625, -0.08013916015625, -0.0721435546875, -0.06414794921875, -0.05615234375, -0.04815673828125, -0.0401611328125, -0.03216552734375, -0.024169921875, -0.01617431640625, -0.0081787109375, -0.00018310546875, 0.0078125, 0.01580810546875, 0.0238037109375, 0.03179931640625, 0.039794921875, 0.04779052734375, 0.0557861328125, 0.06378173828125, 0.07177734375, 0.07977294921875, 0.0877685546875, 0.09576416015625, 0.103759765625, 0.11175537109375, 0.1197509765625, 0.12774658203125, 0.1357421875, 0.14373779296875, 0.1517333984375, 0.15972900390625, 0.167724609375, 0.17572021484375, 0.1837158203125, 0.19171142578125, 0.19970703125, 0.20770263671875, 0.2156982421875, 0.22369384765625, 0.231689453125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 9.0, 19.0, 46.0, 71.0, 139.0, 334.0, 961.0, 7452.0, 1008083.0, 29138.0, 1487.0, 445.0, 191.0, 88.0, 40.0, 33.0, 13.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2347412109375, -0.22625160217285156, -0.21776199340820312, -0.2092723846435547, -0.20078277587890625, -0.1922931671142578, -0.18380355834960938, -0.17531394958496094, -0.1668243408203125, -0.15833473205566406, -0.14984512329101562, -0.1413555145263672, -0.13286590576171875, -0.12437629699707031, -0.11588668823242188, -0.10739707946777344, -0.098907470703125, -0.09041786193847656, -0.08192825317382812, -0.07343864440917969, -0.06494903564453125, -0.05645942687988281, -0.047969818115234375, -0.03948020935058594, -0.0309906005859375, -0.022500991821289062, -0.014011383056640625, -0.0055217742919921875, 0.00296783447265625, 0.011457443237304688, 0.019947052001953125, 0.028436660766601562, 0.03692626953125, 0.04541587829589844, 0.053905487060546875, 0.06239509582519531, 0.07088470458984375, 0.07937431335449219, 0.08786392211914062, 0.09635353088378906, 0.1048431396484375, 0.11333274841308594, 0.12182235717773438, 0.1303119659423828, 0.13880157470703125, 0.1472911834716797, 0.15578079223632812, 0.16427040100097656, 0.172760009765625, 0.18124961853027344, 0.18973922729492188, 0.1982288360595703, 0.20671844482421875, 0.2152080535888672, 0.22369766235351562, 0.23218727111816406, 0.2406768798828125, 0.24916648864746094, 0.2576560974121094, 0.2661457061767578, 0.27463531494140625, 0.2831249237060547, 0.2916145324707031, 0.30010414123535156, 0.30859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 23.0, 30.0, 58.0, 117.0, 218.0, 247.0, 131.0, 76.0, 47.0, 16.0, 12.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004241466522216797, -0.00041430629789829254, -0.0004044659435749054, -0.00039462558925151825, -0.0003847852349281311, -0.00037494488060474396, -0.0003651045262813568, -0.00035526417195796967, -0.0003454238176345825, -0.0003355834633111954, -0.00032574310898780823, -0.0003159027546644211, -0.00030606240034103394, -0.0002962220460176468, -0.00028638169169425964, -0.0002765413373708725, -0.00026670098304748535, -0.0002568606287240982, -0.00024702027440071106, -0.00023717992007732391, -0.00022733956575393677, -0.00021749921143054962, -0.00020765885710716248, -0.00019781850278377533, -0.00018797814846038818, -0.00017813779413700104, -0.0001682974398136139, -0.00015845708549022675, -0.0001486167311668396, -0.00013877637684345245, -0.0001289360225200653, -0.00011909566819667816, -0.00010925531387329102, -9.941495954990387e-05, -8.957460522651672e-05, -7.973425090312958e-05, -6.989389657974243e-05, -6.0053542256355286e-05, -5.021318793296814e-05, -4.0372833609580994e-05, -3.053247928619385e-05, -2.06921249628067e-05, -1.0851770639419556e-05, -1.0114163160324097e-06, 8.828938007354736e-06, 1.8669292330741882e-05, 2.850964665412903e-05, 3.8350000977516174e-05, 4.819035530090332e-05, 5.8030709624290466e-05, 6.787106394767761e-05, 7.771141827106476e-05, 8.75517725944519e-05, 9.739212691783905e-05, 0.0001072324812412262, 0.00011707283556461334, 0.0001269131898880005, 0.00013675354421138763, 0.00014659389853477478, 0.00015643425285816193, 0.00016627460718154907, 0.00017611496150493622, 0.00018595531582832336, 0.0001957956701517105, 0.00020563602447509766]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 11.0, 39.0, 65.0, 135.0, 386.0, 1537.0, 241195.0, 802309.0, 2206.0, 383.0, 140.0, 78.0, 36.0, 15.0, 13.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.316650390625, -0.3083362579345703, -0.3000221252441406, -0.29170799255371094, -0.28339385986328125, -0.27507972717285156, -0.2667655944824219, -0.2584514617919922, -0.2501373291015625, -0.2418231964111328, -0.23350906372070312, -0.22519493103027344, -0.21688079833984375, -0.20856666564941406, -0.20025253295898438, -0.1919384002685547, -0.183624267578125, -0.1753101348876953, -0.16699600219726562, -0.15868186950683594, -0.15036773681640625, -0.14205360412597656, -0.13373947143554688, -0.1254253387451172, -0.1171112060546875, -0.10879707336425781, -0.10048294067382812, -0.09216880798339844, -0.08385467529296875, -0.07554054260253906, -0.06722640991210938, -0.05891227722167969, -0.05059814453125, -0.04228401184082031, -0.033969879150390625, -0.025655746459960938, -0.01734161376953125, -0.009027481079101562, -0.000713348388671875, 0.0076007843017578125, 0.0159149169921875, 0.024229049682617188, 0.032543182373046875, 0.04085731506347656, 0.04917144775390625, 0.05748558044433594, 0.06579971313476562, 0.07411384582519531, 0.082427978515625, 0.09074211120605469, 0.09905624389648438, 0.10737037658691406, 0.11568450927734375, 0.12399864196777344, 0.13231277465820312, 0.1406269073486328, 0.1489410400390625, 0.1572551727294922, 0.16556930541992188, 0.17388343811035156, 0.18219757080078125, 0.19051170349121094, 0.19882583618164062, 0.2071399688720703, 0.2154541015625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 13.0, 10.0, 51.0, 127.0, 253.0, 305.0, 136.0, 69.0, 22.0, 15.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.31689453125, -0.31017398834228516, -0.3034534454345703, -0.29673290252685547, -0.2900123596191406, -0.2832918167114258, -0.27657127380371094, -0.2698507308959961, -0.26313018798828125, -0.2564096450805664, -0.24968910217285156, -0.24296855926513672, -0.23624801635742188, -0.22952747344970703, -0.2228069305419922, -0.21608638763427734, -0.2093658447265625, -0.20264530181884766, -0.1959247589111328, -0.18920421600341797, -0.18248367309570312, -0.17576313018798828, -0.16904258728027344, -0.1623220443725586, -0.15560150146484375, -0.1488809585571289, -0.14216041564941406, -0.13543987274169922, -0.12871932983398438, -0.12199878692626953, -0.11527824401855469, -0.10855770111083984, -0.101837158203125, -0.09511661529541016, -0.08839607238769531, -0.08167552947998047, -0.07495498657226562, -0.06823444366455078, -0.06151390075683594, -0.054793357849121094, -0.04807281494140625, -0.041352272033691406, -0.03463172912597656, -0.02791118621826172, -0.021190643310546875, -0.014470100402832031, -0.0077495574951171875, -0.0010290145874023438, 0.0056915283203125, 0.012412071228027344, 0.019132614135742188, 0.02585315704345703, 0.032573699951171875, 0.03929424285888672, 0.04601478576660156, 0.052735328674316406, 0.05945587158203125, 0.0661764144897461, 0.07289695739746094, 0.07961750030517578, 0.08633804321289062, 0.09305858612060547, 0.09977912902832031, 0.10649967193603516, 0.11322021484375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 12.0, 59.0, 330.0, 473.0, 115.0, 16.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.055200576782227, -9.869478225708008, -9.683755874633789, -9.49803352355957, -9.312312126159668, -9.12658977508545, -8.94086742401123, -8.755145072937012, -8.569422721862793, -8.383700370788574, -8.197978019714355, -8.012255668640137, -7.826533794403076, -7.640811443328857, -7.455089569091797, -7.269367218017578, -7.083644866943359, -6.897922515869141, -6.71220064163208, -6.526478290557861, -6.340755939483643, -6.155033588409424, -5.969311714172363, -5.7835893630981445, -5.597867488861084, -5.412145137786865, -5.226423263549805, -5.040700912475586, -4.854978561401367, -4.669256210327148, -4.483534336090088, -4.297811985015869, -4.112089157104492, -3.9263670444488525, -3.740644693374634, -3.554922580718994, -3.3692002296447754, -3.1834781169891357, -2.997756004333496, -2.8120336532592773, -2.626311779022217, -2.440589666366577, -2.2548673152923584, -2.0691452026367188, -1.8834228515625, -1.6977007389068604, -1.5119785070419312, -1.326256275177002, -1.1405339241027832, -0.954811692237854, -0.7690894603729248, -0.5833672881126404, -0.3976450562477112, -0.21192282438278198, -0.02620065212249756, 0.15952157974243164, 0.34524381160736084, 0.53096604347229, 0.7166882753372192, 0.9024104475975037, 1.088132619857788, 1.2738549709320068, 1.4595770835876465, 1.6452993154525757, 1.8310215473175049]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 9.0, 6.0, 7.0, 9.0, 9.0, 13.0, 13.0, 26.0, 23.0, 27.0, 24.0, 20.0, 34.0, 35.0, 40.0, 32.0, 27.0, 33.0, 37.0, 46.0, 44.0, 46.0, 34.0, 37.0, 39.0, 33.0, 20.0, 31.0, 27.0, 25.0, 26.0, 18.0, 24.0, 12.0, 21.0, 19.0, 12.0, 6.0, 9.0, 6.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 4.0, 7.0, 2.0, 1.0, 2.0], "bins": [-1.1482033729553223, -1.113869547843933, -1.079535722732544, -1.0452018976211548, -1.0108680725097656, -0.9765341877937317, -0.9422003626823425, -0.9078665375709534, -0.8735326528549194, -0.8391988277435303, -0.8048650026321411, -0.770531177520752, -0.736197292804718, -0.7018634676933289, -0.6675296425819397, -0.6331958174705505, -0.5988619923591614, -0.5645281672477722, -0.5301943421363831, -0.4958604872226715, -0.46152663230895996, -0.4271928071975708, -0.39285898208618164, -0.3585251569747925, -0.32419130206108093, -0.2898574769496918, -0.2555236220359802, -0.22118979692459106, -0.1868559569120407, -0.15252211689949036, -0.1181882917881012, -0.08385445177555084, -0.04952061176300049, -0.015186775475740433, 0.019147060811519623, 0.05348089337348938, 0.08781473338603973, 0.12214857339859009, 0.15648239850997925, 0.1908162385225296, 0.22515007853507996, 0.2594839036464691, 0.29381775856018066, 0.3281515836715698, 0.362485408782959, 0.39681926369667053, 0.4311530888080597, 0.46548694372177124, 0.4998207688331604, 0.5341545939445496, 0.5684884190559387, 0.6028223037719727, 0.6371561288833618, 0.671489953994751, 0.7058237791061401, 0.7401576042175293, 0.7744914293289185, 0.8088252544403076, 0.8431590795516968, 0.8774929046630859, 0.9118267893791199, 0.946160614490509, 0.9804944396018982, 1.0148283243179321, 1.0491621494293213]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 3.0, 6.0, 9.0, 6.0, 15.0, 18.0, 21.0, 36.0, 36.0, 50.0, 60.0, 61.0, 98.0, 102.0, 165.0, 217.0, 316.0, 595.0, 1275.0, 2955.0, 9457.0, 47426.0, 3599948.0, 490952.0, 28807.0, 6702.0, 2362.0, 1037.0, 515.0, 332.0, 178.0, 114.0, 98.0, 66.0, 54.0, 40.0, 36.0, 27.0, 12.0, 16.0, 10.0, 14.0, 7.0, 6.0, 6.0, 3.0, 4.0, 6.0, 3.0, 2.0, 1.0], "bins": [-0.275390625, -0.2677116394042969, -0.26003265380859375, -0.2523536682128906, -0.2446746826171875, -0.23699569702148438, -0.22931671142578125, -0.22163772583007812, -0.213958740234375, -0.20627975463867188, -0.19860076904296875, -0.19092178344726562, -0.1832427978515625, -0.17556381225585938, -0.16788482666015625, -0.16020584106445312, -0.15252685546875, -0.14484786987304688, -0.13716888427734375, -0.12948989868164062, -0.1218109130859375, -0.11413192749023438, -0.10645294189453125, -0.09877395629882812, -0.091094970703125, -0.08341598510742188, -0.07573699951171875, -0.06805801391601562, -0.0603790283203125, -0.052700042724609375, -0.04502105712890625, -0.037342071533203125, -0.0296630859375, -0.021984100341796875, -0.01430511474609375, -0.006626129150390625, 0.0010528564453125, 0.008731842041015625, 0.01641082763671875, 0.024089813232421875, 0.031768798828125, 0.039447784423828125, 0.04712677001953125, 0.054805755615234375, 0.0624847412109375, 0.07016372680664062, 0.07784271240234375, 0.08552169799804688, 0.09320068359375, 0.10087966918945312, 0.10855865478515625, 0.11623764038085938, 0.1239166259765625, 0.13159561157226562, 0.13927459716796875, 0.14695358276367188, 0.154632568359375, 0.16231155395507812, 0.16999053955078125, 0.17766952514648438, 0.1853485107421875, 0.19302749633789062, 0.20070648193359375, 0.20838546752929688, 0.216064453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 14.0, 21.0, 20.0, 37.0, 48.0, 71.0, 80.0, 88.0, 106.0, 103.0, 85.0, 79.0, 83.0, 57.0, 32.0, 28.0, 18.0, 11.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.197021484375, -0.1923351287841797, -0.18764877319335938, -0.18296241760253906, -0.17827606201171875, -0.17358970642089844, -0.16890335083007812, -0.1642169952392578, -0.1595306396484375, -0.1548442840576172, -0.15015792846679688, -0.14547157287597656, -0.14078521728515625, -0.13609886169433594, -0.13141250610351562, -0.1267261505126953, -0.122039794921875, -0.11735343933105469, -0.11266708374023438, -0.10798072814941406, -0.10329437255859375, -0.09860801696777344, -0.09392166137695312, -0.08923530578613281, -0.0845489501953125, -0.07986259460449219, -0.07517623901367188, -0.07048988342285156, -0.06580352783203125, -0.06111717224121094, -0.056430816650390625, -0.05174446105957031, -0.04705810546875, -0.04237174987792969, -0.037685394287109375, -0.03299903869628906, -0.02831268310546875, -0.023626327514648438, -0.018939971923828125, -0.014253616333007812, -0.0095672607421875, -0.0048809051513671875, -0.000194549560546875, 0.0044918060302734375, 0.00917816162109375, 0.013864517211914062, 0.018550872802734375, 0.023237228393554688, 0.027923583984375, 0.03260993957519531, 0.037296295166015625, 0.04198265075683594, 0.04666900634765625, 0.05135536193847656, 0.056041717529296875, 0.06072807312011719, 0.0654144287109375, 0.07010078430175781, 0.07478713989257812, 0.07947349548339844, 0.08415985107421875, 0.08884620666503906, 0.09353256225585938, 0.09821891784667969, 0.1029052734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 10.0, 16.0, 20.0, 28.0, 39.0, 64.0, 90.0, 147.0, 240.0, 358.0, 626.0, 1063.0, 2009.0, 4623.0, 14166.0, 83679.0, 3892036.0, 163224.0, 20183.0, 5893.0, 2499.0, 1326.0, 734.0, 430.0, 275.0, 160.0, 117.0, 80.0, 36.0, 26.0, 23.0, 21.0, 6.0, 12.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.201904296875, -0.19402313232421875, -0.1861419677734375, -0.17826080322265625, -0.170379638671875, -0.16249847412109375, -0.1546173095703125, -0.14673614501953125, -0.13885498046875, -0.13097381591796875, -0.1230926513671875, -0.11521148681640625, -0.107330322265625, -0.09944915771484375, -0.0915679931640625, -0.08368682861328125, -0.0758056640625, -0.06792449951171875, -0.0600433349609375, -0.05216217041015625, -0.044281005859375, -0.03639984130859375, -0.0285186767578125, -0.02063751220703125, -0.01275634765625, -0.00487518310546875, 0.0030059814453125, 0.01088714599609375, 0.018768310546875, 0.02664947509765625, 0.0345306396484375, 0.04241180419921875, 0.05029296875, 0.05817413330078125, 0.0660552978515625, 0.07393646240234375, 0.081817626953125, 0.08969879150390625, 0.0975799560546875, 0.10546112060546875, 0.11334228515625, 0.12122344970703125, 0.1291046142578125, 0.13698577880859375, 0.144866943359375, 0.15274810791015625, 0.1606292724609375, 0.16851043701171875, 0.1763916015625, 0.18427276611328125, 0.1921539306640625, 0.20003509521484375, 0.207916259765625, 0.21579742431640625, 0.2236785888671875, 0.23155975341796875, 0.23944091796875, 0.24732208251953125, 0.2552032470703125, 0.26308441162109375, 0.270965576171875, 0.27884674072265625, 0.2867279052734375, 0.29460906982421875, 0.302490234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 9.0, 8.0, 28.0, 49.0, 74.0, 188.0, 980.0, 2304.0, 214.0, 90.0, 49.0, 32.0, 10.0, 7.0, 7.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09869384765625, -0.09460735321044922, -0.09052085876464844, -0.08643436431884766, -0.08234786987304688, -0.0782613754272461, -0.07417488098144531, -0.07008838653564453, -0.06600189208984375, -0.06191539764404297, -0.05782890319824219, -0.053742408752441406, -0.049655914306640625, -0.045569419860839844, -0.04148292541503906, -0.03739643096923828, -0.0333099365234375, -0.02922344207763672, -0.025136947631835938, -0.021050453186035156, -0.016963958740234375, -0.012877464294433594, -0.008790969848632812, -0.004704475402832031, -0.00061798095703125, 0.0034685134887695312, 0.0075550079345703125, 0.011641502380371094, 0.015727996826171875, 0.019814491271972656, 0.023900985717773438, 0.02798748016357422, 0.032073974609375, 0.03616046905517578, 0.04024696350097656, 0.044333457946777344, 0.048419952392578125, 0.052506446838378906, 0.05659294128417969, 0.06067943572998047, 0.06476593017578125, 0.06885242462158203, 0.07293891906738281, 0.0770254135131836, 0.08111190795898438, 0.08519840240478516, 0.08928489685058594, 0.09337139129638672, 0.0974578857421875, 0.10154438018798828, 0.10563087463378906, 0.10971736907958984, 0.11380386352539062, 0.1178903579711914, 0.12197685241699219, 0.12606334686279297, 0.13014984130859375, 0.13423633575439453, 0.1383228302001953, 0.1424093246459961, 0.14649581909179688, 0.15058231353759766, 0.15466880798339844, 0.15875530242919922, 0.162841796875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 10.0, 18.0, 65.0, 200.0, 427.0, 212.0, 53.0, 11.0, 6.0, 2.0, 2.0, 0.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2805880308151245, -0.24361862242221832, -0.20664921402931213, -0.16967980563640594, -0.13271039724349976, -0.09574098885059357, -0.05877158045768738, -0.021802186965942383, 0.015167236328125, 0.05213664472103119, 0.08910605311393738, 0.12607546150684357, 0.16304486989974976, 0.20001427829265594, 0.23698368668556213, 0.27395308017730713, 0.3109225034713745, 0.3478919267654419, 0.3848613202571869, 0.4218307137489319, 0.45880013704299927, 0.49576956033706665, 0.5327389240264893, 0.5697083473205566, 0.606677770614624, 0.6436471939086914, 0.6806166172027588, 0.7175859808921814, 0.7545554041862488, 0.7915248274803162, 0.8284941911697388, 0.8654636144638062, 0.902432918548584, 0.9394023418426514, 0.9763717651367188, 1.0133411884307861, 1.0503106117248535, 1.0872799158096313, 1.1242493391036987, 1.1612187623977661, 1.1981881856918335, 1.2351576089859009, 1.2721270322799683, 1.3090964555740356, 1.3460657596588135, 1.3830351829528809, 1.4200046062469482, 1.4569740295410156, 1.493943452835083, 1.5309128761291504, 1.5678822994232178, 1.6048517227172852, 1.6418211460113525, 1.6787904500961304, 1.7157598733901978, 1.7527292966842651, 1.7896987199783325, 1.8266681432724, 1.8636375665664673, 1.9006069898605347, 1.9375762939453125, 1.9745457172393799, 2.0115151405334473, 2.0484845638275146, 2.085453987121582]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 10.0, 10.0, 11.0, 20.0, 25.0, 29.0, 35.0, 52.0, 59.0, 62.0, 74.0, 85.0, 85.0, 77.0, 84.0, 61.0, 42.0, 47.0, 43.0, 25.0, 20.0, 16.0, 12.0, 10.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4367576241493225, -0.42403900623321533, -0.41132041811943054, -0.39860180020332336, -0.3858831822872162, -0.3731645941734314, -0.3604459762573242, -0.34772735834121704, -0.33500877022743225, -0.3222901523113251, -0.3095715641975403, -0.2968529462814331, -0.2841343283653259, -0.27141574025154114, -0.25869712233543396, -0.24597851932048798, -0.2332599014043808, -0.22054129838943481, -0.20782268047332764, -0.19510407745838165, -0.18238547444343567, -0.1696668565273285, -0.1569482535123825, -0.14422965049743652, -0.13151103258132935, -0.11879242211580276, -0.10607381910085678, -0.0933552086353302, -0.08063660562038422, -0.06791799515485764, -0.055199384689331055, -0.04248078167438507, -0.029762178659439087, -0.017043571919202805, -0.004324963316321373, 0.008393645286560059, 0.02111225202679634, 0.03383085876703262, 0.046549469232559204, 0.05926807224750519, 0.07198668271303177, 0.08470529317855835, 0.09742389619350433, 0.11014250665903091, 0.1228611171245575, 0.13557972013950348, 0.14829832315444946, 0.16101694107055664, 0.17373554408550262, 0.1864541471004486, 0.1991727650165558, 0.21189136803150177, 0.22460997104644775, 0.23732858896255493, 0.2500472068786621, 0.2627657949924469, 0.2754844129085541, 0.28820303082466125, 0.30092161893844604, 0.3136402368545532, 0.3263588547706604, 0.3390774428844452, 0.35179606080055237, 0.36451464891433716, 0.37723326683044434]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 14.0, 21.0, 30.0, 51.0, 116.0, 226.0, 557.0, 1371.0, 4812.0, 21550.0, 181307.0, 722858.0, 96116.0, 14257.0, 3374.0, 1078.0, 397.0, 188.0, 88.0, 55.0, 27.0, 17.0, 6.0, 10.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.49365234375, -0.481719970703125, -0.46978759765625, -0.457855224609375, -0.4459228515625, -0.433990478515625, -0.42205810546875, -0.410125732421875, -0.398193359375, -0.386260986328125, -0.37432861328125, -0.362396240234375, -0.3504638671875, -0.338531494140625, -0.32659912109375, -0.314666748046875, -0.302734375, -0.290802001953125, -0.27886962890625, -0.266937255859375, -0.2550048828125, -0.243072509765625, -0.23114013671875, -0.219207763671875, -0.207275390625, -0.195343017578125, -0.18341064453125, -0.171478271484375, -0.1595458984375, -0.147613525390625, -0.13568115234375, -0.123748779296875, -0.11181640625, -0.099884033203125, -0.08795166015625, -0.076019287109375, -0.0640869140625, -0.052154541015625, -0.04022216796875, -0.028289794921875, -0.016357421875, -0.004425048828125, 0.00750732421875, 0.019439697265625, 0.0313720703125, 0.043304443359375, 0.05523681640625, 0.067169189453125, 0.0791015625, 0.091033935546875, 0.10296630859375, 0.114898681640625, 0.1268310546875, 0.138763427734375, 0.15069580078125, 0.162628173828125, 0.174560546875, 0.186492919921875, 0.19842529296875, 0.210357666015625, 0.2222900390625, 0.234222412109375, 0.24615478515625, 0.258087158203125, 0.27001953125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 19.0, 13.0, 23.0, 35.0, 38.0, 63.0, 72.0, 85.0, 94.0, 100.0, 86.0, 82.0, 80.0, 58.0, 53.0, 29.0, 29.0, 13.0, 6.0, 10.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193115234375, -0.188568115234375, -0.18402099609375, -0.179473876953125, -0.1749267578125, -0.170379638671875, -0.16583251953125, -0.161285400390625, -0.15673828125, -0.152191162109375, -0.14764404296875, -0.143096923828125, -0.1385498046875, -0.134002685546875, -0.12945556640625, -0.124908447265625, -0.120361328125, -0.115814208984375, -0.11126708984375, -0.106719970703125, -0.1021728515625, -0.097625732421875, -0.09307861328125, -0.088531494140625, -0.083984375, -0.079437255859375, -0.07489013671875, -0.070343017578125, -0.0657958984375, -0.061248779296875, -0.05670166015625, -0.052154541015625, -0.047607421875, -0.043060302734375, -0.03851318359375, -0.033966064453125, -0.0294189453125, -0.024871826171875, -0.02032470703125, -0.015777587890625, -0.01123046875, -0.006683349609375, -0.00213623046875, 0.002410888671875, 0.0069580078125, 0.011505126953125, 0.01605224609375, 0.020599365234375, 0.025146484375, 0.029693603515625, 0.03424072265625, 0.038787841796875, 0.0433349609375, 0.047882080078125, 0.05242919921875, 0.056976318359375, 0.0615234375, 0.066070556640625, 0.07061767578125, 0.075164794921875, 0.0797119140625, 0.084259033203125, 0.08880615234375, 0.093353271484375, 0.097900390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 8.0, 12.0, 8.0, 12.0, 23.0, 33.0, 50.0, 71.0, 124.0, 215.0, 341.0, 654.0, 1353.0, 2812.0, 6963.0, 19483.0, 68093.0, 331146.0, 474962.0, 99506.0, 26700.0, 8982.0, 3537.0, 1591.0, 784.0, 421.0, 219.0, 152.0, 98.0, 47.0, 30.0, 29.0, 24.0, 20.0, 13.0, 10.0, 8.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.242431640625, -0.23553085327148438, -0.22863006591796875, -0.22172927856445312, -0.2148284912109375, -0.20792770385742188, -0.20102691650390625, -0.19412612915039062, -0.187225341796875, -0.18032455444335938, -0.17342376708984375, -0.16652297973632812, -0.1596221923828125, -0.15272140502929688, -0.14582061767578125, -0.13891983032226562, -0.13201904296875, -0.12511825561523438, -0.11821746826171875, -0.11131668090820312, -0.1044158935546875, -0.09751510620117188, -0.09061431884765625, -0.08371353149414062, -0.076812744140625, -0.06991195678710938, -0.06301116943359375, -0.056110382080078125, -0.0492095947265625, -0.042308807373046875, -0.03540802001953125, -0.028507232666015625, -0.0216064453125, -0.014705657958984375, -0.00780487060546875, -0.000904083251953125, 0.0059967041015625, 0.012897491455078125, 0.01979827880859375, 0.026699066162109375, 0.033599853515625, 0.040500640869140625, 0.04740142822265625, 0.054302215576171875, 0.0612030029296875, 0.06810379028320312, 0.07500457763671875, 0.08190536499023438, 0.08880615234375, 0.09570693969726562, 0.10260772705078125, 0.10950851440429688, 0.1164093017578125, 0.12331008911132812, 0.13021087646484375, 0.13711166381835938, 0.144012451171875, 0.15091323852539062, 0.15781402587890625, 0.16471481323242188, 0.1716156005859375, 0.17851638793945312, 0.18541717529296875, 0.19231796264648438, 0.19921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 5.0, 9.0, 9.0, 20.0, 22.0, 17.0, 29.0, 27.0, 31.0, 36.0, 32.0, 27.0, 48.0, 43.0, 43.0, 50.0, 38.0, 66.0, 35.0, 37.0, 44.0, 42.0, 48.0, 38.0, 29.0, 30.0, 32.0, 14.0, 20.0, 22.0, 11.0, 12.0, 7.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.328857421875, -0.31906890869140625, -0.3092803955078125, -0.29949188232421875, -0.289703369140625, -0.27991485595703125, -0.2701263427734375, -0.26033782958984375, -0.25054931640625, -0.24076080322265625, -0.2309722900390625, -0.22118377685546875, -0.211395263671875, -0.20160675048828125, -0.1918182373046875, -0.18202972412109375, -0.1722412109375, -0.16245269775390625, -0.1526641845703125, -0.14287567138671875, -0.133087158203125, -0.12329864501953125, -0.1135101318359375, -0.10372161865234375, -0.09393310546875, -0.08414459228515625, -0.0743560791015625, -0.06456756591796875, -0.054779052734375, -0.04499053955078125, -0.0352020263671875, -0.02541351318359375, -0.015625, -0.00583648681640625, 0.0039520263671875, 0.01374053955078125, 0.023529052734375, 0.03331756591796875, 0.0431060791015625, 0.05289459228515625, 0.06268310546875, 0.07247161865234375, 0.0822601318359375, 0.09204864501953125, 0.101837158203125, 0.11162567138671875, 0.1214141845703125, 0.13120269775390625, 0.1409912109375, 0.15077972412109375, 0.1605682373046875, 0.17035675048828125, 0.180145263671875, 0.18993377685546875, 0.1997222900390625, 0.20951080322265625, 0.21929931640625, 0.22908782958984375, 0.2388763427734375, 0.24866485595703125, 0.258453369140625, 0.26824188232421875, 0.2780303955078125, 0.28781890869140625, 0.297607421875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 10.0, 7.0, 5.0, 9.0, 24.0, 36.0, 45.0, 68.0, 132.0, 207.0, 495.0, 1403.0, 4518.0, 19792.0, 213737.0, 755597.0, 40979.0, 7902.0, 2205.0, 696.0, 303.0, 142.0, 86.0, 55.0, 32.0, 26.0, 13.0, 11.0, 11.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.267333984375, -0.2608451843261719, -0.25435638427734375, -0.24786758422851562, -0.2413787841796875, -0.23488998413085938, -0.22840118408203125, -0.22191238403320312, -0.215423583984375, -0.20893478393554688, -0.20244598388671875, -0.19595718383789062, -0.1894683837890625, -0.18297958374023438, -0.17649078369140625, -0.17000198364257812, -0.16351318359375, -0.15702438354492188, -0.15053558349609375, -0.14404678344726562, -0.1375579833984375, -0.13106918334960938, -0.12458038330078125, -0.11809158325195312, -0.111602783203125, -0.10511398315429688, -0.09862518310546875, -0.09213638305664062, -0.0856475830078125, -0.07915878295898438, -0.07266998291015625, -0.06618118286132812, -0.0596923828125, -0.053203582763671875, -0.04671478271484375, -0.040225982666015625, -0.0337371826171875, -0.027248382568359375, -0.02075958251953125, -0.014270782470703125, -0.007781982421875, -0.001293182373046875, 0.00519561767578125, 0.011684417724609375, 0.0181732177734375, 0.024662017822265625, 0.03115081787109375, 0.037639617919921875, 0.04412841796875, 0.050617218017578125, 0.05710601806640625, 0.06359481811523438, 0.0700836181640625, 0.07657241821289062, 0.08306121826171875, 0.08955001831054688, 0.096038818359375, 0.10252761840820312, 0.10901641845703125, 0.11550521850585938, 0.1219940185546875, 0.12848281860351562, 0.13497161865234375, 0.14146041870117188, 0.14794921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 10.0, 15.0, 38.0, 151.0, 378.0, 276.0, 89.0, 35.0, 7.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005335807800292969, -0.0005232710391283035, -0.0005129612982273102, -0.0005026515573263168, -0.0004923418164253235, -0.00048203207552433014, -0.0004717223346233368, -0.00046141259372234344, -0.0004511028528213501, -0.00044079311192035675, -0.0004304833710193634, -0.00042017363011837006, -0.0004098638892173767, -0.00039955414831638336, -0.00038924440741539, -0.00037893466651439667, -0.0003686249256134033, -0.00035831518471241, -0.0003480054438114166, -0.0003376957029104233, -0.00032738596200942993, -0.0003170762211084366, -0.00030676648020744324, -0.0002964567393064499, -0.00028614699840545654, -0.0002758372575044632, -0.00026552751660346985, -0.0002552177757024765, -0.00024490803480148315, -0.0002345982939004898, -0.00022428855299949646, -0.0002139788120985031, -0.00020366907119750977, -0.00019335933029651642, -0.00018304958939552307, -0.00017273984849452972, -0.00016243010759353638, -0.00015212036669254303, -0.00014181062579154968, -0.00013150088489055634, -0.00012119114398956299, -0.00011088140308856964, -0.0001005716621875763, -9.026192128658295e-05, -7.99521803855896e-05, -6.964243948459625e-05, -5.9332698583602905e-05, -4.902295768260956e-05, -3.871321678161621e-05, -2.8403475880622864e-05, -1.8093734979629517e-05, -7.78399407863617e-06, 2.5257468223571777e-06, 1.2835487723350525e-05, 2.3145228624343872e-05, 3.345496952533722e-05, 4.3764710426330566e-05, 5.4074451327323914e-05, 6.438419222831726e-05, 7.469393312931061e-05, 8.500367403030396e-05, 9.53134149312973e-05, 0.00010562315583229065, 0.000115932896733284, 0.00012624263763427734]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 24.0, 67.0, 151.0, 385.0, 1278.0, 5440.0, 33291.0, 797426.0, 192295.0, 14252.0, 2827.0, 731.0, 228.0, 93.0, 33.0, 17.0, 10.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1373291015625, -0.1303882598876953, -0.12344741821289062, -0.11650657653808594, -0.10956573486328125, -0.10262489318847656, -0.09568405151367188, -0.08874320983886719, -0.0818023681640625, -0.07486152648925781, -0.06792068481445312, -0.06097984313964844, -0.05403900146484375, -0.04709815979003906, -0.040157318115234375, -0.03321647644042969, -0.026275634765625, -0.019334793090820312, -0.012393951416015625, -0.0054531097412109375, 0.00148773193359375, 0.008428573608398438, 0.015369415283203125, 0.022310256958007812, 0.0292510986328125, 0.03619194030761719, 0.043132781982421875, 0.05007362365722656, 0.05701446533203125, 0.06395530700683594, 0.07089614868164062, 0.07783699035644531, 0.08477783203125, 0.09171867370605469, 0.09865951538085938, 0.10560035705566406, 0.11254119873046875, 0.11948204040527344, 0.12642288208007812, 0.1333637237548828, 0.1403045654296875, 0.1472454071044922, 0.15418624877929688, 0.16112709045410156, 0.16806793212890625, 0.17500877380371094, 0.18194961547851562, 0.1888904571533203, 0.195831298828125, 0.2027721405029297, 0.20971298217773438, 0.21665382385253906, 0.22359466552734375, 0.23053550720214844, 0.23747634887695312, 0.2444171905517578, 0.2513580322265625, 0.2582988739013672, 0.2652397155761719, 0.27218055725097656, 0.27912139892578125, 0.28606224060058594, 0.2930030822753906, 0.2999439239501953, 0.306884765625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 9.0, 8.0, 6.0, 12.0, 17.0, 21.0, 35.0, 69.0, 114.0, 160.0, 145.0, 129.0, 106.0, 65.0, 47.0, 21.0, 19.0, 12.0, 3.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1036376953125, -0.09825706481933594, -0.09287643432617188, -0.08749580383300781, -0.08211517333984375, -0.07673454284667969, -0.07135391235351562, -0.06597328186035156, -0.0605926513671875, -0.05521202087402344, -0.049831390380859375, -0.04445075988769531, -0.03907012939453125, -0.03368949890136719, -0.028308868408203125, -0.022928237915039062, -0.017547607421875, -0.012166976928710938, -0.006786346435546875, -0.0014057159423828125, 0.00397491455078125, 0.009355545043945312, 0.014736175537109375, 0.020116806030273438, 0.0254974365234375, 0.030878067016601562, 0.036258697509765625, 0.04163932800292969, 0.04701995849609375, 0.05240058898925781, 0.057781219482421875, 0.06316184997558594, 0.06854248046875, 0.07392311096191406, 0.07930374145507812, 0.08468437194824219, 0.09006500244140625, 0.09544563293457031, 0.10082626342773438, 0.10620689392089844, 0.1115875244140625, 0.11696815490722656, 0.12234878540039062, 0.1277294158935547, 0.13311004638671875, 0.1384906768798828, 0.14387130737304688, 0.14925193786621094, 0.154632568359375, 0.16001319885253906, 0.16539382934570312, 0.1707744598388672, 0.17615509033203125, 0.1815357208251953, 0.18691635131835938, 0.19229698181152344, 0.1976776123046875, 0.20305824279785156, 0.20843887329101562, 0.2138195037841797, 0.21920013427734375, 0.2245807647705078, 0.22996139526367188, 0.23534202575683594, 0.24072265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 21.0, 36.0, 88.0, 185.0, 316.0, 197.0, 102.0, 44.0, 10.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1654329299926758, -1.063624620437622, -0.9618163108825684, -0.8600080609321594, -0.7581997513771057, -0.656391441822052, -0.5545831918716431, -0.45277488231658936, -0.35096657276153564, -0.24915827810764313, -0.1473499834537506, -0.04554170370101929, 0.056266605854034424, 0.15807491540908813, 0.25988316535949707, 0.3616914749145508, 0.4634997844696045, 0.5653080940246582, 0.6671164035797119, 0.7689246535301208, 0.8707329630851746, 0.9725412726402283, 1.0743495225906372, 1.176157832145691, 1.2779661417007446, 1.3797744512557983, 1.481582760810852, 1.5833909511566162, 1.68519926071167, 1.7870075702667236, 1.8888158798217773, 1.990624189376831, 2.0924324989318848, 2.1942408084869385, 2.296049118041992, 2.397857427597046, 2.4996657371520996, 2.6014740467071533, 2.703282356262207, 2.8050904273986816, 2.9068989753723145, 3.008707284927368, 3.110515594482422, 3.2123239040374756, 3.3141322135925293, 3.415940523147583, 3.5177488327026367, 3.6195569038391113, 3.721365213394165, 3.8231735229492188, 3.9249818325042725, 4.026790142059326, 4.128598213195801, 4.230406761169434, 4.332214832305908, 4.434023380279541, 4.535831451416016, 4.63763952255249, 4.739448070526123, 4.841256141662598, 4.9430646896362305, 5.044872760772705, 5.146681308746338, 5.2484893798828125, 5.350297927856445]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 13.0, 10.0, 12.0, 8.0, 15.0, 14.0, 24.0, 22.0, 23.0, 29.0, 31.0, 32.0, 33.0, 40.0, 43.0, 51.0, 34.0, 49.0, 36.0, 46.0, 37.0, 45.0, 35.0, 35.0, 36.0, 39.0, 27.0, 27.0, 18.0, 27.0, 12.0, 15.0, 13.0, 10.0, 11.0, 13.0, 5.0, 9.0, 4.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3125150203704834, -1.2703300714492798, -1.2281451225280762, -1.185960292816162, -1.1437753438949585, -1.1015903949737549, -1.0594055652618408, -1.0172206163406372, -0.9750356674194336, -0.93285071849823, -0.8906658291816711, -0.8484809398651123, -0.8062959909439087, -0.7641110420227051, -0.7219261527061462, -0.6797412633895874, -0.6375563144683838, -0.5953713655471802, -0.5531864762306213, -0.5110015869140625, -0.4688166379928589, -0.42663171887397766, -0.38444679975509644, -0.3422618806362152, -0.300076961517334, -0.25789204239845276, -0.21570712327957153, -0.1735222041606903, -0.13133728504180908, -0.08915236592292786, -0.04696744680404663, -0.004782527685165405, 0.03740251064300537, 0.0795874297618866, 0.12177234888076782, 0.16395726799964905, 0.20614218711853027, 0.2483271062374115, 0.2905120253562927, 0.33269694447517395, 0.3748818635940552, 0.4170667827129364, 0.4592517018318176, 0.5014365911483765, 0.5436215400695801, 0.5858064889907837, 0.6279913783073425, 0.6701762676239014, 0.712361216545105, 0.7545461654663086, 0.7967310547828674, 0.8389159440994263, 0.8811008930206299, 0.9232858419418335, 0.9654707312583923, 1.0076556205749512, 1.0498405694961548, 1.0920255184173584, 1.1342103481292725, 1.176395297050476, 1.2185802459716797, 1.2607651948928833, 1.302950143814087, 1.345134973526001, 1.3873199224472046]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 2.0, 10.0, 7.0, 7.0, 6.0, 8.0, 18.0, 28.0, 27.0, 44.0, 53.0, 81.0, 137.0, 238.0, 465.0, 973.0, 2223.0, 5479.0, 16774.0, 118767.0, 3971166.0, 57651.0, 12024.0, 4364.0, 1863.0, 837.0, 465.0, 223.0, 136.0, 98.0, 50.0, 20.0, 14.0, 9.0, 0.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.405029296875, -0.3956890106201172, -0.3863487243652344, -0.37700843811035156, -0.36766815185546875, -0.35832786560058594, -0.3489875793457031, -0.3396472930908203, -0.3303070068359375, -0.3209667205810547, -0.3116264343261719, -0.30228614807128906, -0.29294586181640625, -0.28360557556152344, -0.2742652893066406, -0.2649250030517578, -0.255584716796875, -0.2462444305419922, -0.23690414428710938, -0.22756385803222656, -0.21822357177734375, -0.20888328552246094, -0.19954299926757812, -0.1902027130126953, -0.1808624267578125, -0.1715221405029297, -0.16218185424804688, -0.15284156799316406, -0.14350128173828125, -0.13416099548339844, -0.12482070922851562, -0.11548042297363281, -0.10614013671875, -0.09679985046386719, -0.08745956420898438, -0.07811927795410156, -0.06877899169921875, -0.05943870544433594, -0.050098419189453125, -0.04075813293457031, -0.0314178466796875, -0.022077560424804688, -0.012737274169921875, -0.0033969879150390625, 0.00594329833984375, 0.015283584594726562, 0.024623870849609375, 0.03396415710449219, 0.043304443359375, 0.05264472961425781, 0.061985015869140625, 0.07132530212402344, 0.08066558837890625, 0.09000587463378906, 0.09934616088867188, 0.10868644714355469, 0.1180267333984375, 0.1273670196533203, 0.13670730590820312, 0.14604759216308594, 0.15538787841796875, 0.16472816467285156, 0.17406845092773438, 0.1834087371826172, 0.1927490234375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 12.0, 12.0, 14.0, 19.0, 38.0, 47.0, 36.0, 56.0, 69.0, 77.0, 67.0, 68.0, 76.0, 71.0, 59.0, 67.0, 50.0, 34.0, 37.0, 20.0, 20.0, 16.0, 10.0, 4.0, 8.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.17138671875, -0.1673755645751953, -0.16336441040039062, -0.15935325622558594, -0.15534210205078125, -0.15133094787597656, -0.14731979370117188, -0.1433086395263672, -0.1392974853515625, -0.1352863311767578, -0.13127517700195312, -0.12726402282714844, -0.12325286865234375, -0.11924171447753906, -0.11523056030273438, -0.11121940612792969, -0.107208251953125, -0.10319709777832031, -0.09918594360351562, -0.09517478942871094, -0.09116363525390625, -0.08715248107910156, -0.08314132690429688, -0.07913017272949219, -0.0751190185546875, -0.07110786437988281, -0.06709671020507812, -0.06308555603027344, -0.05907440185546875, -0.05506324768066406, -0.051052093505859375, -0.04704093933105469, -0.04302978515625, -0.03901863098144531, -0.035007476806640625, -0.030996322631835938, -0.02698516845703125, -0.022974014282226562, -0.018962860107421875, -0.014951705932617188, -0.0109405517578125, -0.0069293975830078125, -0.002918243408203125, 0.0010929107666015625, 0.00510406494140625, 0.009115219116210938, 0.013126373291015625, 0.017137527465820312, 0.021148681640625, 0.025159835815429688, 0.029170989990234375, 0.03318214416503906, 0.03719329833984375, 0.04120445251464844, 0.045215606689453125, 0.04922676086425781, 0.0532379150390625, 0.05724906921386719, 0.061260223388671875, 0.06527137756347656, 0.06928253173828125, 0.07329368591308594, 0.07730484008789062, 0.08131599426269531, 0.0853271484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 7.0, 12.0, 31.0, 39.0, 50.0, 67.0, 110.0, 171.0, 235.0, 482.0, 769.0, 1313.0, 2494.0, 4959.0, 12223.0, 46103.0, 3724894.0, 355081.0, 27429.0, 9063.0, 3963.0, 1990.0, 1085.0, 655.0, 380.0, 230.0, 152.0, 109.0, 49.0, 45.0, 31.0, 19.0, 8.0, 7.0, 3.0, 3.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1953125, -0.1887664794921875, -0.182220458984375, -0.1756744384765625, -0.16912841796875, -0.1625823974609375, -0.156036376953125, -0.1494903564453125, -0.1429443359375, -0.1363983154296875, -0.129852294921875, -0.1233062744140625, -0.11676025390625, -0.1102142333984375, -0.103668212890625, -0.0971221923828125, -0.090576171875, -0.0840301513671875, -0.077484130859375, -0.0709381103515625, -0.06439208984375, -0.0578460693359375, -0.051300048828125, -0.0447540283203125, -0.0382080078125, -0.0316619873046875, -0.025115966796875, -0.0185699462890625, -0.01202392578125, -0.0054779052734375, 0.001068115234375, 0.0076141357421875, 0.01416015625, 0.0207061767578125, 0.027252197265625, 0.0337982177734375, 0.04034423828125, 0.0468902587890625, 0.053436279296875, 0.0599822998046875, 0.0665283203125, 0.0730743408203125, 0.079620361328125, 0.0861663818359375, 0.09271240234375, 0.0992584228515625, 0.105804443359375, 0.1123504638671875, 0.118896484375, 0.1254425048828125, 0.131988525390625, 0.1385345458984375, 0.14508056640625, 0.1516265869140625, 0.158172607421875, 0.1647186279296875, 0.1712646484375, 0.1778106689453125, 0.184356689453125, 0.1909027099609375, 0.19744873046875, 0.2039947509765625, 0.210540771484375, 0.2170867919921875, 0.2236328125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 10.0, 5.0, 4.0, 6.0, 10.0, 11.0, 6.0, 20.0, 51.0, 94.0, 423.0, 2936.0, 285.0, 83.0, 42.0, 30.0, 16.0, 11.0, 9.0, 7.0, 3.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09991455078125, -0.0965127944946289, -0.09311103820800781, -0.08970928192138672, -0.08630752563476562, -0.08290576934814453, -0.07950401306152344, -0.07610225677490234, -0.07270050048828125, -0.06929874420166016, -0.06589698791503906, -0.06249523162841797, -0.059093475341796875, -0.05569171905517578, -0.05228996276855469, -0.048888206481933594, -0.0454864501953125, -0.042084693908691406, -0.03868293762207031, -0.03528118133544922, -0.031879425048828125, -0.02847766876220703, -0.025075912475585938, -0.021674156188964844, -0.01827239990234375, -0.014870643615722656, -0.011468887329101562, -0.008067131042480469, -0.004665374755859375, -0.0012636184692382812, 0.0021381378173828125, 0.005539894104003906, 0.008941650390625, 0.012343406677246094, 0.015745162963867188, 0.01914691925048828, 0.022548675537109375, 0.02595043182373047, 0.029352188110351562, 0.032753944396972656, 0.03615570068359375, 0.039557456970214844, 0.04295921325683594, 0.04636096954345703, 0.049762725830078125, 0.05316448211669922, 0.05656623840332031, 0.059967994689941406, 0.0633697509765625, 0.0667715072631836, 0.07017326354980469, 0.07357501983642578, 0.07697677612304688, 0.08037853240966797, 0.08378028869628906, 0.08718204498291016, 0.09058380126953125, 0.09398555755615234, 0.09738731384277344, 0.10078907012939453, 0.10419082641601562, 0.10759258270263672, 0.11099433898925781, 0.1143960952758789, 0.1177978515625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 13.0, 58.0, 174.0, 328.0, 255.0, 111.0, 39.0, 15.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4735005795955658, -0.4494094252586365, -0.42531827092170715, -0.40122711658477783, -0.3771359622478485, -0.3530448079109192, -0.3289536237716675, -0.30486249923706055, -0.28077131509780884, -0.2566801607608795, -0.2325890064239502, -0.20849785208702087, -0.18440669775009155, -0.16031554341316223, -0.13622437417507172, -0.1121332198381424, -0.08804208040237427, -0.06395092606544495, -0.03985976800322533, -0.015768609941005707, 0.008322544395923615, 0.032413698732852936, 0.056504860520362854, 0.08059601485729218, 0.1046871691942215, 0.12877832353115082, 0.15286947786808014, 0.17696064710617065, 0.20105180144309998, 0.2251429557800293, 0.24923411011695862, 0.27332526445388794, 0.2974163889884949, 0.3215075433254242, 0.3455986976623535, 0.36968985199928284, 0.39378100633621216, 0.4178721606731415, 0.4419633150100708, 0.4660544991493225, 0.49014562368392944, 0.5142368078231812, 0.5383279323577881, 0.5624191164970398, 0.5865102410316467, 0.6106014251708984, 0.6346925497055054, 0.6587837338447571, 0.6828749179840088, 0.7069661021232605, 0.7310572266578674, 0.7551484107971191, 0.7792395353317261, 0.8033307194709778, 0.8274218440055847, 0.8515130281448364, 0.8756041526794434, 0.8996953368186951, 0.923786461353302, 0.9478776454925537, 0.9719687700271606, 0.9960599541664124, 1.020151138305664, 1.044242262840271, 1.068333387374878]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 7.0, 10.0, 10.0, 20.0, 37.0, 36.0, 43.0, 51.0, 63.0, 86.0, 79.0, 91.0, 75.0, 77.0, 71.0, 74.0, 55.0, 25.0, 30.0, 23.0, 15.0, 9.0, 12.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31004977226257324, -0.2992687523365021, -0.2884877026081085, -0.27770668268203735, -0.2669256329536438, -0.25614461302757263, -0.24536357820034027, -0.2345825433731079, -0.22380150854587555, -0.2130204737186432, -0.20223943889141083, -0.19145840406417847, -0.1806773841381073, -0.16989633440971375, -0.15911531448364258, -0.14833427965641022, -0.13755324482917786, -0.1267722100019455, -0.11599117517471313, -0.10521014779806137, -0.09442911297082901, -0.08364807814359665, -0.07286705076694489, -0.062086015939712524, -0.051304981112480164, -0.0405239462852478, -0.02974291518330574, -0.018961884081363678, -0.008180849254131317, 0.0026001855731010437, 0.013381212949752808, 0.02416224777698517, 0.03494328260421753, 0.04572431743144989, 0.05650534853339195, 0.06728637963533401, 0.07806741446256638, 0.08884844928979874, 0.0996294766664505, 0.11041051149368286, 0.12119154632091522, 0.13197258114814758, 0.14275361597537994, 0.1535346508026123, 0.16431567072868347, 0.17509672045707703, 0.1858777403831482, 0.19665877521038055, 0.20743981003761292, 0.21822084486484528, 0.22900187969207764, 0.2397828996181488, 0.25056394934654236, 0.2613449692726135, 0.2721260190010071, 0.28290703892707825, 0.2936880588531494, 0.3044690787792206, 0.31525012850761414, 0.3260311484336853, 0.33681219816207886, 0.34759321808815, 0.3583742380142212, 0.36915528774261475, 0.3799363374710083]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 12.0, 8.0, 20.0, 28.0, 42.0, 59.0, 85.0, 159.0, 264.0, 488.0, 891.0, 1708.0, 3500.0, 7421.0, 17548.0, 47439.0, 152569.0, 419980.0, 267551.0, 80562.0, 27452.0, 10906.0, 4846.0, 2261.0, 1188.0, 654.0, 366.0, 217.0, 112.0, 75.0, 46.0, 26.0, 17.0, 12.0, 7.0, 9.0, 4.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.159423828125, -0.15387535095214844, -0.14832687377929688, -0.1427783966064453, -0.13722991943359375, -0.1316814422607422, -0.12613296508789062, -0.12058448791503906, -0.1150360107421875, -0.10948753356933594, -0.10393905639648438, -0.09839057922363281, -0.09284210205078125, -0.08729362487792969, -0.08174514770507812, -0.07619667053222656, -0.070648193359375, -0.06509971618652344, -0.059551239013671875, -0.05400276184082031, -0.04845428466796875, -0.04290580749511719, -0.037357330322265625, -0.03180885314941406, -0.0262603759765625, -0.020711898803710938, -0.015163421630859375, -0.009614944458007812, -0.00406646728515625, 0.0014820098876953125, 0.007030487060546875, 0.012578964233398438, 0.01812744140625, 0.023675918579101562, 0.029224395751953125, 0.03477287292480469, 0.04032135009765625, 0.04586982727050781, 0.051418304443359375, 0.05696678161621094, 0.0625152587890625, 0.06806373596191406, 0.07361221313476562, 0.07916069030761719, 0.08470916748046875, 0.09025764465332031, 0.09580612182617188, 0.10135459899902344, 0.106903076171875, 0.11245155334472656, 0.11800003051757812, 0.12354850769042969, 0.12909698486328125, 0.1346454620361328, 0.14019393920898438, 0.14574241638183594, 0.1512908935546875, 0.15683937072753906, 0.16238784790039062, 0.1679363250732422, 0.17348480224609375, 0.1790332794189453, 0.18458175659179688, 0.19013023376464844, 0.1956787109375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 8.0, 15.0, 12.0, 23.0, 28.0, 46.0, 49.0, 60.0, 64.0, 65.0, 79.0, 74.0, 73.0, 65.0, 70.0, 64.0, 44.0, 36.0, 34.0, 19.0, 19.0, 17.0, 14.0, 7.0, 1.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.175537109375, -0.17142391204833984, -0.1673107147216797, -0.16319751739501953, -0.15908432006835938, -0.15497112274169922, -0.15085792541503906, -0.1467447280883789, -0.14263153076171875, -0.1385183334350586, -0.13440513610839844, -0.13029193878173828, -0.12617874145507812, -0.12206554412841797, -0.11795234680175781, -0.11383914947509766, -0.1097259521484375, -0.10561275482177734, -0.10149955749511719, -0.09738636016845703, -0.09327316284179688, -0.08915996551513672, -0.08504676818847656, -0.0809335708618164, -0.07682037353515625, -0.0727071762084961, -0.06859397888183594, -0.06448078155517578, -0.060367584228515625, -0.05625438690185547, -0.05214118957519531, -0.048027992248535156, -0.043914794921875, -0.039801597595214844, -0.03568840026855469, -0.03157520294189453, -0.027462005615234375, -0.02334880828857422, -0.019235610961914062, -0.015122413635253906, -0.01100921630859375, -0.006896018981933594, -0.0027828216552734375, 0.0013303756713867188, 0.005443572998046875, 0.009556770324707031, 0.013669967651367188, 0.017783164978027344, 0.0218963623046875, 0.026009559631347656, 0.030122756958007812, 0.03423595428466797, 0.038349151611328125, 0.04246234893798828, 0.04657554626464844, 0.050688743591308594, 0.05480194091796875, 0.058915138244628906, 0.06302833557128906, 0.06714153289794922, 0.07125473022460938, 0.07536792755126953, 0.07948112487792969, 0.08359432220458984, 0.08770751953125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 4.0, 5.0, 15.0, 17.0, 17.0, 25.0, 22.0, 30.0, 36.0, 47.0, 67.0, 103.0, 164.0, 207.0, 389.0, 746.0, 1551.0, 4030.0, 11896.0, 42877.0, 240306.0, 605244.0, 104499.0, 23620.0, 7263.0, 2692.0, 1149.0, 558.0, 338.0, 186.0, 142.0, 77.0, 43.0, 44.0, 29.0, 40.0, 21.0, 14.0, 10.0, 7.0, 7.0, 5.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.272705078125, -0.26497650146484375, -0.2572479248046875, -0.24951934814453125, -0.241790771484375, -0.23406219482421875, -0.2263336181640625, -0.21860504150390625, -0.21087646484375, -0.20314788818359375, -0.1954193115234375, -0.18769073486328125, -0.179962158203125, -0.17223358154296875, -0.1645050048828125, -0.15677642822265625, -0.1490478515625, -0.14131927490234375, -0.1335906982421875, -0.12586212158203125, -0.118133544921875, -0.11040496826171875, -0.1026763916015625, -0.09494781494140625, -0.08721923828125, -0.07949066162109375, -0.0717620849609375, -0.06403350830078125, -0.056304931640625, -0.04857635498046875, -0.0408477783203125, -0.03311920166015625, -0.025390625, -0.01766204833984375, -0.0099334716796875, -0.00220489501953125, 0.005523681640625, 0.01325225830078125, 0.0209808349609375, 0.02870941162109375, 0.03643798828125, 0.04416656494140625, 0.0518951416015625, 0.05962371826171875, 0.067352294921875, 0.07508087158203125, 0.0828094482421875, 0.09053802490234375, 0.0982666015625, 0.10599517822265625, 0.1137237548828125, 0.12145233154296875, 0.129180908203125, 0.13690948486328125, 0.1446380615234375, 0.15236663818359375, 0.16009521484375, 0.16782379150390625, 0.1755523681640625, 0.18328094482421875, 0.191009521484375, 0.19873809814453125, 0.2064666748046875, 0.21419525146484375, 0.221923828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 5.0, 9.0, 16.0, 12.0, 22.0, 15.0, 18.0, 16.0, 19.0, 17.0, 22.0, 29.0, 40.0, 30.0, 42.0, 31.0, 48.0, 34.0, 54.0, 46.0, 45.0, 29.0, 43.0, 33.0, 28.0, 30.0, 51.0, 37.0, 22.0, 20.0, 28.0, 21.0, 10.0, 11.0, 18.0, 8.0, 8.0, 3.0, 1.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.330810546875, -0.3211669921875, -0.3115234375, -0.3018798828125, -0.292236328125, -0.2825927734375, -0.27294921875, -0.2633056640625, -0.253662109375, -0.2440185546875, -0.234375, -0.2247314453125, -0.215087890625, -0.2054443359375, -0.19580078125, -0.1861572265625, -0.176513671875, -0.1668701171875, -0.1572265625, -0.1475830078125, -0.137939453125, -0.1282958984375, -0.11865234375, -0.1090087890625, -0.099365234375, -0.0897216796875, -0.080078125, -0.0704345703125, -0.060791015625, -0.0511474609375, -0.04150390625, -0.0318603515625, -0.022216796875, -0.0125732421875, -0.0029296875, 0.0067138671875, 0.016357421875, 0.0260009765625, 0.03564453125, 0.0452880859375, 0.054931640625, 0.0645751953125, 0.07421875, 0.0838623046875, 0.093505859375, 0.1031494140625, 0.11279296875, 0.1224365234375, 0.132080078125, 0.1417236328125, 0.1513671875, 0.1610107421875, 0.170654296875, 0.1802978515625, 0.18994140625, 0.1995849609375, 0.209228515625, 0.2188720703125, 0.228515625, 0.2381591796875, 0.247802734375, 0.2574462890625, 0.26708984375, 0.2767333984375, 0.286376953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 10.0, 12.0, 11.0, 20.0, 23.0, 43.0, 70.0, 92.0, 215.0, 327.0, 666.0, 1409.0, 3569.0, 10264.0, 38001.0, 312376.0, 601746.0, 57441.0, 13933.0, 4665.0, 1831.0, 854.0, 446.0, 212.0, 123.0, 74.0, 33.0, 34.0, 18.0, 13.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.131591796875, -0.12773609161376953, -0.12388038635253906, -0.1200246810913086, -0.11616897583007812, -0.11231327056884766, -0.10845756530761719, -0.10460186004638672, -0.10074615478515625, -0.09689044952392578, -0.09303474426269531, -0.08917903900146484, -0.08532333374023438, -0.0814676284790039, -0.07761192321777344, -0.07375621795654297, -0.0699005126953125, -0.06604480743408203, -0.06218910217285156, -0.058333396911621094, -0.054477691650390625, -0.050621986389160156, -0.04676628112792969, -0.04291057586669922, -0.03905487060546875, -0.03519916534423828, -0.03134346008300781, -0.027487754821777344, -0.023632049560546875, -0.019776344299316406, -0.015920639038085938, -0.012064933776855469, -0.008209228515625, -0.004353523254394531, -0.0004978179931640625, 0.0033578872680664062, 0.007213592529296875, 0.011069297790527344, 0.014925003051757812, 0.01878070831298828, 0.02263641357421875, 0.02649211883544922, 0.030347824096679688, 0.034203529357910156, 0.038059234619140625, 0.041914939880371094, 0.04577064514160156, 0.04962635040283203, 0.0534820556640625, 0.05733776092529297, 0.06119346618652344, 0.0650491714477539, 0.06890487670898438, 0.07276058197021484, 0.07661628723144531, 0.08047199249267578, 0.08432769775390625, 0.08818340301513672, 0.09203910827636719, 0.09589481353759766, 0.09975051879882812, 0.1036062240600586, 0.10746192932128906, 0.11131763458251953, 0.11517333984375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 3.0, 8.0, 22.0, 9.0, 10.0, 16.0, 24.0, 35.0, 23.0, 31.0, 43.0, 77.0, 114.0, 132.0, 120.0, 75.0, 60.0, 50.0, 38.0, 28.0, 19.0, 20.0, 14.0, 5.0, 6.0, 9.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5849552154541016e-05, -5.3017400205135345e-05, -5.0185248255729675e-05, -4.7353096306324005e-05, -4.4520944356918335e-05, -4.1688792407512665e-05, -3.8856640458106995e-05, -3.6024488508701324e-05, -3.3192336559295654e-05, -3.0360184609889984e-05, -2.7528032660484314e-05, -2.4695880711078644e-05, -2.1863728761672974e-05, -1.9031576812267303e-05, -1.6199424862861633e-05, -1.3367272913455963e-05, -1.0535120964050293e-05, -7.702969014644623e-06, -4.870817065238953e-06, -2.0386651158332825e-06, 7.934868335723877e-07, 3.625638782978058e-06, 6.457790732383728e-06, 9.289942681789398e-06, 1.2122094631195068e-05, 1.4954246580600739e-05, 1.778639853000641e-05, 2.061855047941208e-05, 2.345070242881775e-05, 2.628285437822342e-05, 2.911500632762909e-05, 3.194715827703476e-05, 3.477931022644043e-05, 3.76114621758461e-05, 4.044361412525177e-05, 4.327576607465744e-05, 4.610791802406311e-05, 4.894006997346878e-05, 5.177222192287445e-05, 5.460437387228012e-05, 5.743652582168579e-05, 6.026867777109146e-05, 6.310082972049713e-05, 6.59329816699028e-05, 6.876513361930847e-05, 7.159728556871414e-05, 7.442943751811981e-05, 7.726158946752548e-05, 8.009374141693115e-05, 8.292589336633682e-05, 8.575804531574249e-05, 8.859019726514816e-05, 9.142234921455383e-05, 9.42545011639595e-05, 9.708665311336517e-05, 9.991880506277084e-05, 0.00010275095701217651, 0.00010558310896158218, 0.00010841526091098785, 0.00011124741286039352, 0.0001140795648097992, 0.00011691171675920486, 0.00011974386870861053, 0.0001225760206580162, 0.00012540817260742188]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 2.0, 3.0, 10.0, 10.0, 20.0, 20.0, 35.0, 50.0, 72.0, 96.0, 166.0, 322.0, 606.0, 1293.0, 2860.0, 7074.0, 20673.0, 74122.0, 415575.0, 417245.0, 74435.0, 20885.0, 7341.0, 2836.0, 1280.0, 635.0, 338.0, 189.0, 126.0, 78.0, 45.0, 33.0, 21.0, 14.0, 10.0, 10.0, 10.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.105712890625, -0.10277652740478516, -0.09984016418457031, -0.09690380096435547, -0.09396743774414062, -0.09103107452392578, -0.08809471130371094, -0.0851583480834961, -0.08222198486328125, -0.0792856216430664, -0.07634925842285156, -0.07341289520263672, -0.07047653198242188, -0.06754016876220703, -0.06460380554199219, -0.061667442321777344, -0.0587310791015625, -0.055794715881347656, -0.05285835266113281, -0.04992198944091797, -0.046985626220703125, -0.04404926300048828, -0.04111289978027344, -0.038176536560058594, -0.03524017333984375, -0.032303810119628906, -0.029367446899414062, -0.02643108367919922, -0.023494720458984375, -0.02055835723876953, -0.017621994018554688, -0.014685630798339844, -0.011749267578125, -0.008812904357910156, -0.0058765411376953125, -0.0029401779174804688, -3.814697265625e-06, 0.0029325485229492188, 0.0058689117431640625, 0.008805274963378906, 0.01174163818359375, 0.014678001403808594, 0.017614364624023438, 0.02055072784423828, 0.023487091064453125, 0.02642345428466797, 0.029359817504882812, 0.032296180725097656, 0.0352325439453125, 0.038168907165527344, 0.04110527038574219, 0.04404163360595703, 0.046977996826171875, 0.04991436004638672, 0.05285072326660156, 0.055787086486816406, 0.05872344970703125, 0.061659812927246094, 0.06459617614746094, 0.06753253936767578, 0.07046890258789062, 0.07340526580810547, 0.07634162902832031, 0.07927799224853516, 0.08221435546875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 4.0, 13.0, 19.0, 28.0, 25.0, 34.0, 52.0, 66.0, 92.0, 110.0, 139.0, 107.0, 80.0, 55.0, 57.0, 30.0, 29.0, 15.0, 9.0, 11.0, 7.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.081298828125, -0.0774688720703125, -0.073638916015625, -0.0698089599609375, -0.06597900390625, -0.0621490478515625, -0.058319091796875, -0.0544891357421875, -0.0506591796875, -0.0468292236328125, -0.042999267578125, -0.0391693115234375, -0.03533935546875, -0.0315093994140625, -0.027679443359375, -0.0238494873046875, -0.02001953125, -0.0161895751953125, -0.012359619140625, -0.0085296630859375, -0.00469970703125, -0.0008697509765625, 0.002960205078125, 0.0067901611328125, 0.0106201171875, 0.0144500732421875, 0.018280029296875, 0.0221099853515625, 0.02593994140625, 0.0297698974609375, 0.033599853515625, 0.0374298095703125, 0.041259765625, 0.0450897216796875, 0.048919677734375, 0.0527496337890625, 0.05657958984375, 0.0604095458984375, 0.064239501953125, 0.0680694580078125, 0.0718994140625, 0.0757293701171875, 0.079559326171875, 0.0833892822265625, 0.08721923828125, 0.0910491943359375, 0.094879150390625, 0.0987091064453125, 0.1025390625, 0.1063690185546875, 0.110198974609375, 0.1140289306640625, 0.11785888671875, 0.1216888427734375, 0.125518798828125, 0.1293487548828125, 0.1331787109375, 0.1370086669921875, 0.140838623046875, 0.1446685791015625, 0.14849853515625, 0.1523284912109375, 0.156158447265625, 0.1599884033203125, 0.163818359375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 14.0, 62.0, 150.0, 400.0, 267.0, 94.0, 17.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.028061866760254, -0.8768825531005859, -0.7257032990455627, -0.5745240449905396, -0.4233447313308716, -0.2721654176712036, -0.12098616361618042, 0.030193090438842773, 0.18137240409851074, 0.3325516879558563, 0.4837309718132019, 0.6349102258682251, 0.7860895395278931, 0.937268853187561, 1.0884480476379395, 1.2396273612976074, 1.3908066749572754, 1.5419859886169434, 1.6931653022766113, 1.8443444967269897, 1.9955238103866577, 2.1467032432556152, 2.297882318496704, 2.449061632156372, 2.60024094581604, 2.751420259475708, 2.902599573135376, 3.053778886795044, 3.204957962036133, 3.356137275695801, 3.5073165893554688, 3.6584959030151367, 3.8096752166748047, 3.9608545303344727, 4.112033843994141, 4.263213157653809, 4.414392471313477, 4.5655717849731445, 4.7167510986328125, 4.8679304122924805, 5.019109725952148, 5.170289039611816, 5.321468353271484, 5.472647666931152, 5.62382698059082, 5.775006294250488, 5.926185607910156, 6.077364921569824, 6.228543758392334, 6.379723072052002, 6.53090238571167, 6.682081699371338, 6.833261013031006, 6.984440326690674, 7.135619640350342, 7.286798477172852, 7.4379777908325195, 7.5891571044921875, 7.7403364181518555, 7.891515731811523, 8.042695045471191, 8.19387435913086, 8.345053672790527, 8.496232986450195, 8.647412300109863]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 11.0, 4.0, 10.0, 10.0, 10.0, 12.0, 18.0, 15.0, 22.0, 28.0, 20.0, 28.0, 34.0, 25.0, 49.0, 40.0, 29.0, 37.0, 44.0, 48.0, 38.0, 46.0, 45.0, 30.0, 45.0, 36.0, 35.0, 28.0, 26.0, 39.0, 30.0, 22.0, 17.0, 11.0, 9.0, 17.0, 8.0, 11.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5384279489517212, -1.4869585037231445, -1.4354890584945679, -1.3840196132659912, -1.3325501680374146, -1.281080722808838, -1.2296111583709717, -1.1781418323516846, -1.1266722679138184, -1.0752028226852417, -1.023733377456665, -0.9722639322280884, -0.9207944869995117, -0.8693250417709351, -0.8178555369377136, -0.766386091709137, -0.7149167060852051, -0.6634472608566284, -0.6119778156280518, -0.5605083703994751, -0.5090389251708984, -0.4575694501399994, -0.40609997510910034, -0.3546305298805237, -0.303161084651947, -0.25169163942337036, -0.2002221792936325, -0.14875271916389465, -0.097283273935318, -0.04581382870674133, 0.005655646324157715, 0.057125091552734375, 0.10859441757202148, 0.16006386280059814, 0.211533322930336, 0.26300278306007385, 0.3144722282886505, 0.3659416735172272, 0.4174111485481262, 0.4688805937767029, 0.5203500390052795, 0.5718194842338562, 0.6232889294624329, 0.6747584342956543, 0.726227879524231, 0.7776973247528076, 0.8291667699813843, 0.8806362152099609, 0.9321056604385376, 0.9835751056671143, 1.035044550895691, 1.0865139961242676, 1.1379834413528442, 1.189452886581421, 1.240922451019287, 1.2923917770385742, 1.3438613414764404, 1.395330786705017, 1.4468002319335938, 1.4982696771621704, 1.549739122390747, 1.6012085676193237, 1.6526780128479004, 1.7041475772857666, 1.7556169033050537]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 1.0, 7.0, 13.0, 12.0, 14.0, 13.0, 24.0, 22.0, 28.0, 40.0, 57.0, 79.0, 105.0, 158.0, 194.0, 333.0, 618.0, 1136.0, 1845.0, 3949.0, 9611.0, 33717.0, 3206375.0, 889245.0, 29866.0, 8674.0, 3703.0, 1861.0, 921.0, 575.0, 386.0, 204.0, 135.0, 100.0, 71.0, 45.0, 35.0, 30.0, 22.0, 13.0, 17.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0], "bins": [-0.2939453125, -0.2865886688232422, -0.2792320251464844, -0.27187538146972656, -0.26451873779296875, -0.25716209411621094, -0.24980545043945312, -0.2424488067626953, -0.2350921630859375, -0.2277355194091797, -0.22037887573242188, -0.21302223205566406, -0.20566558837890625, -0.19830894470214844, -0.19095230102539062, -0.1835956573486328, -0.176239013671875, -0.1688823699951172, -0.16152572631835938, -0.15416908264160156, -0.14681243896484375, -0.13945579528808594, -0.13209915161132812, -0.12474250793457031, -0.1173858642578125, -0.11002922058105469, -0.10267257690429688, -0.09531593322753906, -0.08795928955078125, -0.08060264587402344, -0.07324600219726562, -0.06588935852050781, -0.05853271484375, -0.05117607116699219, -0.043819427490234375, -0.03646278381347656, -0.02910614013671875, -0.021749496459960938, -0.014392852783203125, -0.0070362091064453125, 0.0003204345703125, 0.0076770782470703125, 0.015033721923828125, 0.022390365600585938, 0.02974700927734375, 0.03710365295410156, 0.044460296630859375, 0.05181694030761719, 0.059173583984375, 0.06653022766113281, 0.07388687133789062, 0.08124351501464844, 0.08860015869140625, 0.09595680236816406, 0.10331344604492188, 0.11067008972167969, 0.1180267333984375, 0.1253833770751953, 0.13274002075195312, 0.14009666442871094, 0.14745330810546875, 0.15480995178222656, 0.16216659545898438, 0.1695232391357422, 0.1768798828125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 12.0, 17.0, 24.0, 25.0, 29.0, 40.0, 48.0, 38.0, 58.0, 75.0, 67.0, 69.0, 56.0, 72.0, 85.0, 57.0, 40.0, 51.0, 26.0, 24.0, 16.0, 18.0, 14.0, 9.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1748046875, -0.17061710357666016, -0.1664295196533203, -0.16224193572998047, -0.15805435180664062, -0.15386676788330078, -0.14967918395996094, -0.1454916000366211, -0.14130401611328125, -0.1371164321899414, -0.13292884826660156, -0.12874126434326172, -0.12455368041992188, -0.12036609649658203, -0.11617851257324219, -0.11199092864990234, -0.1078033447265625, -0.10361576080322266, -0.09942817687988281, -0.09524059295654297, -0.09105300903320312, -0.08686542510986328, -0.08267784118652344, -0.0784902572631836, -0.07430267333984375, -0.0701150894165039, -0.06592750549316406, -0.06173992156982422, -0.057552337646484375, -0.05336475372314453, -0.04917716979980469, -0.044989585876464844, -0.040802001953125, -0.036614418029785156, -0.03242683410644531, -0.02823925018310547, -0.024051666259765625, -0.01986408233642578, -0.015676498413085938, -0.011488914489746094, -0.00730133056640625, -0.0031137466430664062, 0.0010738372802734375, 0.005261421203613281, 0.009449005126953125, 0.013636589050292969, 0.017824172973632812, 0.022011756896972656, 0.0261993408203125, 0.030386924743652344, 0.03457450866699219, 0.03876209259033203, 0.042949676513671875, 0.04713726043701172, 0.05132484436035156, 0.055512428283691406, 0.05970001220703125, 0.0638875961303711, 0.06807518005371094, 0.07226276397705078, 0.07645034790039062, 0.08063793182373047, 0.08482551574707031, 0.08901309967041016, 0.09320068359375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 4.0, 9.0, 13.0, 15.0, 25.0, 52.0, 50.0, 106.0, 156.0, 265.0, 489.0, 859.0, 1601.0, 3082.0, 6960.0, 24987.0, 1295279.0, 2819737.0, 26576.0, 7230.0, 3065.0, 1612.0, 899.0, 493.0, 296.0, 176.0, 81.0, 62.0, 35.0, 15.0, 18.0, 8.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17724609375, -0.17016220092773438, -0.16307830810546875, -0.15599441528320312, -0.1489105224609375, -0.14182662963867188, -0.13474273681640625, -0.12765884399414062, -0.120574951171875, -0.11349105834960938, -0.10640716552734375, -0.09932327270507812, -0.0922393798828125, -0.08515548706054688, -0.07807159423828125, -0.07098770141601562, -0.06390380859375, -0.056819915771484375, -0.04973602294921875, -0.042652130126953125, -0.0355682373046875, -0.028484344482421875, -0.02140045166015625, -0.014316558837890625, -0.007232666015625, -0.000148773193359375, 0.00693511962890625, 0.014019012451171875, 0.0211029052734375, 0.028186798095703125, 0.03527069091796875, 0.042354583740234375, 0.0494384765625, 0.056522369384765625, 0.06360626220703125, 0.07069015502929688, 0.0777740478515625, 0.08485794067382812, 0.09194183349609375, 0.09902572631835938, 0.106109619140625, 0.11319351196289062, 0.12027740478515625, 0.12736129760742188, 0.1344451904296875, 0.14152908325195312, 0.14861297607421875, 0.15569686889648438, 0.16278076171875, 0.16986465454101562, 0.17694854736328125, 0.18403244018554688, 0.1911163330078125, 0.19820022583007812, 0.20528411865234375, 0.21236801147460938, 0.219451904296875, 0.22653579711914062, 0.23361968994140625, 0.24070358276367188, 0.2477874755859375, 0.2548713684082031, 0.26195526123046875, 0.2690391540527344, 0.276123046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 7.0, 13.0, 14.0, 23.0, 50.0, 89.0, 676.0, 2880.0, 141.0, 60.0, 37.0, 23.0, 13.0, 8.0, 7.0, 3.0, 2.0, 5.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1478271484375, -0.14308929443359375, -0.1383514404296875, -0.13361358642578125, -0.128875732421875, -0.12413787841796875, -0.1194000244140625, -0.11466217041015625, -0.10992431640625, -0.10518646240234375, -0.1004486083984375, -0.09571075439453125, -0.090972900390625, -0.08623504638671875, -0.0814971923828125, -0.07675933837890625, -0.072021484375, -0.06728363037109375, -0.0625457763671875, -0.05780792236328125, -0.053070068359375, -0.04833221435546875, -0.0435943603515625, -0.03885650634765625, -0.03411865234375, -0.02938079833984375, -0.0246429443359375, -0.01990509033203125, -0.015167236328125, -0.01042938232421875, -0.0056915283203125, -0.00095367431640625, 0.0037841796875, 0.00852203369140625, 0.0132598876953125, 0.01799774169921875, 0.022735595703125, 0.02747344970703125, 0.0322113037109375, 0.03694915771484375, 0.04168701171875, 0.04642486572265625, 0.0511627197265625, 0.05590057373046875, 0.060638427734375, 0.06537628173828125, 0.0701141357421875, 0.07485198974609375, 0.07958984375, 0.08432769775390625, 0.0890655517578125, 0.09380340576171875, 0.098541259765625, 0.10327911376953125, 0.1080169677734375, 0.11275482177734375, 0.11749267578125, 0.12223052978515625, 0.1269683837890625, 0.13170623779296875, 0.136444091796875, 0.14118194580078125, 0.1459197998046875, 0.15065765380859375, 0.1553955078125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 65.0, 778.0, 141.0, 18.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8055806756019592, -0.7213149666786194, -0.6370493173599243, -0.5527836084365845, -0.46851789951324463, -0.3842521905899048, -0.2999865412712097, -0.21572083234786987, -0.13145512342453003, -0.04718942940235138, 0.03707626461982727, 0.12134194374084473, 0.20560765266418457, 0.2898733615875244, 0.3741390109062195, 0.4584047198295593, 0.5426704287528992, 0.626936137676239, 0.7112017869949341, 0.7954674959182739, 0.8797332048416138, 0.9639989137649536, 1.048264503479004, 1.1325302124023438, 1.2167959213256836, 1.3010616302490234, 1.3853273391723633, 1.4695930480957031, 1.553858757019043, 1.6381244659423828, 1.722390055656433, 1.806655764579773, 1.8909215927124023, 1.9751873016357422, 2.059453010559082, 2.143718719482422, 2.2279844284057617, 2.3122501373291016, 2.3965158462524414, 2.4807815551757812, 2.565047264099121, 2.649312973022461, 2.733578681945801, 2.8178443908691406, 2.9021100997924805, 2.9863758087158203, 3.07064151763916, 3.1549072265625, 3.2391726970672607, 3.3234384059906006, 3.4077041149139404, 3.4919698238372803, 3.57623553276062, 3.66050124168396, 3.7447667121887207, 3.8290324211120605, 3.9132981300354004, 3.9975638389587402, 4.08182954788208, 4.16609525680542, 4.25036096572876, 4.3346266746521, 4.4188923835754395, 4.503158092498779, 4.587423801422119]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 3.0, 9.0, 10.0, 11.0, 25.0, 31.0, 39.0, 41.0, 60.0, 65.0, 52.0, 75.0, 70.0, 69.0, 77.0, 67.0, 48.0, 63.0, 53.0, 28.0, 29.0, 20.0, 17.0, 11.0, 11.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3940753936767578, -0.3810008764266968, -0.36792638897895813, -0.3548518717288971, -0.34177735447883606, -0.3287028670310974, -0.3156283497810364, -0.30255383253097534, -0.2894793152809143, -0.27640479803085327, -0.2633303105831146, -0.2502557933330536, -0.23718127608299255, -0.2241067737340927, -0.21103227138519287, -0.19795775413513184, -0.1848832666873932, -0.17180876433849335, -0.1587342470884323, -0.14565974473953247, -0.13258522748947144, -0.1195107251405716, -0.10643622279167175, -0.09336171299219131, -0.08028720319271088, -0.06721269339323044, -0.0541381873190403, -0.04106368124485016, -0.02798917144536972, -0.014914661645889282, -0.001840159296989441, 0.011234350502490997, 0.024308860301971436, 0.037383370101451874, 0.050457876175642014, 0.06353238224983215, 0.07660689204931259, 0.08968140184879303, 0.10275590419769287, 0.11583041399717331, 0.12890492379665375, 0.1419794261455536, 0.15505394339561462, 0.16812844574451447, 0.1812029480934143, 0.19427746534347534, 0.20735196769237518, 0.22042647004127502, 0.23350098729133606, 0.2465754896402359, 0.25964999198913574, 0.2727245092391968, 0.2857990264892578, 0.29887354373931885, 0.3119480311870575, 0.32502254843711853, 0.3380970358848572, 0.3511715531349182, 0.36424604058265686, 0.3773205578327179, 0.39039507508277893, 0.4034695625305176, 0.4165440797805786, 0.42961859703063965, 0.4426931142807007]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 7.0, 9.0, 26.0, 40.0, 55.0, 104.0, 188.0, 463.0, 1272.0, 3900.0, 14619.0, 70514.0, 523064.0, 366492.0, 51584.0, 11346.0, 3079.0, 1028.0, 386.0, 172.0, 79.0, 48.0, 16.0, 17.0, 13.0, 8.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.371826171875, -0.36250877380371094, -0.3531913757324219, -0.3438739776611328, -0.33455657958984375, -0.3252391815185547, -0.3159217834472656, -0.30660438537597656, -0.2972869873046875, -0.28796958923339844, -0.2786521911621094, -0.2693347930908203, -0.26001739501953125, -0.2506999969482422, -0.24138259887695312, -0.23206520080566406, -0.222747802734375, -0.21343040466308594, -0.20411300659179688, -0.1947956085205078, -0.18547821044921875, -0.1761608123779297, -0.16684341430664062, -0.15752601623535156, -0.1482086181640625, -0.13889122009277344, -0.12957382202148438, -0.12025642395019531, -0.11093902587890625, -0.10162162780761719, -0.09230422973632812, -0.08298683166503906, -0.07366943359375, -0.06435203552246094, -0.055034637451171875, -0.04571723937988281, -0.03639984130859375, -0.027082443237304688, -0.017765045166015625, -0.008447647094726562, 0.0008697509765625, 0.010187149047851562, 0.019504547119140625, 0.028821945190429688, 0.03813934326171875, 0.04745674133300781, 0.056774139404296875, 0.06609153747558594, 0.075408935546875, 0.08472633361816406, 0.09404373168945312, 0.10336112976074219, 0.11267852783203125, 0.12199592590332031, 0.13131332397460938, 0.14063072204589844, 0.1499481201171875, 0.15926551818847656, 0.16858291625976562, 0.1779003143310547, 0.18721771240234375, 0.1965351104736328, 0.20585250854492188, 0.21516990661621094, 0.2244873046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 11.0, 5.0, 15.0, 11.0, 35.0, 23.0, 31.0, 34.0, 39.0, 58.0, 51.0, 62.0, 81.0, 67.0, 61.0, 74.0, 77.0, 59.0, 46.0, 27.0, 35.0, 25.0, 14.0, 17.0, 15.0, 14.0, 6.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.171142578125, -0.16692733764648438, -0.16271209716796875, -0.15849685668945312, -0.1542816162109375, -0.15006637573242188, -0.14585113525390625, -0.14163589477539062, -0.137420654296875, -0.13320541381835938, -0.12899017333984375, -0.12477493286132812, -0.1205596923828125, -0.11634445190429688, -0.11212921142578125, -0.10791397094726562, -0.10369873046875, -0.09948348999023438, -0.09526824951171875, -0.09105300903320312, -0.0868377685546875, -0.08262252807617188, -0.07840728759765625, -0.07419204711914062, -0.069976806640625, -0.06576156616210938, -0.06154632568359375, -0.057331085205078125, -0.0531158447265625, -0.048900604248046875, -0.04468536376953125, -0.040470123291015625, -0.0362548828125, -0.032039642333984375, -0.02782440185546875, -0.023609161376953125, -0.0193939208984375, -0.015178680419921875, -0.01096343994140625, -0.006748199462890625, -0.002532958984375, 0.001682281494140625, 0.00589752197265625, 0.010112762451171875, 0.0143280029296875, 0.018543243408203125, 0.02275848388671875, 0.026973724365234375, 0.03118896484375, 0.035404205322265625, 0.03961944580078125, 0.043834686279296875, 0.0480499267578125, 0.052265167236328125, 0.05648040771484375, 0.060695648193359375, 0.064910888671875, 0.06912612915039062, 0.07334136962890625, 0.07755661010742188, 0.0817718505859375, 0.08598709106445312, 0.09020233154296875, 0.09441757202148438, 0.0986328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 8.0, 14.0, 15.0, 24.0, 20.0, 40.0, 52.0, 67.0, 83.0, 95.0, 149.0, 285.0, 487.0, 1242.0, 5165.0, 29484.0, 359840.0, 599026.0, 42496.0, 6896.0, 1537.0, 550.0, 295.0, 186.0, 133.0, 92.0, 62.0, 56.0, 33.0, 27.0, 23.0, 16.0, 13.0, 11.0, 8.0, 9.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.385498046875, -0.3753776550292969, -0.36525726318359375, -0.3551368713378906, -0.3450164794921875, -0.3348960876464844, -0.32477569580078125, -0.3146553039550781, -0.304534912109375, -0.2944145202636719, -0.28429412841796875, -0.2741737365722656, -0.2640533447265625, -0.2539329528808594, -0.24381256103515625, -0.23369216918945312, -0.22357177734375, -0.21345138549804688, -0.20333099365234375, -0.19321060180664062, -0.1830902099609375, -0.17296981811523438, -0.16284942626953125, -0.15272903442382812, -0.142608642578125, -0.13248825073242188, -0.12236785888671875, -0.11224746704101562, -0.1021270751953125, -0.09200668334960938, -0.08188629150390625, -0.07176589965820312, -0.0616455078125, -0.051525115966796875, -0.04140472412109375, -0.031284332275390625, -0.0211639404296875, -0.011043548583984375, -0.00092315673828125, 0.009197235107421875, 0.019317626953125, 0.029438018798828125, 0.03955841064453125, 0.049678802490234375, 0.0597991943359375, 0.06991958618164062, 0.08003997802734375, 0.09016036987304688, 0.10028076171875, 0.11040115356445312, 0.12052154541015625, 0.13064193725585938, 0.1407623291015625, 0.15088272094726562, 0.16100311279296875, 0.17112350463867188, 0.181243896484375, 0.19136428833007812, 0.20148468017578125, 0.21160507202148438, 0.2217254638671875, 0.23184585571289062, 0.24196624755859375, 0.2520866394042969, 0.26220703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 4.0, 5.0, 6.0, 6.0, 5.0, 17.0, 2.0, 10.0, 10.0, 15.0, 15.0, 30.0, 20.0, 24.0, 24.0, 32.0, 28.0, 35.0, 27.0, 40.0, 37.0, 49.0, 32.0, 42.0, 48.0, 42.0, 33.0, 37.0, 24.0, 30.0, 29.0, 24.0, 24.0, 20.0, 28.0, 25.0, 18.0, 14.0, 14.0, 2.0, 12.0, 8.0, 7.0, 8.0, 8.0, 4.0, 7.0, 4.0, 7.0, 7.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.328125, -0.3183135986328125, -0.308502197265625, -0.2986907958984375, -0.28887939453125, -0.2790679931640625, -0.269256591796875, -0.2594451904296875, -0.2496337890625, -0.2398223876953125, -0.230010986328125, -0.2201995849609375, -0.21038818359375, -0.2005767822265625, -0.190765380859375, -0.1809539794921875, -0.171142578125, -0.1613311767578125, -0.151519775390625, -0.1417083740234375, -0.13189697265625, -0.1220855712890625, -0.112274169921875, -0.1024627685546875, -0.0926513671875, -0.0828399658203125, -0.073028564453125, -0.0632171630859375, -0.05340576171875, -0.0435943603515625, -0.033782958984375, -0.0239715576171875, -0.01416015625, -0.0043487548828125, 0.005462646484375, 0.0152740478515625, 0.02508544921875, 0.0348968505859375, 0.044708251953125, 0.0545196533203125, 0.0643310546875, 0.0741424560546875, 0.083953857421875, 0.0937652587890625, 0.10357666015625, 0.1133880615234375, 0.123199462890625, 0.1330108642578125, 0.142822265625, 0.1526336669921875, 0.162445068359375, 0.1722564697265625, 0.18206787109375, 0.1918792724609375, 0.201690673828125, 0.2115020751953125, 0.2213134765625, 0.2311248779296875, 0.240936279296875, 0.2507476806640625, 0.26055908203125, 0.2703704833984375, 0.280181884765625, 0.2899932861328125, 0.2998046875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 9.0, 9.0, 14.0, 17.0, 43.0, 43.0, 43.0, 73.0, 133.0, 212.0, 306.0, 523.0, 759.0, 1376.0, 2532.0, 5005.0, 10865.0, 31268.0, 232107.0, 679824.0, 53790.0, 15404.0, 6683.0, 3149.0, 1724.0, 995.0, 618.0, 363.0, 213.0, 133.0, 108.0, 65.0, 47.0, 34.0, 18.0, 17.0, 10.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11114501953125, -0.10758113861083984, -0.10401725769042969, -0.10045337677001953, -0.09688949584960938, -0.09332561492919922, -0.08976173400878906, -0.0861978530883789, -0.08263397216796875, -0.0790700912475586, -0.07550621032714844, -0.07194232940673828, -0.06837844848632812, -0.06481456756591797, -0.06125068664550781, -0.057686805725097656, -0.0541229248046875, -0.050559043884277344, -0.04699516296386719, -0.04343128204345703, -0.039867401123046875, -0.03630352020263672, -0.03273963928222656, -0.029175758361816406, -0.02561187744140625, -0.022047996520996094, -0.018484115600585938, -0.014920234680175781, -0.011356353759765625, -0.007792472839355469, -0.0042285919189453125, -0.0006647109985351562, 0.002899169921875, 0.006463050842285156, 0.010026931762695312, 0.013590812683105469, 0.017154693603515625, 0.02071857452392578, 0.024282455444335938, 0.027846336364746094, 0.03141021728515625, 0.034974098205566406, 0.03853797912597656, 0.04210186004638672, 0.045665740966796875, 0.04922962188720703, 0.05279350280761719, 0.056357383728027344, 0.0599212646484375, 0.06348514556884766, 0.06704902648925781, 0.07061290740966797, 0.07417678833007812, 0.07774066925048828, 0.08130455017089844, 0.0848684310913086, 0.08843231201171875, 0.0919961929321289, 0.09556007385253906, 0.09912395477294922, 0.10268783569335938, 0.10625171661376953, 0.10981559753417969, 0.11337947845458984, 0.116943359375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 2.0, 8.0, 9.0, 10.0, 10.0, 21.0, 19.0, 29.0, 28.0, 38.0, 41.0, 66.0, 70.0, 82.0, 83.0, 101.0, 76.0, 63.0, 52.0, 40.0, 32.0, 28.0, 22.0, 16.0, 10.0, 11.0, 10.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.89897346496582e-05, -8.60951840877533e-05, -8.320063352584839e-05, -8.030608296394348e-05, -7.741153240203857e-05, -7.451698184013367e-05, -7.162243127822876e-05, -6.872788071632385e-05, -6.583333015441895e-05, -6.293877959251404e-05, -6.004422903060913e-05, -5.7149678468704224e-05, -5.4255127906799316e-05, -5.136057734489441e-05, -4.84660267829895e-05, -4.5571476221084595e-05, -4.267692565917969e-05, -3.978237509727478e-05, -3.688782453536987e-05, -3.3993273973464966e-05, -3.109872341156006e-05, -2.820417284965515e-05, -2.5309622287750244e-05, -2.2415071725845337e-05, -1.952052116394043e-05, -1.6625970602035522e-05, -1.3731420040130615e-05, -1.0836869478225708e-05, -7.9423189163208e-06, -5.0477683544158936e-06, -2.1532177925109863e-06, 7.413327693939209e-07, 3.635883331298828e-06, 6.530433893203735e-06, 9.424984455108643e-06, 1.231953501701355e-05, 1.5214085578918457e-05, 1.8108636140823364e-05, 2.100318670272827e-05, 2.389773726463318e-05, 2.6792287826538086e-05, 2.9686838388442993e-05, 3.25813889503479e-05, 3.547593951225281e-05, 3.8370490074157715e-05, 4.126504063606262e-05, 4.415959119796753e-05, 4.7054141759872437e-05, 4.9948692321777344e-05, 5.284324288368225e-05, 5.573779344558716e-05, 5.8632344007492065e-05, 6.152689456939697e-05, 6.442144513130188e-05, 6.731599569320679e-05, 7.02105462551117e-05, 7.31050968170166e-05, 7.599964737892151e-05, 7.889419794082642e-05, 8.178874850273132e-05, 8.468329906463623e-05, 8.757784962654114e-05, 9.047240018844604e-05, 9.336695075035095e-05, 9.626150131225586e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 14.0, 19.0, 16.0, 26.0, 44.0, 79.0, 113.0, 189.0, 305.0, 567.0, 957.0, 1631.0, 3173.0, 7040.0, 20140.0, 110660.0, 778897.0, 92848.0, 18414.0, 6488.0, 3046.0, 1615.0, 917.0, 586.0, 290.0, 171.0, 115.0, 73.0, 53.0, 18.0, 20.0, 12.0, 10.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1376953125, -0.1340198516845703, -0.13034439086914062, -0.12666893005371094, -0.12299346923828125, -0.11931800842285156, -0.11564254760742188, -0.11196708679199219, -0.1082916259765625, -0.10461616516113281, -0.10094070434570312, -0.09726524353027344, -0.09358978271484375, -0.08991432189941406, -0.08623886108398438, -0.08256340026855469, -0.078887939453125, -0.07521247863769531, -0.07153701782226562, -0.06786155700683594, -0.06418609619140625, -0.06051063537597656, -0.056835174560546875, -0.05315971374511719, -0.0494842529296875, -0.04580879211425781, -0.042133331298828125, -0.03845787048339844, -0.03478240966796875, -0.031106948852539062, -0.027431488037109375, -0.023756027221679688, -0.02008056640625, -0.016405105590820312, -0.012729644775390625, -0.009054183959960938, -0.00537872314453125, -0.0017032623291015625, 0.001972198486328125, 0.0056476593017578125, 0.0093231201171875, 0.012998580932617188, 0.016674041748046875, 0.020349502563476562, 0.02402496337890625, 0.027700424194335938, 0.031375885009765625, 0.03505134582519531, 0.038726806640625, 0.04240226745605469, 0.046077728271484375, 0.04975318908691406, 0.05342864990234375, 0.05710411071777344, 0.060779571533203125, 0.06445503234863281, 0.0681304931640625, 0.07180595397949219, 0.07548141479492188, 0.07915687561035156, 0.08283233642578125, 0.08650779724121094, 0.09018325805664062, 0.09385871887207031, 0.0975341796875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 7.0, 7.0, 5.0, 7.0, 14.0, 15.0, 23.0, 30.0, 56.0, 70.0, 118.0, 153.0, 153.0, 114.0, 82.0, 50.0, 26.0, 16.0, 12.0, 11.0, 3.0, 10.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134521484375, -0.13057327270507812, -0.12662506103515625, -0.12267684936523438, -0.1187286376953125, -0.11478042602539062, -0.11083221435546875, -0.10688400268554688, -0.102935791015625, -0.09898757934570312, -0.09503936767578125, -0.09109115600585938, -0.0871429443359375, -0.08319473266601562, -0.07924652099609375, -0.07529830932617188, -0.07135009765625, -0.06740188598632812, -0.06345367431640625, -0.059505462646484375, -0.0555572509765625, -0.051609039306640625, -0.04766082763671875, -0.043712615966796875, -0.039764404296875, -0.035816192626953125, -0.03186798095703125, -0.027919769287109375, -0.0239715576171875, -0.020023345947265625, -0.01607513427734375, -0.012126922607421875, -0.0081787109375, -0.004230499267578125, -0.00028228759765625, 0.003665924072265625, 0.0076141357421875, 0.011562347412109375, 0.01551055908203125, 0.019458770751953125, 0.023406982421875, 0.027355194091796875, 0.03130340576171875, 0.035251617431640625, 0.0391998291015625, 0.043148040771484375, 0.04709625244140625, 0.051044464111328125, 0.05499267578125, 0.058940887451171875, 0.06288909912109375, 0.06683731079101562, 0.0707855224609375, 0.07473373413085938, 0.07868194580078125, 0.08263015747070312, 0.086578369140625, 0.09052658081054688, 0.09447479248046875, 0.09842300415039062, 0.1023712158203125, 0.10631942749023438, 0.11026763916015625, 0.11421585083007812, 0.1181640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 10.0, 16.0, 60.0, 116.0, 180.0, 221.0, 192.0, 97.0, 59.0, 28.0, 16.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0002601146697998, -0.9190535545349121, -0.8378469944000244, -0.7566404342651367, -0.675433874130249, -0.5942273139953613, -0.5130207538604736, -0.43181419372558594, -0.35060763359069824, -0.26940107345581055, -0.18819451332092285, -0.10698795318603516, -0.02578139305114746, 0.055425167083740234, 0.13663172721862793, 0.21783828735351562, 0.2990448474884033, 0.380251407623291, 0.4614579677581787, 0.5426645278930664, 0.6238710880279541, 0.7050776481628418, 0.7862842082977295, 0.8674907684326172, 0.9486973285675049, 1.0299038887023926, 1.1111104488372803, 1.192317008972168, 1.2735235691070557, 1.3547301292419434, 1.435936689376831, 1.5171432495117188, 1.5983495712280273, 1.679556131362915, 1.7607626914978027, 1.8419692516326904, 1.9231758117675781, 2.004382371902466, 2.0855889320373535, 2.166795492172241, 2.248002052307129, 2.3292086124420166, 2.4104151725769043, 2.491621732711792, 2.5728282928466797, 2.6540348529815674, 2.735241413116455, 2.8164479732513428, 2.8976545333862305, 2.978861093521118, 3.060067653656006, 3.1412742137908936, 3.2224807739257812, 3.303687334060669, 3.3848938941955566, 3.4661004543304443, 3.547307014465332, 3.6285135746002197, 3.7097201347351074, 3.790926694869995, 3.872133255004883, 3.9533398151397705, 4.034546375274658, 4.115753173828125, 4.196959495544434]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 9.0, 7.0, 13.0, 19.0, 26.0, 23.0, 25.0, 34.0, 38.0, 43.0, 53.0, 46.0, 54.0, 67.0, 52.0, 64.0, 57.0, 55.0, 57.0, 32.0, 30.0, 43.0, 25.0, 27.0, 17.0, 19.0, 10.0, 13.0, 6.0, 7.0, 7.0, 4.0, 6.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.409971237182617, -2.3364856243133545, -2.263000249862671, -2.189514636993408, -2.1160292625427246, -2.042543649673462, -1.9690580368041992, -1.895572543144226, -1.822087049484253, -1.7486015558242798, -1.6751160621643066, -1.601630449295044, -1.5281449556350708, -1.4546594619750977, -1.381173849105835, -1.3076883554458618, -1.2342028617858887, -1.1607173681259155, -1.0872318744659424, -1.0137462615966797, -0.9402607679367065, -0.8667752742767334, -0.7932897210121155, -0.7198041677474976, -0.6463186740875244, -0.5728331804275513, -0.49934762716293335, -0.4258621037006378, -0.3523765802383423, -0.27889105677604675, -0.20540553331375122, -0.1319199800491333, -0.05843472480773926, 0.015050798654556274, 0.0885363221168518, 0.16202184557914734, 0.23550736904144287, 0.3089928925037384, 0.38247841596603394, 0.45596396923065186, 0.529449462890625, 0.6029349565505981, 0.6764205098152161, 0.749906063079834, 0.8233915567398071, 0.8968770503997803, 0.9703626036643982, 1.0438481569290161, 1.1173336505889893, 1.1908191442489624, 1.2643046379089355, 1.3377902507781982, 1.4112757444381714, 1.4847612380981445, 1.5582468509674072, 1.6317323446273804, 1.7052178382873535, 1.7787033319473267, 1.8521888256072998, 1.9256744384765625, 1.9991599321365356, 2.072645425796509, 2.1461310386657715, 2.219616413116455, 2.2931020259857178]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 5.0, 24.0, 36.0, 86.0, 207.0, 704.0, 5970.0, 4136410.0, 48134.0, 2064.0, 378.0, 120.0, 50.0, 27.0, 16.0, 6.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.5380859375, -0.5270500183105469, -0.5160140991210938, -0.5049781799316406, -0.4939422607421875, -0.4829063415527344, -0.47187042236328125, -0.4608345031738281, -0.449798583984375, -0.4387626647949219, -0.42772674560546875, -0.4166908264160156, -0.4056549072265625, -0.3946189880371094, -0.38358306884765625, -0.3725471496582031, -0.36151123046875, -0.3504753112792969, -0.33943939208984375, -0.3284034729003906, -0.3173675537109375, -0.3063316345214844, -0.29529571533203125, -0.2842597961425781, -0.273223876953125, -0.2621879577636719, -0.25115203857421875, -0.24011611938476562, -0.2290802001953125, -0.21804428100585938, -0.20700836181640625, -0.19597244262695312, -0.1849365234375, -0.17390060424804688, -0.16286468505859375, -0.15182876586914062, -0.1407928466796875, -0.12975692749023438, -0.11872100830078125, -0.10768508911132812, -0.096649169921875, -0.08561325073242188, -0.07457733154296875, -0.06354141235351562, -0.0525054931640625, -0.041469573974609375, -0.03043365478515625, -0.019397735595703125, -0.00836181640625, 0.002674102783203125, 0.01371002197265625, 0.024745941162109375, 0.0357818603515625, 0.046817779541015625, 0.05785369873046875, 0.06888961791992188, 0.079925537109375, 0.09096145629882812, 0.10199737548828125, 0.11303329467773438, 0.1240692138671875, 0.13510513305664062, 0.14614105224609375, 0.15717697143554688, 0.168212890625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 11.0, 6.0, 12.0, 13.0, 15.0, 28.0, 25.0, 38.0, 55.0, 44.0, 60.0, 54.0, 73.0, 66.0, 68.0, 56.0, 51.0, 47.0, 51.0, 44.0, 43.0, 27.0, 29.0, 15.0, 18.0, 17.0, 13.0, 6.0, 9.0, 4.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0], "bins": [-0.17529296875, -0.17093753814697266, -0.1665821075439453, -0.16222667694091797, -0.15787124633789062, -0.15351581573486328, -0.14916038513183594, -0.1448049545288086, -0.14044952392578125, -0.1360940933227539, -0.13173866271972656, -0.12738323211669922, -0.12302780151367188, -0.11867237091064453, -0.11431694030761719, -0.10996150970458984, -0.1056060791015625, -0.10125064849853516, -0.09689521789550781, -0.09253978729248047, -0.08818435668945312, -0.08382892608642578, -0.07947349548339844, -0.0751180648803711, -0.07076263427734375, -0.0664072036743164, -0.06205177307128906, -0.05769634246826172, -0.053340911865234375, -0.04898548126220703, -0.04463005065917969, -0.040274620056152344, -0.035919189453125, -0.031563758850097656, -0.027208328247070312, -0.02285289764404297, -0.018497467041015625, -0.014142036437988281, -0.009786605834960938, -0.005431175231933594, -0.00107574462890625, 0.0032796859741210938, 0.0076351165771484375, 0.011990547180175781, 0.016345977783203125, 0.02070140838623047, 0.025056838989257812, 0.029412269592285156, 0.0337677001953125, 0.038123130798339844, 0.04247856140136719, 0.04683399200439453, 0.051189422607421875, 0.05554485321044922, 0.05990028381347656, 0.0642557144165039, 0.06861114501953125, 0.0729665756225586, 0.07732200622558594, 0.08167743682861328, 0.08603286743164062, 0.09038829803466797, 0.09474372863769531, 0.09909915924072266, 0.10345458984375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 7.0, 0.0, 8.0, 6.0, 8.0, 14.0, 17.0, 22.0, 23.0, 37.0, 70.0, 79.0, 113.0, 164.0, 276.0, 371.0, 694.0, 1628.0, 5222.0, 28842.0, 3970184.0, 168437.0, 12371.0, 2989.0, 1104.0, 530.0, 340.0, 227.0, 166.0, 112.0, 61.0, 49.0, 29.0, 24.0, 23.0, 15.0, 10.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.124267578125, -0.12122058868408203, -0.11817359924316406, -0.1151266098022461, -0.11207962036132812, -0.10903263092041016, -0.10598564147949219, -0.10293865203857422, -0.09989166259765625, -0.09684467315673828, -0.09379768371582031, -0.09075069427490234, -0.08770370483398438, -0.0846567153930664, -0.08160972595214844, -0.07856273651123047, -0.0755157470703125, -0.07246875762939453, -0.06942176818847656, -0.0663747787475586, -0.06332778930664062, -0.060280799865722656, -0.05723381042480469, -0.05418682098388672, -0.05113983154296875, -0.04809284210205078, -0.04504585266113281, -0.041998863220214844, -0.038951873779296875, -0.035904884338378906, -0.03285789489746094, -0.02981090545654297, -0.026763916015625, -0.02371692657470703, -0.020669937133789062, -0.017622947692871094, -0.014575958251953125, -0.011528968811035156, -0.008481979370117188, -0.005434989929199219, -0.00238800048828125, 0.0006589889526367188, 0.0037059783935546875, 0.006752967834472656, 0.009799957275390625, 0.012846946716308594, 0.015893936157226562, 0.01894092559814453, 0.0219879150390625, 0.02503490447998047, 0.028081893920898438, 0.031128883361816406, 0.034175872802734375, 0.037222862243652344, 0.04026985168457031, 0.04331684112548828, 0.04636383056640625, 0.04941082000732422, 0.05245780944824219, 0.055504798889160156, 0.058551788330078125, 0.061598777770996094, 0.06464576721191406, 0.06769275665283203, 0.07073974609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 9.0, 8.0, 6.0, 17.0, 40.0, 110.0, 3269.0, 474.0, 79.0, 31.0, 11.0, 10.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0209503173828125, -0.02013993263244629, -0.019329547882080078, -0.018519163131713867, -0.017708778381347656, -0.016898393630981445, -0.016088008880615234, -0.015277624130249023, -0.014467239379882812, -0.013656854629516602, -0.01284646987915039, -0.01203608512878418, -0.011225700378417969, -0.010415315628051758, -0.009604930877685547, -0.008794546127319336, -0.007984161376953125, -0.007173776626586914, -0.006363391876220703, -0.005553007125854492, -0.004742622375488281, -0.00393223762512207, -0.0031218528747558594, -0.0023114681243896484, -0.0015010833740234375, -0.0006906986236572266, 0.00011968612670898438, 0.0009300708770751953, 0.0017404556274414062, 0.002550840377807617, 0.003361225128173828, 0.004171609878540039, 0.00498199462890625, 0.005792379379272461, 0.006602764129638672, 0.007413148880004883, 0.008223533630371094, 0.009033918380737305, 0.009844303131103516, 0.010654687881469727, 0.011465072631835938, 0.012275457382202148, 0.01308584213256836, 0.01389622688293457, 0.014706611633300781, 0.015516996383666992, 0.016327381134033203, 0.017137765884399414, 0.017948150634765625, 0.018758535385131836, 0.019568920135498047, 0.020379304885864258, 0.02118968963623047, 0.02200007438659668, 0.02281045913696289, 0.0236208438873291, 0.024431228637695312, 0.025241613388061523, 0.026051998138427734, 0.026862382888793945, 0.027672767639160156, 0.028483152389526367, 0.029293537139892578, 0.03010392189025879, 0.030914306640625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 13.0, 30.0, 180.0, 415.0, 293.0, 70.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.35568585991859436, -0.34867897629737854, -0.3416720926761627, -0.3346652090549469, -0.3276583254337311, -0.32065144181251526, -0.31364455819129944, -0.3066376745700836, -0.2996307909488678, -0.292623907327652, -0.28561702370643616, -0.27861014008522034, -0.2716032564640045, -0.2645963728427887, -0.2575894892215729, -0.25058260560035706, -0.24357573688030243, -0.2365688532590866, -0.2295619696378708, -0.22255508601665497, -0.21554820239543915, -0.20854131877422333, -0.2015344500541687, -0.19452756643295288, -0.18752068281173706, -0.18051379919052124, -0.17350691556930542, -0.1665000319480896, -0.15949314832687378, -0.15248626470565796, -0.14547938108444214, -0.13847249746322632, -0.1314656287431717, -0.12445874512195587, -0.11745186150074005, -0.11044497787952423, -0.10343809425830841, -0.09643121063709259, -0.08942433446645737, -0.08241745084524155, -0.07541056722402573, -0.0684036836028099, -0.061396799981594086, -0.054389920085668564, -0.047383036464452744, -0.04037615284323692, -0.0333692729473114, -0.02636238932609558, -0.01935550570487976, -0.012348623014986515, -0.005341740325093269, 0.0016651414334774017, 0.008672025054693222, 0.015678908675909042, 0.022685788571834564, 0.029692672193050385, 0.036699555814266205, 0.043706439435482025, 0.050713323056697845, 0.05772020295262337, 0.06472708284854889, 0.07173396646976471, 0.07874085009098053, 0.08574773371219635, 0.09275461733341217]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 4.0, 3.0, 5.0, 4.0, 10.0, 9.0, 15.0, 20.0, 10.0, 15.0, 18.0, 20.0, 27.0, 27.0, 23.0, 38.0, 37.0, 47.0, 48.0, 39.0, 56.0, 50.0, 54.0, 51.0, 56.0, 41.0, 50.0, 38.0, 31.0, 25.0, 25.0, 21.0, 21.0, 15.0, 9.0, 9.0, 12.0, 9.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.04060918092727661, -0.03935711085796356, -0.03810504078865051, -0.03685297071933746, -0.035600900650024414, -0.034348830580711365, -0.033096760511398315, -0.031844690442085266, -0.030592620372772217, -0.029340550303459167, -0.028088480234146118, -0.02683641016483307, -0.02558434009552002, -0.02433227002620697, -0.02308019995689392, -0.02182812988758087, -0.020576059818267822, -0.019323989748954773, -0.018071919679641724, -0.016819849610328674, -0.015567779541015625, -0.014315709471702576, -0.013063639402389526, -0.011811569333076477, -0.010559499263763428, -0.009307429194450378, -0.008055359125137329, -0.00680328905582428, -0.0055512189865112305, -0.004299148917198181, -0.003047078847885132, -0.0017950087785720825, -0.0005429387092590332, 0.0007091313600540161, 0.0019612014293670654, 0.0032132714986801147, 0.004465341567993164, 0.005717411637306213, 0.006969481706619263, 0.008221551775932312, 0.009473621845245361, 0.01072569191455841, 0.01197776198387146, 0.01322983205318451, 0.014481902122497559, 0.015733972191810608, 0.016986042261123657, 0.018238112330436707, 0.019490182399749756, 0.020742252469062805, 0.021994322538375854, 0.023246392607688904, 0.024498462677001953, 0.025750532746315002, 0.027002602815628052, 0.0282546728849411, 0.02950674295425415, 0.0307588130235672, 0.03201088309288025, 0.0332629531621933, 0.03451502323150635, 0.0357670933008194, 0.037019163370132446, 0.038271233439445496, 0.039523303508758545]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 8.0, 5.0, 12.0, 8.0, 16.0, 25.0, 41.0, 82.0, 126.0, 185.0, 357.0, 711.0, 1766.0, 4891.0, 17222.0, 78759.0, 494945.0, 370648.0, 58201.0, 13578.0, 4131.0, 1460.0, 629.0, 302.0, 164.0, 107.0, 59.0, 46.0, 27.0, 18.0, 12.0, 9.0, 2.0, 6.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.3408203125, -0.332489013671875, -0.32415771484375, -0.315826416015625, -0.3074951171875, -0.299163818359375, -0.29083251953125, -0.282501220703125, -0.274169921875, -0.265838623046875, -0.25750732421875, -0.249176025390625, -0.2408447265625, -0.232513427734375, -0.22418212890625, -0.215850830078125, -0.20751953125, -0.199188232421875, -0.19085693359375, -0.182525634765625, -0.1741943359375, -0.165863037109375, -0.15753173828125, -0.149200439453125, -0.140869140625, -0.132537841796875, -0.12420654296875, -0.115875244140625, -0.1075439453125, -0.099212646484375, -0.09088134765625, -0.082550048828125, -0.07421875, -0.065887451171875, -0.05755615234375, -0.049224853515625, -0.0408935546875, -0.032562255859375, -0.02423095703125, -0.015899658203125, -0.007568359375, 0.000762939453125, 0.00909423828125, 0.017425537109375, 0.0257568359375, 0.034088134765625, 0.04241943359375, 0.050750732421875, 0.05908203125, 0.067413330078125, 0.07574462890625, 0.084075927734375, 0.0924072265625, 0.100738525390625, 0.10906982421875, 0.117401123046875, 0.125732421875, 0.134063720703125, 0.14239501953125, 0.150726318359375, 0.1590576171875, 0.167388916015625, 0.17572021484375, 0.184051513671875, 0.1923828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 11.0, 5.0, 20.0, 11.0, 25.0, 29.0, 38.0, 46.0, 48.0, 46.0, 57.0, 65.0, 70.0, 68.0, 53.0, 46.0, 54.0, 49.0, 44.0, 45.0, 34.0, 34.0, 17.0, 16.0, 17.0, 15.0, 11.0, 6.0, 6.0, 5.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0], "bins": [-0.1724853515625, -0.1682415008544922, -0.16399765014648438, -0.15975379943847656, -0.15550994873046875, -0.15126609802246094, -0.14702224731445312, -0.1427783966064453, -0.1385345458984375, -0.1342906951904297, -0.13004684448242188, -0.12580299377441406, -0.12155914306640625, -0.11731529235839844, -0.11307144165039062, -0.10882759094238281, -0.104583740234375, -0.10033988952636719, -0.09609603881835938, -0.09185218811035156, -0.08760833740234375, -0.08336448669433594, -0.07912063598632812, -0.07487678527832031, -0.0706329345703125, -0.06638908386230469, -0.062145233154296875, -0.05790138244628906, -0.05365753173828125, -0.04941368103027344, -0.045169830322265625, -0.04092597961425781, -0.03668212890625, -0.03243827819824219, -0.028194427490234375, -0.023950576782226562, -0.01970672607421875, -0.015462875366210938, -0.011219024658203125, -0.0069751739501953125, -0.0027313232421875, 0.0015125274658203125, 0.005756378173828125, 0.010000228881835938, 0.01424407958984375, 0.018487930297851562, 0.022731781005859375, 0.026975631713867188, 0.031219482421875, 0.03546333312988281, 0.039707183837890625, 0.04395103454589844, 0.04819488525390625, 0.05243873596191406, 0.056682586669921875, 0.06092643737792969, 0.0651702880859375, 0.06941413879394531, 0.07365798950195312, 0.07790184020996094, 0.08214569091796875, 0.08638954162597656, 0.09063339233398438, 0.09487724304199219, 0.09912109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 7.0, 9.0, 17.0, 17.0, 19.0, 22.0, 37.0, 55.0, 64.0, 92.0, 178.0, 265.0, 497.0, 1279.0, 4871.0, 34055.0, 679603.0, 302323.0, 19794.0, 3279.0, 947.0, 415.0, 255.0, 136.0, 81.0, 82.0, 49.0, 35.0, 26.0, 14.0, 12.0, 6.0, 5.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343017578125, -0.33025360107421875, -0.3174896240234375, -0.30472564697265625, -0.291961669921875, -0.27919769287109375, -0.2664337158203125, -0.25366973876953125, -0.24090576171875, -0.22814178466796875, -0.2153778076171875, -0.20261383056640625, -0.189849853515625, -0.17708587646484375, -0.1643218994140625, -0.15155792236328125, -0.1387939453125, -0.12602996826171875, -0.1132659912109375, -0.10050201416015625, -0.087738037109375, -0.07497406005859375, -0.0622100830078125, -0.04944610595703125, -0.03668212890625, -0.02391815185546875, -0.0111541748046875, 0.00160980224609375, 0.014373779296875, 0.02713775634765625, 0.0399017333984375, 0.05266571044921875, 0.0654296875, 0.07819366455078125, 0.0909576416015625, 0.10372161865234375, 0.116485595703125, 0.12924957275390625, 0.1420135498046875, 0.15477752685546875, 0.16754150390625, 0.18030548095703125, 0.1930694580078125, 0.20583343505859375, 0.218597412109375, 0.23136138916015625, 0.2441253662109375, 0.25688934326171875, 0.2696533203125, 0.28241729736328125, 0.2951812744140625, 0.30794525146484375, 0.320709228515625, 0.33347320556640625, 0.3462371826171875, 0.35900115966796875, 0.37176513671875, 0.38452911376953125, 0.3972930908203125, 0.41005706787109375, 0.422821044921875, 0.43558502197265625, 0.4483489990234375, 0.46111297607421875, 0.473876953125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 12.0, 9.0, 5.0, 18.0, 13.0, 22.0, 20.0, 41.0, 35.0, 39.0, 52.0, 56.0, 70.0, 59.0, 62.0, 78.0, 56.0, 62.0, 60.0, 50.0, 44.0, 30.0, 20.0, 23.0, 18.0, 24.0, 5.0, 10.0, 12.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.716796875, -0.6979942321777344, -0.6791915893554688, -0.6603889465332031, -0.6415863037109375, -0.6227836608886719, -0.6039810180664062, -0.5851783752441406, -0.566375732421875, -0.5475730895996094, -0.5287704467773438, -0.5099678039550781, -0.4911651611328125, -0.4723625183105469, -0.45355987548828125, -0.4347572326660156, -0.41595458984375, -0.3971519470214844, -0.37834930419921875, -0.3595466613769531, -0.3407440185546875, -0.3219413757324219, -0.30313873291015625, -0.2843360900878906, -0.265533447265625, -0.24673080444335938, -0.22792816162109375, -0.20912551879882812, -0.1903228759765625, -0.17152023315429688, -0.15271759033203125, -0.13391494750976562, -0.1151123046875, -0.09630966186523438, -0.07750701904296875, -0.058704376220703125, -0.0399017333984375, -0.021099090576171875, -0.00229644775390625, 0.016506195068359375, 0.035308837890625, 0.054111480712890625, 0.07291412353515625, 0.09171676635742188, 0.1105194091796875, 0.12932205200195312, 0.14812469482421875, 0.16692733764648438, 0.18572998046875, 0.20453262329101562, 0.22333526611328125, 0.24213790893554688, 0.2609405517578125, 0.2797431945800781, 0.29854583740234375, 0.3173484802246094, 0.336151123046875, 0.3549537658691406, 0.37375640869140625, 0.3925590515136719, 0.4113616943359375, 0.4301643371582031, 0.44896697998046875, 0.4677696228027344, 0.486572265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 12.0, 9.0, 20.0, 37.0, 52.0, 102.0, 187.0, 448.0, 1375.0, 6197.0, 74370.0, 932338.0, 28167.0, 3673.0, 872.0, 320.0, 137.0, 80.0, 56.0, 37.0, 14.0, 12.0, 8.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33349609375, -0.32349395751953125, -0.3134918212890625, -0.30348968505859375, -0.293487548828125, -0.28348541259765625, -0.2734832763671875, -0.26348114013671875, -0.25347900390625, -0.24347686767578125, -0.2334747314453125, -0.22347259521484375, -0.213470458984375, -0.20346832275390625, -0.1934661865234375, -0.18346405029296875, -0.1734619140625, -0.16345977783203125, -0.1534576416015625, -0.14345550537109375, -0.133453369140625, -0.12345123291015625, -0.1134490966796875, -0.10344696044921875, -0.09344482421875, -0.08344268798828125, -0.0734405517578125, -0.06343841552734375, -0.053436279296875, -0.04343414306640625, -0.0334320068359375, -0.02342987060546875, -0.013427734375, -0.00342559814453125, 0.0065765380859375, 0.01657867431640625, 0.026580810546875, 0.03658294677734375, 0.0465850830078125, 0.05658721923828125, 0.06658935546875, 0.07659149169921875, 0.0865936279296875, 0.09659576416015625, 0.106597900390625, 0.11660003662109375, 0.1266021728515625, 0.13660430908203125, 0.1466064453125, 0.15660858154296875, 0.1666107177734375, 0.17661285400390625, 0.186614990234375, 0.19661712646484375, 0.2066192626953125, 0.21662139892578125, 0.22662353515625, 0.23662567138671875, 0.2466278076171875, 0.25662994384765625, 0.266632080078125, 0.27663421630859375, 0.2866363525390625, 0.29663848876953125, 0.306640625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 4.0, 4.0, 6.0, 11.0, 25.0, 15.0, 20.0, 21.0, 37.0, 46.0, 53.0, 72.0, 90.0, 79.0, 100.0, 75.0, 86.0, 48.0, 44.0, 38.0, 21.0, 29.0, 20.0, 11.0, 15.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.246566772460938e-05, -6.01746141910553e-05, -5.788356065750122e-05, -5.5592507123947144e-05, -5.3301453590393066e-05, -5.101040005683899e-05, -4.871934652328491e-05, -4.6428292989730835e-05, -4.413723945617676e-05, -4.184618592262268e-05, -3.9555132389068604e-05, -3.7264078855514526e-05, -3.497302532196045e-05, -3.268197178840637e-05, -3.0390918254852295e-05, -2.8099864721298218e-05, -2.580881118774414e-05, -2.3517757654190063e-05, -2.1226704120635986e-05, -1.893565058708191e-05, -1.6644597053527832e-05, -1.4353543519973755e-05, -1.2062489986419678e-05, -9.7714364528656e-06, -7.4803829193115234e-06, -5.189329385757446e-06, -2.898275852203369e-06, -6.07222318649292e-07, 1.6838312149047852e-06, 3.974884748458862e-06, 6.2659382820129395e-06, 8.556991815567017e-06, 1.0848045349121094e-05, 1.3139098882675171e-05, 1.5430152416229248e-05, 1.7721205949783325e-05, 2.0012259483337402e-05, 2.230331301689148e-05, 2.4594366550445557e-05, 2.6885420083999634e-05, 2.917647361755371e-05, 3.146752715110779e-05, 3.3758580684661865e-05, 3.604963421821594e-05, 3.834068775177002e-05, 4.06317412853241e-05, 4.2922794818878174e-05, 4.521384835243225e-05, 4.750490188598633e-05, 4.9795955419540405e-05, 5.208700895309448e-05, 5.437806248664856e-05, 5.666911602020264e-05, 5.8960169553756714e-05, 6.125122308731079e-05, 6.354227662086487e-05, 6.583333015441895e-05, 6.812438368797302e-05, 7.04154372215271e-05, 7.270649075508118e-05, 7.499754428863525e-05, 7.728859782218933e-05, 7.957965135574341e-05, 8.187070488929749e-05, 8.416175842285156e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 6.0, 7.0, 7.0, 14.0, 23.0, 55.0, 77.0, 126.0, 314.0, 977.0, 5518.0, 139660.0, 886008.0, 13266.0, 1664.0, 474.0, 155.0, 86.0, 52.0, 26.0, 20.0, 12.0, 3.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.275146484375, -0.2637672424316406, -0.25238800048828125, -0.24100875854492188, -0.2296295166015625, -0.21825027465820312, -0.20687103271484375, -0.19549179077148438, -0.184112548828125, -0.17273330688476562, -0.16135406494140625, -0.14997482299804688, -0.1385955810546875, -0.12721633911132812, -0.11583709716796875, -0.10445785522460938, -0.09307861328125, -0.08169937133789062, -0.07032012939453125, -0.058940887451171875, -0.0475616455078125, -0.036182403564453125, -0.02480316162109375, -0.013423919677734375, -0.002044677734375, 0.009334564208984375, 0.02071380615234375, 0.032093048095703125, 0.0434722900390625, 0.054851531982421875, 0.06623077392578125, 0.07761001586914062, 0.0889892578125, 0.10036849975585938, 0.11174774169921875, 0.12312698364257812, 0.1345062255859375, 0.14588546752929688, 0.15726470947265625, 0.16864395141601562, 0.180023193359375, 0.19140243530273438, 0.20278167724609375, 0.21416091918945312, 0.2255401611328125, 0.23691940307617188, 0.24829864501953125, 0.2596778869628906, 0.27105712890625, 0.2824363708496094, 0.29381561279296875, 0.3051948547363281, 0.3165740966796875, 0.3279533386230469, 0.33933258056640625, 0.3507118225097656, 0.362091064453125, 0.3734703063964844, 0.38484954833984375, 0.3962287902832031, 0.4076080322265625, 0.4189872741699219, 0.43036651611328125, 0.4417457580566406, 0.453125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 28.0, 61.0, 325.0, 473.0, 67.0, 20.0, 10.0, 2.0, 5.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5390625, -0.5167236328125, -0.494384765625, -0.4720458984375, -0.44970703125, -0.4273681640625, -0.405029296875, -0.3826904296875, -0.3603515625, -0.3380126953125, -0.315673828125, -0.2933349609375, -0.27099609375, -0.2486572265625, -0.226318359375, -0.2039794921875, -0.181640625, -0.1593017578125, -0.136962890625, -0.1146240234375, -0.09228515625, -0.0699462890625, -0.047607421875, -0.0252685546875, -0.0029296875, 0.0194091796875, 0.041748046875, 0.0640869140625, 0.08642578125, 0.1087646484375, 0.131103515625, 0.1534423828125, 0.17578125, 0.1981201171875, 0.220458984375, 0.2427978515625, 0.26513671875, 0.2874755859375, 0.309814453125, 0.3321533203125, 0.3544921875, 0.3768310546875, 0.399169921875, 0.4215087890625, 0.44384765625, 0.4661865234375, 0.488525390625, 0.5108642578125, 0.533203125, 0.5555419921875, 0.577880859375, 0.6002197265625, 0.62255859375, 0.6448974609375, 0.667236328125, 0.6895751953125, 0.7119140625, 0.7342529296875, 0.756591796875, 0.7789306640625, 0.80126953125, 0.8236083984375, 0.845947265625, 0.8682861328125, 0.890625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 10.0, 28.0, 53.0, 100.0, 184.0, 213.0, 187.0, 127.0, 57.0, 20.0, 14.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9101192951202393, -2.815542221069336, -2.7209651470184326, -2.6263880729675293, -2.531810998916626, -2.4372339248657227, -2.3426566123962402, -2.248079776763916, -2.1535024642944336, -2.0589253902435303, -1.964348316192627, -1.8697712421417236, -1.7751941680908203, -1.680617094039917, -1.5860399007797241, -1.4914628267288208, -1.396885871887207, -1.3023087978363037, -1.2077317237854004, -1.113154649734497, -1.0185775756835938, -0.9240004420280457, -0.8294233083724976, -0.7348462343215942, -0.6402691602706909, -0.5456920862197876, -0.4511149823665619, -0.3565378785133362, -0.26196080446243286, -0.16738373041152954, -0.07280659675598145, 0.021770477294921875, 0.1163475513458252, 0.2109246402978897, 0.3055017292499542, 0.40007883310317993, 0.49465590715408325, 0.5892329812049866, 0.6838101148605347, 0.778387188911438, 0.8729642629623413, 0.9675413370132446, 1.062118411064148, 1.1566956043243408, 1.2512726783752441, 1.3458497524261475, 1.4404268264770508, 1.535003900527954, 1.6295809745788574, 1.7241580486297607, 1.818735122680664, 1.9133121967315674, 2.0078892707824707, 2.102466344833374, 2.1970434188842773, 2.2916207313537598, 2.386197566986084, 2.4807746410369873, 2.5753517150878906, 2.669928789138794, 2.7645058631896973, 2.8590829372406006, 2.953660011291504, 3.0482373237609863, 3.1428143978118896]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 9.0, 3.0, 8.0, 8.0, 10.0, 9.0, 13.0, 21.0, 25.0, 22.0, 18.0, 28.0, 34.0, 29.0, 37.0, 36.0, 30.0, 45.0, 43.0, 36.0, 48.0, 42.0, 43.0, 49.0, 37.0, 37.0, 32.0, 43.0, 37.0, 24.0, 20.0, 21.0, 20.0, 17.0, 10.0, 8.0, 8.0, 5.0, 9.0, 4.0, 14.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0], "bins": [-2.24587345123291, -2.182187795639038, -2.118502140045166, -2.054816484451294, -1.9911308288574219, -1.9274451732635498, -1.8637595176696777, -1.8000738620758057, -1.7363882064819336, -1.6727025508880615, -1.6090168952941895, -1.5453312397003174, -1.4816455841064453, -1.4179599285125732, -1.3542742729187012, -1.290588617324829, -1.2269030809402466, -1.1632174253463745, -1.0995317697525024, -1.0358461141586304, -0.9721604585647583, -0.9084748029708862, -0.8447892069816589, -0.7811035513877869, -0.7174178957939148, -0.6537322402000427, -0.5900465846061707, -0.5263609886169434, -0.4626753032207489, -0.39898964762687683, -0.33530402183532715, -0.2716183662414551, -0.207932710647583, -0.14424705505371094, -0.08056141436100006, -0.016875773668289185, 0.046809881925582886, 0.11049553751945496, 0.17418116331100464, 0.2378668189048767, 0.3015524744987488, 0.36523813009262085, 0.4289237856864929, 0.4926094114780426, 0.5562950372695923, 0.6199806928634644, 0.6836663484573364, 0.7473520040512085, 0.8110376596450806, 0.8747233152389526, 0.9384089708328247, 1.0020946264266968, 1.0657802820205688, 1.129465937614441, 1.1931514739990234, 1.2568371295928955, 1.3205227851867676, 1.3842084407806396, 1.4478940963745117, 1.5115797519683838, 1.5752654075622559, 1.638951063156128, 1.70263671875, 1.766322374343872, 1.8300080299377441]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 8.0, 9.0, 15.0, 16.0, 44.0, 67.0, 136.0, 326.0, 849.0, 3269.0, 25192.0, 4104669.0, 52720.0, 5026.0, 1193.0, 430.0, 158.0, 73.0, 39.0, 21.0, 8.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.369384765625, -0.3617868423461914, -0.3541889190673828, -0.3465909957885742, -0.3389930725097656, -0.33139514923095703, -0.32379722595214844, -0.31619930267333984, -0.30860137939453125, -0.30100345611572266, -0.29340553283691406, -0.28580760955810547, -0.2782096862792969, -0.2706117630004883, -0.2630138397216797, -0.2554159164428711, -0.2478179931640625, -0.2402200698852539, -0.2326221466064453, -0.22502422332763672, -0.21742630004882812, -0.20982837677001953, -0.20223045349121094, -0.19463253021240234, -0.18703460693359375, -0.17943668365478516, -0.17183876037597656, -0.16424083709716797, -0.15664291381835938, -0.14904499053955078, -0.1414470672607422, -0.1338491439819336, -0.126251220703125, -0.1186532974243164, -0.11105537414550781, -0.10345745086669922, -0.09585952758789062, -0.08826160430908203, -0.08066368103027344, -0.07306575775146484, -0.06546783447265625, -0.057869911193847656, -0.05027198791503906, -0.04267406463623047, -0.035076141357421875, -0.02747821807861328, -0.019880294799804688, -0.012282371520996094, -0.0046844482421875, 0.0029134750366210938, 0.010511398315429688, 0.01810932159423828, 0.025707244873046875, 0.03330516815185547, 0.04090309143066406, 0.048501014709472656, 0.05609893798828125, 0.06369686126708984, 0.07129478454589844, 0.07889270782470703, 0.08649063110351562, 0.09408855438232422, 0.10168647766113281, 0.1092844009399414, 0.11688232421875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 8.0, 10.0, 8.0, 13.0, 22.0, 30.0, 32.0, 42.0, 43.0, 58.0, 54.0, 81.0, 57.0, 61.0, 67.0, 54.0, 66.0, 60.0, 47.0, 42.0, 29.0, 28.0, 20.0, 14.0, 9.0, 10.0, 4.0, 9.0, 6.0, 3.0, 4.0, 3.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.16599273681640625, -0.1612091064453125, -0.15642547607421875, -0.151641845703125, -0.14685821533203125, -0.1420745849609375, -0.13729095458984375, -0.13250732421875, -0.12772369384765625, -0.1229400634765625, -0.11815643310546875, -0.113372802734375, -0.10858917236328125, -0.1038055419921875, -0.09902191162109375, -0.09423828125, -0.08945465087890625, -0.0846710205078125, -0.07988739013671875, -0.075103759765625, -0.07032012939453125, -0.0655364990234375, -0.06075286865234375, -0.05596923828125, -0.05118560791015625, -0.0464019775390625, -0.04161834716796875, -0.036834716796875, -0.03205108642578125, -0.0272674560546875, -0.02248382568359375, -0.0177001953125, -0.01291656494140625, -0.0081329345703125, -0.00334930419921875, 0.001434326171875, 0.00621795654296875, 0.0110015869140625, 0.01578521728515625, 0.02056884765625, 0.02535247802734375, 0.0301361083984375, 0.03491973876953125, 0.039703369140625, 0.04448699951171875, 0.0492706298828125, 0.05405426025390625, 0.058837890625, 0.06362152099609375, 0.0684051513671875, 0.07318878173828125, 0.077972412109375, 0.08275604248046875, 0.0875396728515625, 0.09232330322265625, 0.09710693359375, 0.10189056396484375, 0.1066741943359375, 0.11145782470703125, 0.116241455078125, 0.12102508544921875, 0.1258087158203125, 0.13059234619140625, 0.1353759765625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 2.0, 5.0, 10.0, 11.0, 9.0, 13.0, 20.0, 20.0, 25.0, 27.0, 32.0, 47.0, 63.0, 72.0, 74.0, 112.0, 164.0, 232.0, 428.0, 757.0, 1518.0, 3409.0, 12734.0, 237903.0, 3903507.0, 24090.0, 4767.0, 1781.0, 900.0, 506.0, 267.0, 174.0, 111.0, 88.0, 89.0, 57.0, 63.0, 33.0, 29.0, 24.0, 34.0, 12.0, 15.0, 8.0, 12.0, 7.0, 6.0, 9.0, 0.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1446533203125, -0.1402912139892578, -0.13592910766601562, -0.13156700134277344, -0.12720489501953125, -0.12284278869628906, -0.11848068237304688, -0.11411857604980469, -0.1097564697265625, -0.10539436340332031, -0.10103225708007812, -0.09667015075683594, -0.09230804443359375, -0.08794593811035156, -0.08358383178710938, -0.07922172546386719, -0.074859619140625, -0.07049751281738281, -0.06613540649414062, -0.06177330017089844, -0.05741119384765625, -0.05304908752441406, -0.048686981201171875, -0.04432487487792969, -0.0399627685546875, -0.03560066223144531, -0.031238555908203125, -0.026876449584960938, -0.02251434326171875, -0.018152236938476562, -0.013790130615234375, -0.009428024291992188, -0.00506591796875, -0.0007038116455078125, 0.003658294677734375, 0.008020401000976562, 0.01238250732421875, 0.016744613647460938, 0.021106719970703125, 0.025468826293945312, 0.0298309326171875, 0.03419303894042969, 0.038555145263671875, 0.04291725158691406, 0.04727935791015625, 0.05164146423339844, 0.056003570556640625, 0.06036567687988281, 0.064727783203125, 0.06908988952636719, 0.07345199584960938, 0.07781410217285156, 0.08217620849609375, 0.08653831481933594, 0.09090042114257812, 0.09526252746582031, 0.0996246337890625, 0.10398674011230469, 0.10834884643554688, 0.11271095275878906, 0.11707305908203125, 0.12143516540527344, 0.12579727172851562, 0.1301593780517578, 0.134521484375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 6.0, 19.0, 26.0, 64.0, 217.0, 3328.0, 280.0, 70.0, 22.0, 15.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0142974853515625, -0.013062238693237305, -0.01182699203491211, -0.010591745376586914, -0.009356498718261719, -0.008121252059936523, -0.006886005401611328, -0.005650758743286133, -0.0044155120849609375, -0.003180265426635742, -0.0019450187683105469, -0.0007097721099853516, 0.0005254745483398438, 0.001760721206665039, 0.0029959678649902344, 0.00423121452331543, 0.005466461181640625, 0.00670170783996582, 0.007936954498291016, 0.009172201156616211, 0.010407447814941406, 0.011642694473266602, 0.012877941131591797, 0.014113187789916992, 0.015348434448242188, 0.016583681106567383, 0.017818927764892578, 0.019054174423217773, 0.02028942108154297, 0.021524667739868164, 0.02275991439819336, 0.023995161056518555, 0.02523040771484375, 0.026465654373168945, 0.02770090103149414, 0.028936147689819336, 0.03017139434814453, 0.03140664100646973, 0.03264188766479492, 0.03387713432312012, 0.03511238098144531, 0.03634762763977051, 0.0375828742980957, 0.0388181209564209, 0.040053367614746094, 0.04128861427307129, 0.042523860931396484, 0.04375910758972168, 0.044994354248046875, 0.04622960090637207, 0.047464847564697266, 0.04870009422302246, 0.049935340881347656, 0.05117058753967285, 0.05240583419799805, 0.05364108085632324, 0.05487632751464844, 0.05611157417297363, 0.05734682083129883, 0.05858206748962402, 0.05981731414794922, 0.061052560806274414, 0.06228780746459961, 0.0635230541229248, 0.06475830078125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 7.0, 11.0, 9.0, 18.0, 27.0, 46.0, 52.0, 72.0, 93.0, 125.0, 111.0, 109.0, 83.0, 60.0, 48.0, 40.0, 23.0, 22.0, 9.0, 8.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1159844696521759, -0.11311082541942596, -0.11023718863725662, -0.10736354440450668, -0.10448990017175674, -0.1016162633895874, -0.09874261915683746, -0.09586897492408752, -0.09299533069133759, -0.09012168645858765, -0.0872480496764183, -0.08437440544366837, -0.08150076121091843, -0.07862712442874908, -0.07575348019599915, -0.0728798359632492, -0.07000619918107986, -0.06713255494832993, -0.06425891816616058, -0.061385273933410645, -0.058511629700660706, -0.055637989193201065, -0.052764348685741425, -0.049890704452991486, -0.047017063945531845, -0.044143423438072205, -0.041269779205322266, -0.038396138697862625, -0.035522498190402985, -0.032648853957653046, -0.029775213450193405, -0.026901571080088615, -0.024027928709983826, -0.021154286339879036, -0.018280643969774246, -0.015407003462314606, -0.012533361092209816, -0.009659718722105026, -0.006786078214645386, -0.003912435844540596, -0.0010387934744358063, 0.0018348484300076962, 0.004708490334451199, 0.007582131773233414, 0.010455774143338203, 0.013329416513442993, 0.016203057020902634, 0.019076699391007423, 0.021950341761112213, 0.024823984131217003, 0.027697626501321793, 0.030571267008781433, 0.03344491124153137, 0.03631855174899101, 0.03919219225645065, 0.04206583648920059, 0.04493947699666023, 0.04781311750411987, 0.05068676173686981, 0.05356040224432945, 0.05643404275178909, 0.05930768698453903, 0.06218132749199867, 0.06505496799945831, 0.06792861223220825]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 8.0, 4.0, 8.0, 8.0, 11.0, 13.0, 11.0, 20.0, 25.0, 32.0, 23.0, 41.0, 29.0, 35.0, 42.0, 42.0, 56.0, 45.0, 40.0, 46.0, 43.0, 49.0, 51.0, 36.0, 38.0, 33.0, 39.0, 26.0, 31.0, 18.0, 16.0, 15.0, 17.0, 20.0, 9.0, 14.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051313161849975586, -0.04919978976249695, -0.04708641767501831, -0.04497304558753967, -0.042859673500061035, -0.0407463014125824, -0.03863292932510376, -0.03651955723762512, -0.034406185150146484, -0.03229281306266785, -0.03017944097518921, -0.02806606888771057, -0.025952696800231934, -0.023839324712753296, -0.021725952625274658, -0.01961258053779602, -0.017499208450317383, -0.015385836362838745, -0.013272464275360107, -0.01115909218788147, -0.009045720100402832, -0.006932348012924194, -0.004818975925445557, -0.002705603837966919, -0.0005922317504882812, 0.0015211403369903564, 0.003634512424468994, 0.005747884511947632, 0.00786125659942627, 0.009974628686904907, 0.012088000774383545, 0.014201372861862183, 0.01631474494934082, 0.018428117036819458, 0.020541489124298096, 0.022654861211776733, 0.02476823329925537, 0.02688160538673401, 0.028994977474212646, 0.031108349561691284, 0.03322172164916992, 0.03533509373664856, 0.0374484658241272, 0.039561837911605835, 0.04167520999908447, 0.04378858208656311, 0.04590195417404175, 0.048015326261520386, 0.05012869834899902, 0.05224207043647766, 0.0543554425239563, 0.056468814611434937, 0.058582186698913574, 0.06069555878639221, 0.06280893087387085, 0.06492230296134949, 0.06703567504882812, 0.06914904713630676, 0.0712624192237854, 0.07337579131126404, 0.07548916339874268, 0.07760253548622131, 0.07971590757369995, 0.08182927966117859, 0.08394265174865723]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 15.0, 19.0, 21.0, 39.0, 70.0, 116.0, 146.0, 235.0, 427.0, 701.0, 1036.0, 1805.0, 3175.0, 6019.0, 11615.0, 26116.0, 73467.0, 271665.0, 441072.0, 133863.0, 41493.0, 17117.0, 8044.0, 4295.0, 2452.0, 1424.0, 771.0, 483.0, 296.0, 184.0, 130.0, 76.0, 51.0, 36.0, 27.0, 12.0, 9.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.15576171875, -0.15077590942382812, -0.14579010009765625, -0.14080429077148438, -0.1358184814453125, -0.13083267211914062, -0.12584686279296875, -0.12086105346679688, -0.115875244140625, -0.11088943481445312, -0.10590362548828125, -0.10091781616210938, -0.0959320068359375, -0.09094619750976562, -0.08596038818359375, -0.08097457885742188, -0.07598876953125, -0.07100296020507812, -0.06601715087890625, -0.061031341552734375, -0.0560455322265625, -0.051059722900390625, -0.04607391357421875, -0.041088104248046875, -0.036102294921875, -0.031116485595703125, -0.02613067626953125, -0.021144866943359375, -0.0161590576171875, -0.011173248291015625, -0.00618743896484375, -0.001201629638671875, 0.0037841796875, 0.008769989013671875, 0.01375579833984375, 0.018741607666015625, 0.0237274169921875, 0.028713226318359375, 0.03369903564453125, 0.038684844970703125, 0.043670654296875, 0.048656463623046875, 0.05364227294921875, 0.058628082275390625, 0.0636138916015625, 0.06859970092773438, 0.07358551025390625, 0.07857131958007812, 0.08355712890625, 0.08854293823242188, 0.09352874755859375, 0.09851455688476562, 0.1035003662109375, 0.10848617553710938, 0.11347198486328125, 0.11845779418945312, 0.123443603515625, 0.12842941284179688, 0.13341522216796875, 0.13840103149414062, 0.1433868408203125, 0.14837265014648438, 0.15335845947265625, 0.15834426879882812, 0.163330078125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 2.0, 8.0, 7.0, 9.0, 13.0, 19.0, 25.0, 32.0, 29.0, 51.0, 57.0, 62.0, 54.0, 65.0, 75.0, 57.0, 69.0, 58.0, 66.0, 45.0, 41.0, 38.0, 23.0, 22.0, 18.0, 10.0, 15.0, 6.0, 9.0, 3.0, 5.0, 4.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.167724609375, -0.1629486083984375, -0.158172607421875, -0.1533966064453125, -0.14862060546875, -0.1438446044921875, -0.139068603515625, -0.1342926025390625, -0.1295166015625, -0.1247406005859375, -0.119964599609375, -0.1151885986328125, -0.11041259765625, -0.1056365966796875, -0.100860595703125, -0.0960845947265625, -0.09130859375, -0.0865325927734375, -0.081756591796875, -0.0769805908203125, -0.07220458984375, -0.0674285888671875, -0.062652587890625, -0.0578765869140625, -0.0531005859375, -0.0483245849609375, -0.043548583984375, -0.0387725830078125, -0.03399658203125, -0.0292205810546875, -0.024444580078125, -0.0196685791015625, -0.014892578125, -0.0101165771484375, -0.005340576171875, -0.0005645751953125, 0.00421142578125, 0.0089874267578125, 0.013763427734375, 0.0185394287109375, 0.0233154296875, 0.0280914306640625, 0.032867431640625, 0.0376434326171875, 0.04241943359375, 0.0471954345703125, 0.051971435546875, 0.0567474365234375, 0.0615234375, 0.0662994384765625, 0.071075439453125, 0.0758514404296875, 0.08062744140625, 0.0854034423828125, 0.090179443359375, 0.0949554443359375, 0.0997314453125, 0.1045074462890625, 0.109283447265625, 0.1140594482421875, 0.11883544921875, 0.1236114501953125, 0.128387451171875, 0.1331634521484375, 0.137939453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 4.0, 7.0, 7.0, 16.0, 14.0, 24.0, 23.0, 40.0, 43.0, 41.0, 91.0, 134.0, 200.0, 347.0, 845.0, 3411.0, 22778.0, 418962.0, 567610.0, 27995.0, 3931.0, 973.0, 405.0, 215.0, 124.0, 79.0, 52.0, 53.0, 32.0, 17.0, 8.0, 18.0, 9.0, 5.0, 8.0, 9.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.347900390625, -0.3359222412109375, -0.323944091796875, -0.3119659423828125, -0.29998779296875, -0.2880096435546875, -0.276031494140625, -0.2640533447265625, -0.2520751953125, -0.2400970458984375, -0.228118896484375, -0.2161407470703125, -0.20416259765625, -0.1921844482421875, -0.180206298828125, -0.1682281494140625, -0.15625, -0.1442718505859375, -0.132293701171875, -0.1203155517578125, -0.10833740234375, -0.0963592529296875, -0.084381103515625, -0.0724029541015625, -0.0604248046875, -0.0484466552734375, -0.036468505859375, -0.0244903564453125, -0.01251220703125, -0.0005340576171875, 0.011444091796875, 0.0234222412109375, 0.035400390625, 0.0473785400390625, 0.059356689453125, 0.0713348388671875, 0.08331298828125, 0.0952911376953125, 0.107269287109375, 0.1192474365234375, 0.1312255859375, 0.1432037353515625, 0.155181884765625, 0.1671600341796875, 0.17913818359375, 0.1911163330078125, 0.203094482421875, 0.2150726318359375, 0.22705078125, 0.2390289306640625, 0.251007080078125, 0.2629852294921875, 0.27496337890625, 0.2869415283203125, 0.298919677734375, 0.3108978271484375, 0.3228759765625, 0.3348541259765625, 0.346832275390625, 0.3588104248046875, 0.37078857421875, 0.3827667236328125, 0.394744873046875, 0.4067230224609375, 0.418701171875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 8.0, 0.0, 7.0, 5.0, 7.0, 8.0, 16.0, 16.0, 19.0, 28.0, 18.0, 24.0, 31.0, 28.0, 29.0, 31.0, 31.0, 47.0, 47.0, 52.0, 43.0, 42.0, 41.0, 40.0, 42.0, 32.0, 49.0, 28.0, 33.0, 38.0, 24.0, 21.0, 18.0, 18.0, 18.0, 13.0, 10.0, 7.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.457763671875, -0.4443778991699219, -0.43099212646484375, -0.4176063537597656, -0.4042205810546875, -0.3908348083496094, -0.37744903564453125, -0.3640632629394531, -0.350677490234375, -0.3372917175292969, -0.32390594482421875, -0.3105201721191406, -0.2971343994140625, -0.2837486267089844, -0.27036285400390625, -0.2569770812988281, -0.24359130859375, -0.23020553588867188, -0.21681976318359375, -0.20343399047851562, -0.1900482177734375, -0.17666244506835938, -0.16327667236328125, -0.14989089965820312, -0.136505126953125, -0.12311935424804688, -0.10973358154296875, -0.09634780883789062, -0.0829620361328125, -0.06957626342773438, -0.05619049072265625, -0.042804718017578125, -0.0294189453125, -0.016033172607421875, -0.00264739990234375, 0.010738372802734375, 0.0241241455078125, 0.037509918212890625, 0.05089569091796875, 0.06428146362304688, 0.077667236328125, 0.09105300903320312, 0.10443878173828125, 0.11782455444335938, 0.1312103271484375, 0.14459609985351562, 0.15798187255859375, 0.17136764526367188, 0.18475341796875, 0.19813919067382812, 0.21152496337890625, 0.22491073608398438, 0.2382965087890625, 0.2516822814941406, 0.26506805419921875, 0.2784538269042969, 0.291839599609375, 0.3052253723144531, 0.31861114501953125, 0.3319969177246094, 0.3453826904296875, 0.3587684631347656, 0.37215423583984375, 0.3855400085449219, 0.39892578125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 6.0, 9.0, 17.0, 22.0, 36.0, 75.0, 140.0, 349.0, 927.0, 5780.0, 851982.0, 184420.0, 3506.0, 747.0, 238.0, 145.0, 68.0, 30.0, 25.0, 14.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.51318359375, -0.5009346008300781, -0.48868560791015625, -0.4764366149902344, -0.4641876220703125, -0.4519386291503906, -0.43968963623046875, -0.4274406433105469, -0.415191650390625, -0.4029426574707031, -0.39069366455078125, -0.3784446716308594, -0.3661956787109375, -0.3539466857910156, -0.34169769287109375, -0.3294486999511719, -0.31719970703125, -0.3049507141113281, -0.29270172119140625, -0.2804527282714844, -0.2682037353515625, -0.2559547424316406, -0.24370574951171875, -0.23145675659179688, -0.219207763671875, -0.20695877075195312, -0.19470977783203125, -0.18246078491210938, -0.1702117919921875, -0.15796279907226562, -0.14571380615234375, -0.13346481323242188, -0.1212158203125, -0.10896682739257812, -0.09671783447265625, -0.08446884155273438, -0.0722198486328125, -0.059970855712890625, -0.04772186279296875, -0.035472869873046875, -0.023223876953125, -0.010974884033203125, 0.00127410888671875, 0.013523101806640625, 0.0257720947265625, 0.038021087646484375, 0.05027008056640625, 0.06251907348632812, 0.07476806640625, 0.08701705932617188, 0.09926605224609375, 0.11151504516601562, 0.1237640380859375, 0.13601303100585938, 0.14826202392578125, 0.16051101684570312, 0.172760009765625, 0.18500900268554688, 0.19725799560546875, 0.20950698852539062, 0.2217559814453125, 0.23400497436523438, 0.24625396728515625, 0.2585029602050781, 0.270751953125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 3.0, 5.0, 10.0, 4.0, 8.0, 13.0, 12.0, 17.0, 22.0, 31.0, 36.0, 42.0, 61.0, 80.0, 86.0, 85.0, 85.0, 64.0, 66.0, 48.0, 43.0, 47.0, 29.0, 21.0, 24.0, 21.0, 10.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.309415817260742e-05, -4.1472725570201874e-05, -3.9851292967796326e-05, -3.822986036539078e-05, -3.660842776298523e-05, -3.498699516057968e-05, -3.336556255817413e-05, -3.1744129955768585e-05, -3.0122697353363037e-05, -2.850126475095749e-05, -2.687983214855194e-05, -2.5258399546146393e-05, -2.3636966943740845e-05, -2.2015534341335297e-05, -2.039410173892975e-05, -1.87726691365242e-05, -1.7151236534118652e-05, -1.5529803931713104e-05, -1.3908371329307556e-05, -1.2286938726902008e-05, -1.066550612449646e-05, -9.044073522090912e-06, -7.422640919685364e-06, -5.801208317279816e-06, -4.179775714874268e-06, -2.5583431124687195e-06, -9.369105100631714e-07, 6.845220923423767e-07, 2.305954694747925e-06, 3.927387297153473e-06, 5.548819899559021e-06, 7.170252501964569e-06, 8.791685104370117e-06, 1.0413117706775665e-05, 1.2034550309181213e-05, 1.3655982911586761e-05, 1.527741551399231e-05, 1.6898848116397858e-05, 1.8520280718803406e-05, 2.0141713321208954e-05, 2.1763145923614502e-05, 2.338457852602005e-05, 2.5006011128425598e-05, 2.6627443730831146e-05, 2.8248876333236694e-05, 2.9870308935642242e-05, 3.149174153804779e-05, 3.311317414045334e-05, 3.473460674285889e-05, 3.6356039345264435e-05, 3.797747194766998e-05, 3.959890455007553e-05, 4.122033715248108e-05, 4.284176975488663e-05, 4.4463202357292175e-05, 4.6084634959697723e-05, 4.770606756210327e-05, 4.932750016450882e-05, 5.094893276691437e-05, 5.2570365369319916e-05, 5.4191797971725464e-05, 5.581323057413101e-05, 5.743466317653656e-05, 5.905609577894211e-05, 6.0677528381347656e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 15.0, 23.0, 57.0, 90.0, 173.0, 471.0, 2241.0, 22833.0, 957955.0, 59986.0, 3587.0, 683.0, 209.0, 89.0, 49.0, 29.0, 19.0, 10.0, 4.0, 10.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2344970703125, -0.2256908416748047, -0.21688461303710938, -0.20807838439941406, -0.19927215576171875, -0.19046592712402344, -0.18165969848632812, -0.1728534698486328, -0.1640472412109375, -0.1552410125732422, -0.14643478393554688, -0.13762855529785156, -0.12882232666015625, -0.12001609802246094, -0.11120986938476562, -0.10240364074707031, -0.093597412109375, -0.08479118347167969, -0.07598495483398438, -0.06717872619628906, -0.05837249755859375, -0.04956626892089844, -0.040760040283203125, -0.03195381164550781, -0.0231475830078125, -0.014341354370117188, -0.005535125732421875, 0.0032711029052734375, 0.01207733154296875, 0.020883560180664062, 0.029689788818359375, 0.03849601745605469, 0.04730224609375, 0.05610847473144531, 0.06491470336914062, 0.07372093200683594, 0.08252716064453125, 0.09133338928222656, 0.10013961791992188, 0.10894584655761719, 0.1177520751953125, 0.1265583038330078, 0.13536453247070312, 0.14417076110839844, 0.15297698974609375, 0.16178321838378906, 0.17058944702148438, 0.1793956756591797, 0.188201904296875, 0.1970081329345703, 0.20581436157226562, 0.21462059020996094, 0.22342681884765625, 0.23223304748535156, 0.24103927612304688, 0.2498455047607422, 0.2586517333984375, 0.2674579620361328, 0.2762641906738281, 0.28507041931152344, 0.29387664794921875, 0.30268287658691406, 0.3114891052246094, 0.3202953338623047, 0.3291015625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 10.0, 9.0, 9.0, 16.0, 34.0, 52.0, 98.0, 219.0, 255.0, 147.0, 64.0, 25.0, 15.0, 19.0, 14.0, 6.0, 5.0, 3.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.286376953125, -0.2774620056152344, -0.26854705810546875, -0.2596321105957031, -0.2507171630859375, -0.24180221557617188, -0.23288726806640625, -0.22397232055664062, -0.215057373046875, -0.20614242553710938, -0.19722747802734375, -0.18831253051757812, -0.1793975830078125, -0.17048263549804688, -0.16156768798828125, -0.15265274047851562, -0.14373779296875, -0.13482284545898438, -0.12590789794921875, -0.11699295043945312, -0.1080780029296875, -0.09916305541992188, -0.09024810791015625, -0.08133316040039062, -0.072418212890625, -0.06350326538085938, -0.05458831787109375, -0.045673370361328125, -0.0367584228515625, -0.027843475341796875, -0.01892852783203125, -0.010013580322265625, -0.0010986328125, 0.007816314697265625, 0.01673126220703125, 0.025646209716796875, 0.0345611572265625, 0.043476104736328125, 0.05239105224609375, 0.061305999755859375, 0.070220947265625, 0.07913589477539062, 0.08805084228515625, 0.09696578979492188, 0.1058807373046875, 0.11479568481445312, 0.12371063232421875, 0.13262557983398438, 0.14154052734375, 0.15045547485351562, 0.15937042236328125, 0.16828536987304688, 0.1772003173828125, 0.18611526489257812, 0.19503021240234375, 0.20394515991210938, 0.212860107421875, 0.22177505493164062, 0.23069000244140625, 0.23960494995117188, 0.2485198974609375, 0.2574348449707031, 0.26634979248046875, 0.2752647399902344, 0.2841796875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 10.0, 34.0, 149.0, 380.0, 290.0, 99.0, 36.0, 11.0, 3.0, 1.0, 2.0, 3.0], "bins": [-9.787286758422852, -9.611881256103516, -9.43647575378418, -9.261070251464844, -9.085664749145508, -8.910259246826172, -8.734853744506836, -8.5594482421875, -8.384041786193848, -8.208636283874512, -8.033230781555176, -7.85782527923584, -7.682419300079346, -7.50701379776001, -7.331608295440674, -7.156202793121338, -6.98079776763916, -6.805392265319824, -6.629986763000488, -6.454581260681152, -6.279175281524658, -6.103769779205322, -5.928364276885986, -5.75295877456665, -5.577552795410156, -5.40214729309082, -5.226741790771484, -5.051336288452148, -4.875930309295654, -4.700524806976318, -4.525119304656982, -4.3497138023376465, -4.1743083000183105, -3.9989027976989746, -3.8234970569610596, -3.6480915546417236, -3.4726860523223877, -3.2972803115844727, -3.1218748092651367, -2.946469306945801, -2.771063804626465, -2.595658302307129, -2.420252561569214, -2.244847059249878, -2.069441556930542, -1.8940359354019165, -1.718630313873291, -1.543224811553955, -1.36781907081604, -1.1924134492874146, -1.0170079469680786, -0.8416023254394531, -0.6661967635154724, -0.4907912015914917, -0.3153855800628662, -0.13998007774353027, 0.035425543785095215, 0.21083112061023712, 0.38623669743537903, 0.5616422891616821, 0.7370478510856628, 0.9124534130096436, 1.087859034538269, 1.263264536857605, 1.4386701583862305]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 7.0, 9.0, 17.0, 11.0, 9.0, 9.0, 12.0, 23.0, 18.0, 23.0, 34.0, 26.0, 39.0, 39.0, 38.0, 39.0, 34.0, 43.0, 41.0, 51.0, 50.0, 41.0, 44.0, 47.0, 32.0, 44.0, 39.0, 26.0, 25.0, 24.0, 12.0, 16.0, 15.0, 10.0, 9.0, 15.0, 6.0, 3.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.28642201423645, -2.220757007598877, -2.1550920009613037, -2.0894269943237305, -2.023761749267578, -1.9580968618392944, -1.8924317359924316, -1.8267667293548584, -1.7611017227172852, -1.695436716079712, -1.6297717094421387, -1.5641065835952759, -1.4984415769577026, -1.4327765703201294, -1.3671114444732666, -1.3014464378356934, -1.2357814311981201, -1.1701164245605469, -1.1044514179229736, -1.0387862920761108, -0.9731212854385376, -0.9074562788009644, -0.8417912125587463, -0.7761261463165283, -0.7104611396789551, -0.6447961330413818, -0.5791310667991638, -0.5134660005569458, -0.44780099391937256, -0.38213595747947693, -0.3164709210395813, -0.25080588459968567, -0.18514108657836914, -0.11947605013847351, -0.05381101369857788, 0.011854022741317749, 0.07751905918121338, 0.143184095621109, 0.20884913206100464, 0.27451416850090027, 0.3401792049407959, 0.40584424138069153, 0.47150927782058716, 0.5371743440628052, 0.6028393507003784, 0.6685043573379517, 0.7341694235801697, 0.7998344898223877, 0.8654994964599609, 0.9311645030975342, 0.9968295693397522, 1.0624946355819702, 1.1281596422195435, 1.1938246488571167, 1.2594897747039795, 1.3251547813415527, 1.390819787979126, 1.4564847946166992, 1.5221498012542725, 1.5878149271011353, 1.6534799337387085, 1.7191449403762817, 1.7848100662231445, 1.8504750728607178, 1.916140079498291]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 2.0, 9.0, 13.0, 19.0, 37.0, 52.0, 78.0, 137.0, 197.0, 441.0, 940.0, 2582.0, 13675.0, 4113651.0, 55149.0, 4692.0, 1327.0, 534.0, 294.0, 164.0, 85.0, 71.0, 34.0, 27.0, 17.0, 18.0, 14.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3740234375, -0.3646068572998047, -0.3551902770996094, -0.34577369689941406, -0.33635711669921875, -0.32694053649902344, -0.3175239562988281, -0.3081073760986328, -0.2986907958984375, -0.2892742156982422, -0.2798576354980469, -0.27044105529785156, -0.26102447509765625, -0.25160789489746094, -0.24219131469726562, -0.2327747344970703, -0.223358154296875, -0.2139415740966797, -0.20452499389648438, -0.19510841369628906, -0.18569183349609375, -0.17627525329589844, -0.16685867309570312, -0.1574420928955078, -0.1480255126953125, -0.1386089324951172, -0.12919235229492188, -0.11977577209472656, -0.11035919189453125, -0.10094261169433594, -0.09152603149414062, -0.08210945129394531, -0.07269287109375, -0.06327629089355469, -0.053859710693359375, -0.04444313049316406, -0.03502655029296875, -0.025609970092773438, -0.016193389892578125, -0.0067768096923828125, 0.0026397705078125, 0.012056350708007812, 0.021472930908203125, 0.030889511108398438, 0.04030609130859375, 0.04972267150878906, 0.059139251708984375, 0.06855583190917969, 0.077972412109375, 0.08738899230957031, 0.09680557250976562, 0.10622215270996094, 0.11563873291015625, 0.12505531311035156, 0.13447189331054688, 0.1438884735107422, 0.1533050537109375, 0.1627216339111328, 0.17213821411132812, 0.18155479431152344, 0.19097137451171875, 0.20038795471191406, 0.20980453491210938, 0.2192211151123047, 0.2286376953125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 8.0, 5.0, 18.0, 17.0, 17.0, 26.0, 30.0, 25.0, 50.0, 46.0, 50.0, 55.0, 58.0, 66.0, 59.0, 60.0, 56.0, 61.0, 41.0, 46.0, 36.0, 26.0, 25.0, 26.0, 17.0, 12.0, 20.0, 13.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0], "bins": [-0.1773681640625, -0.17307567596435547, -0.16878318786621094, -0.1644906997680664, -0.16019821166992188, -0.15590572357177734, -0.1516132354736328, -0.14732074737548828, -0.14302825927734375, -0.13873577117919922, -0.1344432830810547, -0.13015079498291016, -0.12585830688476562, -0.1215658187866211, -0.11727333068847656, -0.11298084259033203, -0.1086883544921875, -0.10439586639404297, -0.10010337829589844, -0.0958108901977539, -0.09151840209960938, -0.08722591400146484, -0.08293342590332031, -0.07864093780517578, -0.07434844970703125, -0.07005596160888672, -0.06576347351074219, -0.061470985412597656, -0.057178497314453125, -0.052886009216308594, -0.04859352111816406, -0.04430103302001953, -0.040008544921875, -0.03571605682373047, -0.03142356872558594, -0.027131080627441406, -0.022838592529296875, -0.018546104431152344, -0.014253616333007812, -0.009961128234863281, -0.00566864013671875, -0.0013761520385742188, 0.0029163360595703125, 0.007208824157714844, 0.011501312255859375, 0.015793800354003906, 0.020086288452148438, 0.02437877655029297, 0.0286712646484375, 0.03296375274658203, 0.03725624084472656, 0.041548728942871094, 0.045841217041015625, 0.050133705139160156, 0.05442619323730469, 0.05871868133544922, 0.06301116943359375, 0.06730365753173828, 0.07159614562988281, 0.07588863372802734, 0.08018112182617188, 0.0844736099243164, 0.08876609802246094, 0.09305858612060547, 0.09735107421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 7.0, 10.0, 14.0, 16.0, 20.0, 36.0, 23.0, 45.0, 83.0, 93.0, 150.0, 229.0, 347.0, 469.0, 913.0, 1555.0, 3412.0, 10159.0, 84426.0, 4053152.0, 27178.0, 6193.0, 2456.0, 1202.0, 698.0, 439.0, 296.0, 214.0, 130.0, 83.0, 56.0, 47.0, 27.0, 15.0, 14.0, 13.0, 9.0, 8.0, 6.0, 11.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.1888427734375, -0.18299484252929688, -0.17714691162109375, -0.17129898071289062, -0.1654510498046875, -0.15960311889648438, -0.15375518798828125, -0.14790725708007812, -0.142059326171875, -0.13621139526367188, -0.13036346435546875, -0.12451553344726562, -0.1186676025390625, -0.11281967163085938, -0.10697174072265625, -0.10112380981445312, -0.09527587890625, -0.08942794799804688, -0.08358001708984375, -0.07773208618164062, -0.0718841552734375, -0.06603622436523438, -0.06018829345703125, -0.054340362548828125, -0.048492431640625, -0.042644500732421875, -0.03679656982421875, -0.030948638916015625, -0.0251007080078125, -0.019252777099609375, -0.01340484619140625, -0.007556915283203125, -0.001708984375, 0.004138946533203125, 0.00998687744140625, 0.015834808349609375, 0.0216827392578125, 0.027530670166015625, 0.03337860107421875, 0.039226531982421875, 0.045074462890625, 0.050922393798828125, 0.05677032470703125, 0.06261825561523438, 0.0684661865234375, 0.07431411743164062, 0.08016204833984375, 0.08600997924804688, 0.09185791015625, 0.09770584106445312, 0.10355377197265625, 0.10940170288085938, 0.1152496337890625, 0.12109756469726562, 0.12694549560546875, 0.13279342651367188, 0.138641357421875, 0.14448928833007812, 0.15033721923828125, 0.15618515014648438, 0.1620330810546875, 0.16788101196289062, 0.17372894287109375, 0.17957687377929688, 0.1854248046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 12.0, 18.0, 65.0, 606.0, 3237.0, 70.0, 23.0, 15.0, 9.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0694580078125, -0.067474365234375, -0.06549072265625, -0.063507080078125, -0.0615234375, -0.059539794921875, -0.05755615234375, -0.055572509765625, -0.0535888671875, -0.051605224609375, -0.04962158203125, -0.047637939453125, -0.045654296875, -0.043670654296875, -0.04168701171875, -0.039703369140625, -0.0377197265625, -0.035736083984375, -0.03375244140625, -0.031768798828125, -0.02978515625, -0.027801513671875, -0.02581787109375, -0.023834228515625, -0.0218505859375, -0.019866943359375, -0.01788330078125, -0.015899658203125, -0.013916015625, -0.011932373046875, -0.00994873046875, -0.007965087890625, -0.0059814453125, -0.003997802734375, -0.00201416015625, -3.0517578125e-05, 0.001953125, 0.003936767578125, 0.00592041015625, 0.007904052734375, 0.0098876953125, 0.011871337890625, 0.01385498046875, 0.015838623046875, 0.017822265625, 0.019805908203125, 0.02178955078125, 0.023773193359375, 0.0257568359375, 0.027740478515625, 0.02972412109375, 0.031707763671875, 0.03369140625, 0.035675048828125, 0.03765869140625, 0.039642333984375, 0.0416259765625, 0.043609619140625, 0.04559326171875, 0.047576904296875, 0.049560546875, 0.051544189453125, 0.05352783203125, 0.055511474609375, 0.0574951171875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 26.0, 53.0, 121.0, 204.0, 272.0, 154.0, 89.0, 39.0, 17.0, 7.0, 5.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2907010018825531, -0.28236693143844604, -0.2740328907966614, -0.2656988203525543, -0.25736477971076965, -0.2490307092666626, -0.24069665372371674, -0.23236259818077087, -0.22402852773666382, -0.21569447219371796, -0.2073604166507721, -0.19902634620666504, -0.19069229066371918, -0.18235823512077332, -0.17402417957782745, -0.1656901240348816, -0.15735606849193573, -0.14902201294898987, -0.140687957406044, -0.13235390186309814, -0.12401983141899109, -0.11568577587604523, -0.10735172033309937, -0.0990176647901535, -0.09068360179662704, -0.08234954625368118, -0.07401548326015472, -0.06568142771720886, -0.0573473684489727, -0.04901330918073654, -0.04067925363779068, -0.03234519436955452, -0.02401113510131836, -0.0156770758330822, -0.007343018427491188, 0.000991038978099823, 0.009325098246335983, 0.017659157514572144, 0.025993213057518005, 0.034327272325754166, 0.042661331593990326, 0.050995390862226486, 0.059329450130462646, 0.06766350567340851, 0.07599756121635437, 0.08433162420988083, 0.09266567975282669, 0.10099974274635315, 0.10933379828929901, 0.11766785383224487, 0.12600190937519073, 0.1343359649181366, 0.14267003536224365, 0.15100409090518951, 0.15933814644813538, 0.16767220199108124, 0.1760062575340271, 0.18434031307697296, 0.19267436861991882, 0.20100843906402588, 0.20934249460697174, 0.2176765501499176, 0.22601060569286346, 0.23434466123580933, 0.24267873167991638]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 7.0, 8.0, 7.0, 15.0, 9.0, 10.0, 15.0, 19.0, 19.0, 21.0, 32.0, 24.0, 31.0, 37.0, 24.0, 27.0, 41.0, 44.0, 52.0, 36.0, 44.0, 43.0, 31.0, 31.0, 31.0, 36.0, 39.0, 34.0, 46.0, 27.0, 27.0, 17.0, 26.0, 14.0, 21.0, 9.0, 7.0, 11.0, 10.0, 7.0, 5.0, 2.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07930302619934082, -0.07681325823068619, -0.07432348281145096, -0.07183371484279633, -0.0693439394235611, -0.06685417145490646, -0.06436440348625183, -0.0618746317923069, -0.05938486009836197, -0.05689508840441704, -0.05440531671047211, -0.051915548741817474, -0.04942577704787254, -0.04693600535392761, -0.04444623738527298, -0.04195646569132805, -0.03946669399738312, -0.03697692230343819, -0.034487150609493256, -0.03199738264083862, -0.029507610946893692, -0.02701783925294876, -0.02452806942164898, -0.022038299590349197, -0.019548527896404266, -0.017058756202459335, -0.014568986371159554, -0.012079215608537197, -0.00958944484591484, -0.007099674083292484, -0.004609903320670128, -0.002120133489370346, 0.00036963820457458496, 0.0028594089671969414, 0.005349179729819298, 0.007838950492441654, 0.01032872125506401, 0.012818492017686367, 0.015308262780308723, 0.017798032611608505, 0.020287804305553436, 0.022777575999498367, 0.02526734583079815, 0.02775711566209793, 0.030246887356042862, 0.03273665904998779, 0.035226427018642426, 0.03771619871258736, 0.04020597040653229, 0.04269574210047722, 0.04518551379442215, 0.04767528176307678, 0.05016505345702171, 0.052654825150966644, 0.05514459311962128, 0.05763436481356621, 0.06012413650751114, 0.06261390447616577, 0.065103679895401, 0.06759344786405563, 0.07008321583271027, 0.0725729912519455, 0.07506275922060013, 0.07755252718925476, 0.08004230260848999]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 7.0, 11.0, 7.0, 16.0, 42.0, 35.0, 64.0, 91.0, 177.0, 271.0, 575.0, 1046.0, 2191.0, 4829.0, 12037.0, 32383.0, 96335.0, 294787.0, 380861.0, 146169.0, 47390.0, 16841.0, 6649.0, 2822.0, 1337.0, 688.0, 357.0, 215.0, 109.0, 73.0, 49.0, 28.0, 24.0, 15.0, 8.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11279296875, -0.10848426818847656, -0.10417556762695312, -0.09986686706542969, -0.09555816650390625, -0.09124946594238281, -0.08694076538085938, -0.08263206481933594, -0.0783233642578125, -0.07401466369628906, -0.06970596313476562, -0.06539726257324219, -0.06108856201171875, -0.05677986145019531, -0.052471160888671875, -0.04816246032714844, -0.043853759765625, -0.03954505920410156, -0.035236358642578125, -0.030927658081054688, -0.02661895751953125, -0.022310256958007812, -0.018001556396484375, -0.013692855834960938, -0.0093841552734375, -0.0050754547119140625, -0.000766754150390625, 0.0035419464111328125, 0.00785064697265625, 0.012159347534179688, 0.016468048095703125, 0.020776748657226562, 0.02508544921875, 0.029394149780273438, 0.033702850341796875, 0.03801155090332031, 0.04232025146484375, 0.04662895202636719, 0.050937652587890625, 0.05524635314941406, 0.0595550537109375, 0.06386375427246094, 0.06817245483398438, 0.07248115539550781, 0.07678985595703125, 0.08109855651855469, 0.08540725708007812, 0.08971595764160156, 0.094024658203125, 0.09833335876464844, 0.10264205932617188, 0.10695075988769531, 0.11125946044921875, 0.11556816101074219, 0.11987686157226562, 0.12418556213378906, 0.1284942626953125, 0.13280296325683594, 0.13711166381835938, 0.1414203643798828, 0.14572906494140625, 0.1500377655029297, 0.15434646606445312, 0.15865516662597656, 0.1629638671875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 4.0, 8.0, 10.0, 16.0, 14.0, 20.0, 25.0, 33.0, 32.0, 41.0, 46.0, 59.0, 64.0, 54.0, 75.0, 50.0, 62.0, 57.0, 56.0, 44.0, 38.0, 28.0, 32.0, 24.0, 23.0, 15.0, 20.0, 10.0, 14.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0], "bins": [-0.17822265625, -0.17386817932128906, -0.16951370239257812, -0.1651592254638672, -0.16080474853515625, -0.1564502716064453, -0.15209579467773438, -0.14774131774902344, -0.1433868408203125, -0.13903236389160156, -0.13467788696289062, -0.1303234100341797, -0.12596893310546875, -0.12161445617675781, -0.11725997924804688, -0.11290550231933594, -0.108551025390625, -0.10419654846191406, -0.09984207153320312, -0.09548759460449219, -0.09113311767578125, -0.08677864074707031, -0.08242416381835938, -0.07806968688964844, -0.0737152099609375, -0.06936073303222656, -0.06500625610351562, -0.06065177917480469, -0.05629730224609375, -0.05194282531738281, -0.047588348388671875, -0.04323387145996094, -0.03887939453125, -0.03452491760253906, -0.030170440673828125, -0.025815963745117188, -0.02146148681640625, -0.017107009887695312, -0.012752532958984375, -0.008398056030273438, -0.0040435791015625, 0.0003108978271484375, 0.004665374755859375, 0.009019851684570312, 0.01337432861328125, 0.017728805541992188, 0.022083282470703125, 0.026437759399414062, 0.030792236328125, 0.03514671325683594, 0.039501190185546875, 0.04385566711425781, 0.04821014404296875, 0.05256462097167969, 0.056919097900390625, 0.06127357482910156, 0.0656280517578125, 0.06998252868652344, 0.07433700561523438, 0.07869148254394531, 0.08304595947265625, 0.08740043640136719, 0.09175491333007812, 0.09610939025878906, 0.1004638671875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 7.0, 9.0, 2.0, 7.0, 11.0, 14.0, 17.0, 17.0, 25.0, 25.0, 34.0, 54.0, 54.0, 67.0, 87.0, 114.0, 152.0, 286.0, 510.0, 1051.0, 2791.0, 10139.0, 53946.0, 430242.0, 474454.0, 58168.0, 10757.0, 2897.0, 1063.0, 540.0, 295.0, 187.0, 105.0, 93.0, 66.0, 54.0, 36.0, 39.0, 39.0, 22.0, 20.0, 14.0, 16.0, 5.0, 8.0, 7.0, 11.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.25048828125, -0.24333572387695312, -0.23618316650390625, -0.22903060913085938, -0.2218780517578125, -0.21472549438476562, -0.20757293701171875, -0.20042037963867188, -0.193267822265625, -0.18611526489257812, -0.17896270751953125, -0.17181015014648438, -0.1646575927734375, -0.15750503540039062, -0.15035247802734375, -0.14319992065429688, -0.13604736328125, -0.12889480590820312, -0.12174224853515625, -0.11458969116210938, -0.1074371337890625, -0.10028457641601562, -0.09313201904296875, -0.08597946166992188, -0.078826904296875, -0.07167434692382812, -0.06452178955078125, -0.057369232177734375, -0.0502166748046875, -0.043064117431640625, -0.03591156005859375, -0.028759002685546875, -0.0216064453125, -0.014453887939453125, -0.00730133056640625, -0.000148773193359375, 0.0070037841796875, 0.014156341552734375, 0.02130889892578125, 0.028461456298828125, 0.035614013671875, 0.042766571044921875, 0.04991912841796875, 0.057071685791015625, 0.0642242431640625, 0.07137680053710938, 0.07852935791015625, 0.08568191528320312, 0.09283447265625, 0.09998703002929688, 0.10713958740234375, 0.11429214477539062, 0.1214447021484375, 0.12859725952148438, 0.13574981689453125, 0.14290237426757812, 0.150054931640625, 0.15720748901367188, 0.16436004638671875, 0.17151260375976562, 0.1786651611328125, 0.18581771850585938, 0.19297027587890625, 0.20012283325195312, 0.207275390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 4.0, 14.0, 12.0, 15.0, 20.0, 22.0, 22.0, 23.0, 26.0, 45.0, 33.0, 52.0, 61.0, 51.0, 55.0, 46.0, 60.0, 57.0, 38.0, 49.0, 33.0, 37.0, 28.0, 25.0, 30.0, 27.0, 17.0, 23.0, 19.0, 11.0, 13.0, 8.0, 7.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57861328125, -0.5621910095214844, -0.5457687377929688, -0.5293464660644531, -0.5129241943359375, -0.4965019226074219, -0.48007965087890625, -0.4636573791503906, -0.447235107421875, -0.4308128356933594, -0.41439056396484375, -0.3979682922363281, -0.3815460205078125, -0.3651237487792969, -0.34870147705078125, -0.3322792053222656, -0.31585693359375, -0.2994346618652344, -0.28301239013671875, -0.2665901184082031, -0.2501678466796875, -0.23374557495117188, -0.21732330322265625, -0.20090103149414062, -0.184478759765625, -0.16805648803710938, -0.15163421630859375, -0.13521194458007812, -0.1187896728515625, -0.10236740112304688, -0.08594512939453125, -0.06952285766601562, -0.0531005859375, -0.036678314208984375, -0.02025604248046875, -0.003833770751953125, 0.0125885009765625, 0.029010772705078125, 0.04543304443359375, 0.061855316162109375, 0.078277587890625, 0.09469985961914062, 0.11112213134765625, 0.12754440307617188, 0.1439666748046875, 0.16038894653320312, 0.17681121826171875, 0.19323348999023438, 0.20965576171875, 0.22607803344726562, 0.24250030517578125, 0.2589225769042969, 0.2753448486328125, 0.2917671203613281, 0.30818939208984375, 0.3246116638183594, 0.341033935546875, 0.3574562072753906, 0.37387847900390625, 0.3903007507324219, 0.4067230224609375, 0.4231452941894531, 0.43956756591796875, 0.4559898376464844, 0.472412109375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 6.0, 8.0, 7.0, 15.0, 24.0, 34.0, 44.0, 72.0, 126.0, 267.0, 615.0, 1608.0, 6094.0, 51659.0, 887314.0, 88952.0, 8331.0, 1966.0, 729.0, 297.0, 134.0, 72.0, 54.0, 41.0, 23.0, 14.0, 12.0, 11.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1829833984375, -0.1778411865234375, -0.172698974609375, -0.1675567626953125, -0.16241455078125, -0.1572723388671875, -0.152130126953125, -0.1469879150390625, -0.141845703125, -0.1367034912109375, -0.131561279296875, -0.1264190673828125, -0.12127685546875, -0.1161346435546875, -0.110992431640625, -0.1058502197265625, -0.1007080078125, -0.0955657958984375, -0.090423583984375, -0.0852813720703125, -0.08013916015625, -0.0749969482421875, -0.069854736328125, -0.0647125244140625, -0.0595703125, -0.0544281005859375, -0.049285888671875, -0.0441436767578125, -0.03900146484375, -0.0338592529296875, -0.028717041015625, -0.0235748291015625, -0.0184326171875, -0.0132904052734375, -0.008148193359375, -0.0030059814453125, 0.00213623046875, 0.0072784423828125, 0.012420654296875, 0.0175628662109375, 0.022705078125, 0.0278472900390625, 0.032989501953125, 0.0381317138671875, 0.04327392578125, 0.0484161376953125, 0.053558349609375, 0.0587005615234375, 0.0638427734375, 0.0689849853515625, 0.074127197265625, 0.0792694091796875, 0.08441162109375, 0.0895538330078125, 0.094696044921875, 0.0998382568359375, 0.10498046875, 0.1101226806640625, 0.115264892578125, 0.1204071044921875, 0.12554931640625, 0.1306915283203125, 0.135833740234375, 0.1409759521484375, 0.1461181640625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 4.0, 4.0, 4.0, 8.0, 14.0, 12.0, 18.0, 26.0, 34.0, 55.0, 79.0, 127.0, 149.0, 133.0, 103.0, 65.0, 41.0, 32.0, 14.0, 20.0, 11.0, 12.0, 7.0, 3.0, 5.0, 5.0, 4.0, 1.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.693601608276367e-05, -6.500538438558578e-05, -6.30747526884079e-05, -6.114412099123001e-05, -5.9213489294052124e-05, -5.728285759687424e-05, -5.535222589969635e-05, -5.342159420251846e-05, -5.1490962505340576e-05, -4.956033080816269e-05, -4.76296991109848e-05, -4.5699067413806915e-05, -4.376843571662903e-05, -4.183780401945114e-05, -3.9907172322273254e-05, -3.797654062509537e-05, -3.604590892791748e-05, -3.4115277230739594e-05, -3.2184645533561707e-05, -3.025401383638382e-05, -2.8323382139205933e-05, -2.6392750442028046e-05, -2.446211874485016e-05, -2.2531487047672272e-05, -2.0600855350494385e-05, -1.8670223653316498e-05, -1.673959195613861e-05, -1.4808960258960724e-05, -1.2878328561782837e-05, -1.094769686460495e-05, -9.017065167427063e-06, -7.086433470249176e-06, -5.155801773071289e-06, -3.225170075893402e-06, -1.2945383787155151e-06, 6.360933184623718e-07, 2.566725015640259e-06, 4.497356712818146e-06, 6.427988409996033e-06, 8.35862010717392e-06, 1.0289251804351807e-05, 1.2219883501529694e-05, 1.415051519870758e-05, 1.6081146895885468e-05, 1.8011778593063354e-05, 1.994241029024124e-05, 2.187304198741913e-05, 2.3803673684597015e-05, 2.5734305381774902e-05, 2.766493707895279e-05, 2.9595568776130676e-05, 3.152620047330856e-05, 3.345683217048645e-05, 3.538746386766434e-05, 3.7318095564842224e-05, 3.924872726202011e-05, 4.1179358959198e-05, 4.3109990656375885e-05, 4.504062235355377e-05, 4.697125405073166e-05, 4.8901885747909546e-05, 5.083251744508743e-05, 5.276314914226532e-05, 5.469378083944321e-05, 5.6624412536621094e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 8.0, 5.0, 7.0, 7.0, 10.0, 27.0, 39.0, 50.0, 108.0, 187.0, 529.0, 1614.0, 6221.0, 46957.0, 814510.0, 162252.0, 11929.0, 2586.0, 786.0, 332.0, 146.0, 81.0, 49.0, 31.0, 29.0, 6.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1453857421875, -0.14064979553222656, -0.13591384887695312, -0.1311779022216797, -0.12644195556640625, -0.12170600891113281, -0.11697006225585938, -0.11223411560058594, -0.1074981689453125, -0.10276222229003906, -0.09802627563476562, -0.09329032897949219, -0.08855438232421875, -0.08381843566894531, -0.07908248901367188, -0.07434654235839844, -0.069610595703125, -0.06487464904785156, -0.060138702392578125, -0.05540275573730469, -0.05066680908203125, -0.04593086242675781, -0.041194915771484375, -0.03645896911621094, -0.0317230224609375, -0.026987075805664062, -0.022251129150390625, -0.017515182495117188, -0.01277923583984375, -0.008043289184570312, -0.003307342529296875, 0.0014286041259765625, 0.00616455078125, 0.010900497436523438, 0.015636444091796875, 0.020372390747070312, 0.02510833740234375, 0.029844284057617188, 0.034580230712890625, 0.03931617736816406, 0.0440521240234375, 0.04878807067871094, 0.053524017333984375, 0.05825996398925781, 0.06299591064453125, 0.06773185729980469, 0.07246780395507812, 0.07720375061035156, 0.081939697265625, 0.08667564392089844, 0.09141159057617188, 0.09614753723144531, 0.10088348388671875, 0.10561943054199219, 0.11035537719726562, 0.11509132385253906, 0.1198272705078125, 0.12456321716308594, 0.12929916381835938, 0.1340351104736328, 0.13877105712890625, 0.1435070037841797, 0.14824295043945312, 0.15297889709472656, 0.15771484375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 11.0, 21.0, 38.0, 88.0, 161.0, 232.0, 206.0, 103.0, 44.0, 28.0, 14.0, 11.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35205078125, -0.3432121276855469, -0.33437347412109375, -0.3255348205566406, -0.3166961669921875, -0.3078575134277344, -0.29901885986328125, -0.2901802062988281, -0.281341552734375, -0.2725028991699219, -0.26366424560546875, -0.2548255920410156, -0.2459869384765625, -0.23714828491210938, -0.22830963134765625, -0.21947097778320312, -0.21063232421875, -0.20179367065429688, -0.19295501708984375, -0.18411636352539062, -0.1752777099609375, -0.16643905639648438, -0.15760040283203125, -0.14876174926757812, -0.139923095703125, -0.13108444213867188, -0.12224578857421875, -0.11340713500976562, -0.1045684814453125, -0.09572982788085938, -0.08689117431640625, -0.07805252075195312, -0.0692138671875, -0.060375213623046875, -0.05153656005859375, -0.042697906494140625, -0.0338592529296875, -0.025020599365234375, -0.01618194580078125, -0.007343292236328125, 0.001495361328125, 0.010334014892578125, 0.01917266845703125, 0.028011322021484375, 0.0368499755859375, 0.045688629150390625, 0.05452728271484375, 0.06336593627929688, 0.07220458984375, 0.08104324340820312, 0.08988189697265625, 0.09872055053710938, 0.1075592041015625, 0.11639785766601562, 0.12523651123046875, 0.13407516479492188, 0.142913818359375, 0.15175247192382812, 0.16059112548828125, 0.16942977905273438, 0.1782684326171875, 0.18710708618164062, 0.19594573974609375, 0.20478439331054688, 0.213623046875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 2.0, 5.0, 11.0, 7.0, 19.0, 48.0, 55.0, 79.0, 109.0, 139.0, 141.0, 142.0, 109.0, 47.0, 34.0, 23.0, 9.0, 16.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0867371559143066, -2.0298352241516113, -1.9729334115982056, -1.9160315990447998, -1.8591296672821045, -1.8022278547286987, -1.7453259229660034, -1.6884241104125977, -1.6315221786499023, -1.5746203660964966, -1.5177184343338013, -1.4608166217803955, -1.4039146900177002, -1.3470128774642944, -1.2901109457015991, -1.2332091331481934, -1.176307201385498, -1.1194053888320923, -1.062503457069397, -1.0056016445159912, -0.9486997127532959, -0.8917979001998901, -0.8348959684371948, -0.7779941558837891, -0.7210923433303833, -0.6641904711723328, -0.6072885990142822, -0.5503867268562317, -0.49348485469818115, -0.436583012342453, -0.37968114018440247, -0.32277926802635193, -0.265877366065979, -0.20897549390792847, -0.15207362174987793, -0.09517176449298859, -0.03826989233493805, 0.018631964921951294, 0.07553383708000183, 0.13243570923805237, 0.1893375813961029, 0.24623945355415344, 0.303141325712204, 0.36004316806793213, 0.41694504022598267, 0.4738469123840332, 0.5307487845420837, 0.5876506567001343, 0.6445525288581848, 0.7014544010162354, 0.7583562731742859, 0.8152581453323364, 0.872160017490387, 0.9290618896484375, 0.9859637022018433, 1.0428656339645386, 1.0997674465179443, 1.15666925907135, 1.2135711908340454, 1.2704730033874512, 1.3273749351501465, 1.3842767477035522, 1.4411786794662476, 1.4980804920196533, 1.5549824237823486]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 8.0, 7.0, 11.0, 7.0, 17.0, 13.0, 17.0, 12.0, 25.0, 27.0, 25.0, 24.0, 36.0, 30.0, 41.0, 54.0, 35.0, 55.0, 64.0, 50.0, 48.0, 47.0, 43.0, 36.0, 33.0, 46.0, 26.0, 33.0, 24.0, 18.0, 18.0, 12.0, 15.0, 10.0, 4.0, 6.0, 2.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0074591636657715, -1.9423013925552368, -1.8771436214447021, -1.811985969543457, -1.7468281984329224, -1.6816704273223877, -1.6165127754211426, -1.551355004310608, -1.4861972332000732, -1.4210394620895386, -1.355881690979004, -1.2907240390777588, -1.2255662679672241, -1.1604084968566895, -1.0952508449554443, -1.0300930738449097, -0.964935302734375, -0.8997775316238403, -0.8346198201179504, -0.7694621086120605, -0.7043043375015259, -0.6391465663909912, -0.5739888548851013, -0.5088311433792114, -0.44367337226867676, -0.3785156309604645, -0.3133578896522522, -0.24820014834403992, -0.18304240703582764, -0.11788466572761536, -0.052726924419403076, 0.012430816888809204, 0.07758855819702148, 0.14274629950523376, 0.20790404081344604, 0.2730617821216583, 0.3382195234298706, 0.4033772647380829, 0.46853500604629517, 0.5336927175521851, 0.5988504886627197, 0.6640082597732544, 0.7291659712791443, 0.7943236827850342, 0.8594814538955688, 0.9246392250061035, 0.9897969365119934, 1.0549546480178833, 1.120112419128418, 1.1852701902389526, 1.2504279613494873, 1.3155856132507324, 1.380743384361267, 1.4459011554718018, 1.5110588073730469, 1.5762165784835815, 1.6413743495941162, 1.7065321207046509, 1.7716898918151855, 1.8368475437164307, 1.9020053148269653, 1.9671630859375, 2.032320737838745, 2.0974786281585693, 2.1626362800598145]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 5.0, 7.0, 11.0, 14.0, 24.0, 23.0, 35.0, 60.0, 99.0, 122.0, 170.0, 246.0, 374.0, 605.0, 963.0, 1760.0, 3468.0, 9282.0, 49489.0, 4014737.0, 91139.0, 12308.0, 4203.0, 2075.0, 1086.0, 684.0, 444.0, 265.0, 190.0, 105.0, 87.0, 55.0, 50.0, 30.0, 13.0, 14.0, 9.0, 5.0, 5.0, 10.0, 1.0, 4.0, 3.0], "bins": [-0.2254638671875, -0.2199115753173828, -0.21435928344726562, -0.20880699157714844, -0.20325469970703125, -0.19770240783691406, -0.19215011596679688, -0.1865978240966797, -0.1810455322265625, -0.1754932403564453, -0.16994094848632812, -0.16438865661621094, -0.15883636474609375, -0.15328407287597656, -0.14773178100585938, -0.1421794891357422, -0.136627197265625, -0.1310749053955078, -0.12552261352539062, -0.11997032165527344, -0.11441802978515625, -0.10886573791503906, -0.10331344604492188, -0.09776115417480469, -0.0922088623046875, -0.08665657043457031, -0.08110427856445312, -0.07555198669433594, -0.06999969482421875, -0.06444740295410156, -0.058895111083984375, -0.05334281921386719, -0.04779052734375, -0.04223823547363281, -0.036685943603515625, -0.031133651733398438, -0.02558135986328125, -0.020029067993164062, -0.014476776123046875, -0.008924484252929688, -0.0033721923828125, 0.0021800994873046875, 0.007732391357421875, 0.013284683227539062, 0.01883697509765625, 0.024389266967773438, 0.029941558837890625, 0.03549385070800781, 0.041046142578125, 0.04659843444824219, 0.052150726318359375, 0.05770301818847656, 0.06325531005859375, 0.06880760192871094, 0.07435989379882812, 0.07991218566894531, 0.0854644775390625, 0.09101676940917969, 0.09656906127929688, 0.10212135314941406, 0.10767364501953125, 0.11322593688964844, 0.11877822875976562, 0.12433052062988281, 0.1298828125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 10.0, 8.0, 6.0, 16.0, 9.0, 18.0, 27.0, 27.0, 28.0, 39.0, 36.0, 40.0, 49.0, 58.0, 54.0, 70.0, 44.0, 53.0, 56.0, 50.0, 48.0, 46.0, 25.0, 30.0, 30.0, 21.0, 20.0, 16.0, 14.0, 11.0, 3.0, 8.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 4.0], "bins": [-0.1556396484375, -0.15176105499267578, -0.14788246154785156, -0.14400386810302734, -0.14012527465820312, -0.1362466812133789, -0.1323680877685547, -0.12848949432373047, -0.12461090087890625, -0.12073230743408203, -0.11685371398925781, -0.1129751205444336, -0.10909652709960938, -0.10521793365478516, -0.10133934020996094, -0.09746074676513672, -0.0935821533203125, -0.08970355987548828, -0.08582496643066406, -0.08194637298583984, -0.07806777954101562, -0.0741891860961914, -0.07031059265136719, -0.06643199920654297, -0.06255340576171875, -0.05867481231689453, -0.05479621887207031, -0.050917625427246094, -0.047039031982421875, -0.043160438537597656, -0.03928184509277344, -0.03540325164794922, -0.031524658203125, -0.02764606475830078, -0.023767471313476562, -0.019888877868652344, -0.016010284423828125, -0.012131690979003906, -0.008253097534179688, -0.004374504089355469, -0.00049591064453125, 0.0033826828002929688, 0.0072612762451171875, 0.011139869689941406, 0.015018463134765625, 0.018897056579589844, 0.022775650024414062, 0.02665424346923828, 0.0305328369140625, 0.03441143035888672, 0.03829002380371094, 0.042168617248535156, 0.046047210693359375, 0.049925804138183594, 0.05380439758300781, 0.05768299102783203, 0.06156158447265625, 0.06544017791748047, 0.06931877136230469, 0.0731973648071289, 0.07707595825195312, 0.08095455169677734, 0.08483314514160156, 0.08871173858642578, 0.09259033203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 0.0, 3.0, 6.0, 9.0, 13.0, 14.0, 18.0, 28.0, 45.0, 57.0, 80.0, 104.0, 136.0, 229.0, 360.0, 644.0, 1120.0, 2456.0, 7450.0, 85443.0, 4066232.0, 21460.0, 4264.0, 1746.0, 854.0, 472.0, 307.0, 195.0, 138.0, 99.0, 80.0, 54.0, 43.0, 33.0, 27.0, 12.0, 8.0, 12.0, 13.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.300537109375, -0.29093170166015625, -0.2813262939453125, -0.27172088623046875, -0.262115478515625, -0.25251007080078125, -0.2429046630859375, -0.23329925537109375, -0.22369384765625, -0.21408843994140625, -0.2044830322265625, -0.19487762451171875, -0.185272216796875, -0.17566680908203125, -0.1660614013671875, -0.15645599365234375, -0.1468505859375, -0.13724517822265625, -0.1276397705078125, -0.11803436279296875, -0.108428955078125, -0.09882354736328125, -0.0892181396484375, -0.07961273193359375, -0.07000732421875, -0.06040191650390625, -0.0507965087890625, -0.04119110107421875, -0.031585693359375, -0.02198028564453125, -0.0123748779296875, -0.00276947021484375, 0.0068359375, 0.01644134521484375, 0.0260467529296875, 0.03565216064453125, 0.045257568359375, 0.05486297607421875, 0.0644683837890625, 0.07407379150390625, 0.08367919921875, 0.09328460693359375, 0.1028900146484375, 0.11249542236328125, 0.122100830078125, 0.13170623779296875, 0.1413116455078125, 0.15091705322265625, 0.1605224609375, 0.17012786865234375, 0.1797332763671875, 0.18933868408203125, 0.198944091796875, 0.20854949951171875, 0.2181549072265625, 0.22776031494140625, 0.23736572265625, 0.24697113037109375, 0.2565765380859375, 0.26618194580078125, 0.275787353515625, 0.28539276123046875, 0.2949981689453125, 0.30460357666015625, 0.314208984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 10.0, 22.0, 128.0, 3610.0, 229.0, 43.0, 18.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21435546875, -0.2073535919189453, -0.20035171508789062, -0.19334983825683594, -0.18634796142578125, -0.17934608459472656, -0.17234420776367188, -0.1653423309326172, -0.1583404541015625, -0.1513385772705078, -0.14433670043945312, -0.13733482360839844, -0.13033294677734375, -0.12333106994628906, -0.11632919311523438, -0.10932731628417969, -0.102325439453125, -0.09532356262207031, -0.08832168579101562, -0.08131980895996094, -0.07431793212890625, -0.06731605529785156, -0.060314178466796875, -0.05331230163574219, -0.0463104248046875, -0.03930854797363281, -0.032306671142578125, -0.025304794311523438, -0.01830291748046875, -0.011301040649414062, -0.004299163818359375, 0.0027027130126953125, 0.00970458984375, 0.016706466674804688, 0.023708343505859375, 0.030710220336914062, 0.03771209716796875, 0.04471397399902344, 0.051715850830078125, 0.05871772766113281, 0.0657196044921875, 0.07272148132324219, 0.07972335815429688, 0.08672523498535156, 0.09372711181640625, 0.10072898864746094, 0.10773086547851562, 0.11473274230957031, 0.121734619140625, 0.1287364959716797, 0.13573837280273438, 0.14274024963378906, 0.14974212646484375, 0.15674400329589844, 0.16374588012695312, 0.1707477569580078, 0.1777496337890625, 0.1847515106201172, 0.19175338745117188, 0.19875526428222656, 0.20575714111328125, 0.21275901794433594, 0.21976089477539062, 0.2267627716064453, 0.2337646484375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 9.0, 11.0, 23.0, 40.0, 58.0, 83.0, 121.0, 147.0, 184.0, 127.0, 79.0, 46.0, 31.0, 13.0, 10.0, 9.0, 3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36494317650794983, -0.3513897657394409, -0.3378363847732544, -0.3242829740047455, -0.3107295632362366, -0.29717618227005005, -0.28362277150154114, -0.2700693607330322, -0.2565159797668457, -0.24296258389949799, -0.22940917313098907, -0.21585577726364136, -0.20230236649513245, -0.18874897062778473, -0.175195574760437, -0.1616421639919281, -0.1480887532234192, -0.13453535735607147, -0.12098194658756256, -0.10742855072021484, -0.09387514740228653, -0.08032174408435822, -0.0667683482170105, -0.053214944899082184, -0.03966154158115387, -0.026108140125870705, -0.01255473867058754, 0.000998660922050476, 0.01455206423997879, 0.028105467557907104, 0.04165886342525482, 0.055212266743183136, 0.06876569986343384, 0.08231910318136215, 0.09587250649929047, 0.10942590236663818, 0.1229793056845665, 0.1365327090024948, 0.15008610486984253, 0.16363951563835144, 0.17719291150569916, 0.19074630737304688, 0.2042997181415558, 0.2178531140089035, 0.23140650987625122, 0.24495992064476013, 0.25851333141326904, 0.27206671237945557, 0.2856201231479645, 0.2991735339164734, 0.3127269148826599, 0.3262803256511688, 0.33983373641967773, 0.35338711738586426, 0.36694052815437317, 0.3804939389228821, 0.3940473198890686, 0.4076007306575775, 0.42115411162376404, 0.43470752239227295, 0.44826093316078186, 0.46181434392929077, 0.4753677248954773, 0.4889211356639862, 0.5024745464324951]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 7.0, 10.0, 8.0, 14.0, 21.0, 22.0, 31.0, 38.0, 36.0, 38.0, 37.0, 45.0, 55.0, 54.0, 66.0, 52.0, 46.0, 52.0, 59.0, 59.0, 43.0, 33.0, 43.0, 26.0, 23.0, 20.0, 19.0, 13.0, 7.0, 8.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24484783411026, -0.23513230681419373, -0.22541677951812744, -0.21570125222206116, -0.20598572492599487, -0.1962701976299286, -0.1865546703338623, -0.17683914303779602, -0.16712361574172974, -0.15740808844566345, -0.14769256114959717, -0.13797703385353088, -0.1282615065574646, -0.11854597926139832, -0.10883045941591263, -0.09911493211984634, -0.08939941227436066, -0.07968388497829437, -0.06996835768222809, -0.0602528341114521, -0.05053730681538582, -0.040821779519319534, -0.03110625594854355, -0.021390728652477264, -0.01167520135641098, -0.0019596749916672707, 0.007755851373076439, 0.017471376806497574, 0.027186904102563858, 0.03690243139863014, 0.04661795496940613, 0.05633348226547241, 0.0660490095615387, 0.07576453685760498, 0.08548006415367126, 0.09519559144973755, 0.10491111874580383, 0.11462664604187012, 0.1243421658873558, 0.13405770063400269, 0.14377322793006897, 0.15348875522613525, 0.16320428252220154, 0.17291980981826782, 0.1826353371143341, 0.1923508644104004, 0.20206639170646667, 0.21178191900253296, 0.22149743139743805, 0.23121295869350433, 0.24092848598957062, 0.2506439983844757, 0.260359525680542, 0.2700750529766083, 0.27979058027267456, 0.28950610756874084, 0.29922163486480713, 0.3089371621608734, 0.3186526894569397, 0.328368216753006, 0.33808374404907227, 0.34779927134513855, 0.35751479864120483, 0.3672303259372711, 0.3769458532333374]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 13.0, 11.0, 19.0, 32.0, 27.0, 47.0, 85.0, 126.0, 244.0, 493.0, 1018.0, 2349.0, 6507.0, 22587.0, 104919.0, 523954.0, 310731.0, 54349.0, 13553.0, 4168.0, 1690.0, 732.0, 343.0, 214.0, 119.0, 78.0, 45.0, 31.0, 16.0, 16.0, 7.0, 10.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.260986328125, -0.2538948059082031, -0.24680328369140625, -0.23971176147460938, -0.2326202392578125, -0.22552871704101562, -0.21843719482421875, -0.21134567260742188, -0.204254150390625, -0.19716262817382812, -0.19007110595703125, -0.18297958374023438, -0.1758880615234375, -0.16879653930664062, -0.16170501708984375, -0.15461349487304688, -0.14752197265625, -0.14043045043945312, -0.13333892822265625, -0.12624740600585938, -0.1191558837890625, -0.11206436157226562, -0.10497283935546875, -0.09788131713867188, -0.090789794921875, -0.08369827270507812, -0.07660675048828125, -0.06951522827148438, -0.0624237060546875, -0.055332183837890625, -0.04824066162109375, -0.041149139404296875, -0.0340576171875, -0.026966094970703125, -0.01987457275390625, -0.012783050537109375, -0.0056915283203125, 0.001399993896484375, 0.00849151611328125, 0.015583038330078125, 0.022674560546875, 0.029766082763671875, 0.03685760498046875, 0.043949127197265625, 0.0510406494140625, 0.058132171630859375, 0.06522369384765625, 0.07231521606445312, 0.07940673828125, 0.08649826049804688, 0.09358978271484375, 0.10068130493164062, 0.1077728271484375, 0.11486434936523438, 0.12195587158203125, 0.12904739379882812, 0.136138916015625, 0.14323043823242188, 0.15032196044921875, 0.15741348266601562, 0.1645050048828125, 0.17159652709960938, 0.17868804931640625, 0.18577957153320312, 0.19287109375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 7.0, 13.0, 15.0, 12.0, 11.0, 20.0, 16.0, 35.0, 27.0, 33.0, 37.0, 51.0, 49.0, 36.0, 59.0, 51.0, 57.0, 54.0, 41.0, 48.0, 40.0, 43.0, 34.0, 30.0, 21.0, 27.0, 24.0, 21.0, 15.0, 12.0, 12.0, 8.0, 1.0, 15.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.147216796875, -0.1434640884399414, -0.1397113800048828, -0.13595867156982422, -0.13220596313476562, -0.12845325469970703, -0.12470054626464844, -0.12094783782958984, -0.11719512939453125, -0.11344242095947266, -0.10968971252441406, -0.10593700408935547, -0.10218429565429688, -0.09843158721923828, -0.09467887878417969, -0.0909261703491211, -0.0871734619140625, -0.0834207534790039, -0.07966804504394531, -0.07591533660888672, -0.07216262817382812, -0.06840991973876953, -0.06465721130371094, -0.060904502868652344, -0.05715179443359375, -0.053399085998535156, -0.04964637756347656, -0.04589366912841797, -0.042140960693359375, -0.03838825225830078, -0.03463554382324219, -0.030882835388183594, -0.027130126953125, -0.023377418518066406, -0.019624710083007812, -0.01587200164794922, -0.012119293212890625, -0.008366584777832031, -0.0046138763427734375, -0.0008611679077148438, 0.00289154052734375, 0.006644248962402344, 0.010396957397460938, 0.014149665832519531, 0.017902374267578125, 0.02165508270263672, 0.025407791137695312, 0.029160499572753906, 0.0329132080078125, 0.036665916442871094, 0.04041862487792969, 0.04417133331298828, 0.047924041748046875, 0.05167675018310547, 0.05542945861816406, 0.059182167053222656, 0.06293487548828125, 0.06668758392333984, 0.07044029235839844, 0.07419300079345703, 0.07794570922851562, 0.08169841766357422, 0.08545112609863281, 0.0892038345336914, 0.09295654296875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 11.0, 11.0, 23.0, 31.0, 32.0, 42.0, 63.0, 97.0, 156.0, 257.0, 423.0, 940.0, 2405.0, 9137.0, 56664.0, 659879.0, 283628.0, 26044.0, 5401.0, 1654.0, 649.0, 358.0, 212.0, 130.0, 78.0, 48.0, 52.0, 32.0, 30.0, 14.0, 7.0, 7.0, 8.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25927734375, -0.2499542236328125, -0.240631103515625, -0.2313079833984375, -0.22198486328125, -0.2126617431640625, -0.203338623046875, -0.1940155029296875, -0.1846923828125, -0.1753692626953125, -0.166046142578125, -0.1567230224609375, -0.14739990234375, -0.1380767822265625, -0.128753662109375, -0.1194305419921875, -0.110107421875, -0.1007843017578125, -0.091461181640625, -0.0821380615234375, -0.07281494140625, -0.0634918212890625, -0.054168701171875, -0.0448455810546875, -0.0355224609375, -0.0261993408203125, -0.016876220703125, -0.0075531005859375, 0.00177001953125, 0.0110931396484375, 0.020416259765625, 0.0297393798828125, 0.0390625, 0.0483856201171875, 0.057708740234375, 0.0670318603515625, 0.07635498046875, 0.0856781005859375, 0.095001220703125, 0.1043243408203125, 0.1136474609375, 0.1229705810546875, 0.132293701171875, 0.1416168212890625, 0.15093994140625, 0.1602630615234375, 0.169586181640625, 0.1789093017578125, 0.188232421875, 0.1975555419921875, 0.206878662109375, 0.2162017822265625, 0.22552490234375, 0.2348480224609375, 0.244171142578125, 0.2534942626953125, 0.2628173828125, 0.2721405029296875, 0.281463623046875, 0.2907867431640625, 0.30010986328125, 0.3094329833984375, 0.318756103515625, 0.3280792236328125, 0.33740234375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 10.0, 12.0, 7.0, 10.0, 15.0, 12.0, 19.0, 23.0, 29.0, 27.0, 31.0, 39.0, 44.0, 37.0, 47.0, 38.0, 47.0, 51.0, 51.0, 47.0, 59.0, 44.0, 55.0, 35.0, 39.0, 36.0, 32.0, 16.0, 16.0, 8.0, 16.0, 8.0, 11.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4677734375, -0.4536552429199219, -0.43953704833984375, -0.4254188537597656, -0.4113006591796875, -0.3971824645996094, -0.38306427001953125, -0.3689460754394531, -0.354827880859375, -0.3407096862792969, -0.32659149169921875, -0.3124732971191406, -0.2983551025390625, -0.2842369079589844, -0.27011871337890625, -0.2560005187988281, -0.24188232421875, -0.22776412963867188, -0.21364593505859375, -0.19952774047851562, -0.1854095458984375, -0.17129135131835938, -0.15717315673828125, -0.14305496215820312, -0.128936767578125, -0.11481857299804688, -0.10070037841796875, -0.08658218383789062, -0.0724639892578125, -0.058345794677734375, -0.04422760009765625, -0.030109405517578125, -0.0159912109375, -0.001873016357421875, 0.01224517822265625, 0.026363372802734375, 0.0404815673828125, 0.054599761962890625, 0.06871795654296875, 0.08283615112304688, 0.096954345703125, 0.11107254028320312, 0.12519073486328125, 0.13930892944335938, 0.1534271240234375, 0.16754531860351562, 0.18166351318359375, 0.19578170776367188, 0.20989990234375, 0.22401809692382812, 0.23813629150390625, 0.2522544860839844, 0.2663726806640625, 0.2804908752441406, 0.29460906982421875, 0.3087272644042969, 0.322845458984375, 0.3369636535644531, 0.35108184814453125, 0.3652000427246094, 0.3793182373046875, 0.3934364318847656, 0.40755462646484375, 0.4216728210449219, 0.435791015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 8.0, 3.0, 8.0, 12.0, 23.0, 36.0, 62.0, 75.0, 142.0, 276.0, 594.0, 1770.0, 7683.0, 83025.0, 876793.0, 68452.0, 6881.0, 1545.0, 540.0, 255.0, 133.0, 78.0, 54.0, 41.0, 15.0, 15.0, 10.0, 7.0, 3.0, 3.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1175537109375, -0.11381816864013672, -0.11008262634277344, -0.10634708404541016, -0.10261154174804688, -0.0988759994506836, -0.09514045715332031, -0.09140491485595703, -0.08766937255859375, -0.08393383026123047, -0.08019828796386719, -0.0764627456665039, -0.07272720336914062, -0.06899166107177734, -0.06525611877441406, -0.06152057647705078, -0.0577850341796875, -0.05404949188232422, -0.05031394958496094, -0.046578407287597656, -0.042842864990234375, -0.039107322692871094, -0.03537178039550781, -0.03163623809814453, -0.02790069580078125, -0.02416515350341797, -0.020429611206054688, -0.016694068908691406, -0.012958526611328125, -0.009222984313964844, -0.0054874420166015625, -0.0017518997192382812, 0.001983642578125, 0.005719184875488281, 0.009454727172851562, 0.013190269470214844, 0.016925811767578125, 0.020661354064941406, 0.024396896362304688, 0.02813243865966797, 0.03186798095703125, 0.03560352325439453, 0.03933906555175781, 0.043074607849121094, 0.046810150146484375, 0.050545692443847656, 0.05428123474121094, 0.05801677703857422, 0.0617523193359375, 0.06548786163330078, 0.06922340393066406, 0.07295894622802734, 0.07669448852539062, 0.0804300308227539, 0.08416557312011719, 0.08790111541748047, 0.09163665771484375, 0.09537220001220703, 0.09910774230957031, 0.1028432846069336, 0.10657882690429688, 0.11031436920166016, 0.11404991149902344, 0.11778545379638672, 0.12152099609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 9.0, 9.0, 7.0, 16.0, 13.0, 20.0, 14.0, 29.0, 30.0, 43.0, 58.0, 72.0, 119.0, 94.0, 123.0, 86.0, 56.0, 62.0, 26.0, 28.0, 17.0, 11.0, 11.0, 8.0, 7.0, 9.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-5.358457565307617e-05, -5.211867392063141e-05, -5.0652772188186646e-05, -4.918687045574188e-05, -4.772096872329712e-05, -4.6255066990852356e-05, -4.478916525840759e-05, -4.332326352596283e-05, -4.1857361793518066e-05, -4.03914600610733e-05, -3.892555832862854e-05, -3.745965659618378e-05, -3.5993754863739014e-05, -3.452785313129425e-05, -3.306195139884949e-05, -3.1596049666404724e-05, -3.013014793395996e-05, -2.8664246201515198e-05, -2.7198344469070435e-05, -2.573244273662567e-05, -2.4266541004180908e-05, -2.2800639271736145e-05, -2.1334737539291382e-05, -1.986883580684662e-05, -1.8402934074401855e-05, -1.6937032341957092e-05, -1.547113060951233e-05, -1.4005228877067566e-05, -1.2539327144622803e-05, -1.107342541217804e-05, -9.607523679733276e-06, -8.141621947288513e-06, -6.67572021484375e-06, -5.209818482398987e-06, -3.7439167499542236e-06, -2.2780150175094604e-06, -8.121132850646973e-07, 6.537884473800659e-07, 2.119690179824829e-06, 3.5855919122695923e-06, 5.0514936447143555e-06, 6.517395377159119e-06, 7.983297109603882e-06, 9.449198842048645e-06, 1.0915100574493408e-05, 1.2381002306938171e-05, 1.3846904039382935e-05, 1.5312805771827698e-05, 1.677870750427246e-05, 1.8244609236717224e-05, 1.9710510969161987e-05, 2.117641270160675e-05, 2.2642314434051514e-05, 2.4108216166496277e-05, 2.557411789894104e-05, 2.7040019631385803e-05, 2.8505921363830566e-05, 2.997182309627533e-05, 3.143772482872009e-05, 3.2903626561164856e-05, 3.436952829360962e-05, 3.583543002605438e-05, 3.7301331758499146e-05, 3.876723349094391e-05, 4.023313522338867e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 3.0, 1.0, 4.0, 9.0, 12.0, 20.0, 49.0, 92.0, 242.0, 928.0, 5940.0, 281365.0, 748002.0, 10119.0, 1195.0, 321.0, 121.0, 72.0, 28.0, 11.0, 11.0, 9.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.271728515625, -0.2655668258666992, -0.25940513610839844, -0.25324344635009766, -0.24708175659179688, -0.2409200668334961, -0.2347583770751953, -0.22859668731689453, -0.22243499755859375, -0.21627330780029297, -0.2101116180419922, -0.2039499282836914, -0.19778823852539062, -0.19162654876708984, -0.18546485900878906, -0.17930316925048828, -0.1731414794921875, -0.16697978973388672, -0.16081809997558594, -0.15465641021728516, -0.14849472045898438, -0.1423330307006836, -0.1361713409423828, -0.13000965118408203, -0.12384796142578125, -0.11768627166748047, -0.11152458190917969, -0.1053628921508789, -0.09920120239257812, -0.09303951263427734, -0.08687782287597656, -0.08071613311767578, -0.074554443359375, -0.06839275360107422, -0.06223106384277344, -0.056069374084472656, -0.049907684326171875, -0.043745994567871094, -0.03758430480957031, -0.03142261505126953, -0.02526092529296875, -0.01909923553466797, -0.012937545776367188, -0.006775856018066406, -0.000614166259765625, 0.005547523498535156, 0.011709213256835938, 0.01787090301513672, 0.0240325927734375, 0.03019428253173828, 0.03635597229003906, 0.042517662048339844, 0.048679351806640625, 0.054841041564941406, 0.06100273132324219, 0.06716442108154297, 0.07332611083984375, 0.07948780059814453, 0.08564949035644531, 0.0918111801147461, 0.09797286987304688, 0.10413455963134766, 0.11029624938964844, 0.11645793914794922, 0.12261962890625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 9.0, 11.0, 18.0, 18.0, 30.0, 54.0, 85.0, 127.0, 143.0, 144.0, 147.0, 85.0, 37.0, 23.0, 19.0, 13.0, 13.0, 8.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09625244140625, -0.09143543243408203, -0.08661842346191406, -0.0818014144897461, -0.07698440551757812, -0.07216739654541016, -0.06735038757324219, -0.06253337860107422, -0.05771636962890625, -0.05289936065673828, -0.04808235168457031, -0.043265342712402344, -0.038448333740234375, -0.033631324768066406, -0.028814315795898438, -0.02399730682373047, -0.0191802978515625, -0.014363288879394531, -0.009546279907226562, -0.004729270935058594, 8.7738037109375e-05, 0.004904747009277344, 0.009721755981445312, 0.014538764953613281, 0.01935577392578125, 0.02417278289794922, 0.028989791870117188, 0.033806800842285156, 0.038623809814453125, 0.043440818786621094, 0.04825782775878906, 0.05307483673095703, 0.057891845703125, 0.06270885467529297, 0.06752586364746094, 0.0723428726196289, 0.07715988159179688, 0.08197689056396484, 0.08679389953613281, 0.09161090850830078, 0.09642791748046875, 0.10124492645263672, 0.10606193542480469, 0.11087894439697266, 0.11569595336914062, 0.1205129623413086, 0.12532997131347656, 0.13014698028564453, 0.1349639892578125, 0.13978099822998047, 0.14459800720214844, 0.1494150161743164, 0.15423202514648438, 0.15904903411865234, 0.1638660430908203, 0.16868305206298828, 0.17350006103515625, 0.17831707000732422, 0.1831340789794922, 0.18795108795166016, 0.19276809692382812, 0.1975851058959961, 0.20240211486816406, 0.20721912384033203, 0.2120361328125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 9.0, 12.0, 72.0, 194.0, 342.0, 243.0, 92.0, 26.0, 14.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.448692321777344, -5.31413459777832, -5.179576873779297, -5.045019149780273, -4.91046142578125, -4.775903701782227, -4.641345977783203, -4.50678825378418, -4.372230529785156, -4.237672805786133, -4.103115081787109, -3.968557357788086, -3.8339996337890625, -3.699441909790039, -3.5648841857910156, -3.430326461791992, -3.295768976211548, -3.1612112522125244, -3.026653528213501, -2.8920958042144775, -2.757538080215454, -2.6229803562164307, -2.4884228706359863, -2.353865146636963, -2.2193074226379395, -2.084749698638916, -1.9501919746398926, -1.8156342506408691, -1.6810765266418457, -1.5465188026428223, -1.4119611978530884, -1.277403473854065, -1.142845630645752, -1.0082879066467285, -0.8737301826477051, -0.7391725182533264, -0.604614794254303, -0.47005707025527954, -0.3354994058609009, -0.20094168186187744, -0.066383957862854, 0.06817375123500824, 0.20273146033287048, 0.33728915452957153, 0.47184687852859497, 0.6064046025276184, 0.7409622669219971, 0.8755199909210205, 1.010077714920044, 1.1446354389190674, 1.2791931629180908, 1.4137508869171143, 1.5483086109161377, 1.6828663349151611, 1.817423939704895, 1.9519816637039185, 2.0865392684936523, 2.221096992492676, 2.355654716491699, 2.4902124404907227, 2.624770164489746, 2.7593278884887695, 2.893885612487793, 3.0284433364868164, 3.16300106048584]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 12.0, 10.0, 13.0, 12.0, 22.0, 22.0, 23.0, 26.0, 28.0, 38.0, 47.0, 43.0, 50.0, 52.0, 56.0, 54.0, 72.0, 56.0, 58.0, 41.0, 39.0, 34.0, 37.0, 37.0, 23.0, 12.0, 11.0, 15.0, 9.0, 14.0, 11.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0071139335632324, -1.9408154487609863, -1.8745168447494507, -1.8082183599472046, -1.7419198751449585, -1.6756212711334229, -1.6093227863311768, -1.5430243015289307, -1.4767258167266846, -1.4104273319244385, -1.3441287279129028, -1.2778302431106567, -1.2115317583084106, -1.145233154296875, -1.078934669494629, -1.0126361846923828, -0.9463375806808472, -0.8800390362739563, -0.8137405514717102, -0.7474420070648193, -0.6811435222625732, -0.6148449778556824, -0.5485464334487915, -0.482247918844223, -0.41594940423965454, -0.34965088963508606, -0.2833523750305176, -0.2170538306236267, -0.15075531601905823, -0.08445680141448975, -0.018158257007598877, 0.048140257596969604, 0.11443877220153809, 0.18073728680610657, 0.24703581631183624, 0.3133343458175659, 0.3796328604221344, 0.4459313750267029, 0.5122299194335938, 0.5785284042358398, 0.6448269486427307, 0.7111254930496216, 0.7774239778518677, 0.8437225222587585, 0.9100210666656494, 0.9763195514678955, 1.0426180362701416, 1.1089166402816772, 1.1752151250839233, 1.2415136098861694, 1.307812213897705, 1.3741106986999512, 1.4404091835021973, 1.5067076683044434, 1.573006272315979, 1.639304757118225, 1.7056033611297607, 1.7719018459320068, 1.8382004499435425, 1.9044989347457886, 1.9707974195480347, 2.0370960235595703, 2.1033945083618164, 2.1696929931640625, 2.2359914779663086]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 6.0, 6.0, 8.0, 10.0, 16.0, 18.0, 28.0, 41.0, 42.0, 64.0, 82.0, 145.0, 239.0, 341.0, 539.0, 965.0, 1924.0, 4066.0, 9648.0, 31947.0, 394353.0, 3572750.0, 141243.0, 21139.0, 7595.0, 3271.0, 1590.0, 893.0, 458.0, 292.0, 158.0, 123.0, 62.0, 58.0, 34.0, 33.0, 23.0, 11.0, 10.0, 9.0, 17.0, 4.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1802978515625, -0.17489242553710938, -0.16948699951171875, -0.16408157348632812, -0.1586761474609375, -0.15327072143554688, -0.14786529541015625, -0.14245986938476562, -0.137054443359375, -0.13164901733398438, -0.12624359130859375, -0.12083816528320312, -0.1154327392578125, -0.11002731323242188, -0.10462188720703125, -0.09921646118164062, -0.09381103515625, -0.08840560913085938, -0.08300018310546875, -0.07759475708007812, -0.0721893310546875, -0.06678390502929688, -0.06137847900390625, -0.055973052978515625, -0.050567626953125, -0.045162200927734375, -0.03975677490234375, -0.034351348876953125, -0.0289459228515625, -0.023540496826171875, -0.01813507080078125, -0.012729644775390625, -0.00732421875, -0.001918792724609375, 0.00348663330078125, 0.008892059326171875, 0.0142974853515625, 0.019702911376953125, 0.02510833740234375, 0.030513763427734375, 0.035919189453125, 0.041324615478515625, 0.04673004150390625, 0.052135467529296875, 0.0575408935546875, 0.06294631958007812, 0.06835174560546875, 0.07375717163085938, 0.07916259765625, 0.08456802368164062, 0.08997344970703125, 0.09537887573242188, 0.1007843017578125, 0.10618972778320312, 0.11159515380859375, 0.11700057983398438, 0.122406005859375, 0.12781143188476562, 0.13321685791015625, 0.13862228393554688, 0.1440277099609375, 0.14943313598632812, 0.15483856201171875, 0.16024398803710938, 0.1656494140625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 5.0, 12.0, 10.0, 12.0, 11.0, 17.0, 30.0, 29.0, 45.0, 42.0, 45.0, 56.0, 34.0, 58.0, 68.0, 61.0, 50.0, 42.0, 57.0, 52.0, 39.0, 40.0, 32.0, 26.0, 29.0, 19.0, 19.0, 12.0, 7.0, 7.0, 5.0, 8.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12646484375, -0.1226968765258789, -0.11892890930175781, -0.11516094207763672, -0.11139297485351562, -0.10762500762939453, -0.10385704040527344, -0.10008907318115234, -0.09632110595703125, -0.09255313873291016, -0.08878517150878906, -0.08501720428466797, -0.08124923706054688, -0.07748126983642578, -0.07371330261230469, -0.0699453353881836, -0.0661773681640625, -0.062409400939941406, -0.05864143371582031, -0.05487346649169922, -0.051105499267578125, -0.04733753204345703, -0.04356956481933594, -0.039801597595214844, -0.03603363037109375, -0.032265663146972656, -0.028497695922851562, -0.02472972869873047, -0.020961761474609375, -0.01719379425048828, -0.013425827026367188, -0.009657859802246094, -0.005889892578125, -0.0021219253540039062, 0.0016460418701171875, 0.005414009094238281, 0.009181976318359375, 0.012949943542480469, 0.016717910766601562, 0.020485877990722656, 0.02425384521484375, 0.028021812438964844, 0.03178977966308594, 0.03555774688720703, 0.039325714111328125, 0.04309368133544922, 0.04686164855957031, 0.050629615783691406, 0.0543975830078125, 0.058165550231933594, 0.06193351745605469, 0.06570148468017578, 0.06946945190429688, 0.07323741912841797, 0.07700538635253906, 0.08077335357666016, 0.08454132080078125, 0.08830928802490234, 0.09207725524902344, 0.09584522247314453, 0.09961318969726562, 0.10338115692138672, 0.10714912414550781, 0.1109170913696289, 0.11468505859375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 2.0, 8.0, 13.0, 18.0, 40.0, 64.0, 121.0, 295.0, 1006.0, 6280.0, 111165.0, 4045129.0, 26463.0, 2677.0, 616.0, 199.0, 70.0, 30.0, 25.0, 17.0, 9.0, 6.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.455322265625, -0.44077301025390625, -0.4262237548828125, -0.41167449951171875, -0.397125244140625, -0.38257598876953125, -0.3680267333984375, -0.35347747802734375, -0.33892822265625, -0.32437896728515625, -0.3098297119140625, -0.29528045654296875, -0.280731201171875, -0.26618194580078125, -0.2516326904296875, -0.23708343505859375, -0.2225341796875, -0.20798492431640625, -0.1934356689453125, -0.17888641357421875, -0.164337158203125, -0.14978790283203125, -0.1352386474609375, -0.12068939208984375, -0.10614013671875, -0.09159088134765625, -0.0770416259765625, -0.06249237060546875, -0.047943115234375, -0.03339385986328125, -0.0188446044921875, -0.00429534912109375, 0.01025390625, 0.02480316162109375, 0.0393524169921875, 0.05390167236328125, 0.068450927734375, 0.08300018310546875, 0.0975494384765625, 0.11209869384765625, 0.12664794921875, 0.14119720458984375, 0.1557464599609375, 0.17029571533203125, 0.184844970703125, 0.19939422607421875, 0.2139434814453125, 0.22849273681640625, 0.2430419921875, 0.25759124755859375, 0.2721405029296875, 0.28668975830078125, 0.301239013671875, 0.31578826904296875, 0.3303375244140625, 0.34488677978515625, 0.35943603515625, 0.37398529052734375, 0.3885345458984375, 0.40308380126953125, 0.417633056640625, 0.43218231201171875, 0.4467315673828125, 0.46128082275390625, 0.475830078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 3.0, 4.0, 13.0, 12.0, 13.0, 29.0, 41.0, 101.0, 368.0, 1894.0, 1191.0, 211.0, 73.0, 42.0, 18.0, 17.0, 15.0, 7.0, 6.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.3885650634765625, -0.377716064453125, -0.3668670654296875, -0.35601806640625, -0.3451690673828125, -0.334320068359375, -0.3234710693359375, -0.3126220703125, -0.3017730712890625, -0.290924072265625, -0.2800750732421875, -0.26922607421875, -0.2583770751953125, -0.247528076171875, -0.2366790771484375, -0.225830078125, -0.2149810791015625, -0.204132080078125, -0.1932830810546875, -0.18243408203125, -0.1715850830078125, -0.160736083984375, -0.1498870849609375, -0.1390380859375, -0.1281890869140625, -0.117340087890625, -0.1064910888671875, -0.09564208984375, -0.0847930908203125, -0.073944091796875, -0.0630950927734375, -0.05224609375, -0.0413970947265625, -0.030548095703125, -0.0196990966796875, -0.00885009765625, 0.0019989013671875, 0.012847900390625, 0.0236968994140625, 0.0345458984375, 0.0453948974609375, 0.056243896484375, 0.0670928955078125, 0.07794189453125, 0.0887908935546875, 0.099639892578125, 0.1104888916015625, 0.121337890625, 0.1321868896484375, 0.143035888671875, 0.1538848876953125, 0.16473388671875, 0.1755828857421875, 0.186431884765625, 0.1972808837890625, 0.2081298828125, 0.2189788818359375, 0.229827880859375, 0.2406768798828125, 0.25152587890625, 0.2623748779296875, 0.273223876953125, 0.2840728759765625, 0.294921875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 8.0, 12.0, 26.0, 83.0, 195.0, 343.0, 209.0, 83.0, 22.0, 13.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.519117832183838, -3.4436111450195312, -3.3681044578552246, -3.292597770690918, -3.2170910835266113, -3.1415841579437256, -3.066077470779419, -2.9905707836151123, -2.9150640964508057, -2.839557409286499, -2.7640507221221924, -2.6885440349578857, -2.613037109375, -2.5375304222106934, -2.4620237350463867, -2.38651704788208, -2.3110103607177734, -2.235503673553467, -2.15999698638916, -2.0844902992248535, -2.008983612060547, -1.9334768056869507, -1.8579699993133545, -1.7824633121490479, -1.7069566249847412, -1.6314499378204346, -1.555943250656128, -1.4804364442825317, -1.404929757118225, -1.3294230699539185, -1.2539162635803223, -1.1784095764160156, -1.1029026508331299, -1.0273959636688232, -0.9518892168998718, -0.8763824701309204, -0.8008757829666138, -0.7253690958023071, -0.6498623490333557, -0.5743556022644043, -0.49884891510009766, -0.42334219813346863, -0.3478354811668396, -0.27232876420021057, -0.19682204723358154, -0.12131533026695251, -0.045808613300323486, 0.02969813346862793, 0.10520482063293457, 0.1807115375995636, 0.2562182545661926, 0.33172497153282166, 0.4072316884994507, 0.4827384054660797, 0.5582451224327087, 0.6337518692016602, 0.7092585563659668, 0.7847652435302734, 0.8602719902992249, 0.9357787370681763, 1.011285424232483, 1.0867921113967896, 1.1622989177703857, 1.2378056049346924, 1.313312292098999]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 7.0, 6.0, 7.0, 5.0, 10.0, 16.0, 11.0, 29.0, 32.0, 31.0, 25.0, 47.0, 57.0, 68.0, 68.0, 77.0, 73.0, 60.0, 57.0, 64.0, 51.0, 43.0, 36.0, 25.0, 28.0, 22.0, 15.0, 12.0, 12.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.303004503250122, -1.2634862661361694, -1.2239681482315063, -1.1844499111175537, -1.1449317932128906, -1.105413556098938, -1.0658953189849854, -1.0263772010803223, -0.9868589639663696, -0.9473407864570618, -0.9078226089477539, -0.8683043718338013, -0.8287861943244934, -0.7892680168151855, -0.7497497797012329, -0.710231602191925, -0.6707134246826172, -0.6311952471733093, -0.5916770696640015, -0.5521588325500488, -0.512640655040741, -0.4731224775314331, -0.43360427021980286, -0.3940860629081726, -0.35456788539886475, -0.3150497078895569, -0.27553150057792664, -0.23601330816745758, -0.19649511575698853, -0.15697692334651947, -0.11745873093605042, -0.07794052362442017, -0.038422346115112305, 0.0010958462953567505, 0.040614038705825806, 0.08013223111629486, 0.11965042352676392, 0.15916861593723297, 0.19868680834770203, 0.23820501565933228, 0.27772319316864014, 0.317241370677948, 0.35675957798957825, 0.3962777853012085, 0.43579596281051636, 0.4753141403198242, 0.5148323774337769, 0.5543505549430847, 0.5938687324523926, 0.6333869099617004, 0.6729050874710083, 0.7124233245849609, 0.7519415020942688, 0.7914596796035767, 0.8309779167175293, 0.8704960942268372, 0.910014271736145, 0.9495324492454529, 0.9890506267547607, 1.0285688638687134, 1.068087100982666, 1.107605218887329, 1.1471234560012817, 1.1866416931152344, 1.2261598110198975]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 6.0, 4.0, 7.0, 11.0, 16.0, 30.0, 36.0, 44.0, 96.0, 140.0, 228.0, 393.0, 665.0, 1098.0, 1944.0, 3664.0, 7096.0, 14437.0, 32246.0, 72979.0, 170191.0, 301194.0, 241664.0, 110778.0, 47277.0, 20969.0, 10000.0, 5097.0, 2618.0, 1454.0, 864.0, 462.0, 296.0, 189.0, 113.0, 70.0, 71.0, 31.0, 33.0, 18.0, 9.0, 11.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.102294921875, -0.09943294525146484, -0.09657096862792969, -0.09370899200439453, -0.09084701538085938, -0.08798503875732422, -0.08512306213378906, -0.0822610855102539, -0.07939910888671875, -0.0765371322631836, -0.07367515563964844, -0.07081317901611328, -0.06795120239257812, -0.06508922576904297, -0.06222724914550781, -0.059365272521972656, -0.0565032958984375, -0.053641319274902344, -0.05077934265136719, -0.04791736602783203, -0.045055389404296875, -0.04219341278076172, -0.03933143615722656, -0.036469459533691406, -0.03360748291015625, -0.030745506286621094, -0.027883529663085938, -0.02502155303955078, -0.022159576416015625, -0.01929759979248047, -0.016435623168945312, -0.013573646545410156, -0.010711669921875, -0.007849693298339844, -0.0049877166748046875, -0.0021257400512695312, 0.000736236572265625, 0.0035982131958007812, 0.0064601898193359375, 0.009322166442871094, 0.01218414306640625, 0.015046119689941406, 0.017908096313476562, 0.02077007293701172, 0.023632049560546875, 0.02649402618408203, 0.029356002807617188, 0.032217979431152344, 0.0350799560546875, 0.037941932678222656, 0.04080390930175781, 0.04366588592529297, 0.046527862548828125, 0.04938983917236328, 0.05225181579589844, 0.055113792419433594, 0.05797576904296875, 0.060837745666503906, 0.06369972229003906, 0.06656169891357422, 0.06942367553710938, 0.07228565216064453, 0.07514762878417969, 0.07800960540771484, 0.08087158203125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 7.0, 10.0, 18.0, 17.0, 21.0, 15.0, 22.0, 27.0, 36.0, 49.0, 41.0, 52.0, 44.0, 52.0, 65.0, 56.0, 43.0, 66.0, 46.0, 37.0, 36.0, 51.0, 30.0, 26.0, 32.0, 22.0, 17.0, 13.0, 9.0, 4.0, 6.0, 8.0, 5.0, 6.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1270751953125, -0.12338829040527344, -0.11970138549804688, -0.11601448059082031, -0.11232757568359375, -0.10864067077636719, -0.10495376586914062, -0.10126686096191406, -0.0975799560546875, -0.09389305114746094, -0.09020614624023438, -0.08651924133300781, -0.08283233642578125, -0.07914543151855469, -0.07545852661132812, -0.07177162170410156, -0.068084716796875, -0.06439781188964844, -0.060710906982421875, -0.05702400207519531, -0.05333709716796875, -0.04965019226074219, -0.045963287353515625, -0.04227638244628906, -0.0385894775390625, -0.03490257263183594, -0.031215667724609375, -0.027528762817382812, -0.02384185791015625, -0.020154953002929688, -0.016468048095703125, -0.012781143188476562, -0.00909423828125, -0.0054073333740234375, -0.001720428466796875, 0.0019664764404296875, 0.00565338134765625, 0.009340286254882812, 0.013027191162109375, 0.016714096069335938, 0.0204010009765625, 0.024087905883789062, 0.027774810791015625, 0.03146171569824219, 0.03514862060546875, 0.03883552551269531, 0.042522430419921875, 0.04620933532714844, 0.049896240234375, 0.05358314514160156, 0.057270050048828125, 0.06095695495605469, 0.06464385986328125, 0.06833076477050781, 0.07201766967773438, 0.07570457458496094, 0.0793914794921875, 0.08307838439941406, 0.08676528930664062, 0.09045219421386719, 0.09413909912109375, 0.09782600402832031, 0.10151290893554688, 0.10519981384277344, 0.10888671875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 3.0, 4.0, 9.0, 10.0, 13.0, 31.0, 39.0, 73.0, 96.0, 215.0, 342.0, 706.0, 1490.0, 6621.0, 152694.0, 852601.0, 28297.0, 3040.0, 1062.0, 469.0, 285.0, 168.0, 90.0, 67.0, 34.0, 31.0, 17.0, 15.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.32210540771484375, -0.3107147216796875, -0.29932403564453125, -0.287933349609375, -0.27654266357421875, -0.2651519775390625, -0.25376129150390625, -0.24237060546875, -0.23097991943359375, -0.2195892333984375, -0.20819854736328125, -0.196807861328125, -0.18541717529296875, -0.1740264892578125, -0.16263580322265625, -0.1512451171875, -0.13985443115234375, -0.1284637451171875, -0.11707305908203125, -0.105682373046875, -0.09429168701171875, -0.0829010009765625, -0.07151031494140625, -0.06011962890625, -0.04872894287109375, -0.0373382568359375, -0.02594757080078125, -0.014556884765625, -0.00316619873046875, 0.0082244873046875, 0.01961517333984375, 0.031005859375, 0.04239654541015625, 0.0537872314453125, 0.06517791748046875, 0.076568603515625, 0.08795928955078125, 0.0993499755859375, 0.11074066162109375, 0.12213134765625, 0.13352203369140625, 0.1449127197265625, 0.15630340576171875, 0.167694091796875, 0.17908477783203125, 0.1904754638671875, 0.20186614990234375, 0.2132568359375, 0.22464752197265625, 0.2360382080078125, 0.24742889404296875, 0.258819580078125, 0.27021026611328125, 0.2816009521484375, 0.29299163818359375, 0.30438232421875, 0.31577301025390625, 0.3271636962890625, 0.33855438232421875, 0.349945068359375, 0.36133575439453125, 0.3727264404296875, 0.38411712646484375, 0.3955078125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 2.0, 4.0, 14.0, 12.0, 23.0, 22.0, 19.0, 33.0, 31.0, 26.0, 31.0, 33.0, 35.0, 35.0, 34.0, 38.0, 40.0, 49.0, 45.0, 51.0, 36.0, 42.0, 46.0, 34.0, 42.0, 35.0, 30.0, 25.0, 23.0, 13.0, 22.0, 14.0, 17.0, 12.0, 6.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.408447265625, -0.3973045349121094, -0.38616180419921875, -0.3750190734863281, -0.3638763427734375, -0.3527336120605469, -0.34159088134765625, -0.3304481506347656, -0.319305419921875, -0.3081626892089844, -0.29701995849609375, -0.2858772277832031, -0.2747344970703125, -0.2635917663574219, -0.25244903564453125, -0.24130630493164062, -0.23016357421875, -0.21902084350585938, -0.20787811279296875, -0.19673538208007812, -0.1855926513671875, -0.17444992065429688, -0.16330718994140625, -0.15216445922851562, -0.141021728515625, -0.12987899780273438, -0.11873626708984375, -0.10759353637695312, -0.0964508056640625, -0.08530807495117188, -0.07416534423828125, -0.06302261352539062, -0.0518798828125, -0.040737152099609375, -0.02959442138671875, -0.018451690673828125, -0.0073089599609375, 0.003833770751953125, 0.01497650146484375, 0.026119232177734375, 0.037261962890625, 0.048404693603515625, 0.05954742431640625, 0.07069015502929688, 0.0818328857421875, 0.09297561645507812, 0.10411834716796875, 0.11526107788085938, 0.12640380859375, 0.13754653930664062, 0.14868927001953125, 0.15983200073242188, 0.1709747314453125, 0.18211746215820312, 0.19326019287109375, 0.20440292358398438, 0.215545654296875, 0.22668838500976562, 0.23783111572265625, 0.24897384643554688, 0.2601165771484375, 0.2712593078613281, 0.28240203857421875, 0.2935447692871094, 0.3046875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 9.0, 9.0, 10.0, 10.0, 20.0, 38.0, 44.0, 111.0, 182.0, 476.0, 1395.0, 6219.0, 278479.0, 750242.0, 8615.0, 1649.0, 524.0, 252.0, 106.0, 60.0, 34.0, 26.0, 11.0, 7.0, 9.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2130126953125, -0.20615768432617188, -0.19930267333984375, -0.19244766235351562, -0.1855926513671875, -0.17873764038085938, -0.17188262939453125, -0.16502761840820312, -0.158172607421875, -0.15131759643554688, -0.14446258544921875, -0.13760757446289062, -0.1307525634765625, -0.12389755249023438, -0.11704254150390625, -0.11018753051757812, -0.10333251953125, -0.09647750854492188, -0.08962249755859375, -0.08276748657226562, -0.0759124755859375, -0.06905746459960938, -0.06220245361328125, -0.055347442626953125, -0.048492431640625, -0.041637420654296875, -0.03478240966796875, -0.027927398681640625, -0.0210723876953125, -0.014217376708984375, -0.00736236572265625, -0.000507354736328125, 0.00634765625, 0.013202667236328125, 0.02005767822265625, 0.026912689208984375, 0.0337677001953125, 0.040622711181640625, 0.04747772216796875, 0.054332733154296875, 0.061187744140625, 0.06804275512695312, 0.07489776611328125, 0.08175277709960938, 0.0886077880859375, 0.09546279907226562, 0.10231781005859375, 0.10917282104492188, 0.11602783203125, 0.12288284301757812, 0.12973785400390625, 0.13659286499023438, 0.1434478759765625, 0.15030288696289062, 0.15715789794921875, 0.16401290893554688, 0.170867919921875, 0.17772293090820312, 0.18457794189453125, 0.19143295288085938, 0.1982879638671875, 0.20514297485351562, 0.21199798583984375, 0.21885299682617188, 0.2257080078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 9.0, 7.0, 9.0, 13.0, 7.0, 14.0, 13.0, 22.0, 27.0, 45.0, 58.0, 81.0, 112.0, 135.0, 100.0, 77.0, 62.0, 48.0, 34.0, 26.0, 15.0, 15.0, 15.0, 10.0, 6.0, 6.0, 7.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.166364669799805e-05, -4.0024518966674805e-05, -3.838539123535156e-05, -3.674626350402832e-05, -3.510713577270508e-05, -3.3468008041381836e-05, -3.1828880310058594e-05, -3.018975257873535e-05, -2.855062484741211e-05, -2.6911497116088867e-05, -2.5272369384765625e-05, -2.3633241653442383e-05, -2.199411392211914e-05, -2.03549861907959e-05, -1.8715858459472656e-05, -1.7076730728149414e-05, -1.5437602996826172e-05, -1.379847526550293e-05, -1.2159347534179688e-05, -1.0520219802856445e-05, -8.881092071533203e-06, -7.241964340209961e-06, -5.602836608886719e-06, -3.9637088775634766e-06, -2.3245811462402344e-06, -6.854534149169922e-07, 9.5367431640625e-07, 2.592802047729492e-06, 4.231929779052734e-06, 5.8710575103759766e-06, 7.510185241699219e-06, 9.149312973022461e-06, 1.0788440704345703e-05, 1.2427568435668945e-05, 1.4066696166992188e-05, 1.570582389831543e-05, 1.7344951629638672e-05, 1.8984079360961914e-05, 2.0623207092285156e-05, 2.22623348236084e-05, 2.390146255493164e-05, 2.5540590286254883e-05, 2.7179718017578125e-05, 2.8818845748901367e-05, 3.045797348022461e-05, 3.209710121154785e-05, 3.3736228942871094e-05, 3.5375356674194336e-05, 3.701448440551758e-05, 3.865361213684082e-05, 4.029273986816406e-05, 4.1931867599487305e-05, 4.357099533081055e-05, 4.521012306213379e-05, 4.684925079345703e-05, 4.8488378524780273e-05, 5.0127506256103516e-05, 5.176663398742676e-05, 5.340576171875e-05, 5.504488945007324e-05, 5.6684017181396484e-05, 5.8323144912719727e-05, 5.996227264404297e-05, 6.160140037536621e-05, 6.324052810668945e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 10.0, 4.0, 15.0, 18.0, 21.0, 39.0, 47.0, 65.0, 104.0, 170.0, 335.0, 627.0, 1488.0, 3738.0, 12848.0, 117029.0, 819553.0, 76319.0, 10476.0, 3071.0, 1246.0, 573.0, 270.0, 156.0, 99.0, 73.0, 33.0, 35.0, 17.0, 15.0, 13.0, 7.0, 7.0, 10.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1064453125, -0.10326099395751953, -0.10007667541503906, -0.0968923568725586, -0.09370803833007812, -0.09052371978759766, -0.08733940124511719, -0.08415508270263672, -0.08097076416015625, -0.07778644561767578, -0.07460212707519531, -0.07141780853271484, -0.06823348999023438, -0.0650491714477539, -0.06186485290527344, -0.05868053436279297, -0.0554962158203125, -0.05231189727783203, -0.04912757873535156, -0.045943260192871094, -0.042758941650390625, -0.039574623107910156, -0.03639030456542969, -0.03320598602294922, -0.03002166748046875, -0.02683734893798828, -0.023653030395507812, -0.020468711853027344, -0.017284393310546875, -0.014100074768066406, -0.010915756225585938, -0.007731437683105469, -0.004547119140625, -0.0013628005981445312, 0.0018215179443359375, 0.005005836486816406, 0.008190155029296875, 0.011374473571777344, 0.014558792114257812, 0.01774311065673828, 0.02092742919921875, 0.02411174774169922, 0.027296066284179688, 0.030480384826660156, 0.033664703369140625, 0.036849021911621094, 0.04003334045410156, 0.04321765899658203, 0.0464019775390625, 0.04958629608154297, 0.05277061462402344, 0.055954933166503906, 0.059139251708984375, 0.062323570251464844, 0.06550788879394531, 0.06869220733642578, 0.07187652587890625, 0.07506084442138672, 0.07824516296386719, 0.08142948150634766, 0.08461380004882812, 0.0877981185913086, 0.09098243713378906, 0.09416675567626953, 0.09735107421875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 7.0, 2.0, 0.0, 6.0, 5.0, 5.0, 13.0, 16.0, 19.0, 37.0, 40.0, 51.0, 62.0, 76.0, 113.0, 92.0, 92.0, 88.0, 71.0, 63.0, 30.0, 38.0, 22.0, 14.0, 10.0, 5.0, 6.0, 5.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08599853515625, -0.08277416229248047, -0.07954978942871094, -0.0763254165649414, -0.07310104370117188, -0.06987667083740234, -0.06665229797363281, -0.06342792510986328, -0.06020355224609375, -0.05697917938232422, -0.05375480651855469, -0.050530433654785156, -0.047306060791015625, -0.044081687927246094, -0.04085731506347656, -0.03763294219970703, -0.0344085693359375, -0.03118419647216797, -0.027959823608398438, -0.024735450744628906, -0.021511077880859375, -0.018286705017089844, -0.015062332153320312, -0.011837959289550781, -0.00861358642578125, -0.005389213562011719, -0.0021648406982421875, 0.0010595321655273438, 0.004283905029296875, 0.007508277893066406, 0.010732650756835938, 0.013957023620605469, 0.017181396484375, 0.02040576934814453, 0.023630142211914062, 0.026854515075683594, 0.030078887939453125, 0.033303260803222656, 0.03652763366699219, 0.03975200653076172, 0.04297637939453125, 0.04620075225830078, 0.04942512512207031, 0.052649497985839844, 0.055873870849609375, 0.059098243713378906, 0.06232261657714844, 0.06554698944091797, 0.0687713623046875, 0.07199573516845703, 0.07522010803222656, 0.0784444808959961, 0.08166885375976562, 0.08489322662353516, 0.08811759948730469, 0.09134197235107422, 0.09456634521484375, 0.09779071807861328, 0.10101509094238281, 0.10423946380615234, 0.10746383666992188, 0.1106882095336914, 0.11391258239746094, 0.11713695526123047, 0.120361328125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 8.0, 11.0, 33.0, 63.0, 128.0, 219.0, 200.0, 173.0, 76.0, 45.0, 13.0, 6.0, 11.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.728104829788208, -1.6668163537979126, -1.6055278778076172, -1.5442395210266113, -1.482951045036316, -1.4216625690460205, -1.360374093055725, -1.2990856170654297, -1.2377972602844238, -1.1765087842941284, -1.115220308303833, -1.0539319515228271, -0.9926434755325317, -0.9313549995422363, -0.8700665235519409, -0.8087780475616455, -0.7474895715713501, -0.6862010955810547, -0.624912679195404, -0.5636242032051086, -0.502335786819458, -0.4410473108291626, -0.3797588348388672, -0.31847038865089417, -0.25718194246292114, -0.19589349627494812, -0.1346050351858139, -0.07331657409667969, -0.012028127908706665, 0.04926031827926636, 0.11054879426956177, 0.1718372404575348, 0.2331256866455078, 0.29441413283348083, 0.35570257902145386, 0.41699105501174927, 0.4782795011997223, 0.5395679473876953, 0.6008564233779907, 0.6621448993682861, 0.7234333157539368, 0.7847217917442322, 0.8460102081298828, 0.9072986841201782, 0.9685871601104736, 1.0298755168914795, 1.0911641120910645, 1.1524524688720703, 1.2137409448623657, 1.2750294208526611, 1.3363178968429565, 1.397606372833252, 1.4588947296142578, 1.5201832056045532, 1.5814716815948486, 1.642760157585144, 1.7040486335754395, 1.7653371095657349, 1.8266255855560303, 1.8879139423370361, 1.9492024183273315, 2.010490894317627, 2.071779251098633, 2.1330678462982178, 2.1943562030792236]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 8.0, 14.0, 10.0, 21.0, 15.0, 19.0, 22.0, 25.0, 28.0, 40.0, 45.0, 52.0, 53.0, 58.0, 62.0, 69.0, 51.0, 63.0, 45.0, 37.0, 30.0, 36.0, 38.0, 23.0, 24.0, 21.0, 20.0, 15.0, 17.0, 14.0, 5.0, 3.0, 2.0, 7.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.066498041152954, -2.0110204219818115, -1.955542802810669, -1.9000651836395264, -1.8445875644683838, -1.7891099452972412, -1.733632206916809, -1.6781545877456665, -1.622676968574524, -1.5671993494033813, -1.5117217302322388, -1.4562441110610962, -1.400766372680664, -1.3452887535095215, -1.289811134338379, -1.2343335151672363, -1.1788558959960938, -1.1233782768249512, -1.0679006576538086, -1.012423038482666, -0.9569453597068787, -0.9014677405357361, -0.8459900617599487, -0.7905124425888062, -0.7350348234176636, -0.679557204246521, -0.6240795850753784, -0.5686019062995911, -0.5131242871284485, -0.4576466679573059, -0.40216901898384094, -0.346691370010376, -0.29121363162994385, -0.23573599755764008, -0.1802583634853363, -0.12478072941303253, -0.06930309534072876, -0.013825476169586182, 0.041652172803878784, 0.09712982177734375, 0.15260744094848633, 0.2080850750207901, 0.26356270909309387, 0.31904035806655884, 0.3745179772377014, 0.429995596408844, 0.48547324538230896, 0.5409508943557739, 0.5964285135269165, 0.6519061326980591, 0.7073837518692017, 0.762861430644989, 0.8183390498161316, 0.8738166689872742, 0.9292943477630615, 0.9847719669342041, 1.0402495861053467, 1.0957272052764893, 1.1512048244476318, 1.2066824436187744, 1.262160062789917, 1.3176376819610596, 1.3731154203414917, 1.4285930395126343, 1.4840706586837769]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 7.0, 9.0, 14.0, 13.0, 19.0, 33.0, 32.0, 54.0, 63.0, 89.0, 114.0, 154.0, 246.0, 618.0, 5236.0, 4162781.0, 22934.0, 870.0, 300.0, 176.0, 105.0, 90.0, 64.0, 54.0, 43.0, 39.0, 19.0, 20.0, 13.0, 13.0, 9.0, 7.0, 8.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.8193359375, -0.7956924438476562, -0.7720489501953125, -0.7484054565429688, -0.724761962890625, -0.7011184692382812, -0.6774749755859375, -0.6538314819335938, -0.63018798828125, -0.6065444946289062, -0.5829010009765625, -0.5592575073242188, -0.535614013671875, -0.5119705200195312, -0.4883270263671875, -0.46468353271484375, -0.4410400390625, -0.41739654541015625, -0.3937530517578125, -0.37010955810546875, -0.346466064453125, -0.32282257080078125, -0.2991790771484375, -0.27553558349609375, -0.25189208984375, -0.22824859619140625, -0.2046051025390625, -0.18096160888671875, -0.157318115234375, -0.13367462158203125, -0.1100311279296875, -0.08638763427734375, -0.062744140625, -0.03910064697265625, -0.0154571533203125, 0.00818634033203125, 0.031829833984375, 0.05547332763671875, 0.0791168212890625, 0.10276031494140625, 0.12640380859375, 0.15004730224609375, 0.1736907958984375, 0.19733428955078125, 0.220977783203125, 0.24462127685546875, 0.2682647705078125, 0.29190826416015625, 0.3155517578125, 0.33919525146484375, 0.3628387451171875, 0.38648223876953125, 0.410125732421875, 0.43376922607421875, 0.4574127197265625, 0.48105621337890625, 0.50469970703125, 0.5283432006835938, 0.5519866943359375, 0.5756301879882812, 0.599273681640625, 0.6229171752929688, 0.6465606689453125, 0.6702041625976562, 0.69384765625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 8.0, 9.0, 19.0, 20.0, 22.0, 30.0, 43.0, 68.0, 68.0, 76.0, 84.0, 94.0, 85.0, 78.0, 63.0, 53.0, 54.0, 40.0, 25.0, 25.0, 19.0, 4.0, 5.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2431640625, -0.23758316040039062, -0.23200225830078125, -0.22642135620117188, -0.2208404541015625, -0.21525955200195312, -0.20967864990234375, -0.20409774780273438, -0.198516845703125, -0.19293594360351562, -0.18735504150390625, -0.18177413940429688, -0.1761932373046875, -0.17061233520507812, -0.16503143310546875, -0.15945053100585938, -0.15386962890625, -0.14828872680664062, -0.14270782470703125, -0.13712692260742188, -0.1315460205078125, -0.12596511840820312, -0.12038421630859375, -0.11480331420898438, -0.109222412109375, -0.10364151000976562, -0.09806060791015625, -0.09247970581054688, -0.0868988037109375, -0.08131790161132812, -0.07573699951171875, -0.07015609741210938, -0.0645751953125, -0.058994293212890625, -0.05341339111328125, -0.047832489013671875, -0.0422515869140625, -0.036670684814453125, -0.03108978271484375, -0.025508880615234375, -0.019927978515625, -0.014347076416015625, -0.00876617431640625, -0.003185272216796875, 0.0023956298828125, 0.007976531982421875, 0.01355743408203125, 0.019138336181640625, 0.02471923828125, 0.030300140380859375, 0.03588104248046875, 0.041461944580078125, 0.0470428466796875, 0.052623748779296875, 0.05820465087890625, 0.06378555297851562, 0.069366455078125, 0.07494735717773438, 0.08052825927734375, 0.08610916137695312, 0.0916900634765625, 0.09727096557617188, 0.10285186767578125, 0.10843276977539062, 0.114013671875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 5.0, 9.0, 14.0, 16.0, 28.0, 38.0, 91.0, 144.0, 309.0, 752.0, 2727.0, 15411.0, 371750.0, 3757211.0, 37793.0, 5735.0, 1335.0, 472.0, 204.0, 113.0, 37.0, 38.0, 22.0, 10.0, 10.0, 6.0, 4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28759765625, -0.2789344787597656, -0.27027130126953125, -0.2616081237792969, -0.2529449462890625, -0.24428176879882812, -0.23561859130859375, -0.22695541381835938, -0.218292236328125, -0.20962905883789062, -0.20096588134765625, -0.19230270385742188, -0.1836395263671875, -0.17497634887695312, -0.16631317138671875, -0.15764999389648438, -0.14898681640625, -0.14032363891601562, -0.13166046142578125, -0.12299728393554688, -0.1143341064453125, -0.10567092895507812, -0.09700775146484375, -0.08834457397460938, -0.079681396484375, -0.07101821899414062, -0.06235504150390625, -0.053691864013671875, -0.0450286865234375, -0.036365509033203125, -0.02770233154296875, -0.019039154052734375, -0.0103759765625, -0.001712799072265625, 0.00695037841796875, 0.015613555908203125, 0.0242767333984375, 0.032939910888671875, 0.04160308837890625, 0.050266265869140625, 0.058929443359375, 0.06759262084960938, 0.07625579833984375, 0.08491897583007812, 0.0935821533203125, 0.10224533081054688, 0.11090850830078125, 0.11957168579101562, 0.12823486328125, 0.13689804077148438, 0.14556121826171875, 0.15422439575195312, 0.1628875732421875, 0.17155075073242188, 0.18021392822265625, 0.18887710571289062, 0.197540283203125, 0.20620346069335938, 0.21486663818359375, 0.22352981567382812, 0.2321929931640625, 0.24085617065429688, 0.24951934814453125, 0.2581825256347656, 0.266845703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 9.0, 12.0, 11.0, 25.0, 51.0, 114.0, 436.0, 1818.0, 1183.0, 245.0, 79.0, 26.0, 15.0, 20.0, 12.0, 9.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.300537109375, -0.29137420654296875, -0.2822113037109375, -0.27304840087890625, -0.263885498046875, -0.25472259521484375, -0.2455596923828125, -0.23639678955078125, -0.22723388671875, -0.21807098388671875, -0.2089080810546875, -0.19974517822265625, -0.190582275390625, -0.18141937255859375, -0.1722564697265625, -0.16309356689453125, -0.1539306640625, -0.14476776123046875, -0.1356048583984375, -0.12644195556640625, -0.117279052734375, -0.10811614990234375, -0.0989532470703125, -0.08979034423828125, -0.08062744140625, -0.07146453857421875, -0.0623016357421875, -0.05313873291015625, -0.043975830078125, -0.03481292724609375, -0.0256500244140625, -0.01648712158203125, -0.00732421875, 0.00183868408203125, 0.0110015869140625, 0.02016448974609375, 0.029327392578125, 0.03849029541015625, 0.0476531982421875, 0.05681610107421875, 0.06597900390625, 0.07514190673828125, 0.0843048095703125, 0.09346771240234375, 0.102630615234375, 0.11179351806640625, 0.1209564208984375, 0.13011932373046875, 0.1392822265625, 0.14844512939453125, 0.1576080322265625, 0.16677093505859375, 0.175933837890625, 0.18509674072265625, 0.1942596435546875, 0.20342254638671875, 0.21258544921875, 0.22174835205078125, 0.2309112548828125, 0.24007415771484375, 0.249237060546875, 0.25839996337890625, 0.2675628662109375, 0.27672576904296875, 0.285888671875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 27.0, 40.0, 89.0, 151.0, 216.0, 196.0, 147.0, 62.0, 28.0, 13.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7672268152236938, -0.7290539741516113, -0.6908811330795288, -0.6527082920074463, -0.6145354509353638, -0.5763626098632812, -0.5381898283958435, -0.500016987323761, -0.46184414625167847, -0.42367130517959595, -0.3854984641075134, -0.3473256528377533, -0.3091528117656708, -0.27097997069358826, -0.23280714452266693, -0.1946343183517456, -0.15646147727966309, -0.11828864365816116, -0.08011581003665924, -0.04194297641515732, -0.0037701427936553955, 0.034402698278427124, 0.07257552444934845, 0.11074835062026978, 0.1489211916923523, 0.18709403276443481, 0.22526685893535614, 0.26343968510627747, 0.30161252617836, 0.3397853672504425, 0.37795817852020264, 0.41613101959228516, 0.4543037414550781, 0.49247658252716064, 0.5306494235992432, 0.5688222646713257, 0.6069951057434082, 0.6451679468154907, 0.6833407282829285, 0.721513569355011, 0.7596864104270935, 0.797859251499176, 0.8360320925712585, 0.8742049336433411, 0.9123777151107788, 0.9505505561828613, 0.9887233972549438, 1.0268962383270264, 1.0650690793991089, 1.1032419204711914, 1.141414761543274, 1.1795876026153564, 1.217760443687439, 1.2559332847595215, 1.294106125831604, 1.3322789669036865, 1.3704516887664795, 1.408624529838562, 1.4467973709106445, 1.484970211982727, 1.5231430530548096, 1.561315894126892, 1.5994887351989746, 1.6376614570617676, 1.6758344173431396]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 5.0, 6.0, 9.0, 16.0, 13.0, 22.0, 19.0, 24.0, 19.0, 48.0, 42.0, 51.0, 55.0, 60.0, 46.0, 68.0, 64.0, 50.0, 63.0, 47.0, 50.0, 39.0, 39.0, 31.0, 22.0, 19.0, 22.0, 12.0, 6.0, 9.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6847864985466003, -0.6613394618034363, -0.6378924250602722, -0.6144454479217529, -0.5909984111785889, -0.5675513744354248, -0.5441043376922607, -0.5206573009490967, -0.497210294008255, -0.47376325726509094, -0.45031625032424927, -0.4268692135810852, -0.40342217683792114, -0.37997516989707947, -0.3565281331539154, -0.33308112621307373, -0.30963408946990967, -0.2861870527267456, -0.26274004578590393, -0.23929300904273987, -0.215845987200737, -0.19239896535873413, -0.16895192861557007, -0.1455049067735672, -0.12205788493156433, -0.09861086308956146, -0.075163833796978, -0.05171680450439453, -0.028269782662391663, -0.004822760820388794, 0.01862427592277527, 0.04207129776477814, 0.06551837921142578, 0.08896540105342865, 0.11241243034601212, 0.13585945963859558, 0.15930648148059845, 0.18275350332260132, 0.20620054006576538, 0.22964756190776825, 0.2530945837497711, 0.2765416204929352, 0.29998862743377686, 0.3234356641769409, 0.346882700920105, 0.37032970786094666, 0.3937767446041107, 0.4172237515449524, 0.44067078828811646, 0.4641178250312805, 0.4875648319721222, 0.5110118389129639, 0.5344588756561279, 0.557905912399292, 0.581352949142456, 0.6047999858856201, 0.6282470226287842, 0.6516940593719482, 0.6751410961151123, 0.6985881328582764, 0.7220351099967957, 0.7454821467399597, 0.7689291834831238, 0.7923762202262878, 0.8158231973648071]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 3.0, 13.0, 10.0, 14.0, 14.0, 34.0, 44.0, 74.0, 104.0, 130.0, 205.0, 335.0, 443.0, 735.0, 1181.0, 2089.0, 4275.0, 8979.0, 22648.0, 64458.0, 191831.0, 382698.0, 236689.0, 81884.0, 27672.0, 11006.0, 4817.0, 2528.0, 1276.0, 821.0, 516.0, 349.0, 199.0, 143.0, 102.0, 65.0, 56.0, 50.0, 25.0, 13.0, 6.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12261962890625, -0.11861324310302734, -0.11460685729980469, -0.11060047149658203, -0.10659408569335938, -0.10258769989013672, -0.09858131408691406, -0.0945749282836914, -0.09056854248046875, -0.0865621566772461, -0.08255577087402344, -0.07854938507080078, -0.07454299926757812, -0.07053661346435547, -0.06653022766113281, -0.06252384185791016, -0.0585174560546875, -0.054511070251464844, -0.05050468444824219, -0.04649829864501953, -0.042491912841796875, -0.03848552703857422, -0.03447914123535156, -0.030472755432128906, -0.02646636962890625, -0.022459983825683594, -0.018453598022460938, -0.014447212219238281, -0.010440826416015625, -0.006434440612792969, -0.0024280548095703125, 0.0015783309936523438, 0.005584716796875, 0.009591102600097656, 0.013597488403320312, 0.01760387420654297, 0.021610260009765625, 0.02561664581298828, 0.029623031616210938, 0.033629417419433594, 0.03763580322265625, 0.041642189025878906, 0.04564857482910156, 0.04965496063232422, 0.053661346435546875, 0.05766773223876953, 0.06167411804199219, 0.06568050384521484, 0.0696868896484375, 0.07369327545166016, 0.07769966125488281, 0.08170604705810547, 0.08571243286132812, 0.08971881866455078, 0.09372520446777344, 0.0977315902709961, 0.10173797607421875, 0.1057443618774414, 0.10975074768066406, 0.11375713348388672, 0.11776351928710938, 0.12176990509033203, 0.1257762908935547, 0.12978267669677734, 0.1337890625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 14.0, 13.0, 14.0, 13.0, 21.0, 27.0, 16.0, 35.0, 38.0, 49.0, 56.0, 53.0, 55.0, 56.0, 61.0, 64.0, 59.0, 42.0, 38.0, 42.0, 39.0, 36.0, 31.0, 27.0, 15.0, 26.0, 10.0, 14.0, 10.0, 3.0, 8.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12298583984375, -0.11921977996826172, -0.11545372009277344, -0.11168766021728516, -0.10792160034179688, -0.1041555404663086, -0.10038948059082031, -0.09662342071533203, -0.09285736083984375, -0.08909130096435547, -0.08532524108886719, -0.0815591812133789, -0.07779312133789062, -0.07402706146240234, -0.07026100158691406, -0.06649494171142578, -0.0627288818359375, -0.05896282196044922, -0.05519676208496094, -0.051430702209472656, -0.047664642333984375, -0.043898582458496094, -0.04013252258300781, -0.03636646270751953, -0.03260040283203125, -0.02883434295654297, -0.025068283081054688, -0.021302223205566406, -0.017536163330078125, -0.013770103454589844, -0.010004043579101562, -0.006237983703613281, -0.002471923828125, 0.0012941360473632812, 0.0050601959228515625, 0.008826255798339844, 0.012592315673828125, 0.016358375549316406, 0.020124435424804688, 0.02389049530029297, 0.02765655517578125, 0.03142261505126953, 0.03518867492675781, 0.038954734802246094, 0.042720794677734375, 0.046486854553222656, 0.05025291442871094, 0.05401897430419922, 0.0577850341796875, 0.06155109405517578, 0.06531715393066406, 0.06908321380615234, 0.07284927368164062, 0.0766153335571289, 0.08038139343261719, 0.08414745330810547, 0.08791351318359375, 0.09167957305908203, 0.09544563293457031, 0.0992116928100586, 0.10297775268554688, 0.10674381256103516, 0.11050987243652344, 0.11427593231201172, 0.1180419921875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 10.0, 9.0, 12.0, 25.0, 53.0, 88.0, 189.0, 534.0, 1543.0, 12218.0, 745987.0, 279809.0, 6230.0, 1094.0, 395.0, 180.0, 79.0, 40.0, 22.0, 8.0, 4.0, 7.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.501953125, -0.48668670654296875, -0.4714202880859375, -0.45615386962890625, -0.440887451171875, -0.42562103271484375, -0.4103546142578125, -0.39508819580078125, -0.37982177734375, -0.36455535888671875, -0.3492889404296875, -0.33402252197265625, -0.318756103515625, -0.30348968505859375, -0.2882232666015625, -0.27295684814453125, -0.2576904296875, -0.24242401123046875, -0.2271575927734375, -0.21189117431640625, -0.196624755859375, -0.18135833740234375, -0.1660919189453125, -0.15082550048828125, -0.13555908203125, -0.12029266357421875, -0.1050262451171875, -0.08975982666015625, -0.074493408203125, -0.05922698974609375, -0.0439605712890625, -0.02869415283203125, -0.013427734375, 0.00183868408203125, 0.0171051025390625, 0.03237152099609375, 0.047637939453125, 0.06290435791015625, 0.0781707763671875, 0.09343719482421875, 0.10870361328125, 0.12397003173828125, 0.1392364501953125, 0.15450286865234375, 0.169769287109375, 0.18503570556640625, 0.2003021240234375, 0.21556854248046875, 0.2308349609375, 0.24610137939453125, 0.2613677978515625, 0.27663421630859375, 0.291900634765625, 0.30716705322265625, 0.3224334716796875, 0.33769989013671875, 0.35296630859375, 0.36823272705078125, 0.3834991455078125, 0.39876556396484375, 0.414031982421875, 0.42929840087890625, 0.4445648193359375, 0.45983123779296875, 0.47509765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 7.0, 7.0, 7.0, 11.0, 14.0, 16.0, 28.0, 28.0, 34.0, 33.0, 44.0, 46.0, 52.0, 45.0, 51.0, 50.0, 57.0, 52.0, 58.0, 44.0, 49.0, 43.0, 39.0, 25.0, 27.0, 23.0, 20.0, 24.0, 14.0, 15.0, 10.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.338134765625, -0.3258781433105469, -0.31362152099609375, -0.3013648986816406, -0.2891082763671875, -0.2768516540527344, -0.26459503173828125, -0.2523384094238281, -0.240081787109375, -0.22782516479492188, -0.21556854248046875, -0.20331192016601562, -0.1910552978515625, -0.17879867553710938, -0.16654205322265625, -0.15428543090820312, -0.14202880859375, -0.12977218627929688, -0.11751556396484375, -0.10525894165039062, -0.0930023193359375, -0.08074569702148438, -0.06848907470703125, -0.056232452392578125, -0.043975830078125, -0.031719207763671875, -0.01946258544921875, -0.007205963134765625, 0.0050506591796875, 0.017307281494140625, 0.02956390380859375, 0.041820526123046875, 0.0540771484375, 0.06633377075195312, 0.07859039306640625, 0.09084701538085938, 0.1031036376953125, 0.11536026000976562, 0.12761688232421875, 0.13987350463867188, 0.152130126953125, 0.16438674926757812, 0.17664337158203125, 0.18889999389648438, 0.2011566162109375, 0.21341323852539062, 0.22566986083984375, 0.23792648315429688, 0.25018310546875, 0.2624397277832031, 0.27469635009765625, 0.2869529724121094, 0.2992095947265625, 0.3114662170410156, 0.32372283935546875, 0.3359794616699219, 0.348236083984375, 0.3604927062988281, 0.37274932861328125, 0.3850059509277344, 0.3972625732421875, 0.4095191955566406, 0.42177581787109375, 0.4340324401855469, 0.4462890625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 2.0, 9.0, 10.0, 14.0, 19.0, 15.0, 32.0, 61.0, 118.0, 209.0, 568.0, 1444.0, 5924.0, 84547.0, 919813.0, 30148.0, 3730.0, 1055.0, 393.0, 193.0, 95.0, 56.0, 21.0, 20.0, 24.0, 4.0, 5.0, 5.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193359375, -0.1871929168701172, -0.18102645874023438, -0.17486000061035156, -0.16869354248046875, -0.16252708435058594, -0.15636062622070312, -0.1501941680908203, -0.1440277099609375, -0.1378612518310547, -0.13169479370117188, -0.12552833557128906, -0.11936187744140625, -0.11319541931152344, -0.10702896118164062, -0.10086250305175781, -0.094696044921875, -0.08852958679199219, -0.08236312866210938, -0.07619667053222656, -0.07003021240234375, -0.06386375427246094, -0.057697296142578125, -0.05153083801269531, -0.0453643798828125, -0.03919792175292969, -0.033031463623046875, -0.026865005493164062, -0.02069854736328125, -0.014532089233398438, -0.008365631103515625, -0.0021991729736328125, 0.00396728515625, 0.010133743286132812, 0.016300201416015625, 0.022466659545898438, 0.02863311767578125, 0.03479957580566406, 0.040966033935546875, 0.04713249206542969, 0.0532989501953125, 0.05946540832519531, 0.06563186645507812, 0.07179832458496094, 0.07796478271484375, 0.08413124084472656, 0.09029769897460938, 0.09646415710449219, 0.102630615234375, 0.10879707336425781, 0.11496353149414062, 0.12112998962402344, 0.12729644775390625, 0.13346290588378906, 0.13962936401367188, 0.1457958221435547, 0.1519622802734375, 0.1581287384033203, 0.16429519653320312, 0.17046165466308594, 0.17662811279296875, 0.18279457092285156, 0.18896102905273438, 0.1951274871826172, 0.2012939453125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 6.0, 12.0, 11.0, 9.0, 12.0, 17.0, 24.0, 27.0, 48.0, 63.0, 92.0, 113.0, 128.0, 107.0, 75.0, 55.0, 54.0, 19.0, 21.0, 18.0, 10.0, 12.0, 11.0, 8.0, 10.0, 7.0, 1.0, 4.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.267692565917969e-05, -4.1171908378601074e-05, -3.966689109802246e-05, -3.816187381744385e-05, -3.6656856536865234e-05, -3.515183925628662e-05, -3.364682197570801e-05, -3.2141804695129395e-05, -3.063678741455078e-05, -2.9131770133972168e-05, -2.7626752853393555e-05, -2.612173557281494e-05, -2.4616718292236328e-05, -2.3111701011657715e-05, -2.16066837310791e-05, -2.0101666450500488e-05, -1.8596649169921875e-05, -1.7091631889343262e-05, -1.558661460876465e-05, -1.4081597328186035e-05, -1.2576580047607422e-05, -1.1071562767028809e-05, -9.566545486450195e-06, -8.061528205871582e-06, -6.556510925292969e-06, -5.0514936447143555e-06, -3.546476364135742e-06, -2.041459083557129e-06, -5.364418029785156e-07, 9.685754776000977e-07, 2.473592758178711e-06, 3.978610038757324e-06, 5.4836273193359375e-06, 6.988644599914551e-06, 8.493661880493164e-06, 9.998679161071777e-06, 1.150369644165039e-05, 1.3008713722229004e-05, 1.4513731002807617e-05, 1.601874828338623e-05, 1.7523765563964844e-05, 1.9028782844543457e-05, 2.053380012512207e-05, 2.2038817405700684e-05, 2.3543834686279297e-05, 2.504885196685791e-05, 2.6553869247436523e-05, 2.8058886528015137e-05, 2.956390380859375e-05, 3.106892108917236e-05, 3.2573938369750977e-05, 3.407895565032959e-05, 3.55839729309082e-05, 3.7088990211486816e-05, 3.859400749206543e-05, 4.009902477264404e-05, 4.1604042053222656e-05, 4.310905933380127e-05, 4.461407661437988e-05, 4.6119093894958496e-05, 4.762411117553711e-05, 4.912912845611572e-05, 5.0634145736694336e-05, 5.213916301727295e-05, 5.364418029785156e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 2.0, 14.0, 13.0, 17.0, 22.0, 28.0, 55.0, 92.0, 168.0, 271.0, 508.0, 1148.0, 3082.0, 11838.0, 81626.0, 695092.0, 221694.0, 24401.0, 5216.0, 1719.0, 687.0, 318.0, 197.0, 109.0, 75.0, 46.0, 32.0, 26.0, 15.0, 7.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1024169921875, -0.09937858581542969, -0.09634017944335938, -0.09330177307128906, -0.09026336669921875, -0.08722496032714844, -0.08418655395507812, -0.08114814758300781, -0.0781097412109375, -0.07507133483886719, -0.07203292846679688, -0.06899452209472656, -0.06595611572265625, -0.06291770935058594, -0.059879302978515625, -0.05684089660644531, -0.053802490234375, -0.05076408386230469, -0.047725677490234375, -0.04468727111816406, -0.04164886474609375, -0.03861045837402344, -0.035572052001953125, -0.03253364562988281, -0.0294952392578125, -0.026456832885742188, -0.023418426513671875, -0.020380020141601562, -0.01734161376953125, -0.014303207397460938, -0.011264801025390625, -0.008226394653320312, -0.00518798828125, -0.0021495819091796875, 0.000888824462890625, 0.0039272308349609375, 0.00696563720703125, 0.010004043579101562, 0.013042449951171875, 0.016080856323242188, 0.0191192626953125, 0.022157669067382812, 0.025196075439453125, 0.028234481811523438, 0.03127288818359375, 0.03431129455566406, 0.037349700927734375, 0.04038810729980469, 0.043426513671875, 0.04646492004394531, 0.049503326416015625, 0.05254173278808594, 0.05558013916015625, 0.05861854553222656, 0.061656951904296875, 0.06469535827636719, 0.0677337646484375, 0.07077217102050781, 0.07381057739257812, 0.07684898376464844, 0.07988739013671875, 0.08292579650878906, 0.08596420288085938, 0.08900260925292969, 0.092041015625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 9.0, 6.0, 13.0, 20.0, 17.0, 28.0, 44.0, 50.0, 83.0, 83.0, 107.0, 112.0, 104.0, 91.0, 78.0, 48.0, 36.0, 20.0, 17.0, 20.0, 7.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1544189453125, -0.15040969848632812, -0.14640045166015625, -0.14239120483398438, -0.1383819580078125, -0.13437271118164062, -0.13036346435546875, -0.12635421752929688, -0.122344970703125, -0.11833572387695312, -0.11432647705078125, -0.11031723022460938, -0.1063079833984375, -0.10229873657226562, -0.09828948974609375, -0.09428024291992188, -0.09027099609375, -0.08626174926757812, -0.08225250244140625, -0.07824325561523438, -0.0742340087890625, -0.07022476196289062, -0.06621551513671875, -0.062206268310546875, -0.058197021484375, -0.054187774658203125, -0.05017852783203125, -0.046169281005859375, -0.0421600341796875, -0.038150787353515625, -0.03414154052734375, -0.030132293701171875, -0.026123046875, -0.022113800048828125, -0.01810455322265625, -0.014095306396484375, -0.0100860595703125, -0.006076812744140625, -0.00206756591796875, 0.001941680908203125, 0.005950927734375, 0.009960174560546875, 0.01396942138671875, 0.017978668212890625, 0.0219879150390625, 0.025997161865234375, 0.03000640869140625, 0.034015655517578125, 0.03802490234375, 0.042034149169921875, 0.04604339599609375, 0.050052642822265625, 0.0540618896484375, 0.058071136474609375, 0.06208038330078125, 0.06608963012695312, 0.070098876953125, 0.07410812377929688, 0.07811737060546875, 0.08212661743164062, 0.0861358642578125, 0.09014511108398438, 0.09415435791015625, 0.09816360473632812, 0.1021728515625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 12.0, 42.0, 133.0, 327.0, 335.0, 103.0, 28.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.97115159034729, -3.8614532947540283, -3.7517549991607666, -3.642056465148926, -3.532358169555664, -3.4226598739624023, -3.3129615783691406, -3.203263282775879, -3.093564987182617, -2.9838666915893555, -2.8741683959960938, -2.764470100402832, -2.654771566390991, -2.5450732707977295, -2.4353749752044678, -2.325676679611206, -2.2159781455993652, -2.1062798500061035, -1.9965814352035522, -1.8868831396102905, -1.7771847248077393, -1.6674864292144775, -1.5577881336212158, -1.448089838027954, -1.3383914232254028, -1.2286931276321411, -1.1189947128295898, -1.0092964172363281, -0.8995980620384216, -0.7898997068405151, -0.6802014112472534, -0.5705030560493469, -0.46080493927001953, -0.35110658407211304, -0.24140825867652893, -0.13170993328094482, -0.02201157808303833, 0.08768677711486816, 0.19738507270812988, 0.3070834279060364, 0.41678178310394287, 0.5264801383018494, 0.6361784934997559, 0.7458767890930176, 0.8555751442909241, 0.9652734994888306, 1.0749717950820923, 1.1846702098846436, 1.2943685054779053, 1.404066801071167, 1.5137652158737183, 1.62346351146698, 1.7331619262695312, 1.842860221862793, 1.9525585174560547, 2.0622568130493164, 2.171955108642578, 2.28165340423584, 2.3913516998291016, 2.5010499954223633, 2.610748529434204, 2.720446825027466, 2.8301451206207275, 2.9398434162139893, 3.04954195022583]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 7.0, 13.0, 12.0, 16.0, 19.0, 17.0, 27.0, 25.0, 32.0, 43.0, 36.0, 46.0, 62.0, 61.0, 79.0, 55.0, 70.0, 61.0, 40.0, 36.0, 45.0, 31.0, 46.0, 31.0, 21.0, 14.0, 14.0, 10.0, 7.0, 13.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1596269607543945, -2.102816581726074, -2.046006202697754, -1.9891958236694336, -1.9323853254318237, -1.8755749464035034, -1.818764567375183, -1.7619541883468628, -1.705143690109253, -1.6483333110809326, -1.5915229320526123, -1.534712553024292, -1.4779020547866821, -1.4210916757583618, -1.3642812967300415, -1.3074709177017212, -1.2506605386734009, -1.1938501596450806, -1.1370397806167603, -1.0802292823791504, -1.02341890335083, -0.9666085243225098, -0.9097981452941895, -0.8529877662658691, -0.796177327632904, -0.7393669486045837, -0.6825565099716187, -0.6257461309432983, -0.568935751914978, -0.5121253132820129, -0.4553149342536926, -0.3985045254230499, -0.3416941165924072, -0.2848837077617645, -0.22807331383228302, -0.1712629199028015, -0.11445251107215881, -0.05764210224151611, -0.0008317232131958008, 0.0559786856174469, 0.1127890944480896, 0.1695995032787323, 0.2264098972082138, 0.2832202911376953, 0.340030699968338, 0.3968411087989807, 0.453651487827301, 0.5104619264602661, 0.5672723054885864, 0.6240826845169067, 0.6808931231498718, 0.7377035021781921, 0.7945139408111572, 0.8513243198394775, 0.9081346988677979, 0.9649450778961182, 1.0217554569244385, 1.0785658359527588, 1.135376214981079, 1.1921865940093994, 1.2489970922470093, 1.3058074712753296, 1.36261785030365, 1.4194282293319702, 1.47623872756958]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 9.0, 12.0, 19.0, 11.0, 12.0, 42.0, 41.0, 44.0, 71.0, 97.0, 161.0, 248.0, 389.0, 761.0, 1925.0, 5772.0, 31786.0, 670293.0, 3325494.0, 134805.0, 15242.0, 4037.0, 1514.0, 634.0, 287.0, 172.0, 120.0, 76.0, 56.0, 40.0, 30.0, 16.0, 19.0, 10.0, 8.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18359375, -0.17790603637695312, -0.17221832275390625, -0.16653060913085938, -0.1608428955078125, -0.15515518188476562, -0.14946746826171875, -0.14377975463867188, -0.138092041015625, -0.13240432739257812, -0.12671661376953125, -0.12102890014648438, -0.1153411865234375, -0.10965347290039062, -0.10396575927734375, -0.09827804565429688, -0.09259033203125, -0.08690261840820312, -0.08121490478515625, -0.07552719116210938, -0.0698394775390625, -0.06415176391601562, -0.05846405029296875, -0.052776336669921875, -0.047088623046875, -0.041400909423828125, -0.03571319580078125, -0.030025482177734375, -0.0243377685546875, -0.018650054931640625, -0.01296234130859375, -0.007274627685546875, -0.0015869140625, 0.004100799560546875, 0.00978851318359375, 0.015476226806640625, 0.0211639404296875, 0.026851654052734375, 0.03253936767578125, 0.038227081298828125, 0.043914794921875, 0.049602508544921875, 0.05529022216796875, 0.060977935791015625, 0.0666656494140625, 0.07235336303710938, 0.07804107666015625, 0.08372879028320312, 0.08941650390625, 0.09510421752929688, 0.10079193115234375, 0.10647964477539062, 0.1121673583984375, 0.11785507202148438, 0.12354278564453125, 0.12923049926757812, 0.134918212890625, 0.14060592651367188, 0.14629364013671875, 0.15198135375976562, 0.1576690673828125, 0.16335678100585938, 0.16904449462890625, 0.17473220825195312, 0.180419921875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 12.0, 10.0, 20.0, 23.0, 37.0, 38.0, 58.0, 79.0, 92.0, 104.0, 103.0, 108.0, 70.0, 69.0, 44.0, 38.0, 28.0, 33.0, 17.0, 9.0, 2.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2685546875, -0.26274871826171875, -0.2569427490234375, -0.25113677978515625, -0.245330810546875, -0.23952484130859375, -0.2337188720703125, -0.22791290283203125, -0.22210693359375, -0.21630096435546875, -0.2104949951171875, -0.20468902587890625, -0.198883056640625, -0.19307708740234375, -0.1872711181640625, -0.18146514892578125, -0.1756591796875, -0.16985321044921875, -0.1640472412109375, -0.15824127197265625, -0.152435302734375, -0.14662933349609375, -0.1408233642578125, -0.13501739501953125, -0.12921142578125, -0.12340545654296875, -0.1175994873046875, -0.11179351806640625, -0.105987548828125, -0.10018157958984375, -0.0943756103515625, -0.08856964111328125, -0.082763671875, -0.07695770263671875, -0.0711517333984375, -0.06534576416015625, -0.059539794921875, -0.05373382568359375, -0.0479278564453125, -0.04212188720703125, -0.03631591796875, -0.03050994873046875, -0.0247039794921875, -0.01889801025390625, -0.013092041015625, -0.00728607177734375, -0.0014801025390625, 0.00432586669921875, 0.0101318359375, 0.01593780517578125, 0.0217437744140625, 0.02754974365234375, 0.033355712890625, 0.03916168212890625, 0.0449676513671875, 0.05077362060546875, 0.05657958984375, 0.06238555908203125, 0.0681915283203125, 0.07399749755859375, 0.079803466796875, 0.08560943603515625, 0.0914154052734375, 0.09722137451171875, 0.10302734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 7.0, 13.0, 11.0, 19.0, 21.0, 27.0, 36.0, 76.0, 122.0, 189.0, 370.0, 894.0, 2475.0, 8909.0, 43807.0, 638513.0, 3361160.0, 109522.0, 19186.0, 5291.0, 1843.0, 788.0, 404.0, 219.0, 125.0, 74.0, 51.0, 33.0, 25.0, 17.0, 12.0, 7.0, 10.0, 6.0, 2.0, 2.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.187744140625, -0.181915283203125, -0.17608642578125, -0.170257568359375, -0.1644287109375, -0.158599853515625, -0.15277099609375, -0.146942138671875, -0.14111328125, -0.135284423828125, -0.12945556640625, -0.123626708984375, -0.1177978515625, -0.111968994140625, -0.10614013671875, -0.100311279296875, -0.094482421875, -0.088653564453125, -0.08282470703125, -0.076995849609375, -0.0711669921875, -0.065338134765625, -0.05950927734375, -0.053680419921875, -0.0478515625, -0.042022705078125, -0.03619384765625, -0.030364990234375, -0.0245361328125, -0.018707275390625, -0.01287841796875, -0.007049560546875, -0.001220703125, 0.004608154296875, 0.01043701171875, 0.016265869140625, 0.0220947265625, 0.027923583984375, 0.03375244140625, 0.039581298828125, 0.04541015625, 0.051239013671875, 0.05706787109375, 0.062896728515625, 0.0687255859375, 0.074554443359375, 0.08038330078125, 0.086212158203125, 0.092041015625, 0.097869873046875, 0.10369873046875, 0.109527587890625, 0.1153564453125, 0.121185302734375, 0.12701416015625, 0.132843017578125, 0.138671875, 0.144500732421875, 0.15032958984375, 0.156158447265625, 0.1619873046875, 0.167816162109375, 0.17364501953125, 0.179473876953125, 0.185302734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 10.0, 15.0, 16.0, 13.0, 33.0, 37.0, 61.0, 105.0, 230.0, 609.0, 1042.0, 912.0, 432.0, 192.0, 102.0, 58.0, 51.0, 41.0, 20.0, 19.0, 17.0, 13.0, 5.0, 9.0, 3.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.172607421875, -0.16594314575195312, -0.15927886962890625, -0.15261459350585938, -0.1459503173828125, -0.13928604125976562, -0.13262176513671875, -0.12595748901367188, -0.119293212890625, -0.11262893676757812, -0.10596466064453125, -0.09930038452148438, -0.0926361083984375, -0.08597183227539062, -0.07930755615234375, -0.07264328002929688, -0.06597900390625, -0.059314727783203125, -0.05265045166015625, -0.045986175537109375, -0.0393218994140625, -0.032657623291015625, -0.02599334716796875, -0.019329071044921875, -0.012664794921875, -0.006000518798828125, 0.00066375732421875, 0.007328033447265625, 0.0139923095703125, 0.020656585693359375, 0.02732086181640625, 0.033985137939453125, 0.0406494140625, 0.047313690185546875, 0.05397796630859375, 0.060642242431640625, 0.0673065185546875, 0.07397079467773438, 0.08063507080078125, 0.08729934692382812, 0.093963623046875, 0.10062789916992188, 0.10729217529296875, 0.11395645141601562, 0.1206207275390625, 0.12728500366210938, 0.13394927978515625, 0.14061355590820312, 0.14727783203125, 0.15394210815429688, 0.16060638427734375, 0.16727066040039062, 0.1739349365234375, 0.18059921264648438, 0.18726348876953125, 0.19392776489257812, 0.200592041015625, 0.20725631713867188, 0.21392059326171875, 0.22058486938476562, 0.2272491455078125, 0.23391342163085938, 0.24057769775390625, 0.24724197387695312, 0.25390625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 0.0, 4.0, 18.0, 41.0, 94.0, 210.0, 268.0, 197.0, 91.0, 43.0, 13.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.014565944671631, -1.9520026445388794, -1.8894392251968384, -1.826875925064087, -1.764312505722046, -1.7017492055892944, -1.639185905456543, -1.576622486114502, -1.514059066772461, -1.4514957666397095, -1.3889323472976685, -1.326369047164917, -1.263805627822876, -1.2012423276901245, -1.138679027557373, -1.076115608215332, -1.0135523080825806, -0.9509889483451843, -0.8884255886077881, -0.8258622884750366, -0.7632988691329956, -0.7007355690002441, -0.6381722092628479, -0.5756088495254517, -0.5130454897880554, -0.4504821300506592, -0.38791877031326294, -0.3253554403781891, -0.26279208064079285, -0.2002287209033966, -0.13766539096832275, -0.07510203123092651, -0.012538790702819824, 0.05002456158399582, 0.11258791387081146, 0.1751512587070465, 0.23771461844444275, 0.300277978181839, 0.36284130811691284, 0.4254046678543091, 0.4879680275917053, 0.5505313873291016, 0.6130947470664978, 0.675658106803894, 0.7382214069366455, 0.8007848262786865, 0.863348126411438, 0.9259114861488342, 0.9884748458862305, 1.051038146018982, 1.113601565361023, 1.1761648654937744, 1.2387282848358154, 1.301291584968567, 1.3638548851013184, 1.4264183044433594, 1.4889817237854004, 1.5515450239181519, 1.6141084432601929, 1.6766717433929443, 1.7392351627349854, 1.8017984628677368, 1.8643617630004883, 1.9269251823425293, 1.9894884824752808]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 0.0, 5.0, 4.0, 9.0, 8.0, 12.0, 16.0, 23.0, 24.0, 22.0, 46.0, 46.0, 47.0, 58.0, 67.0, 61.0, 74.0, 58.0, 63.0, 56.0, 56.0, 55.0, 44.0, 38.0, 24.0, 24.0, 23.0, 8.0, 15.0, 6.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7212209105491638, -0.6860234141349792, -0.6508259177207947, -0.6156283617019653, -0.5804308652877808, -0.5452333688735962, -0.5100358724594116, -0.47483837604522705, -0.4396408498287201, -0.4044433534145355, -0.36924582719802856, -0.334048330783844, -0.2988508343696594, -0.26365330815315247, -0.2284558117389679, -0.19325830042362213, -0.15806078910827637, -0.1228632777929306, -0.08766577392816544, -0.05246827006340027, -0.017270758748054504, 0.01792675256729126, 0.05312424898147583, 0.0883217602968216, 0.12351927161216736, 0.15871678292751312, 0.1939142942428589, 0.22911179065704346, 0.264309287071228, 0.299506813287735, 0.33470430970191956, 0.3699018359184265, 0.40509939193725586, 0.44029688835144043, 0.4754944145679474, 0.5106918811798096, 0.5458894371986389, 0.5810869336128235, 0.6162844300270081, 0.6514819264411926, 0.686679482460022, 0.7218769788742065, 0.7570744752883911, 0.7922719717025757, 0.827469527721405, 0.8626670241355896, 0.8978645205497742, 0.9330620169639587, 0.9682595133781433, 1.0034570693969727, 1.0386545658111572, 1.0738520622253418, 1.1090495586395264, 1.144247055053711, 1.1794445514678955, 1.21464204788208, 1.2498395442962646, 1.2850370407104492, 1.3202345371246338, 1.3554320335388184, 1.390629529953003, 1.4258270263671875, 1.461024522781372, 1.4962221384048462, 1.5314196348190308]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 8.0, 13.0, 19.0, 31.0, 34.0, 43.0, 57.0, 91.0, 148.0, 269.0, 371.0, 512.0, 827.0, 1328.0, 2168.0, 3888.0, 6837.0, 12653.0, 24614.0, 49564.0, 100206.0, 182891.0, 243787.0, 194956.0, 109760.0, 55021.0, 26907.0, 13635.0, 7287.0, 4193.0, 2400.0, 1413.0, 925.0, 553.0, 388.0, 252.0, 154.0, 103.0, 64.0, 52.0, 39.0, 24.0, 14.0, 16.0, 11.0, 6.0, 12.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.069091796875, -0.06690311431884766, -0.06471443176269531, -0.06252574920654297, -0.060337066650390625, -0.05814838409423828, -0.05595970153808594, -0.053771018981933594, -0.05158233642578125, -0.049393653869628906, -0.04720497131347656, -0.04501628875732422, -0.042827606201171875, -0.04063892364501953, -0.03845024108886719, -0.036261558532714844, -0.0340728759765625, -0.031884193420410156, -0.029695510864257812, -0.02750682830810547, -0.025318145751953125, -0.02312946319580078, -0.020940780639648438, -0.018752098083496094, -0.01656341552734375, -0.014374732971191406, -0.012186050415039062, -0.009997367858886719, -0.007808685302734375, -0.005620002746582031, -0.0034313201904296875, -0.0012426376342773438, 0.000946044921875, 0.0031347274780273438, 0.0053234100341796875, 0.007512092590332031, 0.009700775146484375, 0.011889457702636719, 0.014078140258789062, 0.016266822814941406, 0.01845550537109375, 0.020644187927246094, 0.022832870483398438, 0.02502155303955078, 0.027210235595703125, 0.02939891815185547, 0.03158760070800781, 0.033776283264160156, 0.0359649658203125, 0.038153648376464844, 0.04034233093261719, 0.04253101348876953, 0.044719696044921875, 0.04690837860107422, 0.04909706115722656, 0.051285743713378906, 0.05347442626953125, 0.055663108825683594, 0.05785179138183594, 0.06004047393798828, 0.062229156494140625, 0.06441783905029297, 0.06660652160644531, 0.06879520416259766, 0.07098388671875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 7.0, 10.0, 19.0, 13.0, 13.0, 26.0, 23.0, 30.0, 35.0, 30.0, 43.0, 42.0, 50.0, 58.0, 67.0, 61.0, 48.0, 57.0, 68.0, 42.0, 48.0, 40.0, 20.0, 15.0, 27.0, 17.0, 14.0, 9.0, 25.0, 8.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.115234375, -0.11187267303466797, -0.10851097106933594, -0.1051492691040039, -0.10178756713867188, -0.09842586517333984, -0.09506416320800781, -0.09170246124267578, -0.08834075927734375, -0.08497905731201172, -0.08161735534667969, -0.07825565338134766, -0.07489395141601562, -0.0715322494506836, -0.06817054748535156, -0.06480884552001953, -0.0614471435546875, -0.05808544158935547, -0.05472373962402344, -0.051362037658691406, -0.048000335693359375, -0.044638633728027344, -0.04127693176269531, -0.03791522979736328, -0.03455352783203125, -0.03119182586669922, -0.027830123901367188, -0.024468421936035156, -0.021106719970703125, -0.017745018005371094, -0.014383316040039062, -0.011021614074707031, -0.007659912109375, -0.004298210144042969, -0.0009365081787109375, 0.0024251937866210938, 0.005786895751953125, 0.009148597717285156, 0.012510299682617188, 0.01587200164794922, 0.01923370361328125, 0.02259540557861328, 0.025957107543945312, 0.029318809509277344, 0.032680511474609375, 0.036042213439941406, 0.03940391540527344, 0.04276561737060547, 0.0461273193359375, 0.04948902130126953, 0.05285072326660156, 0.056212425231933594, 0.059574127197265625, 0.06293582916259766, 0.06629753112792969, 0.06965923309326172, 0.07302093505859375, 0.07638263702392578, 0.07974433898925781, 0.08310604095458984, 0.08646774291992188, 0.0898294448852539, 0.09319114685058594, 0.09655284881591797, 0.09991455078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 11.0, 4.0, 14.0, 24.0, 40.0, 31.0, 39.0, 64.0, 99.0, 107.0, 166.0, 221.0, 308.0, 507.0, 830.0, 1842.0, 7054.0, 75239.0, 860427.0, 89399.0, 7765.0, 1901.0, 843.0, 525.0, 295.0, 224.0, 162.0, 97.0, 90.0, 47.0, 51.0, 25.0, 28.0, 15.0, 15.0, 16.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.340576171875, -0.3304176330566406, -0.32025909423828125, -0.3101005554199219, -0.2999420166015625, -0.2897834777832031, -0.27962493896484375, -0.2694664001464844, -0.259307861328125, -0.24914932250976562, -0.23899078369140625, -0.22883224487304688, -0.2186737060546875, -0.20851516723632812, -0.19835662841796875, -0.18819808959960938, -0.17803955078125, -0.16788101196289062, -0.15772247314453125, -0.14756393432617188, -0.1374053955078125, -0.12724685668945312, -0.11708831787109375, -0.10692977905273438, -0.096771240234375, -0.08661270141601562, -0.07645416259765625, -0.06629562377929688, -0.0561370849609375, -0.045978546142578125, -0.03582000732421875, -0.025661468505859375, -0.0155029296875, -0.005344390869140625, 0.00481414794921875, 0.014972686767578125, 0.0251312255859375, 0.035289764404296875, 0.04544830322265625, 0.055606842041015625, 0.065765380859375, 0.07592391967773438, 0.08608245849609375, 0.09624099731445312, 0.1063995361328125, 0.11655807495117188, 0.12671661376953125, 0.13687515258789062, 0.14703369140625, 0.15719223022460938, 0.16735076904296875, 0.17750930786132812, 0.1876678466796875, 0.19782638549804688, 0.20798492431640625, 0.21814346313476562, 0.228302001953125, 0.23846054077148438, 0.24861907958984375, 0.2587776184082031, 0.2689361572265625, 0.2790946960449219, 0.28925323486328125, 0.2994117736816406, 0.3095703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 8.0, 15.0, 4.0, 10.0, 15.0, 18.0, 16.0, 18.0, 28.0, 31.0, 39.0, 59.0, 50.0, 41.0, 59.0, 60.0, 51.0, 67.0, 63.0, 47.0, 59.0, 44.0, 34.0, 39.0, 31.0, 24.0, 12.0, 12.0, 10.0, 10.0, 4.0, 6.0, 3.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.5546875, -0.5394172668457031, -0.5241470336914062, -0.5088768005371094, -0.4936065673828125, -0.4783363342285156, -0.46306610107421875, -0.4477958679199219, -0.432525634765625, -0.4172554016113281, -0.40198516845703125, -0.3867149353027344, -0.3714447021484375, -0.3561744689941406, -0.34090423583984375, -0.3256340026855469, -0.31036376953125, -0.2950935363769531, -0.27982330322265625, -0.2645530700683594, -0.2492828369140625, -0.23401260375976562, -0.21874237060546875, -0.20347213745117188, -0.188201904296875, -0.17293167114257812, -0.15766143798828125, -0.14239120483398438, -0.1271209716796875, -0.11185073852539062, -0.09658050537109375, -0.08131027221679688, -0.0660400390625, -0.050769805908203125, -0.03549957275390625, -0.020229339599609375, -0.0049591064453125, 0.010311126708984375, 0.02558135986328125, 0.040851593017578125, 0.056121826171875, 0.07139205932617188, 0.08666229248046875, 0.10193252563476562, 0.1172027587890625, 0.13247299194335938, 0.14774322509765625, 0.16301345825195312, 0.17828369140625, 0.19355392456054688, 0.20882415771484375, 0.22409439086914062, 0.2393646240234375, 0.2546348571777344, 0.26990509033203125, 0.2851753234863281, 0.300445556640625, 0.3157157897949219, 0.33098602294921875, 0.3462562561035156, 0.3615264892578125, 0.3767967224121094, 0.39206695556640625, 0.4073371887207031, 0.422607421875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 8.0, 14.0, 7.0, 16.0, 16.0, 21.0, 36.0, 50.0, 58.0, 100.0, 120.0, 238.0, 354.0, 665.0, 1125.0, 1997.0, 4113.0, 9325.0, 26780.0, 133848.0, 689891.0, 134382.0, 26984.0, 9317.0, 4257.0, 2038.0, 1066.0, 647.0, 396.0, 220.0, 145.0, 95.0, 58.0, 52.0, 36.0, 22.0, 18.0, 8.0, 10.0, 7.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0635986328125, -0.06157970428466797, -0.05956077575683594, -0.057541847229003906, -0.055522918701171875, -0.053503990173339844, -0.05148506164550781, -0.04946613311767578, -0.04744720458984375, -0.04542827606201172, -0.04340934753417969, -0.041390419006347656, -0.039371490478515625, -0.037352561950683594, -0.03533363342285156, -0.03331470489501953, -0.0312957763671875, -0.02927684783935547, -0.027257919311523438, -0.025238990783691406, -0.023220062255859375, -0.021201133728027344, -0.019182205200195312, -0.01716327667236328, -0.01514434814453125, -0.013125419616699219, -0.011106491088867188, -0.009087562561035156, -0.007068634033203125, -0.005049705505371094, -0.0030307769775390625, -0.0010118484497070312, 0.001007080078125, 0.0030260086059570312, 0.0050449371337890625, 0.007063865661621094, 0.009082794189453125, 0.011101722717285156, 0.013120651245117188, 0.015139579772949219, 0.01715850830078125, 0.01917743682861328, 0.021196365356445312, 0.023215293884277344, 0.025234222412109375, 0.027253150939941406, 0.029272079467773438, 0.03129100799560547, 0.0333099365234375, 0.03532886505126953, 0.03734779357910156, 0.039366722106933594, 0.041385650634765625, 0.043404579162597656, 0.04542350769042969, 0.04744243621826172, 0.04946136474609375, 0.05148029327392578, 0.05349922180175781, 0.055518150329589844, 0.057537078857421875, 0.059556007385253906, 0.06157493591308594, 0.06359386444091797, 0.06561279296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 5.0, 5.0, 9.0, 3.0, 10.0, 10.0, 21.0, 27.0, 37.0, 49.0, 46.0, 76.0, 112.0, 102.0, 107.0, 108.0, 73.0, 50.0, 36.0, 21.0, 29.0, 10.0, 16.0, 6.0, 8.0, 9.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6597251892089844e-05, -3.492087125778198e-05, -3.324449062347412e-05, -3.156810998916626e-05, -2.98917293548584e-05, -2.8215348720550537e-05, -2.6538968086242676e-05, -2.4862587451934814e-05, -2.3186206817626953e-05, -2.1509826183319092e-05, -1.983344554901123e-05, -1.815706491470337e-05, -1.6480684280395508e-05, -1.4804303646087646e-05, -1.3127923011779785e-05, -1.1451542377471924e-05, -9.775161743164062e-06, -8.098781108856201e-06, -6.42240047454834e-06, -4.7460198402404785e-06, -3.069639205932617e-06, -1.3932585716247559e-06, 2.8312206268310547e-07, 1.959502696990967e-06, 3.635883331298828e-06, 5.3122639656066895e-06, 6.988644599914551e-06, 8.665025234222412e-06, 1.0341405868530273e-05, 1.2017786502838135e-05, 1.3694167137145996e-05, 1.5370547771453857e-05, 1.704692840576172e-05, 1.872330904006958e-05, 2.039968967437744e-05, 2.2076070308685303e-05, 2.3752450942993164e-05, 2.5428831577301025e-05, 2.7105212211608887e-05, 2.8781592845916748e-05, 3.045797348022461e-05, 3.213435411453247e-05, 3.381073474884033e-05, 3.548711538314819e-05, 3.7163496017456055e-05, 3.8839876651763916e-05, 4.051625728607178e-05, 4.219263792037964e-05, 4.38690185546875e-05, 4.554539918899536e-05, 4.722177982330322e-05, 4.8898160457611084e-05, 5.0574541091918945e-05, 5.225092172622681e-05, 5.392730236053467e-05, 5.560368299484253e-05, 5.728006362915039e-05, 5.895644426345825e-05, 6.063282489776611e-05, 6.230920553207397e-05, 6.398558616638184e-05, 6.56619668006897e-05, 6.733834743499756e-05, 6.901472806930542e-05, 7.069110870361328e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 4.0, 8.0, 6.0, 10.0, 14.0, 16.0, 18.0, 32.0, 34.0, 55.0, 72.0, 121.0, 189.0, 248.0, 436.0, 703.0, 1449.0, 2748.0, 6026.0, 15561.0, 61828.0, 559409.0, 329060.0, 46565.0, 13170.0, 5299.0, 2424.0, 1216.0, 668.0, 363.0, 246.0, 156.0, 104.0, 85.0, 52.0, 28.0, 23.0, 14.0, 20.0, 14.0, 19.0, 4.0, 8.0, 8.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0587158203125, -0.05675315856933594, -0.054790496826171875, -0.05282783508300781, -0.05086517333984375, -0.04890251159667969, -0.046939849853515625, -0.04497718811035156, -0.0430145263671875, -0.04105186462402344, -0.039089202880859375, -0.03712654113769531, -0.03516387939453125, -0.03320121765136719, -0.031238555908203125, -0.029275894165039062, -0.027313232421875, -0.025350570678710938, -0.023387908935546875, -0.021425247192382812, -0.01946258544921875, -0.017499923706054688, -0.015537261962890625, -0.013574600219726562, -0.0116119384765625, -0.009649276733398438, -0.007686614990234375, -0.0057239532470703125, -0.00376129150390625, -0.0017986297607421875, 0.000164031982421875, 0.0021266937255859375, 0.00408935546875, 0.0060520172119140625, 0.008014678955078125, 0.009977340698242188, 0.01194000244140625, 0.013902664184570312, 0.015865325927734375, 0.017827987670898438, 0.0197906494140625, 0.021753311157226562, 0.023715972900390625, 0.025678634643554688, 0.02764129638671875, 0.029603958129882812, 0.031566619873046875, 0.03352928161621094, 0.035491943359375, 0.03745460510253906, 0.039417266845703125, 0.04137992858886719, 0.04334259033203125, 0.04530525207519531, 0.047267913818359375, 0.04923057556152344, 0.0511932373046875, 0.05315589904785156, 0.055118560791015625, 0.05708122253417969, 0.05904388427734375, 0.06100654602050781, 0.06296920776367188, 0.06493186950683594, 0.06689453125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 5.0, 5.0, 4.0, 7.0, 9.0, 12.0, 17.0, 29.0, 29.0, 25.0, 60.0, 64.0, 68.0, 75.0, 72.0, 76.0, 77.0, 66.0, 52.0, 66.0, 37.0, 41.0, 24.0, 17.0, 10.0, 10.0, 13.0, 7.0, 4.0, 5.0, 5.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059661865234375, -0.0573582649230957, -0.055054664611816406, -0.05275106430053711, -0.05044746398925781, -0.048143863677978516, -0.04584026336669922, -0.04353666305541992, -0.041233062744140625, -0.03892946243286133, -0.03662586212158203, -0.034322261810302734, -0.03201866149902344, -0.02971506118774414, -0.027411460876464844, -0.025107860565185547, -0.02280426025390625, -0.020500659942626953, -0.018197059631347656, -0.01589345932006836, -0.013589859008789062, -0.011286258697509766, -0.008982658386230469, -0.006679058074951172, -0.004375457763671875, -0.002071857452392578, 0.00023174285888671875, 0.0025353431701660156, 0.0048389434814453125, 0.007142543792724609, 0.009446144104003906, 0.011749744415283203, 0.0140533447265625, 0.016356945037841797, 0.018660545349121094, 0.02096414566040039, 0.023267745971679688, 0.025571346282958984, 0.02787494659423828, 0.030178546905517578, 0.032482147216796875, 0.03478574752807617, 0.03708934783935547, 0.039392948150634766, 0.04169654846191406, 0.04400014877319336, 0.046303749084472656, 0.04860734939575195, 0.05091094970703125, 0.05321455001831055, 0.055518150329589844, 0.05782175064086914, 0.06012535095214844, 0.062428951263427734, 0.06473255157470703, 0.06703615188598633, 0.06933975219726562, 0.07164335250854492, 0.07394695281982422, 0.07625055313110352, 0.07855415344238281, 0.08085775375366211, 0.0831613540649414, 0.0854649543762207, 0.0877685546875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 9.0, 44.0, 153.0, 492.0, 237.0, 42.0, 16.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28227424621582, -5.1458940505981445, -5.009513854980469, -4.873133659362793, -4.736753463745117, -4.600373268127441, -4.463993072509766, -4.327612400054932, -4.191232204437256, -4.05485200881958, -3.9184718132019043, -3.7820916175842285, -3.6457111835479736, -3.509330987930298, -3.372950792312622, -3.2365705966949463, -3.1001904010772705, -2.9638102054595947, -2.827430009841919, -2.691049575805664, -2.5546693801879883, -2.4182891845703125, -2.2819089889526367, -2.145528793334961, -2.009148597717285, -1.8727684020996094, -1.736388087272644, -1.6000078916549683, -1.463627576828003, -1.3272473812103271, -1.1908671855926514, -1.0544869899749756, -0.9181063175201416, -0.781726062297821, -0.6453458070755005, -0.5089656114578247, -0.37258535623550415, -0.2362051010131836, -0.09982490539550781, 0.036555349826812744, 0.1729356050491333, 0.30931586027145386, 0.445696085691452, 0.5820763111114502, 0.7184565663337708, 0.8548368215560913, 0.9912170171737671, 1.1275973320007324, 1.2639775276184082, 1.400357723236084, 1.5367380380630493, 1.673118233680725, 1.8094985485076904, 1.9458787441253662, 2.082258939743042, 2.2186391353607178, 2.3550195693969727, 2.4913997650146484, 2.627779960632324, 2.76416015625, 2.900540590286255, 3.0369207859039307, 3.1733009815216064, 3.3096811771392822, 3.446061372756958]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 6.0, 6.0, 4.0, 9.0, 12.0, 10.0, 24.0, 23.0, 21.0, 31.0, 21.0, 35.0, 46.0, 32.0, 51.0, 64.0, 76.0, 66.0, 56.0, 53.0, 39.0, 42.0, 39.0, 33.0, 31.0, 28.0, 19.0, 19.0, 16.0, 14.0, 19.0, 10.0, 8.0, 7.0, 5.0, 8.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3647549152374268, -1.3149229288101196, -1.2650909423828125, -1.2152589559555054, -1.1654269695281982, -1.1155951023101807, -1.0657631158828735, -1.0159311294555664, -0.9660991430282593, -0.9162671566009521, -0.866435170173645, -0.8166032433509827, -0.7667712569236755, -0.7169392704963684, -0.667107343673706, -0.6172753572463989, -0.5674433708190918, -0.5176113843917847, -0.4677794277667999, -0.4179474711418152, -0.36811548471450806, -0.3182834982872009, -0.2684515416622162, -0.21861958503723145, -0.16878759860992432, -0.11895562708377838, -0.06912365555763245, -0.01929168403148651, 0.030540287494659424, 0.08037225902080536, 0.1302042305469513, 0.18003618717193604, 0.2298680543899536, 0.27970004081726074, 0.3295319974422455, 0.3793639540672302, 0.42919594049453735, 0.4790279269218445, 0.5288598537445068, 0.578691840171814, 0.6285238265991211, 0.6783558130264282, 0.7281877994537354, 0.7780197262763977, 0.8278517127037048, 0.877683699131012, 0.9275156259536743, 0.9773476123809814, 1.0271795988082886, 1.0770115852355957, 1.1268435716629028, 1.17667555809021, 1.2265074253082275, 1.2763394117355347, 1.3261713981628418, 1.376003384590149, 1.425835371017456, 1.4756673574447632, 1.5254993438720703, 1.5753313302993774, 1.6251633167266846, 1.6749951839447021, 1.7248271703720093, 1.7746591567993164, 1.8244911432266235]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 12.0, 19.0, 24.0, 45.0, 72.0, 118.0, 180.0, 320.0, 638.0, 1331.0, 3576.0, 12619.0, 70933.0, 761820.0, 2830092.0, 449841.0, 47231.0, 10051.0, 2975.0, 1092.0, 549.0, 279.0, 176.0, 102.0, 68.0, 42.0, 26.0, 18.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.140380859375, -0.13690567016601562, -0.13343048095703125, -0.12995529174804688, -0.1264801025390625, -0.12300491333007812, -0.11952972412109375, -0.11605453491210938, -0.112579345703125, -0.10910415649414062, -0.10562896728515625, -0.10215377807617188, -0.0986785888671875, -0.09520339965820312, -0.09172821044921875, -0.08825302124023438, -0.08477783203125, -0.08130264282226562, -0.07782745361328125, -0.07435226440429688, -0.0708770751953125, -0.06740188598632812, -0.06392669677734375, -0.060451507568359375, -0.056976318359375, -0.053501129150390625, -0.05002593994140625, -0.046550750732421875, -0.0430755615234375, -0.039600372314453125, -0.03612518310546875, -0.032649993896484375, -0.0291748046875, -0.025699615478515625, -0.02222442626953125, -0.018749237060546875, -0.0152740478515625, -0.011798858642578125, -0.00832366943359375, -0.004848480224609375, -0.001373291015625, 0.002101898193359375, 0.00557708740234375, 0.009052276611328125, 0.0125274658203125, 0.016002655029296875, 0.01947784423828125, 0.022953033447265625, 0.02642822265625, 0.029903411865234375, 0.03337860107421875, 0.036853790283203125, 0.0403289794921875, 0.043804168701171875, 0.04727935791015625, 0.050754547119140625, 0.054229736328125, 0.057704925537109375, 0.06118011474609375, 0.06465530395507812, 0.0681304931640625, 0.07160568237304688, 0.07508087158203125, 0.07855606079101562, 0.08203125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 10.0, 8.0, 10.0, 16.0, 17.0, 19.0, 23.0, 30.0, 30.0, 48.0, 47.0, 51.0, 53.0, 49.0, 57.0, 61.0, 68.0, 53.0, 54.0, 44.0, 55.0, 37.0, 24.0, 23.0, 20.0, 24.0, 19.0, 17.0, 9.0, 5.0, 8.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.1279296875, -0.12450313568115234, -0.12107658386230469, -0.11765003204345703, -0.11422348022460938, -0.11079692840576172, -0.10737037658691406, -0.1039438247680664, -0.10051727294921875, -0.0970907211303711, -0.09366416931152344, -0.09023761749267578, -0.08681106567382812, -0.08338451385498047, -0.07995796203613281, -0.07653141021728516, -0.0731048583984375, -0.06967830657958984, -0.06625175476074219, -0.06282520294189453, -0.059398651123046875, -0.05597209930419922, -0.05254554748535156, -0.049118995666503906, -0.04569244384765625, -0.042265892028808594, -0.03883934020996094, -0.03541278839111328, -0.031986236572265625, -0.02855968475341797, -0.025133132934570312, -0.021706581115722656, -0.018280029296875, -0.014853477478027344, -0.011426925659179688, -0.008000373840332031, -0.004573822021484375, -0.0011472702026367188, 0.0022792816162109375, 0.005705833435058594, 0.00913238525390625, 0.012558937072753906, 0.015985488891601562, 0.01941204071044922, 0.022838592529296875, 0.02626514434814453, 0.029691696166992188, 0.033118247985839844, 0.0365447998046875, 0.039971351623535156, 0.04339790344238281, 0.04682445526123047, 0.050251007080078125, 0.05367755889892578, 0.05710411071777344, 0.060530662536621094, 0.06395721435546875, 0.0673837661743164, 0.07081031799316406, 0.07423686981201172, 0.07766342163085938, 0.08108997344970703, 0.08451652526855469, 0.08794307708740234, 0.09136962890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 9.0, 19.0, 30.0, 42.0, 62.0, 116.0, 210.0, 491.0, 1380.0, 5966.0, 46306.0, 2637082.0, 1453441.0, 39236.0, 6631.0, 1760.0, 638.0, 333.0, 193.0, 105.0, 90.0, 51.0, 24.0, 19.0, 13.0, 8.0, 6.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.18896484375, -0.18220138549804688, -0.17543792724609375, -0.16867446899414062, -0.1619110107421875, -0.15514755249023438, -0.14838409423828125, -0.14162063598632812, -0.134857177734375, -0.12809371948242188, -0.12133026123046875, -0.11456680297851562, -0.1078033447265625, -0.10103988647460938, -0.09427642822265625, -0.08751296997070312, -0.08074951171875, -0.07398605346679688, -0.06722259521484375, -0.060459136962890625, -0.0536956787109375, -0.046932220458984375, -0.04016876220703125, -0.033405303955078125, -0.026641845703125, -0.019878387451171875, -0.01311492919921875, -0.006351470947265625, 0.0004119873046875, 0.007175445556640625, 0.01393890380859375, 0.020702362060546875, 0.0274658203125, 0.034229278564453125, 0.04099273681640625, 0.047756195068359375, 0.0545196533203125, 0.061283111572265625, 0.06804656982421875, 0.07481002807617188, 0.081573486328125, 0.08833694458007812, 0.09510040283203125, 0.10186386108398438, 0.1086273193359375, 0.11539077758789062, 0.12215423583984375, 0.12891769409179688, 0.13568115234375, 0.14244461059570312, 0.14920806884765625, 0.15597152709960938, 0.1627349853515625, 0.16949844360351562, 0.17626190185546875, 0.18302536010742188, 0.189788818359375, 0.19655227661132812, 0.20331573486328125, 0.21007919311523438, 0.2168426513671875, 0.22360610961914062, 0.23036956787109375, 0.23713302612304688, 0.243896484375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 7.0, 7.0, 17.0, 18.0, 41.0, 49.0, 89.0, 188.0, 493.0, 987.0, 1059.0, 549.0, 245.0, 107.0, 69.0, 45.0, 28.0, 15.0, 12.0, 8.0, 10.0, 8.0, 3.0, 2.0, 2.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1968994140625, -0.18987464904785156, -0.18284988403320312, -0.1758251190185547, -0.16880035400390625, -0.1617755889892578, -0.15475082397460938, -0.14772605895996094, -0.1407012939453125, -0.13367652893066406, -0.12665176391601562, -0.11962699890136719, -0.11260223388671875, -0.10557746887207031, -0.09855270385742188, -0.09152793884277344, -0.084503173828125, -0.07747840881347656, -0.07045364379882812, -0.06342887878417969, -0.05640411376953125, -0.04937934875488281, -0.042354583740234375, -0.03532981872558594, -0.0283050537109375, -0.021280288696289062, -0.014255523681640625, -0.0072307586669921875, -0.00020599365234375, 0.0068187713623046875, 0.013843536376953125, 0.020868301391601562, 0.02789306640625, 0.03491783142089844, 0.041942596435546875, 0.04896736145019531, 0.05599212646484375, 0.06301689147949219, 0.07004165649414062, 0.07706642150878906, 0.0840911865234375, 0.09111595153808594, 0.09814071655273438, 0.10516548156738281, 0.11219024658203125, 0.11921501159667969, 0.12623977661132812, 0.13326454162597656, 0.140289306640625, 0.14731407165527344, 0.15433883666992188, 0.1613636016845703, 0.16838836669921875, 0.1754131317138672, 0.18243789672851562, 0.18946266174316406, 0.1964874267578125, 0.20351219177246094, 0.21053695678710938, 0.2175617218017578, 0.22458648681640625, 0.2316112518310547, 0.23863601684570312, 0.24566078186035156, 0.252685546875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 9.0, 18.0, 49.0, 148.0, 243.0, 263.0, 149.0, 58.0, 24.0, 10.0, 10.0, 6.0, 7.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.006287097930908, -2.943056344985962, -2.8798258304595947, -2.8165950775146484, -2.7533645629882812, -2.690133810043335, -2.6269030570983887, -2.5636725425720215, -2.500441789627075, -2.437211036682129, -2.3739805221557617, -2.3107497692108154, -2.247519016265869, -2.184288501739502, -2.1210577487945557, -2.0578272342681885, -1.9945964813232422, -1.9313658475875854, -1.8681352138519287, -1.8049044609069824, -1.7416738271713257, -1.678443193435669, -1.6152124404907227, -1.551981806755066, -1.4887511730194092, -1.4255205392837524, -1.3622899055480957, -1.2990591526031494, -1.2358285188674927, -1.172597885131836, -1.1093671321868896, -1.046136498451233, -0.9829059839248657, -0.919675350189209, -0.8564446568489075, -0.793213963508606, -0.7299833297729492, -0.6667526960372925, -0.603522002696991, -0.5402913093566895, -0.4770606756210327, -0.4138300120830536, -0.35059934854507446, -0.28736868500709534, -0.2241380214691162, -0.16090735793113708, -0.09767669439315796, -0.03444603085517883, 0.028784632682800293, 0.09201529622077942, 0.15524595975875854, 0.21847662329673767, 0.2817072868347168, 0.3449379503726959, 0.40816861391067505, 0.4713992774486542, 0.5346299409866333, 0.59786057472229, 0.6610912680625916, 0.7243219614028931, 0.7875525951385498, 0.8507832288742065, 0.9140139222145081, 0.9772446155548096, 1.0404752492904663]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 6.0, 12.0, 8.0, 14.0, 16.0, 18.0, 26.0, 22.0, 32.0, 35.0, 45.0, 52.0, 53.0, 38.0, 45.0, 55.0, 50.0, 57.0, 55.0, 38.0, 37.0, 48.0, 32.0, 29.0, 27.0, 21.0, 18.0, 26.0, 18.0, 13.0, 10.0, 11.0, 6.0, 6.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7946150898933411, -0.7675920724868774, -0.7405691146850586, -0.713546097278595, -0.6865230798721313, -0.6595000624656677, -0.6324770450592041, -0.6054540872573853, -0.5784310698509216, -0.551408052444458, -0.5243850946426392, -0.49736207723617554, -0.4703390598297119, -0.4433160424232483, -0.41629305481910706, -0.3892700672149658, -0.3622470498085022, -0.3352240324020386, -0.30820104479789734, -0.2811780571937561, -0.2541550397872925, -0.22713203728199005, -0.20010903477668762, -0.1730860322713852, -0.14606302976608276, -0.11904002726078033, -0.0920170247554779, -0.06499402225017548, -0.03797101974487305, -0.010948017239570618, 0.01607498526573181, 0.04309798777103424, 0.0701209306716919, 0.09714393317699432, 0.12416693568229675, 0.15118993818759918, 0.1782129406929016, 0.20523594319820404, 0.23225894570350647, 0.2592819333076477, 0.28630495071411133, 0.31332796812057495, 0.3403509557247162, 0.3673739433288574, 0.39439696073532104, 0.42141997814178467, 0.4484429657459259, 0.47546595335006714, 0.5024889707565308, 0.5295119881629944, 0.556535005569458, 0.5835579633712769, 0.6105809807777405, 0.6376039981842041, 0.664626955986023, 0.6916499733924866, 0.7186729907989502, 0.7456960082054138, 0.7727190256118774, 0.7997419834136963, 0.8267650008201599, 0.8537880182266235, 0.8808109760284424, 0.907833993434906, 0.9348570108413696]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 1.0, 10.0, 7.0, 5.0, 11.0, 22.0, 27.0, 33.0, 62.0, 79.0, 115.0, 166.0, 236.0, 390.0, 629.0, 924.0, 1544.0, 2423.0, 4066.0, 6855.0, 11802.0, 20516.0, 35765.0, 61733.0, 103554.0, 163118.0, 202800.0, 168355.0, 109053.0, 64756.0, 37061.0, 21510.0, 12348.0, 7173.0, 4289.0, 2537.0, 1621.0, 1047.0, 620.0, 439.0, 297.0, 178.0, 133.0, 64.0, 63.0, 39.0, 15.0, 19.0, 16.0, 8.0, 13.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.06524658203125, -0.06330156326293945, -0.061356544494628906, -0.05941152572631836, -0.05746650695800781, -0.055521488189697266, -0.05357646942138672, -0.05163145065307617, -0.049686431884765625, -0.04774141311645508, -0.04579639434814453, -0.043851375579833984, -0.04190635681152344, -0.03996133804321289, -0.038016319274902344, -0.0360713005065918, -0.03412628173828125, -0.0321812629699707, -0.030236244201660156, -0.02829122543334961, -0.026346206665039062, -0.024401187896728516, -0.02245616912841797, -0.020511150360107422, -0.018566131591796875, -0.016621112823486328, -0.014676094055175781, -0.012731075286865234, -0.010786056518554688, -0.00884103775024414, -0.006896018981933594, -0.004951000213623047, -0.0030059814453125, -0.0010609626770019531, 0.0008840560913085938, 0.0028290748596191406, 0.0047740936279296875, 0.006719112396240234, 0.008664131164550781, 0.010609149932861328, 0.012554168701171875, 0.014499187469482422, 0.01644420623779297, 0.018389225006103516, 0.020334243774414062, 0.02227926254272461, 0.024224281311035156, 0.026169300079345703, 0.02811431884765625, 0.030059337615966797, 0.032004356384277344, 0.03394937515258789, 0.03589439392089844, 0.037839412689208984, 0.03978443145751953, 0.04172945022583008, 0.043674468994140625, 0.04561948776245117, 0.04756450653076172, 0.049509525299072266, 0.05145454406738281, 0.05339956283569336, 0.055344581604003906, 0.05728960037231445, 0.059234619140625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 3.0, 5.0, 4.0, 13.0, 11.0, 17.0, 19.0, 28.0, 30.0, 36.0, 50.0, 34.0, 60.0, 42.0, 59.0, 68.0, 62.0, 55.0, 60.0, 64.0, 57.0, 35.0, 34.0, 25.0, 34.0, 24.0, 23.0, 10.0, 18.0, 8.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1268310546875, -0.12324714660644531, -0.11966323852539062, -0.11607933044433594, -0.11249542236328125, -0.10891151428222656, -0.10532760620117188, -0.10174369812011719, -0.0981597900390625, -0.09457588195800781, -0.09099197387695312, -0.08740806579589844, -0.08382415771484375, -0.08024024963378906, -0.07665634155273438, -0.07307243347167969, -0.069488525390625, -0.06590461730957031, -0.062320709228515625, -0.05873680114746094, -0.05515289306640625, -0.05156898498535156, -0.047985076904296875, -0.04440116882324219, -0.0408172607421875, -0.03723335266113281, -0.033649444580078125, -0.030065536499023438, -0.02648162841796875, -0.022897720336914062, -0.019313812255859375, -0.015729904174804688, -0.01214599609375, -0.008562088012695312, -0.004978179931640625, -0.0013942718505859375, 0.00218963623046875, 0.0057735443115234375, 0.009357452392578125, 0.012941360473632812, 0.0165252685546875, 0.020109176635742188, 0.023693084716796875, 0.027276992797851562, 0.03086090087890625, 0.03444480895996094, 0.038028717041015625, 0.04161262512207031, 0.045196533203125, 0.04878044128417969, 0.052364349365234375, 0.05594825744628906, 0.05953216552734375, 0.06311607360839844, 0.06669998168945312, 0.07028388977050781, 0.0738677978515625, 0.07745170593261719, 0.08103561401367188, 0.08461952209472656, 0.08820343017578125, 0.09178733825683594, 0.09537124633789062, 0.09895515441894531, 0.1025390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 11.0, 9.0, 16.0, 15.0, 21.0, 31.0, 54.0, 73.0, 94.0, 128.0, 175.0, 230.0, 384.0, 540.0, 1078.0, 2311.0, 9678.0, 104328.0, 812785.0, 101916.0, 9664.0, 2266.0, 1013.0, 542.0, 346.0, 216.0, 194.0, 111.0, 77.0, 60.0, 50.0, 46.0, 24.0, 21.0, 9.0, 12.0, 6.0, 5.0, 4.0, 0.0, 4.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27099609375, -0.2614860534667969, -0.25197601318359375, -0.24246597290039062, -0.2329559326171875, -0.22344589233398438, -0.21393585205078125, -0.20442581176757812, -0.194915771484375, -0.18540573120117188, -0.17589569091796875, -0.16638565063476562, -0.1568756103515625, -0.14736557006835938, -0.13785552978515625, -0.12834548950195312, -0.11883544921875, -0.10932540893554688, -0.09981536865234375, -0.09030532836914062, -0.0807952880859375, -0.07128524780273438, -0.06177520751953125, -0.052265167236328125, -0.042755126953125, -0.033245086669921875, -0.02373504638671875, -0.014225006103515625, -0.0047149658203125, 0.004795074462890625, 0.01430511474609375, 0.023815155029296875, 0.0333251953125, 0.042835235595703125, 0.05234527587890625, 0.061855316162109375, 0.0713653564453125, 0.08087539672851562, 0.09038543701171875, 0.09989547729492188, 0.109405517578125, 0.11891555786132812, 0.12842559814453125, 0.13793563842773438, 0.1474456787109375, 0.15695571899414062, 0.16646575927734375, 0.17597579956054688, 0.18548583984375, 0.19499588012695312, 0.20450592041015625, 0.21401596069335938, 0.2235260009765625, 0.23303604125976562, 0.24254608154296875, 0.2520561218261719, 0.261566162109375, 0.2710762023925781, 0.28058624267578125, 0.2900962829589844, 0.2996063232421875, 0.3091163635253906, 0.31862640380859375, 0.3281364440917969, 0.337646484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 4.0, 5.0, 7.0, 12.0, 11.0, 17.0, 21.0, 14.0, 21.0, 30.0, 29.0, 34.0, 47.0, 43.0, 43.0, 59.0, 55.0, 60.0, 57.0, 50.0, 60.0, 53.0, 35.0, 37.0, 38.0, 31.0, 21.0, 16.0, 21.0, 12.0, 12.0, 9.0, 8.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294189453125, -0.281829833984375, -0.26947021484375, -0.257110595703125, -0.2447509765625, -0.232391357421875, -0.22003173828125, -0.207672119140625, -0.1953125, -0.182952880859375, -0.17059326171875, -0.158233642578125, -0.1458740234375, -0.133514404296875, -0.12115478515625, -0.108795166015625, -0.096435546875, -0.084075927734375, -0.07171630859375, -0.059356689453125, -0.0469970703125, -0.034637451171875, -0.02227783203125, -0.009918212890625, 0.00244140625, 0.014801025390625, 0.02716064453125, 0.039520263671875, 0.0518798828125, 0.064239501953125, 0.07659912109375, 0.088958740234375, 0.101318359375, 0.113677978515625, 0.12603759765625, 0.138397216796875, 0.1507568359375, 0.163116455078125, 0.17547607421875, 0.187835693359375, 0.2001953125, 0.212554931640625, 0.22491455078125, 0.237274169921875, 0.2496337890625, 0.261993408203125, 0.27435302734375, 0.286712646484375, 0.299072265625, 0.311431884765625, 0.32379150390625, 0.336151123046875, 0.3485107421875, 0.360870361328125, 0.37322998046875, 0.385589599609375, 0.39794921875, 0.410308837890625, 0.42266845703125, 0.435028076171875, 0.4473876953125, 0.459747314453125, 0.47210693359375, 0.484466552734375, 0.496826171875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 8.0, 16.0, 16.0, 23.0, 27.0, 37.0, 51.0, 97.0, 123.0, 256.0, 453.0, 888.0, 1817.0, 4407.0, 13150.0, 53313.0, 318406.0, 559332.0, 70364.0, 16373.0, 5218.0, 1991.0, 906.0, 505.0, 287.0, 171.0, 101.0, 67.0, 36.0, 38.0, 22.0, 14.0, 15.0, 5.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07110595703125, -0.06888961791992188, -0.06667327880859375, -0.06445693969726562, -0.0622406005859375, -0.060024261474609375, -0.05780792236328125, -0.055591583251953125, -0.053375244140625, -0.051158905029296875, -0.04894256591796875, -0.046726226806640625, -0.0445098876953125, -0.042293548583984375, -0.04007720947265625, -0.037860870361328125, -0.03564453125, -0.033428192138671875, -0.03121185302734375, -0.028995513916015625, -0.0267791748046875, -0.024562835693359375, -0.02234649658203125, -0.020130157470703125, -0.017913818359375, -0.015697479248046875, -0.01348114013671875, -0.011264801025390625, -0.0090484619140625, -0.006832122802734375, -0.00461578369140625, -0.002399444580078125, -0.00018310546875, 0.002033233642578125, 0.00424957275390625, 0.006465911865234375, 0.0086822509765625, 0.010898590087890625, 0.01311492919921875, 0.015331268310546875, 0.017547607421875, 0.019763946533203125, 0.02198028564453125, 0.024196624755859375, 0.0264129638671875, 0.028629302978515625, 0.03084564208984375, 0.033061981201171875, 0.0352783203125, 0.037494659423828125, 0.03971099853515625, 0.041927337646484375, 0.0441436767578125, 0.046360015869140625, 0.04857635498046875, 0.050792694091796875, 0.053009033203125, 0.055225372314453125, 0.05744171142578125, 0.059658050537109375, 0.0618743896484375, 0.06409072875976562, 0.06630706787109375, 0.06852340698242188, 0.07073974609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 0.0, 2.0, 4.0, 0.0, 3.0, 6.0, 6.0, 5.0, 6.0, 10.0, 10.0, 7.0, 14.0, 20.0, 30.0, 28.0, 26.0, 53.0, 69.0, 78.0, 95.0, 101.0, 83.0, 79.0, 62.0, 45.0, 26.0, 27.0, 16.0, 17.0, 16.0, 12.0, 3.0, 6.0, 8.0, 7.0, 7.0, 3.0, 0.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.227327346801758e-05, -5.0661154091358185e-05, -4.904903471469879e-05, -4.74369153380394e-05, -4.5824795961380005e-05, -4.421267658472061e-05, -4.260055720806122e-05, -4.0988437831401825e-05, -3.937631845474243e-05, -3.776419907808304e-05, -3.6152079701423645e-05, -3.453996032476425e-05, -3.292784094810486e-05, -3.1315721571445465e-05, -2.9703602194786072e-05, -2.809148281812668e-05, -2.6479363441467285e-05, -2.4867244064807892e-05, -2.32551246881485e-05, -2.1643005311489105e-05, -2.0030885934829712e-05, -1.841876655817032e-05, -1.6806647181510925e-05, -1.5194527804851532e-05, -1.3582408428192139e-05, -1.1970289051532745e-05, -1.0358169674873352e-05, -8.746050298213959e-06, -7.1339309215545654e-06, -5.521811544895172e-06, -3.909692168235779e-06, -2.2975727915763855e-06, -6.854534149169922e-07, 9.266659617424011e-07, 2.5387853384017944e-06, 4.150904715061188e-06, 5.763024091720581e-06, 7.375143468379974e-06, 8.987262845039368e-06, 1.0599382221698761e-05, 1.2211501598358154e-05, 1.3823620975017548e-05, 1.543574035167694e-05, 1.7047859728336334e-05, 1.8659979104995728e-05, 2.027209848165512e-05, 2.1884217858314514e-05, 2.3496337234973907e-05, 2.51084566116333e-05, 2.6720575988292694e-05, 2.8332695364952087e-05, 2.994481474161148e-05, 3.1556934118270874e-05, 3.316905349493027e-05, 3.478117287158966e-05, 3.6393292248249054e-05, 3.800541162490845e-05, 3.961753100156784e-05, 4.1229650378227234e-05, 4.284176975488663e-05, 4.445388913154602e-05, 4.6066008508205414e-05, 4.767812788486481e-05, 4.92902472615242e-05, 5.0902366638183594e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 2.0, 7.0, 9.0, 7.0, 6.0, 14.0, 27.0, 34.0, 49.0, 72.0, 143.0, 223.0, 438.0, 764.0, 1438.0, 3576.0, 11125.0, 52283.0, 510219.0, 399832.0, 50749.0, 10896.0, 3473.0, 1470.0, 668.0, 416.0, 222.0, 134.0, 75.0, 50.0, 44.0, 24.0, 17.0, 12.0, 10.0, 6.0, 7.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.083984375, -0.0816507339477539, -0.07931709289550781, -0.07698345184326172, -0.07464981079101562, -0.07231616973876953, -0.06998252868652344, -0.06764888763427734, -0.06531524658203125, -0.06298160552978516, -0.06064796447753906, -0.05831432342529297, -0.055980682373046875, -0.05364704132080078, -0.05131340026855469, -0.048979759216308594, -0.0466461181640625, -0.044312477111816406, -0.04197883605957031, -0.03964519500732422, -0.037311553955078125, -0.03497791290283203, -0.03264427185058594, -0.030310630798339844, -0.02797698974609375, -0.025643348693847656, -0.023309707641601562, -0.02097606658935547, -0.018642425537109375, -0.01630878448486328, -0.013975143432617188, -0.011641502380371094, -0.009307861328125, -0.006974220275878906, -0.0046405792236328125, -0.0023069381713867188, 2.6702880859375e-05, 0.0023603439331054688, 0.0046939849853515625, 0.007027626037597656, 0.00936126708984375, 0.011694908142089844, 0.014028549194335938, 0.01636219024658203, 0.018695831298828125, 0.02102947235107422, 0.023363113403320312, 0.025696754455566406, 0.0280303955078125, 0.030364036560058594, 0.03269767761230469, 0.03503131866455078, 0.037364959716796875, 0.03969860076904297, 0.04203224182128906, 0.044365882873535156, 0.04669952392578125, 0.049033164978027344, 0.05136680603027344, 0.05370044708251953, 0.056034088134765625, 0.05836772918701172, 0.06070137023925781, 0.0630350112915039, 0.06536865234375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 8.0, 8.0, 9.0, 10.0, 18.0, 27.0, 31.0, 49.0, 59.0, 71.0, 59.0, 83.0, 91.0, 97.0, 77.0, 70.0, 57.0, 34.0, 39.0, 24.0, 16.0, 15.0, 7.0, 11.0, 10.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08868408203125, -0.0861978530883789, -0.08371162414550781, -0.08122539520263672, -0.07873916625976562, -0.07625293731689453, -0.07376670837402344, -0.07128047943115234, -0.06879425048828125, -0.06630802154541016, -0.06382179260253906, -0.06133556365966797, -0.058849334716796875, -0.05636310577392578, -0.05387687683105469, -0.051390647888183594, -0.0489044189453125, -0.046418190002441406, -0.04393196105957031, -0.04144573211669922, -0.038959503173828125, -0.03647327423095703, -0.03398704528808594, -0.031500816345214844, -0.02901458740234375, -0.026528358459472656, -0.024042129516601562, -0.02155590057373047, -0.019069671630859375, -0.01658344268798828, -0.014097213745117188, -0.011610984802246094, -0.009124755859375, -0.006638526916503906, -0.0041522979736328125, -0.0016660690307617188, 0.000820159912109375, 0.0033063888549804688, 0.0057926177978515625, 0.008278846740722656, 0.01076507568359375, 0.013251304626464844, 0.015737533569335938, 0.01822376251220703, 0.020709991455078125, 0.02319622039794922, 0.025682449340820312, 0.028168678283691406, 0.0306549072265625, 0.033141136169433594, 0.03562736511230469, 0.03811359405517578, 0.040599822998046875, 0.04308605194091797, 0.04557228088378906, 0.048058509826660156, 0.05054473876953125, 0.053030967712402344, 0.05551719665527344, 0.05800342559814453, 0.060489654541015625, 0.06297588348388672, 0.06546211242675781, 0.0679483413696289, 0.0704345703125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 16.0, 37.0, 59.0, 125.0, 194.0, 309.0, 128.0, 54.0, 32.0, 11.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1691173315048218, -1.1052755117416382, -1.0414338111877441, -0.9775919914245605, -0.9137502908706665, -0.8499084711074829, -0.7860667109489441, -0.7222249507904053, -0.6583831906318665, -0.5945414304733276, -0.5306996703147888, -0.4668578803539276, -0.4030161201953888, -0.33917436003685, -0.27533257007598877, -0.21149080991744995, -0.14764904975891113, -0.08380728214979172, -0.019965514540672302, 0.04387626051902771, 0.10771802067756653, 0.17155978083610535, 0.23540157079696655, 0.29924333095550537, 0.3630850911140442, 0.426926851272583, 0.4907686114311218, 0.5546103715896606, 0.6184521913528442, 0.6822938919067383, 0.7461357116699219, 0.8099774718284607, 0.87381911277771, 0.9376608729362488, 1.0015026330947876, 1.0653444528579712, 1.1291861534118652, 1.1930279731750488, 1.2568697929382324, 1.3207114934921265, 1.3845531940460205, 1.448395013809204, 1.5122367143630981, 1.5760785341262817, 1.6399202346801758, 1.7037620544433594, 1.767603874206543, 1.831445574760437, 1.8952873945236206, 1.9591292142868042, 2.0229709148406982, 2.086812734603882, 2.1506545543670654, 2.21449613571167, 2.2783379554748535, 2.342179775238037, 2.4060215950012207, 2.4698634147644043, 2.533705234527588, 2.5975468158721924, 2.661388635635376, 2.7252304553985596, 2.789072275161743, 2.8529138565063477, 2.9167556762695312]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 3.0, 3.0, 7.0, 5.0, 8.0, 10.0, 13.0, 18.0, 10.0, 16.0, 15.0, 21.0, 17.0, 27.0, 34.0, 26.0, 35.0, 30.0, 33.0, 60.0, 77.0, 68.0, 55.0, 41.0, 37.0, 41.0, 39.0, 32.0, 18.0, 21.0, 25.0, 23.0, 19.0, 14.0, 19.0, 13.0, 12.0, 5.0, 4.0, 10.0, 2.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0], "bins": [-1.3760292530059814, -1.334822416305542, -1.2936155796051025, -1.2524088621139526, -1.2112020254135132, -1.1699951887130737, -1.1287884712219238, -1.0875816345214844, -1.046374797821045, -1.0051679611206055, -0.9639611840248108, -0.9227544069290161, -0.8815475702285767, -0.8403407335281372, -0.7991339564323425, -0.7579271793365479, -0.7167203426361084, -0.675513505935669, -0.6343067288398743, -0.5930999517440796, -0.5518931150436401, -0.5106862783432007, -0.469479501247406, -0.42827269434928894, -0.3870658874511719, -0.3458590805530548, -0.30465227365493774, -0.2634454667568207, -0.2222386598587036, -0.18103185296058655, -0.13982504606246948, -0.09861823916435242, -0.05741143226623535, -0.016204625368118286, 0.02500218152999878, 0.06620898842811584, 0.10741579532623291, 0.14862260222434998, 0.18982940912246704, 0.2310362160205841, 0.27224302291870117, 0.31344982981681824, 0.3546566367149353, 0.39586344361305237, 0.43707025051116943, 0.4782770574092865, 0.5194838643074036, 0.5606906414031982, 0.6018974781036377, 0.6431043148040771, 0.6843110918998718, 0.7255178689956665, 0.766724705696106, 0.8079315423965454, 0.8491383194923401, 0.8903450965881348, 0.9315519332885742, 0.9727587699890137, 1.0139656066894531, 1.055172324180603, 1.0963791608810425, 1.137585997581482, 1.1787927150726318, 1.2199995517730713, 1.2612063884735107]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 5.0, 11.0, 7.0, 17.0, 21.0, 31.0, 52.0, 74.0, 96.0, 165.0, 239.0, 403.0, 748.0, 1827.0, 5343.0, 23953.0, 183521.0, 2011857.0, 1784221.0, 151240.0, 21146.0, 5549.0, 1922.0, 764.0, 383.0, 234.0, 153.0, 103.0, 68.0, 38.0, 29.0, 18.0, 12.0, 11.0, 5.0, 4.0, 2.0, 0.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.12451171875, -0.12095069885253906, -0.11738967895507812, -0.11382865905761719, -0.11026763916015625, -0.10670661926269531, -0.10314559936523438, -0.09958457946777344, -0.0960235595703125, -0.09246253967285156, -0.08890151977539062, -0.08534049987792969, -0.08177947998046875, -0.07821846008300781, -0.07465744018554688, -0.07109642028808594, -0.067535400390625, -0.06397438049316406, -0.060413360595703125, -0.05685234069824219, -0.05329132080078125, -0.04973030090332031, -0.046169281005859375, -0.04260826110839844, -0.0390472412109375, -0.03548622131347656, -0.031925201416015625, -0.028364181518554688, -0.02480316162109375, -0.021242141723632812, -0.017681121826171875, -0.014120101928710938, -0.01055908203125, -0.0069980621337890625, -0.003437042236328125, 0.0001239776611328125, 0.00368499755859375, 0.0072460174560546875, 0.010807037353515625, 0.014368057250976562, 0.0179290771484375, 0.021490097045898438, 0.025051116943359375, 0.028612136840820312, 0.03217315673828125, 0.03573417663574219, 0.039295196533203125, 0.04285621643066406, 0.046417236328125, 0.04997825622558594, 0.053539276123046875, 0.05710029602050781, 0.06066131591796875, 0.06422233581542969, 0.06778335571289062, 0.07134437561035156, 0.0749053955078125, 0.07846641540527344, 0.08202743530273438, 0.08558845520019531, 0.08914947509765625, 0.09271049499511719, 0.09627151489257812, 0.09983253479003906, 0.1033935546875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 10.0, 13.0, 15.0, 26.0, 29.0, 37.0, 46.0, 45.0, 65.0, 54.0, 54.0, 56.0, 68.0, 60.0, 70.0, 58.0, 48.0, 43.0, 39.0, 39.0, 24.0, 31.0, 21.0, 16.0, 13.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.1368408203125, -0.13320446014404297, -0.12956809997558594, -0.1259317398071289, -0.12229537963867188, -0.11865901947021484, -0.11502265930175781, -0.11138629913330078, -0.10774993896484375, -0.10411357879638672, -0.10047721862792969, -0.09684085845947266, -0.09320449829101562, -0.0895681381225586, -0.08593177795410156, -0.08229541778564453, -0.0786590576171875, -0.07502269744873047, -0.07138633728027344, -0.0677499771118164, -0.06411361694335938, -0.060477256774902344, -0.05684089660644531, -0.05320453643798828, -0.04956817626953125, -0.04593181610107422, -0.04229545593261719, -0.038659095764160156, -0.035022735595703125, -0.031386375427246094, -0.027750015258789062, -0.02411365509033203, -0.020477294921875, -0.01684093475341797, -0.013204574584960938, -0.009568214416503906, -0.005931854248046875, -0.0022954940795898438, 0.0013408660888671875, 0.004977226257324219, 0.00861358642578125, 0.012249946594238281, 0.015886306762695312, 0.019522666931152344, 0.023159027099609375, 0.026795387268066406, 0.030431747436523438, 0.03406810760498047, 0.0377044677734375, 0.04134082794189453, 0.04497718811035156, 0.048613548278808594, 0.052249908447265625, 0.055886268615722656, 0.05952262878417969, 0.06315898895263672, 0.06679534912109375, 0.07043170928955078, 0.07406806945800781, 0.07770442962646484, 0.08134078979492188, 0.0849771499633789, 0.08861351013183594, 0.09224987030029297, 0.09588623046875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 11.0, 14.0, 17.0, 33.0, 61.0, 67.0, 118.0, 201.0, 336.0, 660.0, 2262.0, 21291.0, 3799107.0, 360489.0, 6963.0, 1253.0, 468.0, 298.0, 218.0, 154.0, 97.0, 69.0, 29.0, 24.0, 21.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42431640625, -0.41246795654296875, -0.4006195068359375, -0.38877105712890625, -0.376922607421875, -0.36507415771484375, -0.3532257080078125, -0.34137725830078125, -0.32952880859375, -0.31768035888671875, -0.3058319091796875, -0.29398345947265625, -0.282135009765625, -0.27028656005859375, -0.2584381103515625, -0.24658966064453125, -0.2347412109375, -0.22289276123046875, -0.2110443115234375, -0.19919586181640625, -0.187347412109375, -0.17549896240234375, -0.1636505126953125, -0.15180206298828125, -0.13995361328125, -0.12810516357421875, -0.1162567138671875, -0.10440826416015625, -0.092559814453125, -0.08071136474609375, -0.0688629150390625, -0.05701446533203125, -0.045166015625, -0.03331756591796875, -0.0214691162109375, -0.00962066650390625, 0.002227783203125, 0.01407623291015625, 0.0259246826171875, 0.03777313232421875, 0.04962158203125, 0.06147003173828125, 0.0733184814453125, 0.08516693115234375, 0.097015380859375, 0.10886383056640625, 0.1207122802734375, 0.13256072998046875, 0.1444091796875, 0.15625762939453125, 0.1681060791015625, 0.17995452880859375, 0.191802978515625, 0.20365142822265625, 0.2154998779296875, 0.22734832763671875, 0.23919677734375, 0.25104522705078125, 0.2628936767578125, 0.27474212646484375, 0.286590576171875, 0.29843902587890625, 0.3102874755859375, 0.32213592529296875, 0.333984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 10.0, 16.0, 22.0, 33.0, 53.0, 130.0, 325.0, 1118.0, 1382.0, 638.0, 186.0, 67.0, 46.0, 23.0, 8.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1553955078125, -0.1451396942138672, -0.13488388061523438, -0.12462806701660156, -0.11437225341796875, -0.10411643981933594, -0.09386062622070312, -0.08360481262207031, -0.0733489990234375, -0.06309318542480469, -0.052837371826171875, -0.04258155822753906, -0.03232574462890625, -0.022069931030273438, -0.011814117431640625, -0.0015583038330078125, 0.008697509765625, 0.018953323364257812, 0.029209136962890625, 0.03946495056152344, 0.04972076416015625, 0.05997657775878906, 0.07023239135742188, 0.08048820495605469, 0.0907440185546875, 0.10099983215332031, 0.11125564575195312, 0.12151145935058594, 0.13176727294921875, 0.14202308654785156, 0.15227890014648438, 0.1625347137451172, 0.17279052734375, 0.1830463409423828, 0.19330215454101562, 0.20355796813964844, 0.21381378173828125, 0.22406959533691406, 0.23432540893554688, 0.2445812225341797, 0.2548370361328125, 0.2650928497314453, 0.2753486633300781, 0.28560447692871094, 0.29586029052734375, 0.30611610412597656, 0.3163719177246094, 0.3266277313232422, 0.336883544921875, 0.3471393585205078, 0.3573951721191406, 0.36765098571777344, 0.37790679931640625, 0.38816261291503906, 0.3984184265136719, 0.4086742401123047, 0.4189300537109375, 0.4291858673095703, 0.4394416809082031, 0.44969749450683594, 0.45995330810546875, 0.47020912170410156, 0.4804649353027344, 0.4907207489013672, 0.5009765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 8.0, 8.0, 9.0, 21.0, 40.0, 58.0, 100.0, 192.0, 192.0, 155.0, 91.0, 50.0, 29.0, 18.0, 8.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6926915645599365, -1.6430004835128784, -1.5933094024658203, -1.5436183214187622, -1.493927240371704, -1.444236159324646, -1.394545078277588, -1.3448539972305298, -1.2951629161834717, -1.2454718351364136, -1.1957807540893555, -1.1460896730422974, -1.0963985919952393, -1.0467075109481812, -0.997016429901123, -0.9473253488540649, -0.8976342678070068, -0.8479431867599487, -0.7982521057128906, -0.7485610246658325, -0.6988699436187744, -0.6491788625717163, -0.5994877815246582, -0.5497967004776001, -0.500105619430542, -0.4504145383834839, -0.4007234573364258, -0.3510323762893677, -0.30134129524230957, -0.25165021419525146, -0.20195913314819336, -0.15226805210113525, -0.1025770902633667, -0.052886009216308594, -0.0031949281692504883, 0.04649615287780762, 0.09618723392486572, 0.14587831497192383, 0.19556939601898193, 0.24526047706604004, 0.29495155811309814, 0.34464263916015625, 0.39433372020721436, 0.44402480125427246, 0.49371588230133057, 0.5434069633483887, 0.5930980443954468, 0.6427891254425049, 0.692480206489563, 0.7421712875366211, 0.7918623685836792, 0.8415534496307373, 0.8912445306777954, 0.9409356117248535, 0.9906266927719116, 1.0403177738189697, 1.0900088548660278, 1.139699935913086, 1.189391016960144, 1.2390820980072021, 1.2887731790542603, 1.3384642601013184, 1.3881553411483765, 1.4378464221954346, 1.4875375032424927]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 3.0, 5.0, 5.0, 7.0, 9.0, 8.0, 13.0, 17.0, 22.0, 28.0, 34.0, 25.0, 27.0, 41.0, 50.0, 40.0, 51.0, 40.0, 51.0, 41.0, 46.0, 40.0, 54.0, 45.0, 40.0, 34.0, 42.0, 29.0, 28.0, 14.0, 29.0, 8.0, 15.0, 12.0, 13.0, 12.0, 5.0, 6.0, 3.0, 7.0, 2.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0612034797668457, -1.0328896045684814, -1.0045758485794067, -0.9762619733810425, -0.9479480981826782, -0.9196342825889587, -0.8913204669952393, -0.863006591796875, -0.8346927165985107, -0.8063789010047913, -0.778065025806427, -0.7497512102127075, -0.7214373350143433, -0.6931235194206238, -0.6648097038269043, -0.63649582862854, -0.6081820130348206, -0.5798681974411011, -0.5515543222427368, -0.5232405066490173, -0.4949266314506531, -0.4666128158569336, -0.4382989704608917, -0.40998512506484985, -0.381671279668808, -0.3533574342727661, -0.32504358887672424, -0.2967297434806824, -0.2684159278869629, -0.24010206758975983, -0.21178823709487915, -0.18347439169883728, -0.15516048669815063, -0.12684664130210876, -0.09853280335664749, -0.07021896541118622, -0.04190512001514435, -0.013591274619102478, 0.014722555875778198, 0.04303640127182007, 0.07135024666786194, 0.09966409206390381, 0.12797793745994568, 0.15629176795482635, 0.18460561335086823, 0.2129194587469101, 0.24123328924179077, 0.26954713463783264, 0.2978609800338745, 0.3261748254299164, 0.35448867082595825, 0.38280248641967773, 0.411116361618042, 0.4394301772117615, 0.46774402260780334, 0.4960578680038452, 0.5243717432022095, 0.552685558795929, 0.5809994339942932, 0.6093132495880127, 0.637627124786377, 0.6659409403800964, 0.6942547559738159, 0.7225686311721802, 0.7508824467658997]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 11.0, 12.0, 22.0, 32.0, 51.0, 53.0, 114.0, 155.0, 238.0, 361.0, 533.0, 807.0, 1318.0, 2086.0, 3574.0, 6294.0, 11526.0, 21723.0, 42127.0, 82722.0, 150509.0, 226814.0, 214682.0, 132910.0, 71037.0, 36102.0, 18722.0, 10093.0, 5476.0, 3213.0, 1923.0, 1195.0, 669.0, 504.0, 287.0, 196.0, 148.0, 88.0, 60.0, 49.0, 27.0, 28.0, 20.0, 18.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07720947265625, -0.07478809356689453, -0.07236671447753906, -0.0699453353881836, -0.06752395629882812, -0.06510257720947266, -0.06268119812011719, -0.06025981903076172, -0.05783843994140625, -0.05541706085205078, -0.05299568176269531, -0.050574302673339844, -0.048152923583984375, -0.045731544494628906, -0.04331016540527344, -0.04088878631591797, -0.0384674072265625, -0.03604602813720703, -0.03362464904785156, -0.031203269958496094, -0.028781890869140625, -0.026360511779785156, -0.023939132690429688, -0.02151775360107422, -0.01909637451171875, -0.01667499542236328, -0.014253616333007812, -0.011832237243652344, -0.009410858154296875, -0.006989479064941406, -0.0045680999755859375, -0.0021467208862304688, 0.000274658203125, 0.0026960372924804688, 0.0051174163818359375, 0.007538795471191406, 0.009960174560546875, 0.012381553649902344, 0.014802932739257812, 0.01722431182861328, 0.01964569091796875, 0.02206707000732422, 0.024488449096679688, 0.026909828186035156, 0.029331207275390625, 0.031752586364746094, 0.03417396545410156, 0.03659534454345703, 0.0390167236328125, 0.04143810272216797, 0.04385948181152344, 0.046280860900878906, 0.048702239990234375, 0.051123619079589844, 0.05354499816894531, 0.05596637725830078, 0.05838775634765625, 0.06080913543701172, 0.06323051452636719, 0.06565189361572266, 0.06807327270507812, 0.0704946517944336, 0.07291603088378906, 0.07533740997314453, 0.0777587890625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 29.0, 19.0, 24.0, 42.0, 47.0, 40.0, 44.0, 49.0, 57.0, 57.0, 67.0, 66.0, 57.0, 60.0, 53.0, 49.0, 35.0, 35.0, 32.0, 36.0, 23.0, 17.0, 16.0, 8.0, 13.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1353759765625, -0.13173294067382812, -0.12808990478515625, -0.12444686889648438, -0.1208038330078125, -0.11716079711914062, -0.11351776123046875, -0.10987472534179688, -0.106231689453125, -0.10258865356445312, -0.09894561767578125, -0.09530258178710938, -0.0916595458984375, -0.08801651000976562, -0.08437347412109375, -0.08073043823242188, -0.07708740234375, -0.07344436645507812, -0.06980133056640625, -0.06615829467773438, -0.0625152587890625, -0.058872222900390625, -0.05522918701171875, -0.051586151123046875, -0.047943115234375, -0.044300079345703125, -0.04065704345703125, -0.037014007568359375, -0.0333709716796875, -0.029727935791015625, -0.02608489990234375, -0.022441864013671875, -0.018798828125, -0.015155792236328125, -0.01151275634765625, -0.007869720458984375, -0.0042266845703125, -0.000583648681640625, 0.00305938720703125, 0.006702423095703125, 0.010345458984375, 0.013988494873046875, 0.01763153076171875, 0.021274566650390625, 0.0249176025390625, 0.028560638427734375, 0.03220367431640625, 0.035846710205078125, 0.03948974609375, 0.043132781982421875, 0.04677581787109375, 0.050418853759765625, 0.0540618896484375, 0.057704925537109375, 0.06134796142578125, 0.06499099731445312, 0.068634033203125, 0.07227706909179688, 0.07592010498046875, 0.07956314086914062, 0.0832061767578125, 0.08684921264648438, 0.09049224853515625, 0.09413528442382812, 0.0977783203125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 5.0, 3.0, 2.0, 6.0, 3.0, 3.0, 10.0, 9.0, 10.0, 9.0, 13.0, 12.0, 18.0, 35.0, 44.0, 69.0, 65.0, 100.0, 162.0, 237.0, 416.0, 1062.0, 2720.0, 9716.0, 45393.0, 256048.0, 610161.0, 96289.0, 18221.0, 4546.0, 1507.0, 652.0, 333.0, 198.0, 129.0, 77.0, 69.0, 49.0, 41.0, 24.0, 17.0, 17.0, 18.0, 12.0, 8.0, 8.0, 7.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19287109375, -0.18626976013183594, -0.17966842651367188, -0.1730670928955078, -0.16646575927734375, -0.1598644256591797, -0.15326309204101562, -0.14666175842285156, -0.1400604248046875, -0.13345909118652344, -0.12685775756835938, -0.12025642395019531, -0.11365509033203125, -0.10705375671386719, -0.10045242309570312, -0.09385108947753906, -0.087249755859375, -0.08064842224121094, -0.07404708862304688, -0.06744575500488281, -0.06084442138671875, -0.05424308776855469, -0.047641754150390625, -0.04104042053222656, -0.0344390869140625, -0.027837753295898438, -0.021236419677734375, -0.014635086059570312, -0.00803375244140625, -0.0014324188232421875, 0.005168914794921875, 0.011770248413085938, 0.01837158203125, 0.024972915649414062, 0.031574249267578125, 0.03817558288574219, 0.04477691650390625, 0.05137825012207031, 0.057979583740234375, 0.06458091735839844, 0.0711822509765625, 0.07778358459472656, 0.08438491821289062, 0.09098625183105469, 0.09758758544921875, 0.10418891906738281, 0.11079025268554688, 0.11739158630371094, 0.123992919921875, 0.13059425354003906, 0.13719558715820312, 0.1437969207763672, 0.15039825439453125, 0.1569995880126953, 0.16360092163085938, 0.17020225524902344, 0.1768035888671875, 0.18340492248535156, 0.19000625610351562, 0.1966075897216797, 0.20320892333984375, 0.2098102569580078, 0.21641159057617188, 0.22301292419433594, 0.2296142578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 7.0, 11.0, 10.0, 8.0, 15.0, 9.0, 16.0, 13.0, 19.0, 24.0, 23.0, 41.0, 33.0, 42.0, 32.0, 42.0, 53.0, 45.0, 49.0, 58.0, 49.0, 43.0, 39.0, 47.0, 31.0, 40.0, 35.0, 24.0, 24.0, 25.0, 20.0, 12.0, 16.0, 6.0, 10.0, 10.0, 5.0, 4.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267578125, -0.2579994201660156, -0.24842071533203125, -0.23884201049804688, -0.2292633056640625, -0.21968460083007812, -0.21010589599609375, -0.20052719116210938, -0.190948486328125, -0.18136978149414062, -0.17179107666015625, -0.16221237182617188, -0.1526336669921875, -0.14305496215820312, -0.13347625732421875, -0.12389755249023438, -0.11431884765625, -0.10474014282226562, -0.09516143798828125, -0.08558273315429688, -0.0760040283203125, -0.06642532348632812, -0.05684661865234375, -0.047267913818359375, -0.037689208984375, -0.028110504150390625, -0.01853179931640625, -0.008953094482421875, 0.0006256103515625, 0.010204315185546875, 0.01978302001953125, 0.029361724853515625, 0.0389404296875, 0.048519134521484375, 0.05809783935546875, 0.06767654418945312, 0.0772552490234375, 0.08683395385742188, 0.09641265869140625, 0.10599136352539062, 0.115570068359375, 0.12514877319335938, 0.13472747802734375, 0.14430618286132812, 0.1538848876953125, 0.16346359252929688, 0.17304229736328125, 0.18262100219726562, 0.19219970703125, 0.20177841186523438, 0.21135711669921875, 0.22093582153320312, 0.2305145263671875, 0.24009323120117188, 0.24967193603515625, 0.2592506408691406, 0.268829345703125, 0.2784080505371094, 0.28798675537109375, 0.2975654602050781, 0.3071441650390625, 0.3167228698730469, 0.32630157470703125, 0.3358802795410156, 0.345458984375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 3.0, 10.0, 7.0, 22.0, 21.0, 35.0, 44.0, 66.0, 74.0, 145.0, 225.0, 341.0, 585.0, 1078.0, 2042.0, 4062.0, 9630.0, 24833.0, 76381.0, 268753.0, 506857.0, 100031.0, 31355.0, 11690.0, 4920.0, 2410.0, 1103.0, 675.0, 368.0, 261.0, 160.0, 114.0, 78.0, 44.0, 30.0, 22.0, 18.0, 14.0, 13.0, 2.0, 3.0, 4.0, 4.0, 2.0, 2.0, 6.0, 1.0], "bins": [-0.06805419921875, -0.06622028350830078, -0.06438636779785156, -0.06255245208740234, -0.060718536376953125, -0.058884620666503906, -0.05705070495605469, -0.05521678924560547, -0.05338287353515625, -0.05154895782470703, -0.04971504211425781, -0.047881126403808594, -0.046047210693359375, -0.044213294982910156, -0.04237937927246094, -0.04054546356201172, -0.0387115478515625, -0.03687763214111328, -0.03504371643066406, -0.033209800720214844, -0.031375885009765625, -0.029541969299316406, -0.027708053588867188, -0.02587413787841797, -0.02404022216796875, -0.02220630645751953, -0.020372390747070312, -0.018538475036621094, -0.016704559326171875, -0.014870643615722656, -0.013036727905273438, -0.011202812194824219, -0.009368896484375, -0.007534980773925781, -0.0057010650634765625, -0.0038671493530273438, -0.002033233642578125, -0.00019931793212890625, 0.0016345977783203125, 0.0034685134887695312, 0.00530242919921875, 0.007136344909667969, 0.008970260620117188, 0.010804176330566406, 0.012638092041015625, 0.014472007751464844, 0.016305923461914062, 0.01813983917236328, 0.0199737548828125, 0.02180767059326172, 0.023641586303710938, 0.025475502014160156, 0.027309417724609375, 0.029143333435058594, 0.030977249145507812, 0.03281116485595703, 0.03464508056640625, 0.03647899627685547, 0.03831291198730469, 0.040146827697753906, 0.041980743408203125, 0.043814659118652344, 0.04564857482910156, 0.04748249053955078, 0.04931640625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 6.0, 4.0, 7.0, 11.0, 11.0, 27.0, 42.0, 54.0, 74.0, 83.0, 96.0, 119.0, 98.0, 98.0, 70.0, 69.0, 41.0, 24.0, 16.0, 16.0, 6.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.929304122924805e-05, -4.795379936695099e-05, -4.661455750465393e-05, -4.527531564235687e-05, -4.3936073780059814e-05, -4.2596831917762756e-05, -4.12575900554657e-05, -3.991834819316864e-05, -3.857910633087158e-05, -3.7239864468574524e-05, -3.5900622606277466e-05, -3.456138074398041e-05, -3.322213888168335e-05, -3.188289701938629e-05, -3.0543655157089233e-05, -2.9204413294792175e-05, -2.7865171432495117e-05, -2.652592957019806e-05, -2.5186687707901e-05, -2.3847445845603943e-05, -2.2508203983306885e-05, -2.1168962121009827e-05, -1.982972025871277e-05, -1.849047839641571e-05, -1.7151236534118652e-05, -1.5811994671821594e-05, -1.4472752809524536e-05, -1.3133510947227478e-05, -1.179426908493042e-05, -1.0455027222633362e-05, -9.115785360336304e-06, -7.776543498039246e-06, -6.4373016357421875e-06, -5.098059773445129e-06, -3.7588179111480713e-06, -2.419576048851013e-06, -1.080334186553955e-06, 2.5890767574310303e-07, 1.5981495380401611e-06, 2.9373914003372192e-06, 4.276633262634277e-06, 5.6158751249313354e-06, 6.9551169872283936e-06, 8.294358849525452e-06, 9.63360071182251e-06, 1.0972842574119568e-05, 1.2312084436416626e-05, 1.3651326298713684e-05, 1.4990568161010742e-05, 1.63298100233078e-05, 1.766905188560486e-05, 1.9008293747901917e-05, 2.0347535610198975e-05, 2.1686777472496033e-05, 2.302601933479309e-05, 2.436526119709015e-05, 2.5704503059387207e-05, 2.7043744921684265e-05, 2.8382986783981323e-05, 2.972222864627838e-05, 3.106147050857544e-05, 3.24007123708725e-05, 3.3739954233169556e-05, 3.5079196095466614e-05, 3.641843795776367e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 5.0, 15.0, 12.0, 31.0, 44.0, 87.0, 161.0, 404.0, 1086.0, 3202.0, 12832.0, 69203.0, 606003.0, 298139.0, 44489.0, 8846.0, 2547.0, 776.0, 344.0, 139.0, 67.0, 42.0, 30.0, 13.0, 10.0, 7.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07598876953125, -0.07305240631103516, -0.07011604309082031, -0.06717967987060547, -0.06424331665039062, -0.06130695343017578, -0.05837059020996094, -0.055434226989746094, -0.05249786376953125, -0.049561500549316406, -0.04662513732910156, -0.04368877410888672, -0.040752410888671875, -0.03781604766845703, -0.03487968444824219, -0.031943321228027344, -0.0290069580078125, -0.026070594787597656, -0.023134231567382812, -0.02019786834716797, -0.017261505126953125, -0.014325141906738281, -0.011388778686523438, -0.008452415466308594, -0.00551605224609375, -0.0025796890258789062, 0.0003566741943359375, 0.0032930374145507812, 0.006229400634765625, 0.009165763854980469, 0.012102127075195312, 0.015038490295410156, 0.017974853515625, 0.020911216735839844, 0.023847579956054688, 0.02678394317626953, 0.029720306396484375, 0.03265666961669922, 0.03559303283691406, 0.038529396057128906, 0.04146575927734375, 0.044402122497558594, 0.04733848571777344, 0.05027484893798828, 0.053211212158203125, 0.05614757537841797, 0.05908393859863281, 0.062020301818847656, 0.0649566650390625, 0.06789302825927734, 0.07082939147949219, 0.07376575469970703, 0.07670211791992188, 0.07963848114013672, 0.08257484436035156, 0.0855112075805664, 0.08844757080078125, 0.0913839340209961, 0.09432029724121094, 0.09725666046142578, 0.10019302368164062, 0.10312938690185547, 0.10606575012207031, 0.10900211334228516, 0.1119384765625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 10.0, 14.0, 17.0, 21.0, 42.0, 46.0, 58.0, 53.0, 68.0, 74.0, 84.0, 83.0, 83.0, 89.0, 46.0, 53.0, 39.0, 35.0, 15.0, 21.0, 8.0, 14.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.09307861328125, -0.09049606323242188, -0.08791351318359375, -0.08533096313476562, -0.0827484130859375, -0.08016586303710938, -0.07758331298828125, -0.07500076293945312, -0.072418212890625, -0.06983566284179688, -0.06725311279296875, -0.06467056274414062, -0.0620880126953125, -0.059505462646484375, -0.05692291259765625, -0.054340362548828125, -0.0517578125, -0.049175262451171875, -0.04659271240234375, -0.044010162353515625, -0.0414276123046875, -0.038845062255859375, -0.03626251220703125, -0.033679962158203125, -0.031097412109375, -0.028514862060546875, -0.02593231201171875, -0.023349761962890625, -0.0207672119140625, -0.018184661865234375, -0.01560211181640625, -0.013019561767578125, -0.01043701171875, -0.007854461669921875, -0.00527191162109375, -0.002689361572265625, -0.0001068115234375, 0.002475738525390625, 0.00505828857421875, 0.007640838623046875, 0.010223388671875, 0.012805938720703125, 0.01538848876953125, 0.017971038818359375, 0.0205535888671875, 0.023136138916015625, 0.02571868896484375, 0.028301239013671875, 0.0308837890625, 0.033466339111328125, 0.03604888916015625, 0.038631439208984375, 0.0412139892578125, 0.043796539306640625, 0.04637908935546875, 0.048961639404296875, 0.051544189453125, 0.054126739501953125, 0.05670928955078125, 0.059291839599609375, 0.0618743896484375, 0.06445693969726562, 0.06703948974609375, 0.06962203979492188, 0.07220458984375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 15.0, 35.0, 66.0, 94.0, 185.0, 275.0, 160.0, 60.0, 51.0, 21.0, 9.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5156450271606445, -2.453484296798706, -2.3913238048553467, -2.329163074493408, -2.267002582550049, -2.2048418521881104, -2.142681360244751, -2.0805206298828125, -2.018360137939453, -1.9561995267868042, -1.8940389156341553, -1.8318783044815063, -1.7697176933288574, -1.707556962966919, -1.6453964710235596, -1.583235740661621, -1.5210750102996826, -1.4589143991470337, -1.3967537879943848, -1.3345931768417358, -1.272432565689087, -1.2102718353271484, -1.148111343383789, -1.0859506130218506, -1.0237901210784912, -0.9616295099258423, -0.8994688987731934, -0.8373082876205444, -0.7751476168632507, -0.7129870057106018, -0.6508263945579529, -0.5886657238006592, -0.5265051126480103, -0.46434450149536133, -0.40218386054039, -0.3400232493877411, -0.2778626084327698, -0.21570199728012085, -0.15354138612747192, -0.09138074517250061, -0.029220134019851685, 0.03294048830866814, 0.09510111063718796, 0.15726172924041748, 0.2194223552942276, 0.2815829813480377, 0.34374359250068665, 0.40590423345565796, 0.4680648446083069, 0.5302254557609558, 0.5923860669136047, 0.6545467376708984, 0.7167073488235474, 0.7788679599761963, 0.8410285711288452, 0.9031891822814941, 0.9653497934341431, 1.027510404586792, 1.089671015739441, 1.1518316268920898, 1.2139922380447388, 1.2761528491973877, 1.3383135795593262, 1.400474190711975, 1.462634801864624]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 7.0, 7.0, 7.0, 8.0, 9.0, 14.0, 10.0, 9.0, 20.0, 25.0, 24.0, 22.0, 29.0, 23.0, 32.0, 43.0, 41.0, 51.0, 65.0, 78.0, 70.0, 50.0, 48.0, 35.0, 36.0, 38.0, 26.0, 31.0, 23.0, 17.0, 18.0, 14.0, 17.0, 8.0, 9.0, 12.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0125527381896973, -0.9771116971969604, -0.9416706562042236, -0.9062296152114868, -0.87078857421875, -0.8353475332260132, -0.7999064922332764, -0.7644654512405396, -0.7290244102478027, -0.6935833692550659, -0.6581423282623291, -0.6227012872695923, -0.5872602462768555, -0.5518192052841187, -0.5163781642913818, -0.48093709349632263, -0.4454960227012634, -0.4100549817085266, -0.3746139407157898, -0.339172899723053, -0.30373185873031616, -0.26829081773757935, -0.23284974694252014, -0.19740870594978333, -0.1619676649570465, -0.1265266239643097, -0.09108557552099228, -0.055644527077674866, -0.02020348608493805, 0.015237554907798767, 0.05067861080169678, 0.0861196517944336, 0.12156069278717041, 0.15700173377990723, 0.19244277477264404, 0.22788383066654205, 0.2633248567581177, 0.2987658977508545, 0.3342069685459137, 0.3696480095386505, 0.40508905053138733, 0.44053009152412415, 0.47597113251686096, 0.5114122033119202, 0.546853244304657, 0.5822942852973938, 0.6177353262901306, 0.6531763672828674, 0.6886174082756042, 0.7240584492683411, 0.7594994902610779, 0.7949405312538147, 0.8303815722465515, 0.8658226132392883, 0.9012637138366699, 0.9367047548294067, 0.9721457958221436, 1.0075868368148804, 1.0430278778076172, 1.078468918800354, 1.1139099597930908, 1.1493510007858276, 1.1847920417785645, 1.2202330827713013, 1.255674123764038]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 1.0, 2.0, 5.0, 1.0, 8.0, 5.0, 10.0, 9.0, 19.0, 17.0, 27.0, 37.0, 45.0, 85.0, 97.0, 148.0, 215.0, 294.0, 414.0, 738.0, 1231.0, 2574.0, 6562.0, 23199.0, 124371.0, 929319.0, 2398549.0, 596089.0, 82412.0, 16962.0, 5549.0, 2237.0, 1108.0, 656.0, 383.0, 267.0, 173.0, 141.0, 69.0, 79.0, 58.0, 24.0, 28.0, 22.0, 19.0, 11.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0888671875, -0.08584308624267578, -0.08281898498535156, -0.07979488372802734, -0.07677078247070312, -0.0737466812133789, -0.07072257995605469, -0.06769847869873047, -0.06467437744140625, -0.06165027618408203, -0.05862617492675781, -0.055602073669433594, -0.052577972412109375, -0.049553871154785156, -0.04652976989746094, -0.04350566864013672, -0.0404815673828125, -0.03745746612548828, -0.03443336486816406, -0.031409263610839844, -0.028385162353515625, -0.025361061096191406, -0.022336959838867188, -0.01931285858154297, -0.01628875732421875, -0.013264656066894531, -0.010240554809570312, -0.007216453552246094, -0.004192352294921875, -0.0011682510375976562, 0.0018558502197265625, 0.004879951477050781, 0.007904052734375, 0.010928153991699219, 0.013952255249023438, 0.016976356506347656, 0.020000457763671875, 0.023024559020996094, 0.026048660278320312, 0.02907276153564453, 0.03209686279296875, 0.03512096405029297, 0.03814506530761719, 0.041169166564941406, 0.044193267822265625, 0.047217369079589844, 0.05024147033691406, 0.05326557159423828, 0.0562896728515625, 0.05931377410888672, 0.06233787536621094, 0.06536197662353516, 0.06838607788085938, 0.0714101791381836, 0.07443428039550781, 0.07745838165283203, 0.08048248291015625, 0.08350658416748047, 0.08653068542480469, 0.0895547866821289, 0.09257888793945312, 0.09560298919677734, 0.09862709045410156, 0.10165119171142578, 0.10467529296875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 5.0, 12.0, 12.0, 12.0, 13.0, 21.0, 32.0, 28.0, 37.0, 37.0, 38.0, 57.0, 45.0, 45.0, 65.0, 55.0, 46.0, 61.0, 59.0, 57.0, 48.0, 37.0, 37.0, 29.0, 22.0, 23.0, 14.0, 16.0, 7.0, 6.0, 8.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1190185546875, -0.11565780639648438, -0.11229705810546875, -0.10893630981445312, -0.1055755615234375, -0.10221481323242188, -0.09885406494140625, -0.09549331665039062, -0.092132568359375, -0.08877182006835938, -0.08541107177734375, -0.08205032348632812, -0.0786895751953125, -0.07532882690429688, -0.07196807861328125, -0.06860733032226562, -0.06524658203125, -0.061885833740234375, -0.05852508544921875, -0.055164337158203125, -0.0518035888671875, -0.048442840576171875, -0.04508209228515625, -0.041721343994140625, -0.038360595703125, -0.034999847412109375, -0.03163909912109375, -0.028278350830078125, -0.0249176025390625, -0.021556854248046875, -0.01819610595703125, -0.014835357666015625, -0.011474609375, -0.008113861083984375, -0.00475311279296875, -0.001392364501953125, 0.0019683837890625, 0.005329132080078125, 0.00868988037109375, 0.012050628662109375, 0.015411376953125, 0.018772125244140625, 0.02213287353515625, 0.025493621826171875, 0.0288543701171875, 0.032215118408203125, 0.03557586669921875, 0.038936614990234375, 0.04229736328125, 0.045658111572265625, 0.04901885986328125, 0.052379608154296875, 0.0557403564453125, 0.059101104736328125, 0.06246185302734375, 0.06582260131835938, 0.069183349609375, 0.07254409790039062, 0.07590484619140625, 0.07926559448242188, 0.0826263427734375, 0.08598709106445312, 0.08934783935546875, 0.09270858764648438, 0.0960693359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 10.0, 8.0, 19.0, 55.0, 138.0, 377.0, 1928.0, 114556.0, 4070438.0, 5687.0, 723.0, 205.0, 75.0, 34.0, 8.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78271484375, -0.7591476440429688, -0.7355804443359375, -0.7120132446289062, -0.688446044921875, -0.6648788452148438, -0.6413116455078125, -0.6177444458007812, -0.59417724609375, -0.5706100463867188, -0.5470428466796875, -0.5234756469726562, -0.499908447265625, -0.47634124755859375, -0.4527740478515625, -0.42920684814453125, -0.4056396484375, -0.38207244873046875, -0.3585052490234375, -0.33493804931640625, -0.311370849609375, -0.28780364990234375, -0.2642364501953125, -0.24066925048828125, -0.21710205078125, -0.19353485107421875, -0.1699676513671875, -0.14640045166015625, -0.122833251953125, -0.09926605224609375, -0.0756988525390625, -0.05213165283203125, -0.028564453125, -0.00499725341796875, 0.0185699462890625, 0.04213714599609375, 0.065704345703125, 0.08927154541015625, 0.1128387451171875, 0.13640594482421875, 0.15997314453125, 0.18354034423828125, 0.2071075439453125, 0.23067474365234375, 0.254241943359375, 0.27780914306640625, 0.3013763427734375, 0.32494354248046875, 0.3485107421875, 0.37207794189453125, 0.3956451416015625, 0.41921234130859375, 0.442779541015625, 0.46634674072265625, 0.4899139404296875, 0.5134811401367188, 0.53704833984375, 0.5606155395507812, 0.5841827392578125, 0.6077499389648438, 0.631317138671875, 0.6548843383789062, 0.6784515380859375, 0.7020187377929688, 0.7255859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 16.0, 14.0, 17.0, 36.0, 88.0, 189.0, 503.0, 1222.0, 1184.0, 430.0, 189.0, 86.0, 39.0, 31.0, 8.0, 8.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.42578125, -0.4156208038330078, -0.4054603576660156, -0.39529991149902344, -0.38513946533203125, -0.37497901916503906, -0.3648185729980469, -0.3546581268310547, -0.3444976806640625, -0.3343372344970703, -0.3241767883300781, -0.31401634216308594, -0.30385589599609375, -0.29369544982910156, -0.2835350036621094, -0.2733745574951172, -0.263214111328125, -0.2530536651611328, -0.24289321899414062, -0.23273277282714844, -0.22257232666015625, -0.21241188049316406, -0.20225143432617188, -0.1920909881591797, -0.1819305419921875, -0.1717700958251953, -0.16160964965820312, -0.15144920349121094, -0.14128875732421875, -0.13112831115722656, -0.12096786499023438, -0.11080741882324219, -0.10064697265625, -0.09048652648925781, -0.08032608032226562, -0.07016563415527344, -0.06000518798828125, -0.04984474182128906, -0.039684295654296875, -0.029523849487304688, -0.0193634033203125, -0.009202957153320312, 0.000957489013671875, 0.011117935180664062, 0.02127838134765625, 0.03143882751464844, 0.041599273681640625, 0.05175971984863281, 0.061920166015625, 0.07208061218261719, 0.08224105834960938, 0.09240150451660156, 0.10256195068359375, 0.11272239685058594, 0.12288284301757812, 0.1330432891845703, 0.1432037353515625, 0.1533641815185547, 0.16352462768554688, 0.17368507385253906, 0.18384552001953125, 0.19400596618652344, 0.20416641235351562, 0.2143268585205078, 0.2244873046875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 11.0, 17.0, 41.0, 61.0, 141.0, 210.0, 197.0, 141.0, 94.0, 41.0, 26.0, 9.0, 2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.719484806060791, -2.6601996421813965, -2.600914239883423, -2.5416290760040283, -2.482343912124634, -2.42305850982666, -2.3637733459472656, -2.304488182067871, -2.2452027797698975, -2.185917615890503, -2.1266322135925293, -2.0673470497131348, -2.0080618858337402, -1.9487764835357666, -1.889491319656372, -1.830206036567688, -1.7709208726882935, -1.7116355895996094, -1.6523504257202148, -1.5930651426315308, -1.5337798595428467, -1.4744946956634521, -1.415209412574768, -1.355924129486084, -1.2966389656066895, -1.2373536825180054, -1.1780685186386108, -1.1187832355499268, -1.0594979524612427, -1.0002126693725586, -0.9409275054931641, -0.88164222240448, -0.8223570585250854, -0.7630718350410461, -0.7037865519523621, -0.6445013284683228, -0.5852160453796387, -0.5259308218955994, -0.46664559841156006, -0.40736034512519836, -0.34807509183883667, -0.288789838552475, -0.22950460016727448, -0.17021936178207397, -0.11093410849571228, -0.051648855209350586, 0.007636368274688721, 0.06692162156105042, 0.1262068748474121, 0.1854921281337738, 0.2447773665189743, 0.3040626049041748, 0.3633478581905365, 0.4226331114768982, 0.4819183349609375, 0.5412036180496216, 0.6004888415336609, 0.6597740650177002, 0.7190593481063843, 0.7783445715904236, 0.8376297950744629, 0.896915078163147, 0.9562003016471863, 1.0154855251312256, 1.0747708082199097]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 0.0, 6.0, 3.0, 8.0, 12.0, 13.0, 14.0, 11.0, 25.0, 27.0, 19.0, 22.0, 28.0, 31.0, 35.0, 41.0, 51.0, 50.0, 44.0, 40.0, 37.0, 51.0, 44.0, 48.0, 40.0, 40.0, 34.0, 32.0, 28.0, 17.0, 27.0, 21.0, 18.0, 11.0, 18.0, 12.0, 17.0, 6.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.8045223355293274, -0.7798269391059875, -0.7551315426826477, -0.7304361462593079, -0.7057408094406128, -0.681045413017273, -0.6563500165939331, -0.6316546201705933, -0.6069592237472534, -0.5822638273239136, -0.5575684309005737, -0.5328730344772339, -0.508177638053894, -0.4834822714328766, -0.45878690481185913, -0.4340915083885193, -0.40939611196517944, -0.3847007155418396, -0.36000531911849976, -0.3353099524974823, -0.31061455607414246, -0.2859191596508026, -0.26122379302978516, -0.2365283966064453, -0.21183300018310547, -0.18713760375976562, -0.16244222223758698, -0.13774684071540833, -0.11305144429206848, -0.08835605531930923, -0.06366066634654999, -0.03896528482437134, -0.014269888401031494, 0.010425500571727753, 0.035120889544487, 0.059816278517246246, 0.0845116674900055, 0.10920705646276474, 0.133902445435524, 0.15859782695770264, 0.18329322338104248, 0.20798861980438232, 0.23268400132656097, 0.2573793828487396, 0.28207477927207947, 0.3067701756954193, 0.33146554231643677, 0.3561609387397766, 0.38085633516311646, 0.4055517315864563, 0.43024712800979614, 0.4549424946308136, 0.47963789105415344, 0.5043332576751709, 0.5290286540985107, 0.5537240505218506, 0.5784194469451904, 0.6031148433685303, 0.6278102397918701, 0.65250563621521, 0.6772010326385498, 0.7018963694572449, 0.7265917658805847, 0.7512871623039246, 0.7759825587272644]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 12.0, 13.0, 19.0, 25.0, 38.0, 46.0, 81.0, 123.0, 199.0, 260.0, 424.0, 704.0, 1169.0, 1981.0, 3435.0, 6015.0, 11214.0, 21115.0, 41993.0, 82110.0, 161936.0, 259839.0, 216985.0, 116299.0, 58546.0, 29579.0, 15322.0, 8101.0, 4532.0, 2474.0, 1510.0, 917.0, 531.0, 320.0, 207.0, 154.0, 95.0, 71.0, 39.0, 42.0, 28.0, 10.0, 12.0, 7.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07135009765625, -0.06895160675048828, -0.06655311584472656, -0.06415462493896484, -0.061756134033203125, -0.059357643127441406, -0.05695915222167969, -0.05456066131591797, -0.05216217041015625, -0.04976367950439453, -0.04736518859863281, -0.044966697692871094, -0.042568206787109375, -0.040169715881347656, -0.03777122497558594, -0.03537273406982422, -0.0329742431640625, -0.03057575225830078, -0.028177261352539062, -0.025778770446777344, -0.023380279541015625, -0.020981788635253906, -0.018583297729492188, -0.01618480682373047, -0.01378631591796875, -0.011387825012207031, -0.008989334106445312, -0.006590843200683594, -0.004192352294921875, -0.0017938613891601562, 0.0006046295166015625, 0.0030031204223632812, 0.005401611328125, 0.007800102233886719, 0.010198593139648438, 0.012597084045410156, 0.014995574951171875, 0.017394065856933594, 0.019792556762695312, 0.02219104766845703, 0.02458953857421875, 0.02698802947998047, 0.029386520385742188, 0.031785011291503906, 0.034183502197265625, 0.036581993103027344, 0.03898048400878906, 0.04137897491455078, 0.0437774658203125, 0.04617595672607422, 0.04857444763183594, 0.050972938537597656, 0.053371429443359375, 0.055769920349121094, 0.05816841125488281, 0.06056690216064453, 0.06296539306640625, 0.06536388397216797, 0.06776237487792969, 0.0701608657836914, 0.07255935668945312, 0.07495784759521484, 0.07735633850097656, 0.07975482940673828, 0.0821533203125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 9.0, 13.0, 8.0, 17.0, 13.0, 13.0, 29.0, 26.0, 30.0, 35.0, 32.0, 50.0, 50.0, 49.0, 33.0, 59.0, 47.0, 58.0, 65.0, 53.0, 45.0, 47.0, 41.0, 39.0, 29.0, 24.0, 12.0, 17.0, 22.0, 6.0, 7.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1192626953125, -0.11587905883789062, -0.11249542236328125, -0.10911178588867188, -0.1057281494140625, -0.10234451293945312, -0.09896087646484375, -0.09557723999023438, -0.092193603515625, -0.08880996704101562, -0.08542633056640625, -0.08204269409179688, -0.0786590576171875, -0.07527542114257812, -0.07189178466796875, -0.06850814819335938, -0.06512451171875, -0.061740875244140625, -0.05835723876953125, -0.054973602294921875, -0.0515899658203125, -0.048206329345703125, -0.04482269287109375, -0.041439056396484375, -0.038055419921875, -0.034671783447265625, -0.03128814697265625, -0.027904510498046875, -0.0245208740234375, -0.021137237548828125, -0.01775360107421875, -0.014369964599609375, -0.010986328125, -0.007602691650390625, -0.00421905517578125, -0.000835418701171875, 0.0025482177734375, 0.005931854248046875, 0.00931549072265625, 0.012699127197265625, 0.016082763671875, 0.019466400146484375, 0.02285003662109375, 0.026233673095703125, 0.0296173095703125, 0.033000946044921875, 0.03638458251953125, 0.039768218994140625, 0.04315185546875, 0.046535491943359375, 0.04991912841796875, 0.053302764892578125, 0.0566864013671875, 0.060070037841796875, 0.06345367431640625, 0.06683731079101562, 0.070220947265625, 0.07360458374023438, 0.07698822021484375, 0.08037185668945312, 0.0837554931640625, 0.08713912963867188, 0.09052276611328125, 0.09390640258789062, 0.0972900390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 8.0, 3.0, 10.0, 3.0, 10.0, 14.0, 17.0, 21.0, 51.0, 41.0, 73.0, 91.0, 128.0, 193.0, 274.0, 511.0, 991.0, 2297.0, 7997.0, 44482.0, 615634.0, 329124.0, 35348.0, 6860.0, 2087.0, 823.0, 493.0, 271.0, 213.0, 147.0, 82.0, 70.0, 49.0, 34.0, 24.0, 18.0, 10.0, 13.0, 10.0, 8.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.271240234375, -0.26274871826171875, -0.2542572021484375, -0.24576568603515625, -0.237274169921875, -0.22878265380859375, -0.2202911376953125, -0.21179962158203125, -0.20330810546875, -0.19481658935546875, -0.1863250732421875, -0.17783355712890625, -0.169342041015625, -0.16085052490234375, -0.1523590087890625, -0.14386749267578125, -0.1353759765625, -0.12688446044921875, -0.1183929443359375, -0.10990142822265625, -0.101409912109375, -0.09291839599609375, -0.0844268798828125, -0.07593536376953125, -0.06744384765625, -0.05895233154296875, -0.0504608154296875, -0.04196929931640625, -0.033477783203125, -0.02498626708984375, -0.0164947509765625, -0.00800323486328125, 0.00048828125, 0.00897979736328125, 0.0174713134765625, 0.02596282958984375, 0.034454345703125, 0.04294586181640625, 0.0514373779296875, 0.05992889404296875, 0.06842041015625, 0.07691192626953125, 0.0854034423828125, 0.09389495849609375, 0.102386474609375, 0.11087799072265625, 0.1193695068359375, 0.12786102294921875, 0.1363525390625, 0.14484405517578125, 0.1533355712890625, 0.16182708740234375, 0.170318603515625, 0.17881011962890625, 0.1873016357421875, 0.19579315185546875, 0.20428466796875, 0.21277618408203125, 0.2212677001953125, 0.22975921630859375, 0.238250732421875, 0.24674224853515625, 0.2552337646484375, 0.26372528076171875, 0.272216796875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 9.0, 6.0, 12.0, 16.0, 25.0, 14.0, 34.0, 43.0, 52.0, 49.0, 58.0, 69.0, 72.0, 71.0, 84.0, 76.0, 59.0, 51.0, 41.0, 34.0, 30.0, 27.0, 15.0, 13.0, 14.0, 6.0, 5.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52490234375, -0.5081634521484375, -0.491424560546875, -0.4746856689453125, -0.45794677734375, -0.4412078857421875, -0.424468994140625, -0.4077301025390625, -0.3909912109375, -0.3742523193359375, -0.357513427734375, -0.3407745361328125, -0.32403564453125, -0.3072967529296875, -0.290557861328125, -0.2738189697265625, -0.257080078125, -0.2403411865234375, -0.223602294921875, -0.2068634033203125, -0.19012451171875, -0.1733856201171875, -0.156646728515625, -0.1399078369140625, -0.1231689453125, -0.1064300537109375, -0.089691162109375, -0.0729522705078125, -0.05621337890625, -0.0394744873046875, -0.022735595703125, -0.0059967041015625, 0.0107421875, 0.0274810791015625, 0.044219970703125, 0.0609588623046875, 0.07769775390625, 0.0944366455078125, 0.111175537109375, 0.1279144287109375, 0.1446533203125, 0.1613922119140625, 0.178131103515625, 0.1948699951171875, 0.21160888671875, 0.2283477783203125, 0.245086669921875, 0.2618255615234375, 0.278564453125, 0.2953033447265625, 0.312042236328125, 0.3287811279296875, 0.34552001953125, 0.3622589111328125, 0.378997802734375, 0.3957366943359375, 0.4124755859375, 0.4292144775390625, 0.445953369140625, 0.4626922607421875, 0.47943115234375, 0.4961700439453125, 0.512908935546875, 0.5296478271484375, 0.54638671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 7.0, 9.0, 7.0, 16.0, 27.0, 39.0, 59.0, 92.0, 140.0, 292.0, 561.0, 1199.0, 2931.0, 7671.0, 25654.0, 124552.0, 741216.0, 108153.0, 23538.0, 7302.0, 2706.0, 1162.0, 562.0, 281.0, 163.0, 86.0, 47.0, 24.0, 18.0, 18.0, 10.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09222412109375, -0.08954811096191406, -0.08687210083007812, -0.08419609069824219, -0.08152008056640625, -0.07884407043457031, -0.07616806030273438, -0.07349205017089844, -0.0708160400390625, -0.06814002990722656, -0.06546401977539062, -0.06278800964355469, -0.06011199951171875, -0.05743598937988281, -0.054759979248046875, -0.05208396911621094, -0.049407958984375, -0.04673194885253906, -0.044055938720703125, -0.04137992858886719, -0.03870391845703125, -0.03602790832519531, -0.033351898193359375, -0.030675888061523438, -0.0279998779296875, -0.025323867797851562, -0.022647857666015625, -0.019971847534179688, -0.01729583740234375, -0.014619827270507812, -0.011943817138671875, -0.009267807006835938, -0.006591796875, -0.0039157867431640625, -0.001239776611328125, 0.0014362335205078125, 0.00411224365234375, 0.0067882537841796875, 0.009464263916015625, 0.012140274047851562, 0.0148162841796875, 0.017492294311523438, 0.020168304443359375, 0.022844314575195312, 0.02552032470703125, 0.028196334838867188, 0.030872344970703125, 0.03354835510253906, 0.036224365234375, 0.03890037536621094, 0.041576385498046875, 0.04425239562988281, 0.04692840576171875, 0.04960441589355469, 0.052280426025390625, 0.05495643615722656, 0.0576324462890625, 0.06030845642089844, 0.06298446655273438, 0.06566047668457031, 0.06833648681640625, 0.07101249694824219, 0.07368850708007812, 0.07636451721191406, 0.07904052734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 5.0, 5.0, 16.0, 7.0, 15.0, 16.0, 24.0, 29.0, 36.0, 67.0, 92.0, 118.0, 117.0, 122.0, 83.0, 58.0, 46.0, 28.0, 26.0, 24.0, 8.0, 9.0, 8.0, 9.0, 3.0, 7.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1961669921875e-05, -4.074070602655411e-05, -3.9519742131233215e-05, -3.829877823591232e-05, -3.707781434059143e-05, -3.585685044527054e-05, -3.4635886549949646e-05, -3.3414922654628754e-05, -3.219395875930786e-05, -3.097299486398697e-05, -2.9752030968666077e-05, -2.8531067073345184e-05, -2.7310103178024292e-05, -2.60891392827034e-05, -2.4868175387382507e-05, -2.3647211492061615e-05, -2.2426247596740723e-05, -2.120528370141983e-05, -1.9984319806098938e-05, -1.8763355910778046e-05, -1.7542392015457153e-05, -1.632142812013626e-05, -1.5100464224815369e-05, -1.3879500329494476e-05, -1.2658536434173584e-05, -1.1437572538852692e-05, -1.02166086435318e-05, -8.995644748210907e-06, -7.774680852890015e-06, -6.553716957569122e-06, -5.33275306224823e-06, -4.111789166927338e-06, -2.8908252716064453e-06, -1.669861376285553e-06, -4.4889748096466064e-07, 7.720664143562317e-07, 1.993030309677124e-06, 3.2139942049980164e-06, 4.434958100318909e-06, 5.655921995639801e-06, 6.876885890960693e-06, 8.097849786281586e-06, 9.318813681602478e-06, 1.053977757692337e-05, 1.1760741472244263e-05, 1.2981705367565155e-05, 1.4202669262886047e-05, 1.542363315820694e-05, 1.6644597053527832e-05, 1.7865560948848724e-05, 1.9086524844169617e-05, 2.030748873949051e-05, 2.15284526348114e-05, 2.2749416530132294e-05, 2.3970380425453186e-05, 2.519134432077408e-05, 2.641230821609497e-05, 2.7633272111415863e-05, 2.8854236006736755e-05, 3.0075199902057648e-05, 3.129616379737854e-05, 3.251712769269943e-05, 3.3738091588020325e-05, 3.495905548334122e-05, 3.618001937866211e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 9.0, 15.0, 16.0, 23.0, 34.0, 68.0, 102.0, 202.0, 394.0, 915.0, 2607.0, 9587.0, 62196.0, 792126.0, 155123.0, 18554.0, 4177.0, 1288.0, 552.0, 234.0, 118.0, 71.0, 44.0, 39.0, 21.0, 17.0, 8.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.149169921875, -0.14550399780273438, -0.14183807373046875, -0.13817214965820312, -0.1345062255859375, -0.13084030151367188, -0.12717437744140625, -0.12350845336914062, -0.119842529296875, -0.11617660522460938, -0.11251068115234375, -0.10884475708007812, -0.1051788330078125, -0.10151290893554688, -0.09784698486328125, -0.09418106079101562, -0.09051513671875, -0.08684921264648438, -0.08318328857421875, -0.07951736450195312, -0.0758514404296875, -0.07218551635742188, -0.06851959228515625, -0.06485366821289062, -0.061187744140625, -0.057521820068359375, -0.05385589599609375, -0.050189971923828125, -0.0465240478515625, -0.042858123779296875, -0.03919219970703125, -0.035526275634765625, -0.0318603515625, -0.028194427490234375, -0.02452850341796875, -0.020862579345703125, -0.0171966552734375, -0.013530731201171875, -0.00986480712890625, -0.006198883056640625, -0.002532958984375, 0.001132965087890625, 0.00479888916015625, 0.008464813232421875, 0.0121307373046875, 0.015796661376953125, 0.01946258544921875, 0.023128509521484375, 0.02679443359375, 0.030460357666015625, 0.03412628173828125, 0.037792205810546875, 0.0414581298828125, 0.045124053955078125, 0.04878997802734375, 0.052455902099609375, 0.056121826171875, 0.059787750244140625, 0.06345367431640625, 0.06711959838867188, 0.0707855224609375, 0.07445144653320312, 0.07811737060546875, 0.08178329467773438, 0.08544921875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 9.0, 2.0, 8.0, 6.0, 8.0, 9.0, 18.0, 20.0, 22.0, 31.0, 51.0, 57.0, 81.0, 106.0, 120.0, 103.0, 101.0, 53.0, 37.0, 40.0, 22.0, 22.0, 17.0, 22.0, 15.0, 7.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.128173828125, -0.12515735626220703, -0.12214088439941406, -0.1191244125366211, -0.11610794067382812, -0.11309146881103516, -0.11007499694824219, -0.10705852508544922, -0.10404205322265625, -0.10102558135986328, -0.09800910949707031, -0.09499263763427734, -0.09197616577148438, -0.0889596939086914, -0.08594322204589844, -0.08292675018310547, -0.0799102783203125, -0.07689380645751953, -0.07387733459472656, -0.0708608627319336, -0.06784439086914062, -0.06482791900634766, -0.06181144714355469, -0.05879497528076172, -0.05577850341796875, -0.05276203155517578, -0.04974555969238281, -0.046729087829589844, -0.043712615966796875, -0.040696144104003906, -0.03767967224121094, -0.03466320037841797, -0.031646728515625, -0.02863025665283203, -0.025613784790039062, -0.022597312927246094, -0.019580841064453125, -0.016564369201660156, -0.013547897338867188, -0.010531425476074219, -0.00751495361328125, -0.004498481750488281, -0.0014820098876953125, 0.0015344619750976562, 0.004550933837890625, 0.007567405700683594, 0.010583877563476562, 0.013600349426269531, 0.0166168212890625, 0.01963329315185547, 0.022649765014648438, 0.025666236877441406, 0.028682708740234375, 0.031699180603027344, 0.03471565246582031, 0.03773212432861328, 0.04074859619140625, 0.04376506805419922, 0.04678153991699219, 0.049798011779785156, 0.052814483642578125, 0.055830955505371094, 0.05884742736816406, 0.06186389923095703, 0.06488037109375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 9.0, 13.0, 19.0, 32.0, 52.0, 107.0, 148.0, 301.0, 117.0, 75.0, 45.0, 33.0, 17.0, 11.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1613118648529053, -2.1052229404449463, -2.0491340160369873, -1.9930450916290283, -1.9369560480117798, -1.8808671236038208, -1.8247781991958618, -1.7686892747879028, -1.7126003503799438, -1.6565114259719849, -1.6004225015640259, -1.5443334579467773, -1.4882445335388184, -1.4321556091308594, -1.3760666847229004, -1.3199777603149414, -1.2638888359069824, -1.2077999114990234, -1.1517109870910645, -1.0956220626831055, -1.039533019065857, -0.983444094657898, -0.927355170249939, -0.87126624584198, -0.8151772022247314, -0.7590882778167725, -0.7029992938041687, -0.6469103693962097, -0.5908214449882507, -0.534732460975647, -0.478643536567688, -0.422554612159729, -0.36646568775177, -0.31037673354148865, -0.25428780913352966, -0.1981988549232483, -0.1421099156141281, -0.08602097630500793, -0.029932022094726562, 0.026156902313232422, 0.0822458565235138, 0.13833479583263397, 0.19442373514175415, 0.2505126893520355, 0.3066016435623169, 0.3626905679702759, 0.41877952218055725, 0.47486844658851624, 0.5309574007987976, 0.5870463252067566, 0.6431353092193604, 0.6992242336273193, 0.7553131580352783, 0.8114020824432373, 0.8674910664558411, 0.9235799908638, 0.9796689748764038, 1.0357578992843628, 1.0918468236923218, 1.1479358673095703, 1.2040247917175293, 1.2601137161254883, 1.3162026405334473, 1.3722915649414062, 1.4283804893493652]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 3.0, 7.0, 9.0, 14.0, 14.0, 10.0, 14.0, 17.0, 14.0, 23.0, 23.0, 29.0, 20.0, 30.0, 36.0, 43.0, 69.0, 103.0, 101.0, 72.0, 46.0, 42.0, 29.0, 29.0, 29.0, 19.0, 20.0, 14.0, 15.0, 18.0, 10.0, 10.0, 7.0, 4.0, 6.0, 7.0, 8.0, 2.0, 8.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3526108264923096, -1.3089009523391724, -1.2651911973953247, -1.2214813232421875, -1.1777715682983398, -1.1340616941452026, -1.0903518199920654, -1.0466420650482178, -1.0029321908950806, -0.9592223763465881, -0.9155125617980957, -0.8718026876449585, -0.8280928730964661, -0.7843830585479736, -0.7406731843948364, -0.696963369846344, -0.6532535552978516, -0.6095437407493591, -0.5658339262008667, -0.5221240520477295, -0.47841423749923706, -0.43470442295074463, -0.3909945785999298, -0.347284734249115, -0.30357491970062256, -0.2598651051521301, -0.2161552608013153, -0.17244543135166168, -0.12873560190200806, -0.08502577245235443, -0.041315943002700806, 0.0023939013481140137, 0.046103835105895996, 0.08981366455554962, 0.13352349400520325, 0.17723332345485687, 0.2209431529045105, 0.26465296745300293, 0.30836281180381775, 0.35207265615463257, 0.395782470703125, 0.43949228525161743, 0.48320212960243225, 0.5269119739532471, 0.5706217885017395, 0.6143316030502319, 0.6580414772033691, 0.7017512917518616, 0.745461106300354, 0.7891709208488464, 0.8328807353973389, 0.8765906095504761, 0.9203004240989685, 0.9640102386474609, 1.0077201128005981, 1.0514299869537354, 1.095139741897583, 1.1388496160507202, 1.1825593709945679, 1.226269245147705, 1.2699790000915527, 1.31368887424469, 1.3573987483978271, 1.4011085033416748, 1.444818377494812]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 8.0, 15.0, 14.0, 19.0, 23.0, 29.0, 43.0, 41.0, 53.0, 70.0, 109.0, 182.0, 299.0, 605.0, 1388.0, 4393.0, 25314.0, 392459.0, 3037558.0, 679716.0, 42491.0, 6054.0, 1780.0, 688.0, 286.0, 183.0, 92.0, 71.0, 54.0, 55.0, 41.0, 35.0, 33.0, 19.0, 17.0, 13.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15380859375, -0.14861106872558594, -0.14341354370117188, -0.1382160186767578, -0.13301849365234375, -0.1278209686279297, -0.12262344360351562, -0.11742591857910156, -0.1122283935546875, -0.10703086853027344, -0.10183334350585938, -0.09663581848144531, -0.09143829345703125, -0.08624076843261719, -0.08104324340820312, -0.07584571838378906, -0.070648193359375, -0.06545066833496094, -0.060253143310546875, -0.05505561828613281, -0.04985809326171875, -0.04466056823730469, -0.039463043212890625, -0.03426551818847656, -0.0290679931640625, -0.023870468139648438, -0.018672943115234375, -0.013475418090820312, -0.00827789306640625, -0.0030803680419921875, 0.002117156982421875, 0.0073146820068359375, 0.01251220703125, 0.017709732055664062, 0.022907257080078125, 0.028104782104492188, 0.03330230712890625, 0.03849983215332031, 0.043697357177734375, 0.04889488220214844, 0.0540924072265625, 0.05928993225097656, 0.06448745727539062, 0.06968498229980469, 0.07488250732421875, 0.08008003234863281, 0.08527755737304688, 0.09047508239746094, 0.095672607421875, 0.10087013244628906, 0.10606765747070312, 0.11126518249511719, 0.11646270751953125, 0.12166023254394531, 0.12685775756835938, 0.13205528259277344, 0.1372528076171875, 0.14245033264160156, 0.14764785766601562, 0.1528453826904297, 0.15804290771484375, 0.1632404327392578, 0.16843795776367188, 0.17363548278808594, 0.1788330078125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 8.0, 8.0, 4.0, 12.0, 14.0, 13.0, 22.0, 26.0, 24.0, 38.0, 37.0, 38.0, 47.0, 30.0, 59.0, 46.0, 42.0, 56.0, 39.0, 55.0, 60.0, 42.0, 35.0, 42.0, 40.0, 35.0, 19.0, 20.0, 20.0, 18.0, 11.0, 9.0, 6.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11773681640625, -0.11440181732177734, -0.11106681823730469, -0.10773181915283203, -0.10439682006835938, -0.10106182098388672, -0.09772682189941406, -0.0943918228149414, -0.09105682373046875, -0.0877218246459961, -0.08438682556152344, -0.08105182647705078, -0.07771682739257812, -0.07438182830810547, -0.07104682922363281, -0.06771183013916016, -0.0643768310546875, -0.061041831970214844, -0.05770683288574219, -0.05437183380126953, -0.051036834716796875, -0.04770183563232422, -0.04436683654785156, -0.041031837463378906, -0.03769683837890625, -0.034361839294433594, -0.031026840209960938, -0.02769184112548828, -0.024356842041015625, -0.02102184295654297, -0.017686843872070312, -0.014351844787597656, -0.011016845703125, -0.007681846618652344, -0.0043468475341796875, -0.0010118484497070312, 0.002323150634765625, 0.005658149719238281, 0.008993148803710938, 0.012328147888183594, 0.01566314697265625, 0.018998146057128906, 0.022333145141601562, 0.02566814422607422, 0.029003143310546875, 0.03233814239501953, 0.03567314147949219, 0.039008140563964844, 0.0423431396484375, 0.045678138732910156, 0.04901313781738281, 0.05234813690185547, 0.055683135986328125, 0.05901813507080078, 0.06235313415527344, 0.0656881332397461, 0.06902313232421875, 0.0723581314086914, 0.07569313049316406, 0.07902812957763672, 0.08236312866210938, 0.08569812774658203, 0.08903312683105469, 0.09236812591552734, 0.095703125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 13.0, 14.0, 24.0, 36.0, 67.0, 128.0, 255.0, 738.0, 2635.0, 32149.0, 3936723.0, 213263.0, 6369.0, 1098.0, 374.0, 188.0, 75.0, 45.0, 30.0, 15.0, 13.0, 2.0, 8.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50390625, -0.49018096923828125, -0.4764556884765625, -0.46273040771484375, -0.449005126953125, -0.43527984619140625, -0.4215545654296875, -0.40782928466796875, -0.39410400390625, -0.38037872314453125, -0.3666534423828125, -0.35292816162109375, -0.339202880859375, -0.32547760009765625, -0.3117523193359375, -0.29802703857421875, -0.2843017578125, -0.27057647705078125, -0.2568511962890625, -0.24312591552734375, -0.229400634765625, -0.21567535400390625, -0.2019500732421875, -0.18822479248046875, -0.17449951171875, -0.16077423095703125, -0.1470489501953125, -0.13332366943359375, -0.119598388671875, -0.10587310791015625, -0.0921478271484375, -0.07842254638671875, -0.064697265625, -0.05097198486328125, -0.0372467041015625, -0.02352142333984375, -0.009796142578125, 0.00392913818359375, 0.0176544189453125, 0.03137969970703125, 0.04510498046875, 0.05883026123046875, 0.0725555419921875, 0.08628082275390625, 0.100006103515625, 0.11373138427734375, 0.1274566650390625, 0.14118194580078125, 0.1549072265625, 0.16863250732421875, 0.1823577880859375, 0.19608306884765625, 0.209808349609375, 0.22353363037109375, 0.2372589111328125, 0.25098419189453125, 0.26470947265625, 0.27843475341796875, 0.2921600341796875, 0.30588531494140625, 0.319610595703125, 0.33333587646484375, 0.3470611572265625, 0.36078643798828125, 0.37451171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 4.0, 4.0, 5.0, 4.0, 19.0, 25.0, 30.0, 38.0, 69.0, 103.0, 178.0, 336.0, 640.0, 892.0, 728.0, 420.0, 248.0, 114.0, 79.0, 49.0, 24.0, 21.0, 14.0, 9.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2020263671875, -0.19414329528808594, -0.18626022338867188, -0.1783771514892578, -0.17049407958984375, -0.1626110076904297, -0.15472793579101562, -0.14684486389160156, -0.1389617919921875, -0.13107872009277344, -0.12319564819335938, -0.11531257629394531, -0.10742950439453125, -0.09954643249511719, -0.09166336059570312, -0.08378028869628906, -0.075897216796875, -0.06801414489746094, -0.060131072998046875, -0.05224800109863281, -0.04436492919921875, -0.03648185729980469, -0.028598785400390625, -0.020715713500976562, -0.0128326416015625, -0.0049495697021484375, 0.002933502197265625, 0.010816574096679688, 0.01869964599609375, 0.026582717895507812, 0.034465789794921875, 0.04234886169433594, 0.05023193359375, 0.05811500549316406, 0.06599807739257812, 0.07388114929199219, 0.08176422119140625, 0.08964729309082031, 0.09753036499023438, 0.10541343688964844, 0.1132965087890625, 0.12117958068847656, 0.12906265258789062, 0.1369457244873047, 0.14482879638671875, 0.1527118682861328, 0.16059494018554688, 0.16847801208496094, 0.176361083984375, 0.18424415588378906, 0.19212722778320312, 0.2000102996826172, 0.20789337158203125, 0.2157764434814453, 0.22365951538085938, 0.23154258728027344, 0.2394256591796875, 0.24730873107910156, 0.2551918029785156, 0.2630748748779297, 0.27095794677734375, 0.2788410186767578, 0.2867240905761719, 0.29460716247558594, 0.302490234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 13.0, 34.0, 64.0, 223.0, 317.0, 208.0, 98.0, 18.0, 14.0, 8.0, 4.0, 2.0], "bins": [-5.664047718048096, -5.56368350982666, -5.463318824768066, -5.362954616546631, -5.262590408325195, -5.162225723266602, -5.061861515045166, -4.9614973068237305, -4.861132621765137, -4.760768413543701, -4.660403728485107, -4.560039520263672, -4.459675312042236, -4.359310626983643, -4.258946418762207, -4.158581733703613, -4.058217525482178, -3.957853078842163, -3.8574888706207275, -3.757124423980713, -3.6567599773406982, -3.5563955307006836, -3.456031322479248, -3.3556668758392334, -3.255302667617798, -3.154938220977783, -3.0545740127563477, -2.954209566116333, -2.8538451194763184, -2.753480911254883, -2.653116464614868, -2.5527520179748535, -2.4523873329162598, -2.352022886276245, -2.2516586780548096, -2.151294231414795, -2.0509297847747803, -1.9505654573440552, -1.85020112991333, -1.7498366832733154, -1.6494724750518799, -1.5491081476211548, -1.4487437009811401, -1.348379373550415, -1.2480149269104004, -1.1476505994796753, -1.0472862720489502, -0.9469218254089355, -0.8465573787689209, -0.746192991733551, -0.6458286046981812, -0.545464277267456, -0.4450998604297638, -0.3447355031967163, -0.24437111616134644, -0.14400672912597656, -0.04364234209060669, 0.05672203749418259, 0.15708641707897186, 0.25745078921318054, 0.3578151762485504, 0.4581795334815979, 0.5585439205169678, 0.6589083075523376, 0.7592726945877075]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 8.0, 9.0, 5.0, 8.0, 11.0, 13.0, 20.0, 32.0, 24.0, 23.0, 27.0, 41.0, 36.0, 40.0, 41.0, 58.0, 66.0, 58.0, 52.0, 60.0, 46.0, 53.0, 30.0, 40.0, 38.0, 22.0, 29.0, 22.0, 16.0, 16.0, 13.0, 6.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8728641867637634, -0.8426277041435242, -0.8123912215232849, -0.7821547985076904, -0.7519183158874512, -0.7216818332672119, -0.6914453506469727, -0.6612088680267334, -0.6309723854064941, -0.6007359027862549, -0.5704994201660156, -0.5402629375457764, -0.5100265145301819, -0.4797900319099426, -0.44955354928970337, -0.4193170666694641, -0.38908064365386963, -0.35884416103363037, -0.3286077082157135, -0.29837122559547424, -0.2681347727775574, -0.23789829015731812, -0.20766180753707886, -0.1774253398180008, -0.14718887209892273, -0.11695240437984467, -0.086715929210186, -0.056479454040527344, -0.02624298632144928, 0.003993481397628784, 0.03422996401786804, 0.0644664317369461, 0.0947028398513794, 0.12493930757045746, 0.15517577528953552, 0.18541225790977478, 0.21564872562885284, 0.2458851933479309, 0.27612167596817017, 0.3063581585884094, 0.3365946114063263, 0.36683109402656555, 0.3970675468444824, 0.4273040294647217, 0.45754051208496094, 0.4877769649028778, 0.5180134773254395, 0.5482499003410339, 0.5784863829612732, 0.6087228655815125, 0.6389593482017517, 0.6691957712173462, 0.6994322538375854, 0.7296687364578247, 0.759905219078064, 0.7901417016983032, 0.8203781843185425, 0.8506146669387817, 0.880851149559021, 0.9110876321792603, 0.9413240551948547, 0.971560537815094, 1.0017969608306885, 1.0320334434509277, 1.062269926071167]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 8.0, 8.0, 12.0, 13.0, 20.0, 34.0, 42.0, 72.0, 113.0, 180.0, 295.0, 442.0, 801.0, 1307.0, 2262.0, 3975.0, 7678.0, 15827.0, 35103.0, 83079.0, 219813.0, 369613.0, 180276.0, 69035.0, 29699.0, 13546.0, 6869.0, 3565.0, 1871.0, 1169.0, 667.0, 408.0, 279.0, 155.0, 119.0, 60.0, 53.0, 25.0, 19.0, 21.0, 8.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12261962890625, -0.1187143325805664, -0.11480903625488281, -0.11090373992919922, -0.10699844360351562, -0.10309314727783203, -0.09918785095214844, -0.09528255462646484, -0.09137725830078125, -0.08747196197509766, -0.08356666564941406, -0.07966136932373047, -0.07575607299804688, -0.07185077667236328, -0.06794548034667969, -0.0640401840209961, -0.0601348876953125, -0.056229591369628906, -0.05232429504394531, -0.04841899871826172, -0.044513702392578125, -0.04060840606689453, -0.03670310974121094, -0.032797813415527344, -0.02889251708984375, -0.024987220764160156, -0.021081924438476562, -0.01717662811279297, -0.013271331787109375, -0.009366035461425781, -0.0054607391357421875, -0.0015554428100585938, 0.002349853515625, 0.006255149841308594, 0.010160446166992188, 0.014065742492675781, 0.017971038818359375, 0.02187633514404297, 0.025781631469726562, 0.029686927795410156, 0.03359222412109375, 0.037497520446777344, 0.04140281677246094, 0.04530811309814453, 0.049213409423828125, 0.05311870574951172, 0.05702400207519531, 0.060929298400878906, 0.0648345947265625, 0.0687398910522461, 0.07264518737792969, 0.07655048370361328, 0.08045578002929688, 0.08436107635498047, 0.08826637268066406, 0.09217166900634766, 0.09607696533203125, 0.09998226165771484, 0.10388755798339844, 0.10779285430908203, 0.11169815063476562, 0.11560344696044922, 0.11950874328613281, 0.1234140396118164, 0.1273193359375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 6.0, 16.0, 12.0, 10.0, 22.0, 21.0, 18.0, 27.0, 29.0, 38.0, 40.0, 53.0, 44.0, 47.0, 62.0, 24.0, 52.0, 38.0, 56.0, 51.0, 47.0, 37.0, 27.0, 29.0, 34.0, 22.0, 24.0, 19.0, 15.0, 19.0, 11.0, 12.0, 6.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.11328125, -0.11006927490234375, -0.1068572998046875, -0.10364532470703125, -0.100433349609375, -0.09722137451171875, -0.0940093994140625, -0.09079742431640625, -0.08758544921875, -0.08437347412109375, -0.0811614990234375, -0.07794952392578125, -0.074737548828125, -0.07152557373046875, -0.0683135986328125, -0.06510162353515625, -0.0618896484375, -0.05867767333984375, -0.0554656982421875, -0.05225372314453125, -0.049041748046875, -0.04582977294921875, -0.0426177978515625, -0.03940582275390625, -0.03619384765625, -0.03298187255859375, -0.0297698974609375, -0.02655792236328125, -0.023345947265625, -0.02013397216796875, -0.0169219970703125, -0.01371002197265625, -0.010498046875, -0.00728607177734375, -0.0040740966796875, -0.00086212158203125, 0.002349853515625, 0.00556182861328125, 0.0087738037109375, 0.01198577880859375, 0.01519775390625, 0.01840972900390625, 0.0216217041015625, 0.02483367919921875, 0.028045654296875, 0.03125762939453125, 0.0344696044921875, 0.03768157958984375, 0.0408935546875, 0.04410552978515625, 0.0473175048828125, 0.05052947998046875, 0.053741455078125, 0.05695343017578125, 0.0601654052734375, 0.06337738037109375, 0.06658935546875, 0.06980133056640625, 0.0730133056640625, 0.07622528076171875, 0.079437255859375, 0.08264923095703125, 0.0858612060546875, 0.08907318115234375, 0.09228515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 9.0, 16.0, 17.0, 17.0, 35.0, 40.0, 80.0, 102.0, 131.0, 290.0, 475.0, 943.0, 2185.0, 10887.0, 338912.0, 677141.0, 12686.0, 2350.0, 990.0, 469.0, 277.0, 177.0, 109.0, 68.0, 44.0, 26.0, 26.0, 15.0, 12.0, 11.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.448974609375, -0.4345054626464844, -0.42003631591796875, -0.4055671691894531, -0.3910980224609375, -0.3766288757324219, -0.36215972900390625, -0.3476905822753906, -0.333221435546875, -0.3187522888183594, -0.30428314208984375, -0.2898139953613281, -0.2753448486328125, -0.2608757019042969, -0.24640655517578125, -0.23193740844726562, -0.21746826171875, -0.20299911499023438, -0.18852996826171875, -0.17406082153320312, -0.1595916748046875, -0.14512252807617188, -0.13065338134765625, -0.11618423461914062, -0.101715087890625, -0.08724594116210938, -0.07277679443359375, -0.058307647705078125, -0.0438385009765625, -0.029369354248046875, -0.01490020751953125, -0.000431060791015625, 0.0140380859375, 0.028507232666015625, 0.04297637939453125, 0.057445526123046875, 0.0719146728515625, 0.08638381958007812, 0.10085296630859375, 0.11532211303710938, 0.129791259765625, 0.14426040649414062, 0.15872955322265625, 0.17319869995117188, 0.1876678466796875, 0.20213699340820312, 0.21660614013671875, 0.23107528686523438, 0.24554443359375, 0.2600135803222656, 0.27448272705078125, 0.2889518737792969, 0.3034210205078125, 0.3178901672363281, 0.33235931396484375, 0.3468284606933594, 0.361297607421875, 0.3757667541503906, 0.39023590087890625, 0.4047050476074219, 0.4191741943359375, 0.4336433410644531, 0.44811248779296875, 0.4625816345214844, 0.47705078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 10.0, 4.0, 5.0, 10.0, 18.0, 20.0, 22.0, 36.0, 40.0, 55.0, 57.0, 62.0, 86.0, 64.0, 79.0, 81.0, 62.0, 60.0, 47.0, 51.0, 27.0, 24.0, 17.0, 14.0, 15.0, 7.0, 3.0, 5.0, 5.0, 4.0, 1.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57861328125, -0.5628204345703125, -0.547027587890625, -0.5312347412109375, -0.51544189453125, -0.4996490478515625, -0.483856201171875, -0.4680633544921875, -0.4522705078125, -0.4364776611328125, -0.420684814453125, -0.4048919677734375, -0.38909912109375, -0.3733062744140625, -0.357513427734375, -0.3417205810546875, -0.325927734375, -0.3101348876953125, -0.294342041015625, -0.2785491943359375, -0.26275634765625, -0.2469635009765625, -0.231170654296875, -0.2153778076171875, -0.1995849609375, -0.1837921142578125, -0.167999267578125, -0.1522064208984375, -0.13641357421875, -0.1206207275390625, -0.104827880859375, -0.0890350341796875, -0.0732421875, -0.0574493408203125, -0.041656494140625, -0.0258636474609375, -0.01007080078125, 0.0057220458984375, 0.021514892578125, 0.0373077392578125, 0.0531005859375, 0.0688934326171875, 0.084686279296875, 0.1004791259765625, 0.11627197265625, 0.1320648193359375, 0.147857666015625, 0.1636505126953125, 0.179443359375, 0.1952362060546875, 0.211029052734375, 0.2268218994140625, 0.24261474609375, 0.2584075927734375, 0.274200439453125, 0.2899932861328125, 0.3057861328125, 0.3215789794921875, 0.337371826171875, 0.3531646728515625, 0.36895751953125, 0.3847503662109375, 0.400543212890625, 0.4163360595703125, 0.43212890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 9.0, 7.0, 10.0, 12.0, 20.0, 36.0, 60.0, 91.0, 147.0, 319.0, 710.0, 2046.0, 7701.0, 43152.0, 768306.0, 198129.0, 20833.0, 4462.0, 1366.0, 518.0, 227.0, 140.0, 76.0, 49.0, 24.0, 15.0, 14.0, 11.0, 14.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08660888671875, -0.08388614654541016, -0.08116340637207031, -0.07844066619873047, -0.07571792602539062, -0.07299518585205078, -0.07027244567871094, -0.0675497055053711, -0.06482696533203125, -0.062104225158691406, -0.05938148498535156, -0.05665874481201172, -0.053936004638671875, -0.05121326446533203, -0.04849052429199219, -0.045767784118652344, -0.0430450439453125, -0.040322303771972656, -0.03759956359863281, -0.03487682342529297, -0.032154083251953125, -0.02943134307861328, -0.026708602905273438, -0.023985862731933594, -0.02126312255859375, -0.018540382385253906, -0.015817642211914062, -0.013094902038574219, -0.010372161865234375, -0.007649421691894531, -0.0049266815185546875, -0.0022039413452148438, 0.000518798828125, 0.0032415390014648438, 0.0059642791748046875, 0.008687019348144531, 0.011409759521484375, 0.014132499694824219, 0.016855239868164062, 0.019577980041503906, 0.02230072021484375, 0.025023460388183594, 0.027746200561523438, 0.03046894073486328, 0.033191680908203125, 0.03591442108154297, 0.03863716125488281, 0.041359901428222656, 0.0440826416015625, 0.046805381774902344, 0.04952812194824219, 0.05225086212158203, 0.054973602294921875, 0.05769634246826172, 0.06041908264160156, 0.0631418228149414, 0.06586456298828125, 0.0685873031616211, 0.07131004333496094, 0.07403278350830078, 0.07675552368164062, 0.07947826385498047, 0.08220100402832031, 0.08492374420166016, 0.087646484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 8.0, 2.0, 3.0, 8.0, 11.0, 10.0, 16.0, 22.0, 16.0, 16.0, 30.0, 27.0, 39.0, 55.0, 71.0, 79.0, 86.0, 89.0, 80.0, 65.0, 46.0, 53.0, 33.0, 24.0, 23.0, 16.0, 21.0, 9.0, 6.0, 5.0, 3.0, 6.0, 4.0, 3.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.9981136322021484e-05, -2.9012560844421387e-05, -2.804398536682129e-05, -2.707540988922119e-05, -2.6106834411621094e-05, -2.5138258934020996e-05, -2.41696834564209e-05, -2.32011079788208e-05, -2.2232532501220703e-05, -2.1263957023620605e-05, -2.0295381546020508e-05, -1.932680606842041e-05, -1.8358230590820312e-05, -1.7389655113220215e-05, -1.6421079635620117e-05, -1.545250415802002e-05, -1.4483928680419922e-05, -1.3515353202819824e-05, -1.2546777725219727e-05, -1.1578202247619629e-05, -1.0609626770019531e-05, -9.641051292419434e-06, -8.672475814819336e-06, -7.703900337219238e-06, -6.735324859619141e-06, -5.766749382019043e-06, -4.798173904418945e-06, -3.829598426818848e-06, -2.86102294921875e-06, -1.8924474716186523e-06, -9.238719940185547e-07, 4.470348358154297e-08, 1.0132789611816406e-06, 1.9818544387817383e-06, 2.950429916381836e-06, 3.919005393981934e-06, 4.887580871582031e-06, 5.856156349182129e-06, 6.8247318267822266e-06, 7.793307304382324e-06, 8.761882781982422e-06, 9.73045825958252e-06, 1.0699033737182617e-05, 1.1667609214782715e-05, 1.2636184692382812e-05, 1.360476016998291e-05, 1.4573335647583008e-05, 1.5541911125183105e-05, 1.6510486602783203e-05, 1.74790620803833e-05, 1.84476375579834e-05, 1.9416213035583496e-05, 2.0384788513183594e-05, 2.135336399078369e-05, 2.232193946838379e-05, 2.3290514945983887e-05, 2.4259090423583984e-05, 2.5227665901184082e-05, 2.619624137878418e-05, 2.7164816856384277e-05, 2.8133392333984375e-05, 2.9101967811584473e-05, 3.007054328918457e-05, 3.103911876678467e-05, 3.2007694244384766e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 6.0, 15.0, 9.0, 25.0, 38.0, 44.0, 81.0, 131.0, 173.0, 367.0, 691.0, 1622.0, 4513.0, 17840.0, 122369.0, 790389.0, 89436.0, 14170.0, 3755.0, 1369.0, 642.0, 328.0, 173.0, 111.0, 70.0, 44.0, 40.0, 29.0, 22.0, 9.0, 7.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06842041015625, -0.06609535217285156, -0.06377029418945312, -0.06144523620605469, -0.05912017822265625, -0.05679512023925781, -0.054470062255859375, -0.05214500427246094, -0.0498199462890625, -0.04749488830566406, -0.045169830322265625, -0.04284477233886719, -0.04051971435546875, -0.03819465637207031, -0.035869598388671875, -0.03354454040527344, -0.031219482421875, -0.028894424438476562, -0.026569366455078125, -0.024244308471679688, -0.02191925048828125, -0.019594192504882812, -0.017269134521484375, -0.014944076538085938, -0.0126190185546875, -0.010293960571289062, -0.007968902587890625, -0.0056438446044921875, -0.00331878662109375, -0.0009937286376953125, 0.001331329345703125, 0.0036563873291015625, 0.0059814453125, 0.008306503295898438, 0.010631561279296875, 0.012956619262695312, 0.01528167724609375, 0.017606735229492188, 0.019931793212890625, 0.022256851196289062, 0.0245819091796875, 0.026906967163085938, 0.029232025146484375, 0.03155708312988281, 0.03388214111328125, 0.03620719909667969, 0.038532257080078125, 0.04085731506347656, 0.043182373046875, 0.04550743103027344, 0.047832489013671875, 0.05015754699707031, 0.05248260498046875, 0.05480766296386719, 0.057132720947265625, 0.05945777893066406, 0.0617828369140625, 0.06410789489746094, 0.06643295288085938, 0.06875801086425781, 0.07108306884765625, 0.07340812683105469, 0.07573318481445312, 0.07805824279785156, 0.08038330078125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 8.0, 15.0, 14.0, 15.0, 29.0, 19.0, 40.0, 57.0, 84.0, 150.0, 127.0, 115.0, 87.0, 61.0, 54.0, 27.0, 32.0, 17.0, 7.0, 14.0, 7.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0650634765625, -0.062419891357421875, -0.05977630615234375, -0.057132720947265625, -0.0544891357421875, -0.051845550537109375, -0.04920196533203125, -0.046558380126953125, -0.043914794921875, -0.041271209716796875, -0.03862762451171875, -0.035984039306640625, -0.0333404541015625, -0.030696868896484375, -0.02805328369140625, -0.025409698486328125, -0.02276611328125, -0.020122528076171875, -0.01747894287109375, -0.014835357666015625, -0.0121917724609375, -0.009548187255859375, -0.00690460205078125, -0.004261016845703125, -0.001617431640625, 0.001026153564453125, 0.00366973876953125, 0.006313323974609375, 0.0089569091796875, 0.011600494384765625, 0.01424407958984375, 0.016887664794921875, 0.01953125, 0.022174835205078125, 0.02481842041015625, 0.027462005615234375, 0.0301055908203125, 0.032749176025390625, 0.03539276123046875, 0.038036346435546875, 0.040679931640625, 0.043323516845703125, 0.04596710205078125, 0.048610687255859375, 0.0512542724609375, 0.053897857666015625, 0.05654144287109375, 0.059185028076171875, 0.06182861328125, 0.06447219848632812, 0.06711578369140625, 0.06975936889648438, 0.0724029541015625, 0.07504653930664062, 0.07769012451171875, 0.08033370971679688, 0.082977294921875, 0.08562088012695312, 0.08826446533203125, 0.09090805053710938, 0.0935516357421875, 0.09619522094726562, 0.09883880615234375, 0.10148239135742188, 0.1041259765625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 10.0, 15.0, 38.0, 113.0, 307.0, 385.0, 91.0, 30.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8249331712722778, -1.7238578796386719, -1.6227824687957764, -1.5217071771621704, -1.4206318855285645, -1.319556474685669, -1.218481183052063, -1.117405891418457, -1.0163304805755615, -0.9152551293373108, -0.8141798377037048, -0.7131044864654541, -0.6120291948318481, -0.5109538435935974, -0.4098784923553467, -0.3088032007217407, -0.20772790908813477, -0.10665258020162582, -0.005577251315116882, 0.09549808502197266, 0.196573406457901, 0.29764872789382935, 0.3987240791320801, 0.49979937076568604, 0.6008747220039368, 0.7019500732421875, 0.8030253648757935, 0.9041007161140442, 1.005176067352295, 1.1062513589859009, 1.2073266506195068, 1.3084020614624023, 1.4094774723052979, 1.5105527639389038, 1.6116281747817993, 1.7127034664154053, 1.8137787580490112, 1.9148540496826172, 2.0159294605255127, 2.117004871368408, 2.2180800437927246, 2.31915545463562, 2.4202306270599365, 2.521306037902832, 2.6223814487457275, 2.723456621170044, 2.8245320320129395, 2.925607204437256, 3.0266828536987305, 3.127758264541626, 3.2288334369659424, 3.329908847808838, 3.4309842586517334, 3.53205943107605, 3.6331348419189453, 3.7342100143432617, 3.8352854251861572, 3.9363608360290527, 4.037436008453369, 4.138511657714844, 4.23958683013916, 4.340662002563477, 4.441737174987793, 4.542812824249268, 4.643887996673584]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 4.0, 8.0, 3.0, 9.0, 7.0, 13.0, 12.0, 12.0, 15.0, 15.0, 24.0, 16.0, 23.0, 34.0, 34.0, 38.0, 60.0, 87.0, 176.0, 75.0, 52.0, 39.0, 38.0, 27.0, 29.0, 25.0, 20.0, 18.0, 20.0, 13.0, 12.0, 7.0, 3.0, 8.0, 4.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3344430923461914, -1.2888784408569336, -1.2433139085769653, -1.1977492570877075, -1.1521847248077393, -1.1066200733184814, -1.0610554218292236, -1.0154907703399658, -0.9699262380599976, -0.9243616461753845, -0.8787970542907715, -0.8332324028015137, -0.7876678109169006, -0.7421032190322876, -0.6965385675430298, -0.6509739756584167, -0.6054093837738037, -0.5598447918891907, -0.5142802000045776, -0.4687155485153198, -0.4231509566307068, -0.37758636474609375, -0.3320217430591583, -0.2864571213722229, -0.24089252948760986, -0.19532792270183563, -0.1497633159160614, -0.10419870913028717, -0.05863410234451294, -0.013069495558738708, 0.03249511122703552, 0.07805973291397095, 0.12362432479858398, 0.16918893158435822, 0.21475353837013245, 0.26031816005706787, 0.3058827519416809, 0.35144734382629395, 0.39701196551322937, 0.4425765872001648, 0.48814117908477783, 0.5337057709693909, 0.5792703628540039, 0.6248350143432617, 0.6703996062278748, 0.7159641981124878, 0.7615288496017456, 0.8070934414863586, 0.8526580333709717, 0.8982226252555847, 0.9437872171401978, 0.9893518686294556, 1.0349164009094238, 1.0804810523986816, 1.1260457038879395, 1.1716103553771973, 1.2171748876571655, 1.2627395391464233, 1.3083040714263916, 1.3538687229156494, 1.3994333744049072, 1.4449979066848755, 1.4905625581741333, 1.5361270904541016, 1.5816917419433594]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 8.0, 15.0, 17.0, 30.0, 42.0, 48.0, 67.0, 90.0, 121.0, 174.0, 308.0, 416.0, 593.0, 965.0, 1506.0, 2660.0, 5009.0, 10397.0, 26402.0, 82610.0, 289211.0, 883815.0, 1555223.0, 903211.0, 296483.0, 83515.0, 28229.0, 10936.0, 4981.0, 2793.0, 1554.0, 901.0, 626.0, 411.0, 264.0, 170.0, 144.0, 88.0, 75.0, 34.0, 33.0, 22.0, 22.0, 19.0, 16.0, 3.0, 3.0, 5.0, 0.0, 8.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0950927734375, -0.09216785430908203, -0.08924293518066406, -0.0863180160522461, -0.08339309692382812, -0.08046817779541016, -0.07754325866699219, -0.07461833953857422, -0.07169342041015625, -0.06876850128173828, -0.06584358215332031, -0.06291866302490234, -0.059993743896484375, -0.057068824768066406, -0.05414390563964844, -0.05121898651123047, -0.0482940673828125, -0.04536914825439453, -0.04244422912597656, -0.039519309997558594, -0.036594390869140625, -0.033669471740722656, -0.030744552612304688, -0.02781963348388672, -0.02489471435546875, -0.02196979522705078, -0.019044876098632812, -0.016119956970214844, -0.013195037841796875, -0.010270118713378906, -0.0073451995849609375, -0.004420280456542969, -0.001495361328125, 0.0014295578002929688, 0.0043544769287109375, 0.007279396057128906, 0.010204315185546875, 0.013129234313964844, 0.016054153442382812, 0.01897907257080078, 0.02190399169921875, 0.02482891082763672, 0.027753829956054688, 0.030678749084472656, 0.033603668212890625, 0.036528587341308594, 0.03945350646972656, 0.04237842559814453, 0.0453033447265625, 0.04822826385498047, 0.05115318298339844, 0.054078102111816406, 0.057003021240234375, 0.059927940368652344, 0.06285285949707031, 0.06577777862548828, 0.06870269775390625, 0.07162761688232422, 0.07455253601074219, 0.07747745513916016, 0.08040237426757812, 0.0833272933959961, 0.08625221252441406, 0.08917713165283203, 0.09210205078125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 13.0, 10.0, 12.0, 14.0, 19.0, 18.0, 30.0, 30.0, 36.0, 41.0, 45.0, 44.0, 48.0, 51.0, 50.0, 40.0, 55.0, 48.0, 49.0, 42.0, 41.0, 36.0, 37.0, 22.0, 32.0, 29.0, 14.0, 16.0, 18.0, 12.0, 10.0, 7.0, 4.0, 1.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0992431640625, -0.09629535675048828, -0.09334754943847656, -0.09039974212646484, -0.08745193481445312, -0.0845041275024414, -0.08155632019042969, -0.07860851287841797, -0.07566070556640625, -0.07271289825439453, -0.06976509094238281, -0.0668172836303711, -0.06386947631835938, -0.060921669006347656, -0.05797386169433594, -0.05502605438232422, -0.0520782470703125, -0.04913043975830078, -0.04618263244628906, -0.043234825134277344, -0.040287017822265625, -0.037339210510253906, -0.03439140319824219, -0.03144359588623047, -0.02849578857421875, -0.02554798126220703, -0.022600173950195312, -0.019652366638183594, -0.016704559326171875, -0.013756752014160156, -0.010808944702148438, -0.007861137390136719, -0.004913330078125, -0.0019655227661132812, 0.0009822845458984375, 0.003930091857910156, 0.006877899169921875, 0.009825706481933594, 0.012773513793945312, 0.01572132110595703, 0.01866912841796875, 0.02161693572998047, 0.024564743041992188, 0.027512550354003906, 0.030460357666015625, 0.033408164978027344, 0.03635597229003906, 0.03930377960205078, 0.0422515869140625, 0.04519939422607422, 0.04814720153808594, 0.051095008850097656, 0.054042816162109375, 0.056990623474121094, 0.05993843078613281, 0.06288623809814453, 0.06583404541015625, 0.06878185272216797, 0.07172966003417969, 0.0746774673461914, 0.07762527465820312, 0.08057308197021484, 0.08352088928222656, 0.08646869659423828, 0.08941650390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 8.0, 5.0, 10.0, 10.0, 6.0, 18.0, 19.0, 29.0, 46.0, 70.0, 89.0, 142.0, 227.0, 377.0, 520.0, 1035.0, 2095.0, 7221.0, 93610.0, 3971736.0, 104698.0, 7754.0, 2140.0, 969.0, 505.0, 318.0, 183.0, 139.0, 88.0, 54.0, 48.0, 22.0, 32.0, 16.0, 11.0, 11.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.51611328125, -0.5015792846679688, -0.4870452880859375, -0.47251129150390625, -0.457977294921875, -0.44344329833984375, -0.4289093017578125, -0.41437530517578125, -0.39984130859375, -0.38530731201171875, -0.3707733154296875, -0.35623931884765625, -0.341705322265625, -0.32717132568359375, -0.3126373291015625, -0.29810333251953125, -0.2835693359375, -0.26903533935546875, -0.2545013427734375, -0.23996734619140625, -0.225433349609375, -0.21089935302734375, -0.1963653564453125, -0.18183135986328125, -0.16729736328125, -0.15276336669921875, -0.1382293701171875, -0.12369537353515625, -0.109161376953125, -0.09462738037109375, -0.0800933837890625, -0.06555938720703125, -0.051025390625, -0.03649139404296875, -0.0219573974609375, -0.00742340087890625, 0.007110595703125, 0.02164459228515625, 0.0361785888671875, 0.05071258544921875, 0.06524658203125, 0.07978057861328125, 0.0943145751953125, 0.10884857177734375, 0.123382568359375, 0.13791656494140625, 0.1524505615234375, 0.16698455810546875, 0.1815185546875, 0.19605255126953125, 0.2105865478515625, 0.22512054443359375, 0.239654541015625, 0.25418853759765625, 0.2687225341796875, 0.28325653076171875, 0.29779052734375, 0.31232452392578125, 0.3268585205078125, 0.34139251708984375, 0.355926513671875, 0.37046051025390625, 0.3849945068359375, 0.39952850341796875, 0.4140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 2.0, 12.0, 5.0, 8.0, 6.0, 11.0, 18.0, 20.0, 35.0, 33.0, 56.0, 93.0, 120.0, 194.0, 252.0, 357.0, 479.0, 609.0, 467.0, 367.0, 246.0, 188.0, 134.0, 87.0, 74.0, 48.0, 37.0, 30.0, 28.0, 16.0, 11.0, 4.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.314697265625, -0.3062782287597656, -0.29785919189453125, -0.2894401550292969, -0.2810211181640625, -0.2726020812988281, -0.26418304443359375, -0.2557640075683594, -0.247344970703125, -0.23892593383789062, -0.23050689697265625, -0.22208786010742188, -0.2136688232421875, -0.20524978637695312, -0.19683074951171875, -0.18841171264648438, -0.17999267578125, -0.17157363891601562, -0.16315460205078125, -0.15473556518554688, -0.1463165283203125, -0.13789749145507812, -0.12947845458984375, -0.12105941772460938, -0.112640380859375, -0.10422134399414062, -0.09580230712890625, -0.08738327026367188, -0.0789642333984375, -0.07054519653320312, -0.06212615966796875, -0.053707122802734375, -0.0452880859375, -0.036869049072265625, -0.02845001220703125, -0.020030975341796875, -0.0116119384765625, -0.003192901611328125, 0.00522613525390625, 0.013645172119140625, 0.022064208984375, 0.030483245849609375, 0.03890228271484375, 0.047321319580078125, 0.0557403564453125, 0.06415939331054688, 0.07257843017578125, 0.08099746704101562, 0.08941650390625, 0.09783554077148438, 0.10625457763671875, 0.11467361450195312, 0.1230926513671875, 0.13151168823242188, 0.13993072509765625, 0.14834976196289062, 0.156768798828125, 0.16518783569335938, 0.17360687255859375, 0.18202590942382812, 0.1904449462890625, 0.19886398315429688, 0.20728302001953125, 0.21570205688476562, 0.22412109375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 11.0, 8.0, 24.0, 61.0, 142.0, 240.0, 260.0, 139.0, 64.0, 25.0, 15.0, 2.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.275860786437988, -6.118461608886719, -5.961061954498291, -5.8036627769470215, -5.646263122558594, -5.488863945007324, -5.3314642906188965, -5.174065113067627, -5.016665458679199, -4.85926628112793, -4.701866626739502, -4.544467449188232, -4.387067794799805, -4.229668617248535, -4.072268962860107, -3.914869785308838, -3.7574706077575684, -3.6000711917877197, -3.442671775817871, -3.2852723598480225, -3.127872943878174, -2.9704737663269043, -2.8130743503570557, -2.655674934387207, -2.4982755184173584, -2.3408761024475098, -2.183476686477661, -2.0260772705078125, -1.8686779737472534, -1.7112785577774048, -1.5538792610168457, -1.396479845046997, -1.2390809059143066, -1.081681489944458, -0.9242821335792542, -0.7668827772140503, -0.6094833612442017, -0.452083945274353, -0.29468458890914917, -0.1372852325439453, 0.02011418342590332, 0.17751356959342957, 0.3349129557609558, 0.49231234192848206, 0.6497117280960083, 0.8071111440658569, 0.9645105004310608, 1.1219098567962646, 1.2793092727661133, 1.436708688735962, 1.5941081047058105, 1.7515074014663696, 1.9089068174362183, 2.0663061141967773, 2.223705530166626, 2.3811049461364746, 2.5385043621063232, 2.695903778076172, 2.8533031940460205, 3.010702610015869, 3.1681017875671387, 3.3255014419555664, 3.482900619506836, 3.6403000354766846, 3.797699451446533]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 10.0, 10.0, 15.0, 20.0, 21.0, 46.0, 45.0, 45.0, 51.0, 84.0, 99.0, 92.0, 85.0, 54.0, 68.0, 51.0, 58.0, 32.0, 33.0, 28.0, 20.0, 13.0, 10.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.195653200149536, -3.114492893218994, -3.033332586288452, -2.95217227935791, -2.871011734008789, -2.789851427078247, -2.708691120147705, -2.627530813217163, -2.546370506286621, -2.465210199356079, -2.384049892425537, -2.302889585494995, -2.221729278564453, -2.140568733215332, -2.05940842628479, -1.978248119354248, -1.897087812423706, -1.815927505493164, -1.734767198562622, -1.6536067724227905, -1.5724464654922485, -1.4912861585617065, -1.410125732421875, -1.328965425491333, -1.247805118560791, -1.166644811630249, -1.085484504699707, -1.0043240785598755, -0.9231637716293335, -0.8420034646987915, -0.7608430981636047, -0.679682731628418, -0.598522424697876, -0.517362117767334, -0.4362017512321472, -0.35504141449928284, -0.27388107776641846, -0.19272074103355408, -0.1115604043006897, -0.03040003776550293, 0.05076026916503906, 0.13192060589790344, 0.21308094263076782, 0.2942412793636322, 0.3754016160964966, 0.45656195282936096, 0.5377222895622253, 0.6188826560974121, 0.7000429630279541, 0.7812032699584961, 0.8623636364936829, 0.9435240030288696, 1.0246843099594116, 1.1058446168899536, 1.1870050430297852, 1.2681653499603271, 1.3493256568908691, 1.4304859638214111, 1.5116462707519531, 1.5928066968917847, 1.6739670038223267, 1.7551273107528687, 1.8362877368927002, 1.9174480438232422, 1.9986083507537842]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 3.0, 6.0, 10.0, 9.0, 15.0, 15.0, 26.0, 34.0, 58.0, 65.0, 122.0, 233.0, 546.0, 1515.0, 4814.0, 19845.0, 143181.0, 784774.0, 74868.0, 12923.0, 3391.0, 1120.0, 451.0, 205.0, 124.0, 53.0, 41.0, 36.0, 24.0, 11.0, 7.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.270263671875, -0.2610588073730469, -0.25185394287109375, -0.24264907836914062, -0.2334442138671875, -0.22423934936523438, -0.21503448486328125, -0.20582962036132812, -0.196624755859375, -0.18741989135742188, -0.17821502685546875, -0.16901016235351562, -0.1598052978515625, -0.15060043334960938, -0.14139556884765625, -0.13219070434570312, -0.12298583984375, -0.11378097534179688, -0.10457611083984375, -0.09537124633789062, -0.0861663818359375, -0.07696151733398438, -0.06775665283203125, -0.058551788330078125, -0.049346923828125, -0.040142059326171875, -0.03093719482421875, -0.021732330322265625, -0.0125274658203125, -0.003322601318359375, 0.00588226318359375, 0.015087127685546875, 0.0242919921875, 0.033496856689453125, 0.04270172119140625, 0.051906585693359375, 0.0611114501953125, 0.07031631469726562, 0.07952117919921875, 0.08872604370117188, 0.097930908203125, 0.10713577270507812, 0.11634063720703125, 0.12554550170898438, 0.1347503662109375, 0.14395523071289062, 0.15316009521484375, 0.16236495971679688, 0.17156982421875, 0.18077468872070312, 0.18997955322265625, 0.19918441772460938, 0.2083892822265625, 0.21759414672851562, 0.22679901123046875, 0.23600387573242188, 0.245208740234375, 0.2544136047363281, 0.26361846923828125, 0.2728233337402344, 0.2820281982421875, 0.2912330627441406, 0.30043792724609375, 0.3096427917480469, 0.31884765625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 10.0, 22.0, 40.0, 56.0, 56.0, 96.0, 119.0, 98.0, 118.0, 107.0, 87.0, 69.0, 42.0, 28.0, 18.0, 11.0, 11.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.329345703125, -0.3212776184082031, -0.31320953369140625, -0.3051414489746094, -0.2970733642578125, -0.2890052795410156, -0.28093719482421875, -0.2728691101074219, -0.264801025390625, -0.2567329406738281, -0.24866485595703125, -0.24059677124023438, -0.2325286865234375, -0.22446060180664062, -0.21639251708984375, -0.20832443237304688, -0.20025634765625, -0.19218826293945312, -0.18412017822265625, -0.17605209350585938, -0.1679840087890625, -0.15991592407226562, -0.15184783935546875, -0.14377975463867188, -0.135711669921875, -0.12764358520507812, -0.11957550048828125, -0.11150741577148438, -0.1034393310546875, -0.09537124633789062, -0.08730316162109375, -0.07923507690429688, -0.0711669921875, -0.06309890747070312, -0.05503082275390625, -0.046962738037109375, -0.0388946533203125, -0.030826568603515625, -0.02275848388671875, -0.014690399169921875, -0.006622314453125, 0.001445770263671875, 0.00951385498046875, 0.017581939697265625, 0.0256500244140625, 0.033718109130859375, 0.04178619384765625, 0.049854278564453125, 0.05792236328125, 0.06599044799804688, 0.07405853271484375, 0.08212661743164062, 0.0901947021484375, 0.09826278686523438, 0.10633087158203125, 0.11439895629882812, 0.122467041015625, 0.13053512573242188, 0.13860321044921875, 0.14667129516601562, 0.1547393798828125, 0.16280746459960938, 0.17087554931640625, 0.17894363403320312, 0.18701171875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 2.0, 10.0, 12.0, 12.0, 24.0, 26.0, 43.0, 42.0, 72.0, 151.0, 220.0, 395.0, 872.0, 2804.0, 17982.0, 854669.0, 158202.0, 9619.0, 1848.0, 700.0, 330.0, 169.0, 115.0, 75.0, 56.0, 29.0, 21.0, 16.0, 11.0, 13.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.371826171875, -0.36200714111328125, -0.3521881103515625, -0.34236907958984375, -0.332550048828125, -0.32273101806640625, -0.3129119873046875, -0.30309295654296875, -0.29327392578125, -0.28345489501953125, -0.2736358642578125, -0.26381683349609375, -0.253997802734375, -0.24417877197265625, -0.2343597412109375, -0.22454071044921875, -0.2147216796875, -0.20490264892578125, -0.1950836181640625, -0.18526458740234375, -0.175445556640625, -0.16562652587890625, -0.1558074951171875, -0.14598846435546875, -0.13616943359375, -0.12635040283203125, -0.1165313720703125, -0.10671234130859375, -0.096893310546875, -0.08707427978515625, -0.0772552490234375, -0.06743621826171875, -0.0576171875, -0.04779815673828125, -0.0379791259765625, -0.02816009521484375, -0.018341064453125, -0.00852203369140625, 0.0012969970703125, 0.01111602783203125, 0.02093505859375, 0.03075408935546875, 0.0405731201171875, 0.05039215087890625, 0.060211181640625, 0.07003021240234375, 0.0798492431640625, 0.08966827392578125, 0.0994873046875, 0.10930633544921875, 0.1191253662109375, 0.12894439697265625, 0.138763427734375, 0.14858245849609375, 0.1584014892578125, 0.16822052001953125, 0.17803955078125, 0.18785858154296875, 0.1976776123046875, 0.20749664306640625, 0.217315673828125, 0.22713470458984375, 0.2369537353515625, 0.24677276611328125, 0.256591796875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 9.0, 9.0, 9.0, 12.0, 10.0, 21.0, 21.0, 19.0, 33.0, 21.0, 32.0, 28.0, 37.0, 52.0, 66.0, 65.0, 73.0, 74.0, 75.0, 71.0, 34.0, 30.0, 34.0, 25.0, 20.0, 21.0, 21.0, 13.0, 12.0, 14.0, 8.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.52294921875, -0.5094566345214844, -0.49596405029296875, -0.4824714660644531, -0.4689788818359375, -0.4554862976074219, -0.44199371337890625, -0.4285011291503906, -0.415008544921875, -0.4015159606933594, -0.38802337646484375, -0.3745307922363281, -0.3610382080078125, -0.3475456237792969, -0.33405303955078125, -0.3205604553222656, -0.30706787109375, -0.2935752868652344, -0.28008270263671875, -0.2665901184082031, -0.2530975341796875, -0.23960494995117188, -0.22611236572265625, -0.21261978149414062, -0.199127197265625, -0.18563461303710938, -0.17214202880859375, -0.15864944458007812, -0.1451568603515625, -0.13166427612304688, -0.11817169189453125, -0.10467910766601562, -0.0911865234375, -0.07769393920898438, -0.06420135498046875, -0.050708770751953125, -0.0372161865234375, -0.023723602294921875, -0.01023101806640625, 0.003261566162109375, 0.016754150390625, 0.030246734619140625, 0.04373931884765625, 0.057231903076171875, 0.0707244873046875, 0.08421707153320312, 0.09770965576171875, 0.11120223999023438, 0.12469482421875, 0.13818740844726562, 0.15167999267578125, 0.16517257690429688, 0.1786651611328125, 0.19215774536132812, 0.20565032958984375, 0.21914291381835938, 0.232635498046875, 0.24612808227539062, 0.25962066650390625, 0.2731132507324219, 0.2866058349609375, 0.3000984191894531, 0.31359100341796875, 0.3270835876464844, 0.340576171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 2.0, 15.0, 11.0, 26.0, 34.0, 48.0, 83.0, 133.0, 249.0, 535.0, 1297.0, 4425.0, 28282.0, 953441.0, 50663.0, 6317.0, 1592.0, 631.0, 329.0, 165.0, 89.0, 57.0, 41.0, 21.0, 20.0, 15.0, 7.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0799560546875, -0.07750415802001953, -0.07505226135253906, -0.0726003646850586, -0.07014846801757812, -0.06769657135009766, -0.06524467468261719, -0.06279277801513672, -0.06034088134765625, -0.05788898468017578, -0.05543708801269531, -0.052985191345214844, -0.050533294677734375, -0.048081398010253906, -0.04562950134277344, -0.04317760467529297, -0.0407257080078125, -0.03827381134033203, -0.03582191467285156, -0.033370018005371094, -0.030918121337890625, -0.028466224670410156, -0.026014328002929688, -0.02356243133544922, -0.02111053466796875, -0.01865863800048828, -0.016206741333007812, -0.013754844665527344, -0.011302947998046875, -0.008851051330566406, -0.0063991546630859375, -0.003947257995605469, -0.001495361328125, 0.0009565353393554688, 0.0034084320068359375, 0.005860328674316406, 0.008312225341796875, 0.010764122009277344, 0.013216018676757812, 0.01566791534423828, 0.01811981201171875, 0.02057170867919922, 0.023023605346679688, 0.025475502014160156, 0.027927398681640625, 0.030379295349121094, 0.03283119201660156, 0.03528308868408203, 0.0377349853515625, 0.04018688201904297, 0.04263877868652344, 0.045090675354003906, 0.047542572021484375, 0.049994468688964844, 0.05244636535644531, 0.05489826202392578, 0.05735015869140625, 0.05980205535888672, 0.06225395202636719, 0.06470584869384766, 0.06715774536132812, 0.0696096420288086, 0.07206153869628906, 0.07451343536376953, 0.07696533203125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 7.0, 9.0, 7.0, 20.0, 18.0, 26.0, 20.0, 32.0, 44.0, 50.0, 72.0, 90.0, 84.0, 78.0, 92.0, 72.0, 60.0, 43.0, 31.0, 23.0, 20.0, 17.0, 14.0, 17.0, 10.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.74913215637207e-05, -3.645382821559906e-05, -3.541633486747742e-05, -3.4378841519355774e-05, -3.334134817123413e-05, -3.230385482311249e-05, -3.1266361474990845e-05, -3.02288681268692e-05, -2.919137477874756e-05, -2.8153881430625916e-05, -2.7116388082504272e-05, -2.607889473438263e-05, -2.5041401386260986e-05, -2.4003908038139343e-05, -2.29664146900177e-05, -2.1928921341896057e-05, -2.0891427993774414e-05, -1.985393464565277e-05, -1.8816441297531128e-05, -1.7778947949409485e-05, -1.6741454601287842e-05, -1.57039612531662e-05, -1.4666467905044556e-05, -1.3628974556922913e-05, -1.259148120880127e-05, -1.1553987860679626e-05, -1.0516494512557983e-05, -9.47900116443634e-06, -8.441507816314697e-06, -7.404014468193054e-06, -6.366521120071411e-06, -5.329027771949768e-06, -4.291534423828125e-06, -3.254041075706482e-06, -2.216547727584839e-06, -1.1790543794631958e-06, -1.4156103134155273e-07, 8.959323167800903e-07, 1.9334256649017334e-06, 2.9709190130233765e-06, 4.0084123611450195e-06, 5.045905709266663e-06, 6.083399057388306e-06, 7.120892405509949e-06, 8.158385753631592e-06, 9.195879101753235e-06, 1.0233372449874878e-05, 1.1270865797996521e-05, 1.2308359146118164e-05, 1.3345852494239807e-05, 1.438334584236145e-05, 1.5420839190483093e-05, 1.6458332538604736e-05, 1.749582588672638e-05, 1.8533319234848022e-05, 1.9570812582969666e-05, 2.060830593109131e-05, 2.164579927921295e-05, 2.2683292627334595e-05, 2.3720785975456238e-05, 2.475827932357788e-05, 2.5795772671699524e-05, 2.6833266019821167e-05, 2.787075936794281e-05, 2.8908252716064453e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 2.0, 2.0, 7.0, 13.0, 23.0, 23.0, 37.0, 53.0, 93.0, 190.0, 288.0, 537.0, 1086.0, 2521.0, 6830.0, 23331.0, 249926.0, 725359.0, 25677.0, 7322.0, 2723.0, 1156.0, 564.0, 318.0, 170.0, 98.0, 62.0, 32.0, 29.0, 22.0, 15.0, 12.0, 2.0, 10.0, 5.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03973388671875, -0.03831624984741211, -0.03689861297607422, -0.03548097610473633, -0.03406333923339844, -0.03264570236206055, -0.031228065490722656, -0.029810428619384766, -0.028392791748046875, -0.026975154876708984, -0.025557518005371094, -0.024139881134033203, -0.022722244262695312, -0.021304607391357422, -0.01988697052001953, -0.01846933364868164, -0.01705169677734375, -0.01563405990600586, -0.014216423034667969, -0.012798786163330078, -0.011381149291992188, -0.009963512420654297, -0.008545875549316406, -0.007128238677978516, -0.005710601806640625, -0.004292964935302734, -0.0028753280639648438, -0.0014576911926269531, -4.00543212890625e-05, 0.0013775825500488281, 0.0027952194213867188, 0.004212856292724609, 0.0056304931640625, 0.007048130035400391, 0.008465766906738281, 0.009883403778076172, 0.011301040649414062, 0.012718677520751953, 0.014136314392089844, 0.015553951263427734, 0.016971588134765625, 0.018389225006103516, 0.019806861877441406, 0.021224498748779297, 0.022642135620117188, 0.024059772491455078, 0.02547740936279297, 0.02689504623413086, 0.02831268310546875, 0.02973031997680664, 0.03114795684814453, 0.03256559371948242, 0.03398323059082031, 0.0354008674621582, 0.036818504333496094, 0.038236141204833984, 0.039653778076171875, 0.041071414947509766, 0.042489051818847656, 0.04390668869018555, 0.04532432556152344, 0.04674196243286133, 0.04815959930419922, 0.04957723617553711, 0.050994873046875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 10.0, 8.0, 7.0, 12.0, 21.0, 20.0, 24.0, 26.0, 30.0, 34.0, 46.0, 84.0, 116.0, 141.0, 98.0, 66.0, 54.0, 37.0, 25.0, 23.0, 19.0, 11.0, 14.0, 15.0, 5.0, 7.0, 7.0, 7.0, 4.0, 2.0, 3.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0382080078125, -0.03698539733886719, -0.035762786865234375, -0.03454017639160156, -0.03331756591796875, -0.03209495544433594, -0.030872344970703125, -0.029649734497070312, -0.0284271240234375, -0.027204513549804688, -0.025981903076171875, -0.024759292602539062, -0.02353668212890625, -0.022314071655273438, -0.021091461181640625, -0.019868850708007812, -0.018646240234375, -0.017423629760742188, -0.016201019287109375, -0.014978408813476562, -0.01375579833984375, -0.012533187866210938, -0.011310577392578125, -0.010087966918945312, -0.0088653564453125, -0.0076427459716796875, -0.006420135498046875, -0.0051975250244140625, -0.00397491455078125, -0.0027523040771484375, -0.001529693603515625, -0.0003070831298828125, 0.00091552734375, 0.0021381378173828125, 0.003360748291015625, 0.0045833587646484375, 0.00580596923828125, 0.0070285797119140625, 0.008251190185546875, 0.009473800659179688, 0.0106964111328125, 0.011919021606445312, 0.013141632080078125, 0.014364242553710938, 0.01558685302734375, 0.016809463500976562, 0.018032073974609375, 0.019254684448242188, 0.020477294921875, 0.021699905395507812, 0.022922515869140625, 0.024145126342773438, 0.02536773681640625, 0.026590347290039062, 0.027812957763671875, 0.029035568237304688, 0.0302581787109375, 0.03148078918457031, 0.032703399658203125, 0.03392601013183594, 0.03514862060546875, 0.03637123107910156, 0.037593841552734375, 0.03881645202636719, 0.0400390625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 8.0, 40.0, 86.0, 571.0, 194.0, 54.0, 25.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.972259521484375, -3.8644375801086426, -3.75661563873291, -3.6487936973571777, -3.5409717559814453, -3.433149814605713, -3.3253278732299805, -3.217505931854248, -3.1096839904785156, -3.001862049102783, -2.894040107727051, -2.7862181663513184, -2.678396224975586, -2.5705742835998535, -2.462752342224121, -2.3549304008483887, -2.2471084594726562, -2.139286518096924, -2.0314645767211914, -1.923642635345459, -1.8158206939697266, -1.7079987525939941, -1.6001768112182617, -1.4923548698425293, -1.3845326900482178, -1.2767107486724854, -1.168888807296753, -1.0610668659210205, -0.9532449245452881, -0.8454229235649109, -0.7376009821891785, -0.629779040813446, -0.5219571590423584, -0.414135217666626, -0.30631327629089355, -0.19849130511283875, -0.09066936373710632, 0.017152607440948486, 0.12497454881668091, 0.23279649019241333, 0.34061843156814575, 0.4484403729438782, 0.5562623143196106, 0.6640843152999878, 0.7719062566757202, 0.8797281980514526, 0.9875501394271851, 1.0953720808029175, 1.20319402217865, 1.3110159635543823, 1.4188379049301147, 1.5266598463058472, 1.6344817876815796, 1.7423038482666016, 1.850125789642334, 1.9579477310180664, 2.065769672393799, 2.1735916137695312, 2.2814135551452637, 2.389235496520996, 2.4970574378967285, 2.604879379272461, 2.7127013206481934, 2.820523262023926, 2.928345203399658]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 8.0, 7.0, 9.0, 17.0, 13.0, 18.0, 20.0, 13.0, 27.0, 19.0, 26.0, 24.0, 34.0, 129.0, 316.0, 74.0, 26.0, 34.0, 22.0, 17.0, 16.0, 16.0, 12.0, 17.0, 9.0, 8.0, 7.0, 7.0, 10.0, 8.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2284584045410156, -1.1880301237106323, -1.147601842880249, -1.1071734428405762, -1.0667451620101929, -1.0263168811798096, -0.9858886003494263, -0.9454602599143982, -0.9050319194793701, -0.8646036386489868, -0.8241752982139587, -0.7837470173835754, -0.7433186769485474, -0.7028903961181641, -0.6624621152877808, -0.6220337748527527, -0.5816054940223694, -0.5411772131919861, -0.500748872756958, -0.4603205919265747, -0.41989225149154663, -0.37946397066116333, -0.33903566002845764, -0.29860734939575195, -0.25817903876304626, -0.21775072813034058, -0.1773224174976349, -0.1368941217660904, -0.0964658111333847, -0.056037500500679016, -0.015609204769134521, 0.024819105863571167, 0.06524741649627686, 0.10567572712898254, 0.14610403776168823, 0.18653233349323273, 0.22696064412593842, 0.2673889398574829, 0.3078172504901886, 0.3482455611228943, 0.3886738717556, 0.42910218238830566, 0.46953049302101135, 0.509958803653717, 0.5503870844841003, 0.5908154249191284, 0.6312437057495117, 0.671671986579895, 0.7121003270149231, 0.7525286078453064, 0.7929569482803345, 0.8333852291107178, 0.8738135695457458, 0.9142418503761292, 0.9546701908111572, 0.9950984716415405, 1.0355267524719238, 1.0759550333023071, 1.1163833141326904, 1.1568117141723633, 1.1972399950027466, 1.2376682758331299, 1.2780965566635132, 1.3185248374938965, 1.3589532375335693]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 7.0, 6.0, 4.0, 8.0, 12.0, 14.0, 20.0, 16.0, 22.0, 24.0, 30.0, 38.0, 38.0, 85.0, 246.0, 95.0, 48.0, 49.0, 39.0, 37.0, 13.0, 21.0, 13.0, 20.0, 11.0, 13.0, 12.0, 3.0, 8.0, 6.0, 7.0, 3.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.10479736328125, -0.10167503356933594, -0.09855270385742188, -0.09543037414550781, -0.09230804443359375, -0.08918571472167969, -0.08606338500976562, -0.08294105529785156, -0.0798187255859375, -0.07669639587402344, -0.07357406616210938, -0.07045173645019531, -0.06732940673828125, -0.06420707702636719, -0.061084747314453125, -0.05796241760253906, -0.054840087890625, -0.05171775817871094, -0.048595428466796875, -0.04547309875488281, -0.04235076904296875, -0.03922843933105469, -0.036106109619140625, -0.03298377990722656, -0.0298614501953125, -0.026739120483398438, -0.023616790771484375, -0.020494461059570312, -0.01737213134765625, -0.014249801635742188, -0.011127471923828125, -0.008005142211914062, -0.0048828125, -0.0017604827880859375, 0.001361846923828125, 0.0044841766357421875, 0.00760650634765625, 0.010728836059570312, 0.013851165771484375, 0.016973495483398438, 0.0200958251953125, 0.023218154907226562, 0.026340484619140625, 0.029462814331054688, 0.03258514404296875, 0.03570747375488281, 0.038829803466796875, 0.04195213317871094, 0.045074462890625, 0.04819679260253906, 0.051319122314453125, 0.05444145202636719, 0.05756378173828125, 0.06068611145019531, 0.06380844116210938, 0.06693077087402344, 0.0700531005859375, 0.07317543029785156, 0.07629776000976562, 0.07942008972167969, 0.08254241943359375, 0.08566474914550781, 0.08878707885742188, 0.09190940856933594, 0.09503173828125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 2.0, 7.0, 7.0, 15.0, 18.0, 31.0, 52.0, 58.0, 127.0, 215.0, 585.0, 2083.0, 18128.0, 8355497.0, 9468.0, 1416.0, 363.0, 185.0, 109.0, 86.0, 47.0, 22.0, 16.0, 4.0, 6.0, 3.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 6.0, 7.0, 6.0], "bins": [-1.727432131767273, -1.6866792440414429, -1.6459263563156128, -1.6051735877990723, -1.5644207000732422, -1.523667812347412, -1.482914924621582, -1.442162036895752, -1.4014091491699219, -1.3606562614440918, -1.3199033737182617, -1.2791506052017212, -1.2383977174758911, -1.197644829750061, -1.156891942024231, -1.1161390542984009, -1.0753862857818604, -1.0346333980560303, -0.993880569934845, -0.9531276822090149, -0.9123748540878296, -0.8716219663619995, -0.8308690786361694, -0.7901161909103394, -0.749363362789154, -0.708610475063324, -0.6678576469421387, -0.6271047592163086, -0.5863518714904785, -0.5455990433692932, -0.5048461556434631, -0.46409329771995544, -0.423340380191803, -0.3825875222682953, -0.3418346643447876, -0.3010817766189575, -0.26032891869544983, -0.21957606077194214, -0.17882318794727325, -0.13807031512260437, -0.09731745719909668, -0.05656459182500839, -0.015811726450920105, 0.024941138923168182, 0.06569400429725647, 0.10644686222076416, 0.14719973504543304, 0.18795260787010193, 0.22870546579360962, 0.2694583237171173, 0.310211181640625, 0.3509640693664551, 0.39171692728996277, 0.43246978521347046, 0.47322267293930054, 0.5139755010604858, 0.5547283887863159, 0.595481276512146, 0.6362341046333313, 0.6769869923591614, 0.7177398204803467, 0.7584927082061768, 0.7992455959320068, 0.8399984836578369, 0.8807513117790222]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 2.0, 3.0, 6.0, 2.0, 3.0, 2.0, 5.0, 7.0, 3.0, 6.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8476085662841797, -0.810314953327179, -0.7730213403701782, -0.7357277274131775, -0.6984341144561768, -0.6611405611038208, -0.6238469481468201, -0.5865533351898193, -0.5492597222328186, -0.5119661092758179, -0.47467249631881714, -0.4373789131641388, -0.40008530020713806, -0.36279168725013733, -0.325498104095459, -0.28820449113845825, -0.2509108781814575, -0.2136172652244568, -0.17632366716861725, -0.1390300691127777, -0.10173645615577698, -0.06444284319877625, -0.027149245142936707, 0.010144352912902832, 0.047437965869903564, 0.0847315713763237, 0.12202517688274384, 0.15931877493858337, 0.1966123878955841, 0.23390600085258484, 0.2711995840072632, 0.3084931969642639, 0.3457869291305542, 0.38308054208755493, 0.42037415504455566, 0.457667738199234, 0.49496135115623474, 0.5322549343109131, 0.5695485472679138, 0.6068421602249146, 0.6441357731819153, 0.681429386138916, 0.7187229990959167, 0.7560166120529175, 0.7933101654052734, 0.830603837966919, 0.8678973913192749, 0.9051910042762756, 0.9424846172332764, 0.9797782301902771, 1.0170718431472778, 1.0543653964996338, 1.0916590690612793, 1.1289526224136353, 1.1662462949752808, 1.2035398483276367, 1.2408335208892822, 1.2781270742416382, 1.3154207468032837, 1.3527143001556396, 1.3900079727172852, 1.4273015260696411, 1.4645951986312866, 1.5018887519836426, 1.5391823053359985]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 9.0, 3.0, 8.0, 6.0, 25.0, 29.0, 37.0, 71.0, 80.0, 117.0, 208.0, 352.0, 545.0, 932.0, 1781.0, 3639.0, 8081.0, 21462.0, 65313.0, 189003.0, 153837.0, 48876.0, 16877.0, 6587.0, 2838.0, 1500.0, 789.0, 445.0, 273.0, 188.0, 116.0, 83.0, 39.0, 37.0, 28.0, 19.0, 10.0, 7.0, 8.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.93896484375, -0.9135055541992188, -0.8880462646484375, -0.8625869750976562, -0.837127685546875, -0.8116683959960938, -0.7862091064453125, -0.7607498168945312, -0.73529052734375, -0.7098312377929688, -0.6843719482421875, -0.6589126586914062, -0.633453369140625, -0.6079940795898438, -0.5825347900390625, -0.5570755004882812, -0.5316162109375, -0.5061569213867188, -0.4806976318359375, -0.45523834228515625, -0.429779052734375, -0.40431976318359375, -0.3788604736328125, -0.35340118408203125, -0.32794189453125, -0.30248260498046875, -0.2770233154296875, -0.25156402587890625, -0.226104736328125, -0.20064544677734375, -0.1751861572265625, -0.14972686767578125, -0.124267578125, -0.09880828857421875, -0.0733489990234375, -0.04788970947265625, -0.022430419921875, 0.00302886962890625, 0.0284881591796875, 0.05394744873046875, 0.07940673828125, 0.10486602783203125, 0.1303253173828125, 0.15578460693359375, 0.181243896484375, 0.20670318603515625, 0.2321624755859375, 0.25762176513671875, 0.2830810546875, 0.30854034423828125, 0.3339996337890625, 0.35945892333984375, 0.384918212890625, 0.41037750244140625, 0.4358367919921875, 0.46129608154296875, 0.48675537109375, 0.5122146606445312, 0.5376739501953125, 0.5631332397460938, 0.588592529296875, 0.6140518188476562, 0.6395111083984375, 0.6649703979492188, 0.6904296875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 10.0, 14.0, 26.0, 44.0, 57.0, 98.0, 148.0, 131.0, 130.0, 112.0, 63.0, 48.0, 39.0, 27.0, 26.0, 11.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322509765625, -0.3142223358154297, -0.3059349060058594, -0.29764747619628906, -0.28936004638671875, -0.28107261657714844, -0.2727851867675781, -0.2644977569580078, -0.2562103271484375, -0.2479228973388672, -0.23963546752929688, -0.23134803771972656, -0.22306060791015625, -0.21477317810058594, -0.20648574829101562, -0.1981983184814453, -0.189910888671875, -0.1816234588623047, -0.17333602905273438, -0.16504859924316406, -0.15676116943359375, -0.14847373962402344, -0.14018630981445312, -0.1318988800048828, -0.1236114501953125, -0.11532402038574219, -0.10703659057617188, -0.09874916076660156, -0.09046173095703125, -0.08217430114746094, -0.07388687133789062, -0.06559944152832031, -0.05731201171875, -0.04902458190917969, -0.040737152099609375, -0.03244972229003906, -0.02416229248046875, -0.015874862670898438, -0.007587432861328125, 0.0006999969482421875, 0.0089874267578125, 0.017274856567382812, 0.025562286376953125, 0.03384971618652344, 0.04213714599609375, 0.05042457580566406, 0.058712005615234375, 0.06699943542480469, 0.075286865234375, 0.08357429504394531, 0.09186172485351562, 0.10014915466308594, 0.10843658447265625, 0.11672401428222656, 0.12501144409179688, 0.1332988739013672, 0.1415863037109375, 0.1498737335205078, 0.15816116333007812, 0.16644859313964844, 0.17473602294921875, 0.18302345275878906, 0.19131088256835938, 0.1995983123779297, 0.2078857421875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 16.0, 31.0, 49.0, 117.0, 110.0, 64.0, 43.0, 11.0, 6.0, 5.0, 11.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6203757524490356, -1.5752099752426147, -1.5300440788269043, -1.4848783016204834, -1.439712405204773, -1.394546627998352, -1.3493807315826416, -1.3042149543762207, -1.2590491771697998, -1.213883399963379, -1.1687175035476685, -1.1235517263412476, -1.078385829925537, -1.0332200527191162, -0.9880542159080505, -0.9428883790969849, -0.8977224826812744, -0.8525566458702087, -0.8073908090591431, -0.7622250318527222, -0.7170591354370117, -0.6718933582305908, -0.6267275214195251, -0.5815616846084595, -0.5363958477973938, -0.4912300109863281, -0.44606417417526245, -0.40089836716651917, -0.3557325303554535, -0.3105666935443878, -0.26540088653564453, -0.22023504972457886, -0.17506933212280273, -0.12990349531173706, -0.08473767340183258, -0.0395718514919281, 0.005593985319137573, 0.05075982213020325, 0.09592562913894653, 0.1410914659500122, 0.18625730276107788, 0.23142313957214355, 0.27658897638320923, 0.3217547833919525, 0.3669206202030182, 0.41208645701408386, 0.45725226402282715, 0.5024181008338928, 0.5475839376449585, 0.5927497744560242, 0.6379156112670898, 0.6830813884735107, 0.7282472848892212, 0.7734130620956421, 0.8185788989067078, 0.8637447357177734, 0.9089105725288391, 0.9540764093399048, 0.9992422461509705, 1.0444080829620361, 1.089573860168457, 1.1347397565841675, 1.1799055337905884, 1.2250714302062988, 1.2702372074127197]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0, 6.0, 15.0, 6.0, 21.0, 58.0, 117.0, 123.0, 55.0, 17.0, 13.0, 8.0, 1.0, 3.0, 2.0, 8.0, 8.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1648681163787842, -1.1329078674316406, -1.100947618484497, -1.0689873695373535, -1.03702712059021, -1.0050668716430664, -0.9731065630912781, -0.9411463141441345, -0.909186065196991, -0.8772258162498474, -0.8452655673027039, -0.8133053183555603, -0.781345009803772, -0.7493847608566284, -0.7174245119094849, -0.6854642629623413, -0.6535040140151978, -0.6215437650680542, -0.5895835161209106, -0.5576232671737671, -0.5256630182266235, -0.4937027394771576, -0.46174246072769165, -0.4297822117805481, -0.39782196283340454, -0.365861713886261, -0.33390146493911743, -0.3019411861896515, -0.26998093724250793, -0.23802068829536438, -0.20606042444705963, -0.17410016059875488, -0.14213979244232178, -0.11017953604459763, -0.07821927964687347, -0.04625902324914932, -0.014298766851425171, 0.017661482095718384, 0.04962174594402313, 0.08158200979232788, 0.11354225873947144, 0.145502507686615, 0.17746277153491974, 0.2094230353832245, 0.24138328433036804, 0.2733435332775116, 0.30530381202697754, 0.3372640609741211, 0.36922430992126465, 0.4011845588684082, 0.43314480781555176, 0.4651050865650177, 0.49706533551216125, 0.5290255546569824, 0.5609858632087708, 0.5929461121559143, 0.6249063611030579, 0.6568666100502014, 0.688826858997345, 0.7207871079444885, 0.7527474164962769, 0.7847076654434204, 0.816667914390564, 0.8486281633377075, 0.8805884122848511]}, "eval/loss": 4.228886127471924, "eval/wer": 1.9632883776279255, "eval/runtime": 974.9232, "eval/samples_per_second": 2.71, "eval/steps_per_second": 0.34, "train/train_runtime": 6364.0567, "train/train_samples_per_second": 4.484, "train/train_steps_per_second": 0.14, "train/total_flos": 0.0, "train/train_loss": 4.297821357913081} \ No newline at end of file