diff --git "a/wandb/run-20220228_122826-3vepvy3m/files/wandb-summary.json" "b/wandb/run-20220228_122826-3vepvy3m/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220228_122826-3vepvy3m/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.3305, "train/learning_rate": 9.940000000000001e-06, "train/epoch": 0.56, "train/global_step": 500, "_runtime": 3904, "_timestamp": 1646055210, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 246.0, 762.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-66.11236572265625, -45.430301666259766, -24.74823760986328, -4.066173553466797, 16.615890502929688, 37.29795837402344, 57.980018615722656, 78.66207885742188, 99.34414672851562, 120.02621459960938, 140.70828247070312, 161.3903350830078, 182.07240295410156, 202.7544708251953, 223.4365234375, 244.11859130859375, 264.8006591796875, 285.48272705078125, 306.164794921875, 326.84686279296875, 347.5289306640625, 368.21099853515625, 388.8930358886719, 409.5751037597656, 430.2571716308594, 450.9392395019531, 471.6213073730469, 492.3033752441406, 512.9854125976562, 533.66748046875, 554.3495483398438, 575.0316162109375, 595.713623046875, 616.3956909179688, 637.0777587890625, 657.7598266601562, 678.44189453125, 699.1239624023438, 719.8060302734375, 740.488037109375, 761.170166015625, 781.8522338867188, 802.5343017578125, 823.2163696289062, 843.8984375, 864.5805053710938, 885.2625732421875, 905.944580078125, 926.6266479492188, 947.3087158203125, 967.9907836914062, 988.6728515625, 1009.3549194335938, 1030.0369873046875, 1050.718994140625, 1071.401123046875, 1092.0831298828125, 1112.76513671875, 1133.447265625, 1154.1292724609375, 1174.8114013671875, 1195.493408203125, 1216.175537109375, 1236.8575439453125, 1257.5396728515625]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 10.0, 3.0, 14.0, 13.0, 11.0, 24.0, 27.0, 32.0, 35.0, 50.0, 38.0, 43.0, 46.0, 68.0, 65.0, 54.0, 53.0, 45.0, 57.0, 51.0, 44.0, 45.0, 29.0, 32.0, 24.0, 28.0, 8.0, 14.0, 10.0, 8.0, 9.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.97714233398438, -89.7153091430664, -86.4534683227539, -83.19163513183594, -79.92979431152344, -76.66796112060547, -73.4061279296875, -70.144287109375, -66.88245391845703, -63.6206169128418, -60.35877990722656, -57.096946716308594, -53.83510971069336, -50.573272705078125, -47.311439514160156, -44.04960250854492, -40.78776550292969, -37.52592849731445, -34.26409149169922, -31.00225830078125, -27.740421295166016, -24.47858428955078, -21.21674919128418, -17.954914093017578, -14.693077087402344, -11.431241035461426, -8.169404983520508, -4.90756893157959, -1.6457328796386719, 1.6161041259765625, 4.877939224243164, 8.139774322509766, 11.401611328125, 14.663447380065918, 17.925283432006836, 21.187118530273438, 24.448955535888672, 27.710792541503906, 30.972627639770508, 34.23446273803711, 37.496299743652344, 40.75813674926758, 44.01997375488281, 47.28180694580078, 50.543643951416016, 53.80548095703125, 57.06731414794922, 60.32915115356445, 63.59098815917969, 66.85282135009766, 70.11466217041016, 73.37649536132812, 76.63833618164062, 79.9001693725586, 83.16200256347656, 86.42384338378906, 89.68567657470703, 92.947509765625, 96.2093505859375, 99.47118377685547, 102.73301696777344, 105.99485778808594, 109.2566909790039, 112.51852416992188, 115.78036499023438]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 0.0, 6.0, 13.0, 11.0, 20.0, 16.0, 30.0, 38.0, 27.0, 48.0, 51.0, 52.0, 53.0, 69.0, 74.0, 85.0, 58.0, 66.0, 58.0, 37.0, 34.0, 35.0, 36.0, 24.0, 20.0, 14.0, 12.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -4.8896484375, -4.615234375, -4.3408203125, -4.06640625, -3.7919921875, -3.517578125, -3.2431640625, -2.96875, -2.6943359375, -2.419921875, -2.1455078125, -1.87109375, -1.5966796875, -1.322265625, -1.0478515625, -0.7734375, -0.4990234375, -0.224609375, 0.0498046875, 0.32421875, 0.5986328125, 0.873046875, 1.1474609375, 1.421875, 1.6962890625, 1.970703125, 2.2451171875, 2.51953125, 2.7939453125, 3.068359375, 3.3427734375, 3.6171875, 3.8916015625, 4.166015625, 4.4404296875, 4.71484375, 4.9892578125, 5.263671875, 5.5380859375, 5.8125, 6.0869140625, 6.361328125, 6.6357421875, 6.91015625, 7.1845703125, 7.458984375, 7.7333984375, 8.0078125, 8.2822265625, 8.556640625, 8.8310546875, 9.10546875, 9.3798828125, 9.654296875, 9.9287109375, 10.203125, 10.4775390625, 10.751953125, 11.0263671875, 11.30078125, 11.5751953125, 11.849609375, 12.1240234375, 12.3984375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 5.0, 7.0, 16.0, 22.0, 29.0, 52.0, 54.0, 77.0, 133.0, 198.0, 321.0, 456.0, 717.0, 1150.0, 2223.0, 4863.0, 13667.0, 59172.0, 793809.0, 2888724.0, 374422.0, 35956.0, 9698.0, 3803.0, 1866.0, 1009.0, 649.0, 376.0, 280.0, 132.0, 117.0, 70.0, 54.0, 46.0, 29.0, 28.0, 16.0, 15.0, 11.0, 2.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.671875, -12.078857421875, -11.48583984375, -10.892822265625, -10.2998046875, -9.706787109375, -9.11376953125, -8.520751953125, -7.927734375, -7.334716796875, -6.74169921875, -6.148681640625, -5.5556640625, -4.962646484375, -4.36962890625, -3.776611328125, -3.18359375, -2.590576171875, -1.99755859375, -1.404541015625, -0.8115234375, -0.218505859375, 0.37451171875, 0.967529296875, 1.560546875, 2.153564453125, 2.74658203125, 3.339599609375, 3.9326171875, 4.525634765625, 5.11865234375, 5.711669921875, 6.3046875, 6.897705078125, 7.49072265625, 8.083740234375, 8.6767578125, 9.269775390625, 9.86279296875, 10.455810546875, 11.048828125, 11.641845703125, 12.23486328125, 12.827880859375, 13.4208984375, 14.013916015625, 14.60693359375, 15.199951171875, 15.79296875, 16.385986328125, 16.97900390625, 17.572021484375, 18.1650390625, 18.758056640625, 19.35107421875, 19.944091796875, 20.537109375, 21.130126953125, 21.72314453125, 22.316162109375, 22.9091796875, 23.502197265625, 24.09521484375, 24.688232421875, 25.28125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 1.0, 10.0, 13.0, 14.0, 18.0, 26.0, 45.0, 68.0, 72.0, 90.0, 155.0, 235.0, 329.0, 499.0, 536.0, 546.0, 387.0, 282.0, 211.0, 133.0, 116.0, 77.0, 50.0, 38.0, 29.0, 19.0, 15.0, 14.0, 13.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.296875, -19.6357421875, -18.974609375, -18.3134765625, -17.65234375, -16.9912109375, -16.330078125, -15.6689453125, -15.0078125, -14.3466796875, -13.685546875, -13.0244140625, -12.36328125, -11.7021484375, -11.041015625, -10.3798828125, -9.71875, -9.0576171875, -8.396484375, -7.7353515625, -7.07421875, -6.4130859375, -5.751953125, -5.0908203125, -4.4296875, -3.7685546875, -3.107421875, -2.4462890625, -1.78515625, -1.1240234375, -0.462890625, 0.1982421875, 0.859375, 1.5205078125, 2.181640625, 2.8427734375, 3.50390625, 4.1650390625, 4.826171875, 5.4873046875, 6.1484375, 6.8095703125, 7.470703125, 8.1318359375, 8.79296875, 9.4541015625, 10.115234375, 10.7763671875, 11.4375, 12.0986328125, 12.759765625, 13.4208984375, 14.08203125, 14.7431640625, 15.404296875, 16.0654296875, 16.7265625, 17.3876953125, 18.048828125, 18.7099609375, 19.37109375, 20.0322265625, 20.693359375, 21.3544921875, 22.015625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 6.0, 7.0, 12.0, 18.0, 13.0, 22.0, 20.0, 44.0, 54.0, 78.0, 95.0, 156.0, 239.0, 364.0, 620.0, 1211.0, 3232.0, 39383.0, 3811315.0, 326321.0, 6984.0, 1725.0, 842.0, 474.0, 310.0, 207.0, 136.0, 115.0, 85.0, 54.0, 42.0, 16.0, 17.0, 15.0, 10.0, 4.0, 4.0, 4.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-66.8125, -64.7060546875, -62.599609375, -60.4931640625, -58.38671875, -56.2802734375, -54.173828125, -52.0673828125, -49.9609375, -47.8544921875, -45.748046875, -43.6416015625, -41.53515625, -39.4287109375, -37.322265625, -35.2158203125, -33.109375, -31.0029296875, -28.896484375, -26.7900390625, -24.68359375, -22.5771484375, -20.470703125, -18.3642578125, -16.2578125, -14.1513671875, -12.044921875, -9.9384765625, -7.83203125, -5.7255859375, -3.619140625, -1.5126953125, 0.59375, 2.7001953125, 4.806640625, 6.9130859375, 9.01953125, 11.1259765625, 13.232421875, 15.3388671875, 17.4453125, 19.5517578125, 21.658203125, 23.7646484375, 25.87109375, 27.9775390625, 30.083984375, 32.1904296875, 34.296875, 36.4033203125, 38.509765625, 40.6162109375, 42.72265625, 44.8291015625, 46.935546875, 49.0419921875, 51.1484375, 53.2548828125, 55.361328125, 57.4677734375, 59.57421875, 61.6806640625, 63.787109375, 65.8935546875, 68.0]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 190.0, 730.0, 85.0, 4.0, 0.0, 0.0, 1.0], "bins": [-675.4635009765625, -663.8788452148438, -652.294189453125, -640.7095336914062, -629.1248779296875, -617.540283203125, -605.9556274414062, -594.3709716796875, -582.7863159179688, -571.20166015625, -559.6170043945312, -548.0323486328125, -536.4476928710938, -524.8630981445312, -513.2784423828125, -501.69378662109375, -490.109130859375, -478.52447509765625, -466.9398193359375, -455.3551940917969, -443.7705383300781, -432.1858825683594, -420.6012268066406, -409.0166015625, -397.4319152832031, -385.8472595214844, -374.2626037597656, -362.677978515625, -351.09332275390625, -339.5086669921875, -327.92401123046875, -316.33935546875, -304.75469970703125, -293.1700439453125, -281.58538818359375, -270.0007629394531, -258.4161071777344, -246.83145141601562, -235.24679565429688, -223.6621551513672, -212.0775146484375, -200.49285888671875, -188.90821838378906, -177.3235626220703, -165.73892211914062, -154.15426635742188, -142.56961059570312, -130.98497009277344, -119.40032196044922, -107.815673828125, -96.23102569580078, -84.64637756347656, -73.06172180175781, -61.47707748413086, -49.892425537109375, -38.307777404785156, -26.723129272460938, -15.138480186462402, -3.553831100463867, 8.030818939208984, 19.615467071533203, 31.200115203857422, 42.784767150878906, 54.369415283203125, 65.95406341552734]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 10.0, 5.0, 14.0, 19.0, 8.0, 19.0, 23.0, 26.0, 40.0, 46.0, 59.0, 43.0, 53.0, 58.0, 61.0, 58.0, 69.0, 53.0, 49.0, 50.0, 52.0, 38.0, 28.0, 33.0, 22.0, 26.0, 8.0, 11.0, 10.0, 2.0, 11.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.02938842773438, -121.90411376953125, -118.77884674072266, -115.65357208251953, -112.52830505371094, -109.40303039550781, -106.27775573730469, -103.1524887084961, -100.02721405029297, -96.90193939208984, -93.77667236328125, -90.65139770507812, -87.52613067626953, -84.4008560180664, -81.27558898925781, -78.15031433105469, -75.02503967285156, -71.89976501464844, -68.77449798583984, -65.64922332763672, -62.52395248413086, -59.398681640625, -56.27341079711914, -53.14813995361328, -50.02287292480469, -46.89760208129883, -43.77233123779297, -40.647056579589844, -37.521785736083984, -34.396514892578125, -31.271244049072266, -28.145971298217773, -25.02069854736328, -21.895427703857422, -18.77015495300293, -15.64488410949707, -12.519612312316895, -9.394340515136719, -6.269069671630859, -3.143796920776367, -0.018526077270507812, 3.106745481491089, 6.2320170402526855, 9.357288360595703, 12.482560157775879, 15.607831954956055, 18.733102798461914, 21.858375549316406, 24.983646392822266, 28.108917236328125, 31.234189987182617, 34.359458923339844, 37.48473358154297, 40.61000442504883, 43.73527526855469, 46.86054992675781, 49.985816955566406, 53.111087799072266, 56.236358642578125, 59.36163330078125, 62.48690414428711, 65.61217498779297, 68.73744201660156, 71.86271667480469, 74.98799133300781]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 10.0, 7.0, 9.0, 13.0, 16.0, 23.0, 13.0, 17.0, 27.0, 29.0, 27.0, 34.0, 35.0, 28.0, 46.0, 43.0, 47.0, 44.0, 51.0, 51.0, 47.0, 30.0, 37.0, 35.0, 43.0, 39.0, 27.0, 31.0, 20.0, 18.0, 21.0, 11.0, 14.0, 14.0, 6.0, 6.0, 13.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.16015625, -5.9569091796875, -5.753662109375, -5.5504150390625, -5.34716796875, -5.1439208984375, -4.940673828125, -4.7374267578125, -4.5341796875, -4.3309326171875, -4.127685546875, -3.9244384765625, -3.72119140625, -3.5179443359375, -3.314697265625, -3.1114501953125, -2.908203125, -2.7049560546875, -2.501708984375, -2.2984619140625, -2.09521484375, -1.8919677734375, -1.688720703125, -1.4854736328125, -1.2822265625, -1.0789794921875, -0.875732421875, -0.6724853515625, -0.46923828125, -0.2659912109375, -0.062744140625, 0.1405029296875, 0.34375, 0.5469970703125, 0.750244140625, 0.9534912109375, 1.15673828125, 1.3599853515625, 1.563232421875, 1.7664794921875, 1.9697265625, 2.1729736328125, 2.376220703125, 2.5794677734375, 2.78271484375, 2.9859619140625, 3.189208984375, 3.3924560546875, 3.595703125, 3.7989501953125, 4.002197265625, 4.2054443359375, 4.40869140625, 4.6119384765625, 4.815185546875, 5.0184326171875, 5.2216796875, 5.4249267578125, 5.628173828125, 5.8314208984375, 6.03466796875, 6.2379150390625, 6.441162109375, 6.6444091796875, 6.84765625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 1.0, 6.0, 16.0, 23.0, 18.0, 29.0, 47.0, 77.0, 90.0, 146.0, 252.0, 323.0, 565.0, 794.0, 1292.0, 1972.0, 3106.0, 5027.0, 7968.0, 13174.0, 21636.0, 37156.0, 65955.0, 128050.0, 357656.0, 195691.0, 87918.0, 48153.0, 27742.0, 16579.0, 10082.0, 6189.0, 3905.0, 2428.0, 1564.0, 971.0, 713.0, 401.0, 278.0, 190.0, 109.0, 81.0, 80.0, 28.0, 30.0, 20.0, 7.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.38671875, -1.343017578125, -1.29931640625, -1.255615234375, -1.2119140625, -1.168212890625, -1.12451171875, -1.080810546875, -1.037109375, -0.993408203125, -0.94970703125, -0.906005859375, -0.8623046875, -0.818603515625, -0.77490234375, -0.731201171875, -0.6875, -0.643798828125, -0.60009765625, -0.556396484375, -0.5126953125, -0.468994140625, -0.42529296875, -0.381591796875, -0.337890625, -0.294189453125, -0.25048828125, -0.206787109375, -0.1630859375, -0.119384765625, -0.07568359375, -0.031982421875, 0.01171875, 0.055419921875, 0.09912109375, 0.142822265625, 0.1865234375, 0.230224609375, 0.27392578125, 0.317626953125, 0.361328125, 0.405029296875, 0.44873046875, 0.492431640625, 0.5361328125, 0.579833984375, 0.62353515625, 0.667236328125, 0.7109375, 0.754638671875, 0.79833984375, 0.842041015625, 0.8857421875, 0.929443359375, 0.97314453125, 1.016845703125, 1.060546875, 1.104248046875, 1.14794921875, 1.191650390625, 1.2353515625, 1.279052734375, 1.32275390625, 1.366455078125, 1.41015625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 10.0, 4.0, 14.0, 7.0, 14.0, 11.0, 22.0, 16.0, 29.0, 28.0, 28.0, 35.0, 27.0, 25.0, 29.0, 41.0, 48.0, 44.0, 44.0, 1056.0, 33.0, 40.0, 39.0, 45.0, 32.0, 29.0, 38.0, 27.0, 25.0, 27.0, 21.0, 22.0, 14.0, 10.0, 9.0, 16.0, 14.0, 10.0, 11.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.927734375, -3.804046630859375, -3.68035888671875, -3.556671142578125, -3.4329833984375, -3.309295654296875, -3.18560791015625, -3.061920166015625, -2.938232421875, -2.814544677734375, -2.69085693359375, -2.567169189453125, -2.4434814453125, -2.319793701171875, -2.19610595703125, -2.072418212890625, -1.94873046875, -1.825042724609375, -1.70135498046875, -1.577667236328125, -1.4539794921875, -1.330291748046875, -1.20660400390625, -1.082916259765625, -0.959228515625, -0.835540771484375, -0.71185302734375, -0.588165283203125, -0.4644775390625, -0.340789794921875, -0.21710205078125, -0.093414306640625, 0.0302734375, 0.153961181640625, 0.27764892578125, 0.401336669921875, 0.5250244140625, 0.648712158203125, 0.77239990234375, 0.896087646484375, 1.019775390625, 1.143463134765625, 1.26715087890625, 1.390838623046875, 1.5145263671875, 1.638214111328125, 1.76190185546875, 1.885589599609375, 2.00927734375, 2.132965087890625, 2.25665283203125, 2.380340576171875, 2.5040283203125, 2.627716064453125, 2.75140380859375, 2.875091552734375, 2.998779296875, 3.122467041015625, 3.24615478515625, 3.369842529296875, 3.4935302734375, 3.617218017578125, 3.74090576171875, 3.864593505859375, 3.98828125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 9.0, 9.0, 10.0, 14.0, 15.0, 20.0, 25.0, 46.0, 57.0, 89.0, 127.0, 184.0, 288.0, 398.0, 589.0, 809.0, 1213.0, 1808.0, 2660.0, 4056.0, 5924.0, 9019.0, 13924.0, 21269.0, 33193.0, 52823.0, 93054.0, 208115.0, 1351021.0, 120413.0, 63897.0, 38826.0, 25131.0, 16407.0, 10751.0, 7031.0, 4706.0, 3069.0, 2059.0, 1317.0, 897.0, 612.0, 400.0, 256.0, 205.0, 137.0, 85.0, 45.0, 47.0, 26.0, 17.0, 14.0, 10.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.2001953125, -1.16290283203125, -1.1256103515625, -1.08831787109375, -1.051025390625, -1.01373291015625, -0.9764404296875, -0.93914794921875, -0.90185546875, -0.86456298828125, -0.8272705078125, -0.78997802734375, -0.752685546875, -0.71539306640625, -0.6781005859375, -0.64080810546875, -0.603515625, -0.56622314453125, -0.5289306640625, -0.49163818359375, -0.454345703125, -0.41705322265625, -0.3797607421875, -0.34246826171875, -0.30517578125, -0.26788330078125, -0.2305908203125, -0.19329833984375, -0.156005859375, -0.11871337890625, -0.0814208984375, -0.04412841796875, -0.0068359375, 0.03045654296875, 0.0677490234375, 0.10504150390625, 0.142333984375, 0.17962646484375, 0.2169189453125, 0.25421142578125, 0.29150390625, 0.32879638671875, 0.3660888671875, 0.40338134765625, 0.440673828125, 0.47796630859375, 0.5152587890625, 0.55255126953125, 0.58984375, 0.62713623046875, 0.6644287109375, 0.70172119140625, 0.739013671875, 0.77630615234375, 0.8135986328125, 0.85089111328125, 0.88818359375, 0.92547607421875, 0.9627685546875, 1.00006103515625, 1.037353515625, 1.07464599609375, 1.1119384765625, 1.14923095703125, 1.1865234375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 6.0, 9.0, 3.0, 8.0, 7.0, 15.0, 15.0, 20.0, 30.0, 29.0, 44.0, 59.0, 60.0, 62.0, 82.0, 96.0, 76.0, 68.0, 49.0, 52.0, 47.0, 36.0, 25.0, 19.0, 18.0, 11.0, 6.0, 7.0, 3.0, 9.0, 6.0, 4.0, 2.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0009889602661132812, -0.0009608566761016846, -0.0009327530860900879, -0.0009046494960784912, -0.0008765459060668945, -0.0008484423160552979, -0.0008203387260437012, -0.0007922351360321045, -0.0007641315460205078, -0.0007360279560089111, -0.0007079243659973145, -0.0006798207759857178, -0.0006517171859741211, -0.0006236135959625244, -0.0005955100059509277, -0.0005674064159393311, -0.0005393028259277344, -0.0005111992359161377, -0.000483095645904541, -0.00045499205589294434, -0.00042688846588134766, -0.000398784875869751, -0.0003706812858581543, -0.0003425776958465576, -0.00031447410583496094, -0.00028637051582336426, -0.0002582669258117676, -0.0002301633358001709, -0.00020205974578857422, -0.00017395615577697754, -0.00014585256576538086, -0.00011774897575378418, -8.96453857421875e-05, -6.154179573059082e-05, -3.343820571899414e-05, -5.334615707397461e-06, 2.276897430419922e-05, 5.08725643157959e-05, 7.897615432739258e-05, 0.00010707974433898926, 0.00013518333435058594, 0.00016328692436218262, 0.0001913905143737793, 0.00021949410438537598, 0.00024759769439697266, 0.00027570128440856934, 0.000303804874420166, 0.0003319084644317627, 0.0003600120544433594, 0.00038811564445495605, 0.00041621923446655273, 0.0004443228244781494, 0.0004724264144897461, 0.0005005300045013428, 0.0005286335945129395, 0.0005567371845245361, 0.0005848407745361328, 0.0006129443645477295, 0.0006410479545593262, 0.0006691515445709229, 0.0006972551345825195, 0.0007253587245941162, 0.0007534623146057129, 0.0007815659046173096, 0.0008096694946289062]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 5.0, 7.0, 11.0, 17.0, 12.0, 26.0, 19.0, 25.0, 30.0, 50.0, 76.0, 119.0, 172.0, 197.0, 297.0, 476.0, 835.0, 70687.0, 972687.0, 1090.0, 514.0, 339.0, 220.0, 175.0, 104.0, 78.0, 66.0, 49.0, 23.0, 19.0, 28.0, 17.0, 19.0, 11.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0152435302734375, -0.014737367630004883, -0.014231204986572266, -0.013725042343139648, -0.013218879699707031, -0.012712717056274414, -0.012206554412841797, -0.01170039176940918, -0.011194229125976562, -0.010688066482543945, -0.010181903839111328, -0.009675741195678711, -0.009169578552246094, -0.008663415908813477, -0.00815725326538086, -0.007651090621948242, -0.007144927978515625, -0.006638765335083008, -0.006132602691650391, -0.0056264400482177734, -0.005120277404785156, -0.004614114761352539, -0.004107952117919922, -0.0036017894744873047, -0.0030956268310546875, -0.0025894641876220703, -0.002083301544189453, -0.001577138900756836, -0.0010709762573242188, -0.0005648136138916016, -5.8650970458984375e-05, 0.0004475116729736328, 0.00095367431640625, 0.0014598369598388672, 0.0019659996032714844, 0.0024721622467041016, 0.0029783248901367188, 0.003484487533569336, 0.003990650177001953, 0.00449681282043457, 0.0050029754638671875, 0.005509138107299805, 0.006015300750732422, 0.006521463394165039, 0.007027626037597656, 0.0075337886810302734, 0.00803995132446289, 0.008546113967895508, 0.009052276611328125, 0.009558439254760742, 0.01006460189819336, 0.010570764541625977, 0.011076927185058594, 0.011583089828491211, 0.012089252471923828, 0.012595415115356445, 0.013101577758789062, 0.01360774040222168, 0.014113903045654297, 0.014620065689086914, 0.015126228332519531, 0.01563239097595215, 0.016138553619384766, 0.016644716262817383, 0.01715087890625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 17.0, 68.0, 307.0, 456.0, 135.0, 21.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0017846140544861555, -0.001752868527546525, -0.0017211231170222163, -0.0016893777064979076, -0.0016576321795582771, -0.0016258866526186466, -0.001594141242094338, -0.0015623958315700293, -0.0015306503046303988, -0.0014989047776907682, -0.0014671593671664596, -0.0014354139566421509, -0.0014036684297025204, -0.0013719229027628899, -0.0013401774922385812, -0.0013084320817142725, -0.001276686554774642, -0.0012449410278350115, -0.0012131956173107028, -0.0011814502067863941, -0.0011497046798467636, -0.001117959152907133, -0.0010862137423828244, -0.0010544683318585157, -0.0010227228049188852, -0.0009909772779792547, -0.000959231867454946, -0.0009274863987229764, -0.0008957409299910069, -0.0008639954612590373, -0.0008322499925270677, -0.0008005045237950981, -0.0007687590550631285, -0.0007370135863311589, -0.0007052681175991893, -0.0006735226488672197, -0.0006417771801352501, -0.0006100317114032805, -0.0005782862426713109, -0.0005465407739393413, -0.0005147953052073717, -0.0004830498364754021, -0.0004513043677434325, -0.0004195588990114629, -0.00038781343027949333, -0.00035606796154752374, -0.00032432249281555414, -0.00029257702408358455, -0.0002608315844554454, -0.00022908611572347581, -0.00019734064699150622, -0.00016559517825953662, -0.00013384970952756703, -0.00010210424079559743, -7.035877206362784e-05, -3.8613303331658244e-05, -6.867834599688649e-06, 2.4877634132280946e-05, 5.662310286425054e-05, 8.836857159622014e-05, 0.00012011404032818973, 0.00015185950906015933, 0.00018360497779212892, 0.00021535044652409852, 0.0002470959152560681]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 9.0, 8.0, 7.0, 16.0, 19.0, 11.0, 17.0, 22.0, 16.0, 21.0, 30.0, 36.0, 39.0, 29.0, 41.0, 35.0, 29.0, 47.0, 33.0, 53.0, 36.0, 42.0, 42.0, 46.0, 30.0, 32.0, 25.0, 37.0, 26.0, 22.0, 19.0, 17.0, 19.0, 13.0, 18.0, 7.0, 12.0, 8.0, 8.0, 6.0, 8.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038999319076538086, -0.00037722568958997726, -0.00036445818841457367, -0.0003516906872391701, -0.0003389231860637665, -0.0003261556848883629, -0.0003133881837129593, -0.0003006206825375557, -0.0002878531813621521, -0.0002750856801867485, -0.0002623181790113449, -0.0002495506778359413, -0.00023678317666053772, -0.00022401567548513412, -0.00021124817430973053, -0.00019848067313432693, -0.00018571317195892334, -0.00017294567078351974, -0.00016017816960811615, -0.00014741066843271255, -0.00013464316725730896, -0.00012187566608190536, -0.00010910816490650177, -9.634066373109818e-05, -8.357316255569458e-05, -7.080566138029099e-05, -5.803816020488739e-05, -4.5270659029483795e-05, -3.25031578540802e-05, -1.9735656678676605e-05, -6.96815550327301e-06, 5.799345672130585e-06, 1.856684684753418e-05, 3.1334348022937775e-05, 4.410184919834137e-05, 5.6869350373744965e-05, 6.963685154914856e-05, 8.240435272455215e-05, 9.517185389995575e-05, 0.00010793935507535934, 0.00012070685625076294, 0.00013347435742616653, 0.00014624185860157013, 0.00015900935977697372, 0.00017177686095237732, 0.00018454436212778091, 0.0001973118633031845, 0.0002100793644785881, 0.0002228468656539917, 0.0002356143668293953, 0.0002483818680047989, 0.0002611493691802025, 0.0002739168703556061, 0.0002866843715310097, 0.00029945187270641327, 0.00031221937388181686, 0.00032498687505722046, 0.00033775437623262405, 0.00035052187740802765, 0.00036328937858343124, 0.00037605687975883484, 0.00038882438093423843, 0.00040159188210964203, 0.0004143593832850456, 0.0004271268844604492]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 10.0, 7.0, 9.0, 13.0, 16.0, 23.0, 13.0, 17.0, 27.0, 29.0, 27.0, 34.0, 35.0, 28.0, 46.0, 43.0, 47.0, 44.0, 51.0, 51.0, 47.0, 30.0, 37.0, 35.0, 43.0, 39.0, 27.0, 31.0, 20.0, 18.0, 21.0, 11.0, 14.0, 14.0, 6.0, 6.0, 13.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.16015625, -5.9569091796875, -5.753662109375, -5.5504150390625, -5.34716796875, -5.1439208984375, -4.940673828125, -4.7374267578125, -4.5341796875, -4.3309326171875, -4.127685546875, -3.9244384765625, -3.72119140625, -3.5179443359375, -3.314697265625, -3.1114501953125, -2.908203125, -2.7049560546875, -2.501708984375, -2.2984619140625, -2.09521484375, -1.8919677734375, -1.688720703125, -1.4854736328125, -1.2822265625, -1.0789794921875, -0.875732421875, -0.6724853515625, -0.46923828125, -0.2659912109375, -0.062744140625, 0.1405029296875, 0.34375, 0.5469970703125, 0.750244140625, 0.9534912109375, 1.15673828125, 1.3599853515625, 1.563232421875, 1.7664794921875, 1.9697265625, 2.1729736328125, 2.376220703125, 2.5794677734375, 2.78271484375, 2.9859619140625, 3.189208984375, 3.3924560546875, 3.595703125, 3.7989501953125, 4.002197265625, 4.2054443359375, 4.40869140625, 4.6119384765625, 4.815185546875, 5.0184326171875, 5.2216796875, 5.4249267578125, 5.628173828125, 5.8314208984375, 6.03466796875, 6.2379150390625, 6.441162109375, 6.6444091796875, 6.84765625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 8.0, 15.0, 19.0, 35.0, 39.0, 41.0, 64.0, 72.0, 129.0, 151.0, 234.0, 307.0, 386.0, 582.0, 805.0, 1146.0, 1612.0, 2428.0, 3727.0, 6515.0, 13822.0, 48454.0, 844162.0, 86182.0, 16960.0, 7630.0, 4256.0, 2645.0, 1712.0, 1235.0, 920.0, 611.0, 427.0, 342.0, 232.0, 151.0, 159.0, 92.0, 60.0, 47.0, 36.0, 36.0, 17.0, 17.0, 8.0, 12.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-41.28125, -40.05322265625, -38.8251953125, -37.59716796875, -36.369140625, -35.14111328125, -33.9130859375, -32.68505859375, -31.45703125, -30.22900390625, -29.0009765625, -27.77294921875, -26.544921875, -25.31689453125, -24.0888671875, -22.86083984375, -21.6328125, -20.40478515625, -19.1767578125, -17.94873046875, -16.720703125, -15.49267578125, -14.2646484375, -13.03662109375, -11.80859375, -10.58056640625, -9.3525390625, -8.12451171875, -6.896484375, -5.66845703125, -4.4404296875, -3.21240234375, -1.984375, -0.75634765625, 0.4716796875, 1.69970703125, 2.927734375, 4.15576171875, 5.3837890625, 6.61181640625, 7.83984375, 9.06787109375, 10.2958984375, 11.52392578125, 12.751953125, 13.97998046875, 15.2080078125, 16.43603515625, 17.6640625, 18.89208984375, 20.1201171875, 21.34814453125, 22.576171875, 23.80419921875, 25.0322265625, 26.26025390625, 27.48828125, 28.71630859375, 29.9443359375, 31.17236328125, 32.400390625, 33.62841796875, 34.8564453125, 36.08447265625, 37.3125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 3.0, 6.0, 5.0, 11.0, 8.0, 14.0, 18.0, 5.0, 18.0, 17.0, 35.0, 27.0, 28.0, 30.0, 56.0, 51.0, 61.0, 59.0, 181.0, 1723.0, 189.0, 68.0, 49.0, 51.0, 43.0, 38.0, 28.0, 31.0, 34.0, 36.0, 20.0, 11.0, 20.0, 17.0, 15.0, 9.0, 9.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.71875, -20.11865234375, -19.5185546875, -18.91845703125, -18.318359375, -17.71826171875, -17.1181640625, -16.51806640625, -15.91796875, -15.31787109375, -14.7177734375, -14.11767578125, -13.517578125, -12.91748046875, -12.3173828125, -11.71728515625, -11.1171875, -10.51708984375, -9.9169921875, -9.31689453125, -8.716796875, -8.11669921875, -7.5166015625, -6.91650390625, -6.31640625, -5.71630859375, -5.1162109375, -4.51611328125, -3.916015625, -3.31591796875, -2.7158203125, -2.11572265625, -1.515625, -0.91552734375, -0.3154296875, 0.28466796875, 0.884765625, 1.48486328125, 2.0849609375, 2.68505859375, 3.28515625, 3.88525390625, 4.4853515625, 5.08544921875, 5.685546875, 6.28564453125, 6.8857421875, 7.48583984375, 8.0859375, 8.68603515625, 9.2861328125, 9.88623046875, 10.486328125, 11.08642578125, 11.6865234375, 12.28662109375, 12.88671875, 13.48681640625, 14.0869140625, 14.68701171875, 15.287109375, 15.88720703125, 16.4873046875, 17.08740234375, 17.6875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 2.0, 8.0, 6.0, 6.0, 6.0, 12.0, 15.0, 17.0, 14.0, 15.0, 29.0, 30.0, 27.0, 33.0, 46.0, 51.0, 100.0, 156.0, 429.0, 2227.0, 3050671.0, 90119.0, 991.0, 242.0, 118.0, 82.0, 55.0, 31.0, 34.0, 22.0, 17.0, 15.0, 17.0, 10.0, 19.0, 4.0, 10.0, 6.0, 3.0, 5.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.3125, -78.5849609375, -75.857421875, -73.1298828125, -70.40234375, -67.6748046875, -64.947265625, -62.2197265625, -59.4921875, -56.7646484375, -54.037109375, -51.3095703125, -48.58203125, -45.8544921875, -43.126953125, -40.3994140625, -37.671875, -34.9443359375, -32.216796875, -29.4892578125, -26.76171875, -24.0341796875, -21.306640625, -18.5791015625, -15.8515625, -13.1240234375, -10.396484375, -7.6689453125, -4.94140625, -2.2138671875, 0.513671875, 3.2412109375, 5.96875, 8.6962890625, 11.423828125, 14.1513671875, 16.87890625, 19.6064453125, 22.333984375, 25.0615234375, 27.7890625, 30.5166015625, 33.244140625, 35.9716796875, 38.69921875, 41.4267578125, 44.154296875, 46.8818359375, 49.609375, 52.3369140625, 55.064453125, 57.7919921875, 60.51953125, 63.2470703125, 65.974609375, 68.7021484375, 71.4296875, 74.1572265625, 76.884765625, 79.6123046875, 82.33984375, 85.0673828125, 87.794921875, 90.5224609375, 93.25]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 84.0, 756.0, 163.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-235.33775329589844, -231.24969482421875, -227.16163635253906, -223.07359313964844, -218.98553466796875, -214.89747619628906, -210.80941772460938, -206.7213592529297, -202.63330078125, -198.5452423095703, -194.45718383789062, -190.369140625, -186.2810821533203, -182.19302368164062, -178.10496520996094, -174.01690673828125, -169.92886352539062, -165.84080505371094, -161.75274658203125, -157.66470336914062, -153.57664489746094, -149.48858642578125, -145.40052795410156, -141.31246948242188, -137.22442626953125, -133.13636779785156, -129.04830932617188, -124.96025848388672, -120.87220764160156, -116.78414916992188, -112.69609069824219, -108.6080322265625, -104.51998901367188, -100.43193054199219, -96.34387969970703, -92.25582122802734, -88.16777038574219, -84.0797119140625, -79.99165344238281, -75.90359497070312, -71.81554412841797, -67.72748565673828, -63.639434814453125, -59.55137634277344, -55.463321685791016, -51.375267028808594, -47.287208557128906, -43.199153900146484, -39.11109924316406, -35.02304458618164, -30.934988021850586, -26.84693145751953, -22.75887680053711, -18.670822143554688, -14.582765579223633, -10.494709014892578, -6.406652450561523, -2.318596839904785, 1.7694587707519531, 5.857514381408691, 9.94556999206543, 14.033624649047852, 18.121681213378906, 22.20973777770996, 26.297792434692383]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 4.0, 9.0, 10.0, 8.0, 10.0, 13.0, 13.0, 13.0, 16.0, 26.0, 20.0, 25.0, 25.0, 20.0, 28.0, 42.0, 33.0, 41.0, 37.0, 37.0, 41.0, 46.0, 46.0, 47.0, 39.0, 35.0, 34.0, 33.0, 35.0, 29.0, 30.0, 13.0, 23.0, 18.0, 15.0, 18.0, 11.0, 7.0, 14.0, 7.0, 8.0, 7.0, 8.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-62.762062072753906, -61.041603088378906, -59.321144104003906, -57.60068893432617, -55.88022994995117, -54.15977096557617, -52.43931198120117, -50.71885681152344, -48.99839782714844, -47.27793884277344, -45.55747985839844, -43.8370246887207, -42.1165657043457, -40.3961067199707, -38.6756477355957, -36.95519256591797, -35.23473358154297, -33.51427459716797, -31.7938175201416, -30.0733585357666, -28.352901458740234, -26.632442474365234, -24.911983489990234, -23.191526412963867, -21.471065521240234, -19.750606536865234, -18.030149459838867, -16.309690475463867, -14.5892333984375, -12.8687744140625, -11.148316383361816, -9.427858352661133, -7.707401275634766, -5.986943244934082, -4.266485214233398, -2.5460267066955566, -0.825568675994873, 0.8948898315429688, 2.6153478622436523, 4.335805892944336, 6.0562639236450195, 7.776721954345703, 9.497179985046387, 11.21763801574707, 12.93809700012207, 14.658555030822754, 16.379013061523438, 18.099472045898438, 19.819929122924805, 21.540388107299805, 23.260845184326172, 24.981304168701172, 26.70176124572754, 28.42222023010254, 30.142677307128906, 31.863136291503906, 33.583595275878906, 35.304054260253906, 37.024513244628906, 38.74496841430664, 40.46542739868164, 42.18588638305664, 43.90634536743164, 45.626800537109375, 47.347259521484375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 4.0, 4.0, 6.0, 4.0, 7.0, 9.0, 9.0, 22.0, 16.0, 18.0, 17.0, 18.0, 35.0, 27.0, 28.0, 30.0, 37.0, 40.0, 45.0, 38.0, 55.0, 44.0, 49.0, 44.0, 37.0, 33.0, 40.0, 35.0, 37.0, 40.0, 22.0, 27.0, 22.0, 17.0, 14.0, 12.0, 8.0, 17.0, 8.0, 8.0, 1.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.3671875, -6.1588134765625, -5.950439453125, -5.7420654296875, -5.53369140625, -5.3253173828125, -5.116943359375, -4.9085693359375, -4.7001953125, -4.4918212890625, -4.283447265625, -4.0750732421875, -3.86669921875, -3.6583251953125, -3.449951171875, -3.2415771484375, -3.033203125, -2.8248291015625, -2.616455078125, -2.4080810546875, -2.19970703125, -1.9913330078125, -1.782958984375, -1.5745849609375, -1.3662109375, -1.1578369140625, -0.949462890625, -0.7410888671875, -0.53271484375, -0.3243408203125, -0.115966796875, 0.0924072265625, 0.30078125, 0.5091552734375, 0.717529296875, 0.9259033203125, 1.13427734375, 1.3426513671875, 1.551025390625, 1.7593994140625, 1.9677734375, 2.1761474609375, 2.384521484375, 2.5928955078125, 2.80126953125, 3.0096435546875, 3.218017578125, 3.4263916015625, 3.634765625, 3.8431396484375, 4.051513671875, 4.2598876953125, 4.46826171875, 4.6766357421875, 4.885009765625, 5.0933837890625, 5.3017578125, 5.5101318359375, 5.718505859375, 5.9268798828125, 6.13525390625, 6.3436279296875, 6.552001953125, 6.7603759765625, 6.96875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 6.0, 7.0, 10.0, 9.0, 11.0, 13.0, 20.0, 43.0, 45.0, 84.0, 86.0, 134.0, 217.0, 366.0, 612.0, 1151.0, 2111.0, 4404.0, 9380.0, 24076.0, 104128.0, 2981329.0, 982368.0, 54196.0, 16045.0, 6636.0, 3063.0, 1542.0, 857.0, 460.0, 289.0, 184.0, 115.0, 72.0, 52.0, 39.0, 35.0, 22.0, 11.0, 14.0, 6.0, 10.0, 8.0, 2.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-35.84375, -34.6806640625, -33.517578125, -32.3544921875, -31.19140625, -30.0283203125, -28.865234375, -27.7021484375, -26.5390625, -25.3759765625, -24.212890625, -23.0498046875, -21.88671875, -20.7236328125, -19.560546875, -18.3974609375, -17.234375, -16.0712890625, -14.908203125, -13.7451171875, -12.58203125, -11.4189453125, -10.255859375, -9.0927734375, -7.9296875, -6.7666015625, -5.603515625, -4.4404296875, -3.27734375, -2.1142578125, -0.951171875, 0.2119140625, 1.375, 2.5380859375, 3.701171875, 4.8642578125, 6.02734375, 7.1904296875, 8.353515625, 9.5166015625, 10.6796875, 11.8427734375, 13.005859375, 14.1689453125, 15.33203125, 16.4951171875, 17.658203125, 18.8212890625, 19.984375, 21.1474609375, 22.310546875, 23.4736328125, 24.63671875, 25.7998046875, 26.962890625, 28.1259765625, 29.2890625, 30.4521484375, 31.615234375, 32.7783203125, 33.94140625, 35.1044921875, 36.267578125, 37.4306640625, 38.59375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 6.0, 6.0, 3.0, 12.0, 14.0, 20.0, 20.0, 30.0, 42.0, 54.0, 82.0, 87.0, 123.0, 169.0, 260.0, 371.0, 498.0, 587.0, 491.0, 361.0, 231.0, 144.0, 119.0, 82.0, 62.0, 54.0, 34.0, 24.0, 15.0, 24.0, 14.0, 5.0, 7.0, 5.0, 2.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.6875, -25.80908203125, -24.9306640625, -24.05224609375, -23.173828125, -22.29541015625, -21.4169921875, -20.53857421875, -19.66015625, -18.78173828125, -17.9033203125, -17.02490234375, -16.146484375, -15.26806640625, -14.3896484375, -13.51123046875, -12.6328125, -11.75439453125, -10.8759765625, -9.99755859375, -9.119140625, -8.24072265625, -7.3623046875, -6.48388671875, -5.60546875, -4.72705078125, -3.8486328125, -2.97021484375, -2.091796875, -1.21337890625, -0.3349609375, 0.54345703125, 1.421875, 2.30029296875, 3.1787109375, 4.05712890625, 4.935546875, 5.81396484375, 6.6923828125, 7.57080078125, 8.44921875, 9.32763671875, 10.2060546875, 11.08447265625, 11.962890625, 12.84130859375, 13.7197265625, 14.59814453125, 15.4765625, 16.35498046875, 17.2333984375, 18.11181640625, 18.990234375, 19.86865234375, 20.7470703125, 21.62548828125, 22.50390625, 23.38232421875, 24.2607421875, 25.13916015625, 26.017578125, 26.89599609375, 27.7744140625, 28.65283203125, 29.53125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 7.0, 7.0, 9.0, 22.0, 27.0, 16.0, 26.0, 52.0, 73.0, 84.0, 117.0, 195.0, 331.0, 729.0, 4906.0, 4082478.0, 102502.0, 1419.0, 442.0, 244.0, 156.0, 108.0, 77.0, 64.0, 43.0, 31.0, 24.0, 20.0, 15.0, 7.0, 6.0, 7.0, 4.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.875, -124.681640625, -120.48828125, -116.294921875, -112.1015625, -107.908203125, -103.71484375, -99.521484375, -95.328125, -91.134765625, -86.94140625, -82.748046875, -78.5546875, -74.361328125, -70.16796875, -65.974609375, -61.78125, -57.587890625, -53.39453125, -49.201171875, -45.0078125, -40.814453125, -36.62109375, -32.427734375, -28.234375, -24.041015625, -19.84765625, -15.654296875, -11.4609375, -7.267578125, -3.07421875, 1.119140625, 5.3125, 9.505859375, 13.69921875, 17.892578125, 22.0859375, 26.279296875, 30.47265625, 34.666015625, 38.859375, 43.052734375, 47.24609375, 51.439453125, 55.6328125, 59.826171875, 64.01953125, 68.212890625, 72.40625, 76.599609375, 80.79296875, 84.986328125, 89.1796875, 93.373046875, 97.56640625, 101.759765625, 105.953125, 110.146484375, 114.33984375, 118.533203125, 122.7265625, 126.919921875, 131.11328125, 135.306640625, 139.5]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 30.0, 106.0, 265.0, 347.0, 182.0, 61.0, 16.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.61618041992188, -123.90042877197266, -119.18467712402344, -114.46892547607422, -109.753173828125, -105.03741455078125, -100.32166290283203, -95.60591125488281, -90.8901596069336, -86.17440795898438, -81.45865631103516, -76.74290466308594, -72.02714538574219, -67.3114013671875, -62.59564208984375, -57.87989044189453, -53.16413879394531, -48.448387145996094, -43.732635498046875, -39.01688003540039, -34.30112838745117, -29.585376739501953, -24.8696231842041, -20.15386962890625, -15.438117980957031, -10.722365379333496, -6.006612777709961, -1.2908601760864258, 3.4248924255371094, 8.140644073486328, 12.85639762878418, 17.57215118408203, 22.28790283203125, 27.00365447998047, 31.71940803527832, 36.43516159057617, 41.15091323852539, 45.86666488647461, 50.582420349121094, 55.29817199707031, 60.01392364501953, 64.72967529296875, 69.44542694091797, 74.16117858886719, 78.87693786621094, 83.59268188476562, 88.30844116210938, 93.0241928100586, 97.73994445800781, 102.45569610595703, 107.17144775390625, 111.88719940185547, 116.60295104980469, 121.31871032714844, 126.03446197509766, 130.75021362304688, 135.46597290039062, 140.18173217773438, 144.89747619628906, 149.6132354736328, 154.3289794921875, 159.04473876953125, 163.76048278808594, 168.4762420654297, 173.19198608398438]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 5.0, 7.0, 10.0, 18.0, 12.0, 14.0, 18.0, 20.0, 24.0, 30.0, 21.0, 44.0, 24.0, 32.0, 32.0, 36.0, 46.0, 42.0, 51.0, 42.0, 29.0, 52.0, 34.0, 38.0, 36.0, 33.0, 24.0, 38.0, 26.0, 23.0, 20.0, 17.0, 23.0, 15.0, 10.0, 6.0, 10.0, 7.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.61894226074219, -78.90320587158203, -76.18746948242188, -73.47174072265625, -70.7560043334961, -68.04026794433594, -65.32453918457031, -62.608802795410156, -59.89306640625, -57.177330017089844, -54.46159744262695, -51.74586486816406, -49.030128479003906, -46.31439208984375, -43.59865951538086, -40.88292694091797, -38.16719055175781, -35.451454162597656, -32.735721588134766, -30.019987106323242, -27.30425262451172, -24.588518142700195, -21.872783660888672, -19.15704917907715, -16.441314697265625, -13.725580215454102, -11.009845733642578, -8.294111251831055, -5.578376770019531, -2.862642288208008, -0.14690780639648438, 2.568826675415039, 5.284568786621094, 8.000303268432617, 10.71603775024414, 13.431772232055664, 16.147506713867188, 18.86324119567871, 21.578975677490234, 24.294710159301758, 27.01044464111328, 29.726179122924805, 32.44191360473633, 35.15764617919922, 37.873382568359375, 40.58911895751953, 43.30485153198242, 46.02058410644531, 48.73632049560547, 51.452056884765625, 54.167789459228516, 56.883522033691406, 59.59925842285156, 62.31499481201172, 65.03073120117188, 67.7464599609375, 70.46219635009766, 73.17793273925781, 75.89366149902344, 78.6093978881836, 81.32513427734375, 84.0408706665039, 86.75660705566406, 89.47233581542969, 92.18807220458984]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 1.0, 6.0, 1.0, 9.0, 9.0, 12.0, 13.0, 12.0, 13.0, 15.0, 24.0, 29.0, 37.0, 29.0, 34.0, 30.0, 30.0, 53.0, 48.0, 40.0, 44.0, 40.0, 44.0, 42.0, 47.0, 43.0, 37.0, 43.0, 34.0, 30.0, 24.0, 23.0, 15.0, 15.0, 16.0, 7.0, 12.0, 10.0, 6.0, 11.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.76953125, -6.5518798828125, -6.334228515625, -6.1165771484375, -5.89892578125, -5.6812744140625, -5.463623046875, -5.2459716796875, -5.0283203125, -4.8106689453125, -4.593017578125, -4.3753662109375, -4.15771484375, -3.9400634765625, -3.722412109375, -3.5047607421875, -3.287109375, -3.0694580078125, -2.851806640625, -2.6341552734375, -2.41650390625, -2.1988525390625, -1.981201171875, -1.7635498046875, -1.5458984375, -1.3282470703125, -1.110595703125, -0.8929443359375, -0.67529296875, -0.4576416015625, -0.239990234375, -0.0223388671875, 0.1953125, 0.4129638671875, 0.630615234375, 0.8482666015625, 1.06591796875, 1.2835693359375, 1.501220703125, 1.7188720703125, 1.9365234375, 2.1541748046875, 2.371826171875, 2.5894775390625, 2.80712890625, 3.0247802734375, 3.242431640625, 3.4600830078125, 3.677734375, 3.8953857421875, 4.113037109375, 4.3306884765625, 4.54833984375, 4.7659912109375, 4.983642578125, 5.2012939453125, 5.4189453125, 5.6365966796875, 5.854248046875, 6.0718994140625, 6.28955078125, 6.5072021484375, 6.724853515625, 6.9425048828125, 7.16015625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 8.0, 8.0, 7.0, 11.0, 22.0, 39.0, 62.0, 77.0, 99.0, 146.0, 208.0, 279.0, 414.0, 691.0, 1009.0, 1538.0, 2212.0, 3356.0, 5346.0, 8660.0, 13717.0, 22735.0, 38801.0, 68925.0, 130752.0, 322381.0, 202716.0, 94353.0, 51949.0, 29695.0, 17849.0, 11066.0, 6694.0, 4271.0, 2807.0, 1857.0, 1225.0, 808.0, 570.0, 392.0, 260.0, 159.0, 118.0, 91.0, 47.0, 38.0, 23.0, 19.0, 22.0, 14.0, 5.0, 3.0, 5.0, 2.0, 0.0, 4.0, 2.0], "bins": [-1.4755859375, -1.4305419921875, -1.385498046875, -1.3404541015625, -1.29541015625, -1.2503662109375, -1.205322265625, -1.1602783203125, -1.115234375, -1.0701904296875, -1.025146484375, -0.9801025390625, -0.93505859375, -0.8900146484375, -0.844970703125, -0.7999267578125, -0.7548828125, -0.7098388671875, -0.664794921875, -0.6197509765625, -0.57470703125, -0.5296630859375, -0.484619140625, -0.4395751953125, -0.39453125, -0.3494873046875, -0.304443359375, -0.2593994140625, -0.21435546875, -0.1693115234375, -0.124267578125, -0.0792236328125, -0.0341796875, 0.0108642578125, 0.055908203125, 0.1009521484375, 0.14599609375, 0.1910400390625, 0.236083984375, 0.2811279296875, 0.326171875, 0.3712158203125, 0.416259765625, 0.4613037109375, 0.50634765625, 0.5513916015625, 0.596435546875, 0.6414794921875, 0.6865234375, 0.7315673828125, 0.776611328125, 0.8216552734375, 0.86669921875, 0.9117431640625, 0.956787109375, 1.0018310546875, 1.046875, 1.0919189453125, 1.136962890625, 1.1820068359375, 1.22705078125, 1.2720947265625, 1.317138671875, 1.3621826171875, 1.4072265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 9.0, 8.0, 13.0, 12.0, 17.0, 20.0, 18.0, 19.0, 20.0, 26.0, 23.0, 25.0, 33.0, 31.0, 42.0, 25.0, 36.0, 35.0, 25.0, 36.0, 1060.0, 47.0, 31.0, 43.0, 27.0, 32.0, 39.0, 24.0, 27.0, 26.0, 29.0, 31.0, 22.0, 15.0, 14.0, 15.0, 21.0, 10.0, 9.0, 7.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.9921875, -3.867767333984375, -3.74334716796875, -3.618927001953125, -3.4945068359375, -3.370086669921875, -3.24566650390625, -3.121246337890625, -2.996826171875, -2.872406005859375, -2.74798583984375, -2.623565673828125, -2.4991455078125, -2.374725341796875, -2.25030517578125, -2.125885009765625, -2.00146484375, -1.877044677734375, -1.75262451171875, -1.628204345703125, -1.5037841796875, -1.379364013671875, -1.25494384765625, -1.130523681640625, -1.006103515625, -0.881683349609375, -0.75726318359375, -0.632843017578125, -0.5084228515625, -0.384002685546875, -0.25958251953125, -0.135162353515625, -0.0107421875, 0.113677978515625, 0.23809814453125, 0.362518310546875, 0.4869384765625, 0.611358642578125, 0.73577880859375, 0.860198974609375, 0.984619140625, 1.109039306640625, 1.23345947265625, 1.357879638671875, 1.4822998046875, 1.606719970703125, 1.73114013671875, 1.855560302734375, 1.97998046875, 2.104400634765625, 2.22882080078125, 2.353240966796875, 2.4776611328125, 2.602081298828125, 2.72650146484375, 2.850921630859375, 2.975341796875, 3.099761962890625, 3.22418212890625, 3.348602294921875, 3.4730224609375, 3.597442626953125, 3.72186279296875, 3.846282958984375, 3.970703125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 11.0, 11.0, 14.0, 19.0, 28.0, 50.0, 59.0, 78.0, 126.0, 192.0, 303.0, 446.0, 627.0, 866.0, 1471.0, 2188.0, 3235.0, 4971.0, 7513.0, 11425.0, 17514.0, 26028.0, 40200.0, 63404.0, 111609.0, 1313707.0, 221852.0, 100957.0, 58973.0, 37436.0, 24451.0, 16099.0, 10780.0, 7109.0, 4608.0, 3057.0, 1966.0, 1232.0, 857.0, 534.0, 379.0, 236.0, 178.0, 127.0, 54.0, 44.0, 38.0, 20.0, 19.0, 12.0, 10.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.1904296875, -1.15313720703125, -1.1158447265625, -1.07855224609375, -1.041259765625, -1.00396728515625, -0.9666748046875, -0.92938232421875, -0.89208984375, -0.85479736328125, -0.8175048828125, -0.78021240234375, -0.742919921875, -0.70562744140625, -0.6683349609375, -0.63104248046875, -0.59375, -0.55645751953125, -0.5191650390625, -0.48187255859375, -0.444580078125, -0.40728759765625, -0.3699951171875, -0.33270263671875, -0.29541015625, -0.25811767578125, -0.2208251953125, -0.18353271484375, -0.146240234375, -0.10894775390625, -0.0716552734375, -0.03436279296875, 0.0029296875, 0.04022216796875, 0.0775146484375, 0.11480712890625, 0.152099609375, 0.18939208984375, 0.2266845703125, 0.26397705078125, 0.30126953125, 0.33856201171875, 0.3758544921875, 0.41314697265625, 0.450439453125, 0.48773193359375, 0.5250244140625, 0.56231689453125, 0.599609375, 0.63690185546875, 0.6741943359375, 0.71148681640625, 0.748779296875, 0.78607177734375, 0.8233642578125, 0.86065673828125, 0.89794921875, 0.93524169921875, 0.9725341796875, 1.00982666015625, 1.047119140625, 1.08441162109375, 1.1217041015625, 1.15899658203125, 1.1962890625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 9.0, 7.0, 9.0, 21.0, 14.0, 29.0, 43.0, 57.0, 64.0, 92.0, 110.0, 117.0, 118.0, 57.0, 59.0, 48.0, 47.0, 19.0, 18.0, 12.0, 8.0, 10.0, 7.0, 4.0, 5.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010967254638671875, -0.0010605454444885254, -0.0010243654251098633, -0.0009881854057312012, -0.0009520053863525391, -0.000915825366973877, -0.0008796453475952148, -0.0008434653282165527, -0.0008072853088378906, -0.0007711052894592285, -0.0007349252700805664, -0.0006987452507019043, -0.0006625652313232422, -0.0006263852119445801, -0.000590205192565918, -0.0005540251731872559, -0.0005178451538085938, -0.00048166513442993164, -0.00044548511505126953, -0.0004093050956726074, -0.0003731250762939453, -0.0003369450569152832, -0.0003007650375366211, -0.000264585018157959, -0.00022840499877929688, -0.00019222497940063477, -0.00015604496002197266, -0.00011986494064331055, -8.368492126464844e-05, -4.750490188598633e-05, -1.1324882507324219e-05, 2.485513687133789e-05, 6.103515625e-05, 9.721517562866211e-05, 0.00013339519500732422, 0.00016957521438598633, 0.00020575523376464844, 0.00024193525314331055, 0.00027811527252197266, 0.00031429529190063477, 0.0003504753112792969, 0.000386655330657959, 0.0004228353500366211, 0.0004590153694152832, 0.0004951953887939453, 0.0005313754081726074, 0.0005675554275512695, 0.0006037354469299316, 0.0006399154663085938, 0.0006760954856872559, 0.000712275505065918, 0.0007484555244445801, 0.0007846355438232422, 0.0008208155632019043, 0.0008569955825805664, 0.0008931756019592285, 0.0009293556213378906, 0.0009655356407165527, 0.0010017156600952148, 0.001037895679473877, 0.001074075698852539, 0.0011102557182312012, 0.0011464357376098633, 0.0011826157569885254, 0.0012187957763671875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 4.0, 8.0, 10.0, 15.0, 22.0, 41.0, 81.0, 134.0, 265.0, 583.0, 827419.0, 218846.0, 547.0, 260.0, 128.0, 67.0, 38.0, 22.0, 16.0, 10.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03204345703125, -0.03107142448425293, -0.03009939193725586, -0.02912735939025879, -0.02815532684326172, -0.02718329429626465, -0.026211261749267578, -0.025239229202270508, -0.024267196655273438, -0.023295164108276367, -0.022323131561279297, -0.021351099014282227, -0.020379066467285156, -0.019407033920288086, -0.018435001373291016, -0.017462968826293945, -0.016490936279296875, -0.015518903732299805, -0.014546871185302734, -0.013574838638305664, -0.012602806091308594, -0.011630773544311523, -0.010658740997314453, -0.009686708450317383, -0.008714675903320312, -0.007742643356323242, -0.006770610809326172, -0.0057985782623291016, -0.004826545715332031, -0.003854513168334961, -0.0028824806213378906, -0.0019104480743408203, -0.00093841552734375, 3.361701965332031e-05, 0.0010056495666503906, 0.001977682113647461, 0.0029497146606445312, 0.0039217472076416016, 0.004893779754638672, 0.005865812301635742, 0.0068378448486328125, 0.007809877395629883, 0.008781909942626953, 0.009753942489624023, 0.010725975036621094, 0.011698007583618164, 0.012670040130615234, 0.013642072677612305, 0.014614105224609375, 0.015586137771606445, 0.016558170318603516, 0.017530202865600586, 0.018502235412597656, 0.019474267959594727, 0.020446300506591797, 0.021418333053588867, 0.022390365600585938, 0.023362398147583008, 0.024334430694580078, 0.02530646324157715, 0.02627849578857422, 0.02725052833557129, 0.02822256088256836, 0.02919459342956543, 0.0301666259765625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 951.0, 63.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.008962997235357761, -0.008796058595180511, -0.008629119955003262, -0.008462180383503437, -0.008295241743326187, -0.008128303103148937, -0.007961364462971687, -0.00779442535713315, -0.007627486251294613, -0.007460547611117363, -0.007293608505278826, -0.007126669865101576, -0.006959730759263039, -0.006792792119085789, -0.0066258530132472515, -0.006458914373070002, -0.006291975267231464, -0.0061250366270542145, -0.005958097521215677, -0.005791158881038427, -0.00562421977519989, -0.00545728113502264, -0.005290342029184103, -0.005123403389006853, -0.004956464748829603, -0.004789526108652353, -0.004622587002813816, -0.004455648362636566, -0.004288709256798029, -0.004121770616620779, -0.003954831510782242, -0.003787892870604992, -0.0036209532991051674, -0.003454014426097274, -0.0032870755530893803, -0.0031201366800814867, -0.002953197807073593, -0.0027862589340656996, -0.002619320061057806, -0.002452381420880556, -0.0022854425478726625, -0.002118503674864769, -0.0019515648018568754, -0.0017846259288489819, -0.0016176870558410883, -0.0014507481828331947, -0.001283809426240623, -0.0011168705532327294, -0.0009499316802248359, -0.0007829928072169423, -0.0006160539342090487, -0.0004491151194088161, -0.00028217624640092254, -0.00011523737339302897, 5.1701441407203674e-05, 0.00021864031441509724, 0.0003855791874229908, 0.0005525180604308844, 0.0007194569334387779, 0.0008863957482390106, 0.001053334679454565, 0.0012202735524624586, 0.0013872123090550303, 0.001554151182062924, 0.0017210900550708175]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 9.0, 2.0, 1.0, 5.0, 8.0, 10.0, 7.0, 8.0, 15.0, 8.0, 11.0, 16.0, 18.0, 7.0, 20.0, 20.0, 23.0, 31.0, 32.0, 36.0, 39.0, 36.0, 34.0, 39.0, 42.0, 40.0, 44.0, 38.0, 38.0, 41.0, 39.0, 29.0, 35.0, 39.0, 25.0, 17.0, 14.0, 21.0, 21.0, 14.0, 21.0, 16.0, 7.0, 9.0, 3.0, 8.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0004317760467529297, -0.00041939225047826767, -0.00040700845420360565, -0.00039462465792894363, -0.0003822408616542816, -0.0003698570653796196, -0.0003574732691049576, -0.00034508947283029556, -0.00033270567655563354, -0.0003203218802809715, -0.0003079380840063095, -0.0002955542877316475, -0.0002831704914569855, -0.00027078669518232346, -0.00025840289890766144, -0.0002460191026329994, -0.0002336353063583374, -0.00022125151008367538, -0.00020886771380901337, -0.00019648391753435135, -0.00018410012125968933, -0.0001717163249850273, -0.0001593325287103653, -0.00014694873243570328, -0.00013456493616104126, -0.00012218113988637924, -0.00010979734361171722, -9.74135473370552e-05, -8.502975106239319e-05, -7.264595478773117e-05, -6.026215851306915e-05, -4.7878362238407135e-05, -3.549456596374512e-05, -2.31107696890831e-05, -1.0726973414421082e-05, 1.6568228602409363e-06, 1.4040619134902954e-05, 2.6424415409564972e-05, 3.880821168422699e-05, 5.119200795888901e-05, 6.357580423355103e-05, 7.595960050821304e-05, 8.834339678287506e-05, 0.00010072719305753708, 0.0001131109893321991, 0.00012549478560686111, 0.00013787858188152313, 0.00015026237815618515, 0.00016264617443084717, 0.00017502997070550919, 0.0001874137669801712, 0.00019979756325483322, 0.00021218135952949524, 0.00022456515580415726, 0.00023694895207881927, 0.0002493327483534813, 0.0002617165446281433, 0.00027410034090280533, 0.00028648413717746735, 0.00029886793345212936, 0.0003112517297267914, 0.0003236355260014534, 0.0003360193222761154, 0.00034840311855077744, 0.00036078691482543945]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 1.0, 6.0, 1.0, 9.0, 9.0, 12.0, 13.0, 12.0, 13.0, 15.0, 24.0, 29.0, 37.0, 29.0, 34.0, 30.0, 30.0, 53.0, 48.0, 40.0, 44.0, 40.0, 44.0, 42.0, 47.0, 43.0, 37.0, 43.0, 34.0, 30.0, 24.0, 23.0, 15.0, 15.0, 16.0, 7.0, 12.0, 10.0, 6.0, 11.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.76953125, -6.5518798828125, -6.334228515625, -6.1165771484375, -5.89892578125, -5.6812744140625, -5.463623046875, -5.2459716796875, -5.0283203125, -4.8106689453125, -4.593017578125, -4.3753662109375, -4.15771484375, -3.9400634765625, -3.722412109375, -3.5047607421875, -3.287109375, -3.0694580078125, -2.851806640625, -2.6341552734375, -2.41650390625, -2.1988525390625, -1.981201171875, -1.7635498046875, -1.5458984375, -1.3282470703125, -1.110595703125, -0.8929443359375, -0.67529296875, -0.4576416015625, -0.239990234375, -0.0223388671875, 0.1953125, 0.4129638671875, 0.630615234375, 0.8482666015625, 1.06591796875, 1.2835693359375, 1.501220703125, 1.7188720703125, 1.9365234375, 2.1541748046875, 2.371826171875, 2.5894775390625, 2.80712890625, 3.0247802734375, 3.242431640625, 3.4600830078125, 3.677734375, 3.8953857421875, 4.113037109375, 4.3306884765625, 4.54833984375, 4.7659912109375, 4.983642578125, 5.2012939453125, 5.4189453125, 5.6365966796875, 5.854248046875, 6.0718994140625, 6.28955078125, 6.5072021484375, 6.724853515625, 6.9425048828125, 7.16015625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 7.0, 4.0, 8.0, 13.0, 17.0, 27.0, 37.0, 39.0, 53.0, 78.0, 123.0, 147.0, 185.0, 286.0, 467.0, 741.0, 1199.0, 2281.0, 4784.0, 11037.0, 28636.0, 89084.0, 381128.0, 387001.0, 90260.0, 28911.0, 11328.0, 4849.0, 2386.0, 1282.0, 678.0, 413.0, 283.0, 250.0, 126.0, 94.0, 77.0, 71.0, 47.0, 34.0, 18.0, 26.0, 15.0, 4.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.2734375, -6.07110595703125, -5.8687744140625, -5.66644287109375, -5.464111328125, -5.26177978515625, -5.0594482421875, -4.85711669921875, -4.65478515625, -4.45245361328125, -4.2501220703125, -4.04779052734375, -3.845458984375, -3.64312744140625, -3.4407958984375, -3.23846435546875, -3.0361328125, -2.83380126953125, -2.6314697265625, -2.42913818359375, -2.226806640625, -2.02447509765625, -1.8221435546875, -1.61981201171875, -1.41748046875, -1.21514892578125, -1.0128173828125, -0.81048583984375, -0.608154296875, -0.40582275390625, -0.2034912109375, -0.00115966796875, 0.201171875, 0.40350341796875, 0.6058349609375, 0.80816650390625, 1.010498046875, 1.21282958984375, 1.4151611328125, 1.61749267578125, 1.81982421875, 2.02215576171875, 2.2244873046875, 2.42681884765625, 2.629150390625, 2.83148193359375, 3.0338134765625, 3.23614501953125, 3.4384765625, 3.64080810546875, 3.8431396484375, 4.04547119140625, 4.247802734375, 4.45013427734375, 4.6524658203125, 4.85479736328125, 5.05712890625, 5.25946044921875, 5.4617919921875, 5.66412353515625, 5.866455078125, 6.06878662109375, 6.2711181640625, 6.47344970703125, 6.67578125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 5.0, 3.0, 8.0, 12.0, 14.0, 14.0, 11.0, 13.0, 24.0, 35.0, 39.0, 36.0, 45.0, 53.0, 48.0, 67.0, 73.0, 148.0, 1841.0, 119.0, 51.0, 55.0, 51.0, 45.0, 42.0, 19.0, 35.0, 36.0, 11.0, 21.0, 15.0, 12.0, 13.0, 8.0, 7.0, 6.0, 4.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.171875, -26.3828125, -25.59375, -24.8046875, -24.015625, -23.2265625, -22.4375, -21.6484375, -20.859375, -20.0703125, -19.28125, -18.4921875, -17.703125, -16.9140625, -16.125, -15.3359375, -14.546875, -13.7578125, -12.96875, -12.1796875, -11.390625, -10.6015625, -9.8125, -9.0234375, -8.234375, -7.4453125, -6.65625, -5.8671875, -5.078125, -4.2890625, -3.5, -2.7109375, -1.921875, -1.1328125, -0.34375, 0.4453125, 1.234375, 2.0234375, 2.8125, 3.6015625, 4.390625, 5.1796875, 5.96875, 6.7578125, 7.546875, 8.3359375, 9.125, 9.9140625, 10.703125, 11.4921875, 12.28125, 13.0703125, 13.859375, 14.6484375, 15.4375, 16.2265625, 17.015625, 17.8046875, 18.59375, 19.3828125, 20.171875, 20.9609375, 21.75, 22.5390625, 23.328125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 8.0, 7.0, 5.0, 18.0, 14.0, 14.0, 19.0, 15.0, 36.0, 38.0, 44.0, 64.0, 97.0, 160.0, 337.0, 1057.0, 15048.0, 3114014.0, 12839.0, 965.0, 325.0, 159.0, 96.0, 83.0, 43.0, 52.0, 38.0, 19.0, 18.0, 13.0, 14.0, 13.0, 9.0, 11.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.71875, -52.86279296875, -51.0068359375, -49.15087890625, -47.294921875, -45.43896484375, -43.5830078125, -41.72705078125, -39.87109375, -38.01513671875, -36.1591796875, -34.30322265625, -32.447265625, -30.59130859375, -28.7353515625, -26.87939453125, -25.0234375, -23.16748046875, -21.3115234375, -19.45556640625, -17.599609375, -15.74365234375, -13.8876953125, -12.03173828125, -10.17578125, -8.31982421875, -6.4638671875, -4.60791015625, -2.751953125, -0.89599609375, 0.9599609375, 2.81591796875, 4.671875, 6.52783203125, 8.3837890625, 10.23974609375, 12.095703125, 13.95166015625, 15.8076171875, 17.66357421875, 19.51953125, 21.37548828125, 23.2314453125, 25.08740234375, 26.943359375, 28.79931640625, 30.6552734375, 32.51123046875, 34.3671875, 36.22314453125, 38.0791015625, 39.93505859375, 41.791015625, 43.64697265625, 45.5029296875, 47.35888671875, 49.21484375, 51.07080078125, 52.9267578125, 54.78271484375, 56.638671875, 58.49462890625, 60.3505859375, 62.20654296875, 64.0625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 285.0, 731.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.956825256347656, -12.510163307189941, -1.0635013580322266, 10.383159637451172, 21.829822540283203, 33.276485443115234, 44.72314453125, 56.16980743408203, 67.61647033691406, 79.0631332397461, 90.50979614257812, 101.95645141601562, 113.40312194824219, 124.84977722167969, 136.29644775390625, 147.74310302734375, 159.18975830078125, 170.63641357421875, 182.0830841064453, 193.5297393798828, 204.97640991210938, 216.42306518554688, 227.86972045898438, 239.31639099121094, 250.7630615234375, 262.209716796875, 273.6563720703125, 285.1030578613281, 296.5497131347656, 307.9963684082031, 319.4430236816406, 330.88970947265625, 342.3363342285156, 353.7829895019531, 365.2296447753906, 376.67633056640625, 388.12298583984375, 399.56964111328125, 411.01629638671875, 422.46295166015625, 433.9096374511719, 445.3562927246094, 456.8029479980469, 468.2496337890625, 479.6962890625, 491.1429443359375, 502.589599609375, 514.0362548828125, 525.48291015625, 536.9295654296875, 548.376220703125, 559.8228759765625, 571.26953125, 582.7162475585938, 594.1629028320312, 605.6095581054688, 617.0562133789062, 628.5028686523438, 639.9495239257812, 651.3961791992188, 662.8428344726562, 674.28955078125, 685.7362060546875, 697.182861328125, 708.6295166015625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 7.0, 11.0, 8.0, 10.0, 11.0, 17.0, 17.0, 27.0, 22.0, 22.0, 13.0, 33.0, 37.0, 30.0, 34.0, 37.0, 33.0, 32.0, 39.0, 50.0, 43.0, 28.0, 33.0, 27.0, 34.0, 39.0, 42.0, 29.0, 36.0, 23.0, 24.0, 22.0, 28.0, 19.0, 18.0, 14.0, 11.0, 10.0, 9.0, 4.0, 6.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-70.2687759399414, -68.1363525390625, -66.0039291381836, -63.87150192260742, -61.739078521728516, -59.606651306152344, -57.47422790527344, -55.34180450439453, -53.209381103515625, -51.07695770263672, -48.94453048706055, -46.81210708618164, -44.679683685302734, -42.54725646972656, -40.414833068847656, -38.28240966796875, -36.14998245239258, -34.01755905151367, -31.885133743286133, -29.752708435058594, -27.620285034179688, -25.48785972595215, -23.35543441772461, -21.223011016845703, -19.090585708618164, -16.958160400390625, -14.825736999511719, -12.69331169128418, -10.560887336730957, -8.428462982177734, -6.296037673950195, -4.163613319396973, -2.03118896484375, 0.10123562812805176, 2.2336602210998535, 4.366085052490234, 6.498509407043457, 8.63093376159668, 10.763359069824219, 12.895783424377441, 15.028207778930664, 17.160633087158203, 19.29305648803711, 21.42548179626465, 23.557907104492188, 25.690330505371094, 27.822755813598633, 29.955181121826172, 32.08760452270508, 34.220027923583984, 36.352455139160156, 38.48487854003906, 40.61730194091797, 42.749725341796875, 44.88215255737305, 47.01457595825195, 49.147003173828125, 51.27942657470703, 53.4118537902832, 55.54427719116211, 57.676700592041016, 59.80912780761719, 61.941551208496094, 64.073974609375, 66.2063980102539]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 0.0, 2.0, 4.0, 10.0, 14.0, 9.0, 18.0, 8.0, 15.0, 23.0, 19.0, 35.0, 40.0, 35.0, 26.0, 33.0, 43.0, 47.0, 46.0, 47.0, 39.0, 49.0, 52.0, 37.0, 43.0, 40.0, 31.0, 42.0, 30.0, 27.0, 24.0, 19.0, 23.0, 7.0, 8.0, 14.0, 10.0, 1.0, 10.0, 12.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.046875, -6.82208251953125, -6.5972900390625, -6.37249755859375, -6.147705078125, -5.92291259765625, -5.6981201171875, -5.47332763671875, -5.24853515625, -5.02374267578125, -4.7989501953125, -4.57415771484375, -4.349365234375, -4.12457275390625, -3.8997802734375, -3.67498779296875, -3.4501953125, -3.22540283203125, -3.0006103515625, -2.77581787109375, -2.551025390625, -2.32623291015625, -2.1014404296875, -1.87664794921875, -1.65185546875, -1.42706298828125, -1.2022705078125, -0.97747802734375, -0.752685546875, -0.52789306640625, -0.3031005859375, -0.07830810546875, 0.146484375, 0.37127685546875, 0.5960693359375, 0.82086181640625, 1.045654296875, 1.27044677734375, 1.4952392578125, 1.72003173828125, 1.94482421875, 2.16961669921875, 2.3944091796875, 2.61920166015625, 2.843994140625, 3.06878662109375, 3.2935791015625, 3.51837158203125, 3.7431640625, 3.96795654296875, 4.1927490234375, 4.41754150390625, 4.642333984375, 4.86712646484375, 5.0919189453125, 5.31671142578125, 5.54150390625, 5.76629638671875, 5.9910888671875, 6.21588134765625, 6.440673828125, 6.66546630859375, 6.8902587890625, 7.11505126953125, 7.33984375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 3.0, 7.0, 10.0, 12.0, 9.0, 17.0, 22.0, 24.0, 34.0, 37.0, 58.0, 88.0, 126.0, 259.0, 567.0, 2302.0, 27078.0, 1343189.0, 2744764.0, 69807.0, 4206.0, 791.0, 347.0, 153.0, 91.0, 66.0, 48.0, 37.0, 27.0, 21.0, 21.0, 7.0, 10.0, 13.0, 7.0, 4.0, 2.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.171875, -26.270263671875, -25.36865234375, -24.467041015625, -23.5654296875, -22.663818359375, -21.76220703125, -20.860595703125, -19.958984375, -19.057373046875, -18.15576171875, -17.254150390625, -16.3525390625, -15.450927734375, -14.54931640625, -13.647705078125, -12.74609375, -11.844482421875, -10.94287109375, -10.041259765625, -9.1396484375, -8.238037109375, -7.33642578125, -6.434814453125, -5.533203125, -4.631591796875, -3.72998046875, -2.828369140625, -1.9267578125, -1.025146484375, -0.12353515625, 0.778076171875, 1.6796875, 2.581298828125, 3.48291015625, 4.384521484375, 5.2861328125, 6.187744140625, 7.08935546875, 7.990966796875, 8.892578125, 9.794189453125, 10.69580078125, 11.597412109375, 12.4990234375, 13.400634765625, 14.30224609375, 15.203857421875, 16.10546875, 17.007080078125, 17.90869140625, 18.810302734375, 19.7119140625, 20.613525390625, 21.51513671875, 22.416748046875, 23.318359375, 24.219970703125, 25.12158203125, 26.023193359375, 26.9248046875, 27.826416015625, 28.72802734375, 29.629638671875, 30.53125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 13.0, 8.0, 16.0, 24.0, 44.0, 65.0, 107.0, 123.0, 224.0, 407.0, 578.0, 662.0, 624.0, 420.0, 262.0, 159.0, 118.0, 66.0, 46.0, 40.0, 19.0, 12.0, 9.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.03125, -33.987548828125, -32.94384765625, -31.900146484375, -30.8564453125, -29.812744140625, -28.76904296875, -27.725341796875, -26.681640625, -25.637939453125, -24.59423828125, -23.550537109375, -22.5068359375, -21.463134765625, -20.41943359375, -19.375732421875, -18.33203125, -17.288330078125, -16.24462890625, -15.200927734375, -14.1572265625, -13.113525390625, -12.06982421875, -11.026123046875, -9.982421875, -8.938720703125, -7.89501953125, -6.851318359375, -5.8076171875, -4.763916015625, -3.72021484375, -2.676513671875, -1.6328125, -0.589111328125, 0.45458984375, 1.498291015625, 2.5419921875, 3.585693359375, 4.62939453125, 5.673095703125, 6.716796875, 7.760498046875, 8.80419921875, 9.847900390625, 10.8916015625, 11.935302734375, 12.97900390625, 14.022705078125, 15.06640625, 16.110107421875, 17.15380859375, 18.197509765625, 19.2412109375, 20.284912109375, 21.32861328125, 22.372314453125, 23.416015625, 24.459716796875, 25.50341796875, 26.547119140625, 27.5908203125, 28.634521484375, 29.67822265625, 30.721923828125, 31.765625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 4.0, 8.0, 3.0, 12.0, 20.0, 46.0, 50.0, 98.0, 183.0, 346.0, 815.0, 9718.0, 4157125.0, 24060.0, 964.0, 379.0, 179.0, 106.0, 59.0, 35.0, 21.0, 19.0, 10.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-133.625, -129.392578125, -125.16015625, -120.927734375, -116.6953125, -112.462890625, -108.23046875, -103.998046875, -99.765625, -95.533203125, -91.30078125, -87.068359375, -82.8359375, -78.603515625, -74.37109375, -70.138671875, -65.90625, -61.673828125, -57.44140625, -53.208984375, -48.9765625, -44.744140625, -40.51171875, -36.279296875, -32.046875, -27.814453125, -23.58203125, -19.349609375, -15.1171875, -10.884765625, -6.65234375, -2.419921875, 1.8125, 6.044921875, 10.27734375, 14.509765625, 18.7421875, 22.974609375, 27.20703125, 31.439453125, 35.671875, 39.904296875, 44.13671875, 48.369140625, 52.6015625, 56.833984375, 61.06640625, 65.298828125, 69.53125, 73.763671875, 77.99609375, 82.228515625, 86.4609375, 90.693359375, 94.92578125, 99.158203125, 103.390625, 107.623046875, 111.85546875, 116.087890625, 120.3203125, 124.552734375, 128.78515625, 133.017578125, 137.25]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 93.0, 489.0, 388.0, 39.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-427.95977783203125, -417.21441650390625, -406.46905517578125, -395.72369384765625, -384.9783020019531, -374.2329406738281, -363.4875793457031, -352.7422180175781, -341.9968566894531, -331.2514953613281, -320.5061340332031, -309.7607421875, -299.015380859375, -288.27001953125, -277.524658203125, -266.779296875, -256.033935546875, -245.28857421875, -234.54319763183594, -223.79783630371094, -213.05247497558594, -202.30709838867188, -191.56173706054688, -180.81637573242188, -170.07098388671875, -159.32562255859375, -148.5802459716797, -137.8348846435547, -127.08952331542969, -116.34415435791016, -105.59878540039062, -94.85342407226562, -84.10806274414062, -73.3626937866211, -62.617332458496094, -51.87196350097656, -41.1265983581543, -30.38123321533203, -19.6358642578125, -8.8905029296875, 1.8548660278320312, 12.600232124328613, 23.345598220825195, 34.090965270996094, 44.83633041381836, 55.581695556640625, 66.32706451416016, 77.07242584228516, 87.81779479980469, 98.56316375732422, 109.30852508544922, 120.05389404296875, 130.79925537109375, 141.54461669921875, 152.2899932861328, 163.0353546142578, 173.78073120117188, 184.52609252929688, 195.27146911621094, 206.01683044433594, 216.76219177246094, 227.507568359375, 238.2529296875, 248.998291015625, 259.74365234375]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 2.0, 2.0, 10.0, 12.0, 4.0, 9.0, 12.0, 17.0, 11.0, 18.0, 24.0, 22.0, 19.0, 30.0, 33.0, 27.0, 43.0, 41.0, 40.0, 34.0, 40.0, 37.0, 39.0, 45.0, 38.0, 38.0, 34.0, 43.0, 20.0, 36.0, 23.0, 28.0, 20.0, 27.0, 17.0, 15.0, 22.0, 13.0, 8.0, 8.0, 6.0, 9.0, 8.0, 4.0, 4.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-83.39867401123047, -80.9155044555664, -78.43234252929688, -75.94917297363281, -73.46601104736328, -70.98284149169922, -68.49967956542969, -66.01651000976562, -63.53334426879883, -61.05017852783203, -58.567012786865234, -56.08384704589844, -53.600677490234375, -51.117515563964844, -48.63434600830078, -46.151180267333984, -43.66801452636719, -41.18484878540039, -38.701683044433594, -36.2185173034668, -33.7353515625, -31.25218391418457, -28.76901626586914, -26.285850524902344, -23.802684783935547, -21.31951904296875, -18.836353302001953, -16.353185653686523, -13.870019912719727, -11.38685417175293, -8.903687477111816, -6.420520782470703, -3.9373550415039062, -1.4541888236999512, 1.028977394104004, 3.512143611907959, 5.995309829711914, 8.478475570678711, 10.961642265319824, 13.444808959960938, 15.927974700927734, 18.41114044189453, 20.894306182861328, 23.377473831176758, 25.860639572143555, 28.34380531311035, 30.82697296142578, 33.31013870239258, 35.793304443359375, 38.27647018432617, 40.75963592529297, 43.242801666259766, 45.72596740722656, 48.209136962890625, 50.69230270385742, 53.17546844482422, 55.658634185791016, 58.14179992675781, 60.62496566772461, 63.108131408691406, 65.59130096435547, 68.074462890625, 70.55763244628906, 73.04080200195312, 75.52396392822266]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 9.0, 5.0, 8.0, 11.0, 12.0, 13.0, 27.0, 25.0, 32.0, 25.0, 28.0, 29.0, 31.0, 35.0, 43.0, 43.0, 59.0, 46.0, 50.0, 40.0, 45.0, 41.0, 40.0, 45.0, 36.0, 29.0, 33.0, 32.0, 21.0, 20.0, 14.0, 12.0, 11.0, 7.0, 7.0, 5.0, 12.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.63671875, -6.40802001953125, -6.1793212890625, -5.95062255859375, -5.721923828125, -5.49322509765625, -5.2645263671875, -5.03582763671875, -4.80712890625, -4.57843017578125, -4.3497314453125, -4.12103271484375, -3.892333984375, -3.66363525390625, -3.4349365234375, -3.20623779296875, -2.9775390625, -2.74884033203125, -2.5201416015625, -2.29144287109375, -2.062744140625, -1.83404541015625, -1.6053466796875, -1.37664794921875, -1.14794921875, -0.91925048828125, -0.6905517578125, -0.46185302734375, -0.233154296875, -0.00445556640625, 0.2242431640625, 0.45294189453125, 0.681640625, 0.91033935546875, 1.1390380859375, 1.36773681640625, 1.596435546875, 1.82513427734375, 2.0538330078125, 2.28253173828125, 2.51123046875, 2.73992919921875, 2.9686279296875, 3.19732666015625, 3.426025390625, 3.65472412109375, 3.8834228515625, 4.11212158203125, 4.3408203125, 4.56951904296875, 4.7982177734375, 5.02691650390625, 5.255615234375, 5.48431396484375, 5.7130126953125, 5.94171142578125, 6.17041015625, 6.39910888671875, 6.6278076171875, 6.85650634765625, 7.085205078125, 7.31390380859375, 7.5426025390625, 7.77130126953125, 8.0]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 8.0, 24.0, 21.0, 27.0, 57.0, 83.0, 130.0, 200.0, 299.0, 505.0, 870.0, 1522.0, 2466.0, 4316.0, 7781.0, 14582.0, 28074.0, 55665.0, 121605.0, 387125.0, 239193.0, 91332.0, 43710.0, 22129.0, 11602.0, 6533.0, 3565.0, 1981.0, 1152.0, 732.0, 471.0, 282.0, 180.0, 103.0, 67.0, 43.0, 41.0, 19.0, 19.0, 13.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.111328125, -2.0507049560546875, -1.990081787109375, -1.9294586181640625, -1.86883544921875, -1.8082122802734375, -1.747589111328125, -1.6869659423828125, -1.6263427734375, -1.5657196044921875, -1.505096435546875, -1.4444732666015625, -1.38385009765625, -1.3232269287109375, -1.262603759765625, -1.2019805908203125, -1.141357421875, -1.0807342529296875, -1.020111083984375, -0.9594879150390625, -0.89886474609375, -0.8382415771484375, -0.777618408203125, -0.7169952392578125, -0.6563720703125, -0.5957489013671875, -0.535125732421875, -0.4745025634765625, -0.41387939453125, -0.3532562255859375, -0.292633056640625, -0.2320098876953125, -0.17138671875, -0.1107635498046875, -0.050140380859375, 0.0104827880859375, 0.07110595703125, 0.1317291259765625, 0.192352294921875, 0.2529754638671875, 0.3135986328125, 0.3742218017578125, 0.434844970703125, 0.4954681396484375, 0.55609130859375, 0.6167144775390625, 0.677337646484375, 0.7379608154296875, 0.798583984375, 0.8592071533203125, 0.919830322265625, 0.9804534912109375, 1.04107666015625, 1.1016998291015625, 1.162322998046875, 1.2229461669921875, 1.2835693359375, 1.3441925048828125, 1.404815673828125, 1.4654388427734375, 1.52606201171875, 1.5866851806640625, 1.647308349609375, 1.7079315185546875, 1.7685546875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 6.0, 17.0, 9.0, 10.0, 15.0, 21.0, 25.0, 15.0, 26.0, 33.0, 18.0, 26.0, 30.0, 34.0, 25.0, 27.0, 44.0, 39.0, 38.0, 1065.0, 42.0, 40.0, 38.0, 30.0, 28.0, 43.0, 41.0, 33.0, 29.0, 16.0, 21.0, 16.0, 18.0, 21.0, 16.0, 13.0, 10.0, 7.0, 6.0, 9.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.75390625, -3.6300048828125, -3.506103515625, -3.3822021484375, -3.25830078125, -3.1343994140625, -3.010498046875, -2.8865966796875, -2.7626953125, -2.6387939453125, -2.514892578125, -2.3909912109375, -2.26708984375, -2.1431884765625, -2.019287109375, -1.8953857421875, -1.771484375, -1.6475830078125, -1.523681640625, -1.3997802734375, -1.27587890625, -1.1519775390625, -1.028076171875, -0.9041748046875, -0.7802734375, -0.6563720703125, -0.532470703125, -0.4085693359375, -0.28466796875, -0.1607666015625, -0.036865234375, 0.0870361328125, 0.2109375, 0.3348388671875, 0.458740234375, 0.5826416015625, 0.70654296875, 0.8304443359375, 0.954345703125, 1.0782470703125, 1.2021484375, 1.3260498046875, 1.449951171875, 1.5738525390625, 1.69775390625, 1.8216552734375, 1.945556640625, 2.0694580078125, 2.193359375, 2.3172607421875, 2.441162109375, 2.5650634765625, 2.68896484375, 2.8128662109375, 2.936767578125, 3.0606689453125, 3.1845703125, 3.3084716796875, 3.432373046875, 3.5562744140625, 3.68017578125, 3.8040771484375, 3.927978515625, 4.0518798828125, 4.17578125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 6.0, 14.0, 12.0, 19.0, 28.0, 32.0, 55.0, 72.0, 107.0, 160.0, 229.0, 321.0, 472.0, 687.0, 1032.0, 1436.0, 2217.0, 3348.0, 5038.0, 7602.0, 11536.0, 17220.0, 26723.0, 41439.0, 65789.0, 119141.0, 1351990.0, 196766.0, 90732.0, 53601.0, 33867.0, 22095.0, 14564.0, 9845.0, 6282.0, 4288.0, 2810.0, 1754.0, 1232.0, 847.0, 520.0, 372.0, 286.0, 170.0, 115.0, 92.0, 43.0, 37.0, 27.0, 18.0, 13.0, 8.0, 6.0, 9.0, 4.0, 2.0, 3.0], "bins": [-1.2529296875, -1.215850830078125, -1.17877197265625, -1.141693115234375, -1.1046142578125, -1.067535400390625, -1.03045654296875, -0.993377685546875, -0.956298828125, -0.919219970703125, -0.88214111328125, -0.845062255859375, -0.8079833984375, -0.770904541015625, -0.73382568359375, -0.696746826171875, -0.65966796875, -0.622589111328125, -0.58551025390625, -0.548431396484375, -0.5113525390625, -0.474273681640625, -0.43719482421875, -0.400115966796875, -0.363037109375, -0.325958251953125, -0.28887939453125, -0.251800537109375, -0.2147216796875, -0.177642822265625, -0.14056396484375, -0.103485107421875, -0.06640625, -0.029327392578125, 0.00775146484375, 0.044830322265625, 0.0819091796875, 0.118988037109375, 0.15606689453125, 0.193145751953125, 0.230224609375, 0.267303466796875, 0.30438232421875, 0.341461181640625, 0.3785400390625, 0.415618896484375, 0.45269775390625, 0.489776611328125, 0.52685546875, 0.563934326171875, 0.60101318359375, 0.638092041015625, 0.6751708984375, 0.712249755859375, 0.74932861328125, 0.786407470703125, 0.823486328125, 0.860565185546875, 0.89764404296875, 0.934722900390625, 0.9718017578125, 1.008880615234375, 1.04595947265625, 1.083038330078125, 1.1201171875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 7.0, 5.0, 5.0, 2.0, 9.0, 11.0, 14.0, 25.0, 20.0, 22.0, 35.0, 68.0, 60.0, 59.0, 58.0, 86.0, 92.0, 80.0, 67.0, 56.0, 43.0, 36.0, 44.0, 24.0, 26.0, 12.0, 4.0, 8.0, 10.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007781982421875, -0.0007513165473937988, -0.0007244348526000977, -0.0006975531578063965, -0.0006706714630126953, -0.0006437897682189941, -0.000616908073425293, -0.0005900263786315918, -0.0005631446838378906, -0.0005362629890441895, -0.0005093812942504883, -0.0004824995994567871, -0.00045561790466308594, -0.00042873620986938477, -0.0004018545150756836, -0.0003749728202819824, -0.00034809112548828125, -0.0003212094306945801, -0.0002943277359008789, -0.00026744604110717773, -0.00024056434631347656, -0.0002136826515197754, -0.00018680095672607422, -0.00015991926193237305, -0.00013303756713867188, -0.0001061558723449707, -7.927417755126953e-05, -5.239248275756836e-05, -2.5510787963867188e-05, 1.3709068298339844e-06, 2.8252601623535156e-05, 5.513429641723633e-05, 8.20159912109375e-05, 0.00010889768600463867, 0.00013577938079833984, 0.00016266107559204102, 0.0001895427703857422, 0.00021642446517944336, 0.00024330615997314453, 0.0002701878547668457, 0.0002970695495605469, 0.00032395124435424805, 0.0003508329391479492, 0.0003777146339416504, 0.00040459632873535156, 0.00043147802352905273, 0.0004583597183227539, 0.0004852414131164551, 0.0005121231079101562, 0.0005390048027038574, 0.0005658864974975586, 0.0005927681922912598, 0.0006196498870849609, 0.0006465315818786621, 0.0006734132766723633, 0.0007002949714660645, 0.0007271766662597656, 0.0007540583610534668, 0.000780940055847168, 0.0008078217506408691, 0.0008347034454345703, 0.0008615851402282715, 0.0008884668350219727, 0.0009153485298156738, 0.000942230224609375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 5.0, 6.0, 8.0, 17.0, 22.0, 26.0, 41.0, 52.0, 95.0, 134.0, 240.0, 522.0, 13457.0, 1032175.0, 903.0, 347.0, 200.0, 99.0, 51.0, 35.0, 27.0, 20.0, 18.0, 16.0, 4.0, 6.0, 4.0, 4.0, 1.0, 8.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0267791748046875, -0.02604055404663086, -0.02530193328857422, -0.024563312530517578, -0.023824691772460938, -0.023086071014404297, -0.022347450256347656, -0.021608829498291016, -0.020870208740234375, -0.020131587982177734, -0.019392967224121094, -0.018654346466064453, -0.017915725708007812, -0.017177104949951172, -0.01643848419189453, -0.01569986343383789, -0.01496124267578125, -0.01422262191772461, -0.013484001159667969, -0.012745380401611328, -0.012006759643554688, -0.011268138885498047, -0.010529518127441406, -0.009790897369384766, -0.009052276611328125, -0.008313655853271484, -0.007575035095214844, -0.006836414337158203, -0.0060977935791015625, -0.005359172821044922, -0.004620552062988281, -0.0038819313049316406, -0.003143310546875, -0.0024046897888183594, -0.0016660690307617188, -0.0009274482727050781, -0.0001888275146484375, 0.0005497932434082031, 0.0012884140014648438, 0.0020270347595214844, 0.002765655517578125, 0.0035042762756347656, 0.004242897033691406, 0.004981517791748047, 0.0057201385498046875, 0.006458759307861328, 0.007197380065917969, 0.00793600082397461, 0.00867462158203125, 0.00941324234008789, 0.010151863098144531, 0.010890483856201172, 0.011629104614257812, 0.012367725372314453, 0.013106346130371094, 0.013844966888427734, 0.014583587646484375, 0.015322208404541016, 0.016060829162597656, 0.016799449920654297, 0.017538070678710938, 0.018276691436767578, 0.01901531219482422, 0.01975393295288086, 0.0204925537109375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 11.0, 141.0, 542.0, 293.0, 29.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044134899508208036, -0.0003753548371605575, -0.00030936067923903465, -0.00024336649221368134, -0.00017737233429215848, -0.00011137817637063563, -4.5383989345282316e-05, 2.061016857624054e-05, 8.66043264977634e-05, 0.00015259848441928625, 0.00021859265689272434, 0.0002845868293661624, 0.0003505809872876853, 0.00041657514520920813, 0.00048256933223456144, 0.0005485634901560843, 0.0006145576480776072, 0.00068055180599913, 0.0007465459639206529, 0.0008125401800498366, 0.0008785342797636986, 0.0009445284958928823, 0.0010105227120220661, 0.001076516811735928, 0.00114251091144979, 0.0012085051275789738, 0.0012744992272928357, 0.0013404934434220195, 0.0014064875431358814, 0.0014724817592650652, 0.001538475975394249, 0.001604470075108111, 0.0016704641748219728, 0.0017364583909511566, 0.0018024524906650186, 0.0018684467067942023, 0.0019344408065080643, 0.002000435022637248, 0.002066429238766432, 0.002132423222064972, 0.0021984174381941557, 0.0022644116543233395, 0.0023304058704525232, 0.0023963998537510633, 0.002462394069880247, 0.002528388286009431, 0.0025943825021386147, 0.0026603764854371548, 0.002726370934396982, 0.002792365150526166, 0.0028583593666553497, 0.00292435334995389, 0.0029903475660830736, 0.0030563417822122574, 0.003122335998341441, 0.003188330214470625, 0.003254324197769165, 0.003320318413898349, 0.0033863126300275326, 0.0034523066133260727, 0.0035183008294552565, 0.0035842950455844402, 0.003650289261713624, 0.0037162834778428078, 0.003782277461141348]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 8.0, 7.0, 15.0, 13.0, 15.0, 19.0, 17.0, 23.0, 20.0, 24.0, 21.0, 27.0, 42.0, 40.0, 36.0, 51.0, 34.0, 38.0, 39.0, 50.0, 50.0, 46.0, 40.0, 27.0, 32.0, 30.0, 35.0, 40.0, 19.0, 22.0, 21.0, 11.0, 20.0, 9.0, 9.0, 5.0, 9.0, 5.0, 6.0, 1.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003440380096435547, -0.00033304188400506973, -0.0003220457583665848, -0.0003110496327280998, -0.00030005350708961487, -0.0002890573814511299, -0.00027806125581264496, -0.00026706513017416, -0.00025606900453567505, -0.0002450728788971901, -0.00023407675325870514, -0.00022308062762022018, -0.00021208450198173523, -0.00020108837634325027, -0.00019009225070476532, -0.00017909612506628036, -0.0001680999994277954, -0.00015710387378931046, -0.0001461077481508255, -0.00013511162251234055, -0.0001241154968738556, -0.00011311937123537064, -0.00010212324559688568, -9.112711995840073e-05, -8.013099431991577e-05, -6.913486868143082e-05, -5.813874304294586e-05, -4.714261740446091e-05, -3.614649176597595e-05, -2.5150366127490997e-05, -1.4154240489006042e-05, -3.1581148505210876e-06, 7.838010787963867e-06, 1.8834136426448822e-05, 2.9830262064933777e-05, 4.082638770341873e-05, 5.1822513341903687e-05, 6.281863898038864e-05, 7.38147646188736e-05, 8.481089025735855e-05, 9.58070158958435e-05, 0.00010680314153432846, 0.00011779926717281342, 0.00012879539281129837, 0.00013979151844978333, 0.00015078764408826828, 0.00016178376972675323, 0.0001727798953652382, 0.00018377602100372314, 0.0001947721466422081, 0.00020576827228069305, 0.000216764397919178, 0.00022776052355766296, 0.00023875664919614792, 0.0002497527748346329, 0.00026074890047311783, 0.0002717450261116028, 0.00028274115175008774, 0.0002937372773885727, 0.00030473340302705765, 0.0003157295286655426, 0.00032672565430402756, 0.0003377217799425125, 0.00034871790558099747, 0.0003597140312194824]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 9.0, 5.0, 8.0, 11.0, 12.0, 13.0, 27.0, 25.0, 32.0, 25.0, 28.0, 29.0, 31.0, 35.0, 43.0, 43.0, 59.0, 46.0, 50.0, 40.0, 46.0, 40.0, 40.0, 45.0, 36.0, 29.0, 33.0, 32.0, 21.0, 20.0, 14.0, 12.0, 11.0, 7.0, 7.0, 5.0, 12.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.63671875, -6.40802001953125, -6.1793212890625, -5.95062255859375, -5.721923828125, -5.49322509765625, -5.2645263671875, -5.03582763671875, -4.80712890625, -4.57843017578125, -4.3497314453125, -4.12103271484375, -3.892333984375, -3.66363525390625, -3.4349365234375, -3.20623779296875, -2.9775390625, -2.74884033203125, -2.5201416015625, -2.29144287109375, -2.062744140625, -1.83404541015625, -1.6053466796875, -1.37664794921875, -1.14794921875, -0.91925048828125, -0.6905517578125, -0.46185302734375, -0.233154296875, -0.00445556640625, 0.2242431640625, 0.45294189453125, 0.681640625, 0.91033935546875, 1.1390380859375, 1.36773681640625, 1.596435546875, 1.82513427734375, 2.0538330078125, 2.28253173828125, 2.51123046875, 2.73992919921875, 2.9686279296875, 3.19732666015625, 3.426025390625, 3.65472412109375, 3.8834228515625, 4.11212158203125, 4.3408203125, 4.56951904296875, 4.7982177734375, 5.02691650390625, 5.255615234375, 5.48431396484375, 5.7130126953125, 5.94171142578125, 6.17041015625, 6.39910888671875, 6.6278076171875, 6.85650634765625, 7.085205078125, 7.31390380859375, 7.5426025390625, 7.77130126953125, 8.0]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 6.0, 22.0, 16.0, 31.0, 27.0, 45.0, 62.0, 90.0, 128.0, 204.0, 297.0, 457.0, 689.0, 1226.0, 1940.0, 3679.0, 7024.0, 15121.0, 36158.0, 97834.0, 329411.0, 373157.0, 107849.0, 39597.0, 16362.0, 7709.0, 3851.0, 2201.0, 1165.0, 720.0, 484.0, 315.0, 206.0, 149.0, 89.0, 72.0, 52.0, 27.0, 19.0, 20.0, 12.0, 11.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41796875, -4.265869140625, -4.11376953125, -3.961669921875, -3.8095703125, -3.657470703125, -3.50537109375, -3.353271484375, -3.201171875, -3.049072265625, -2.89697265625, -2.744873046875, -2.5927734375, -2.440673828125, -2.28857421875, -2.136474609375, -1.984375, -1.832275390625, -1.68017578125, -1.528076171875, -1.3759765625, -1.223876953125, -1.07177734375, -0.919677734375, -0.767578125, -0.615478515625, -0.46337890625, -0.311279296875, -0.1591796875, -0.007080078125, 0.14501953125, 0.297119140625, 0.44921875, 0.601318359375, 0.75341796875, 0.905517578125, 1.0576171875, 1.209716796875, 1.36181640625, 1.513916015625, 1.666015625, 1.818115234375, 1.97021484375, 2.122314453125, 2.2744140625, 2.426513671875, 2.57861328125, 2.730712890625, 2.8828125, 3.034912109375, 3.18701171875, 3.339111328125, 3.4912109375, 3.643310546875, 3.79541015625, 3.947509765625, 4.099609375, 4.251708984375, 4.40380859375, 4.555908203125, 4.7080078125, 4.860107421875, 5.01220703125, 5.164306640625, 5.31640625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 7.0, 7.0, 8.0, 12.0, 17.0, 15.0, 23.0, 23.0, 26.0, 27.0, 34.0, 36.0, 39.0, 45.0, 52.0, 66.0, 176.0, 1851.0, 133.0, 62.0, 52.0, 49.0, 44.0, 37.0, 37.0, 30.0, 25.0, 24.0, 19.0, 15.0, 8.0, 13.0, 14.0, 6.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.390625, -27.5146484375, -26.638671875, -25.7626953125, -24.88671875, -24.0107421875, -23.134765625, -22.2587890625, -21.3828125, -20.5068359375, -19.630859375, -18.7548828125, -17.87890625, -17.0029296875, -16.126953125, -15.2509765625, -14.375, -13.4990234375, -12.623046875, -11.7470703125, -10.87109375, -9.9951171875, -9.119140625, -8.2431640625, -7.3671875, -6.4912109375, -5.615234375, -4.7392578125, -3.86328125, -2.9873046875, -2.111328125, -1.2353515625, -0.359375, 0.5166015625, 1.392578125, 2.2685546875, 3.14453125, 4.0205078125, 4.896484375, 5.7724609375, 6.6484375, 7.5244140625, 8.400390625, 9.2763671875, 10.15234375, 11.0283203125, 11.904296875, 12.7802734375, 13.65625, 14.5322265625, 15.408203125, 16.2841796875, 17.16015625, 18.0361328125, 18.912109375, 19.7880859375, 20.6640625, 21.5400390625, 22.416015625, 23.2919921875, 24.16796875, 25.0439453125, 25.919921875, 26.7958984375, 27.671875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 12.0, 14.0, 9.0, 9.0, 16.0, 21.0, 22.0, 22.0, 38.0, 55.0, 55.0, 104.0, 174.0, 295.0, 822.0, 6493.0, 2874184.0, 259279.0, 2786.0, 548.0, 254.0, 141.0, 90.0, 40.0, 45.0, 36.0, 23.0, 24.0, 21.0, 16.0, 12.0, 10.0, 8.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.3125, -44.8583984375, -43.404296875, -41.9501953125, -40.49609375, -39.0419921875, -37.587890625, -36.1337890625, -34.6796875, -33.2255859375, -31.771484375, -30.3173828125, -28.86328125, -27.4091796875, -25.955078125, -24.5009765625, -23.046875, -21.5927734375, -20.138671875, -18.6845703125, -17.23046875, -15.7763671875, -14.322265625, -12.8681640625, -11.4140625, -9.9599609375, -8.505859375, -7.0517578125, -5.59765625, -4.1435546875, -2.689453125, -1.2353515625, 0.21875, 1.6728515625, 3.126953125, 4.5810546875, 6.03515625, 7.4892578125, 8.943359375, 10.3974609375, 11.8515625, 13.3056640625, 14.759765625, 16.2138671875, 17.66796875, 19.1220703125, 20.576171875, 22.0302734375, 23.484375, 24.9384765625, 26.392578125, 27.8466796875, 29.30078125, 30.7548828125, 32.208984375, 33.6630859375, 35.1171875, 36.5712890625, 38.025390625, 39.4794921875, 40.93359375, 42.3876953125, 43.841796875, 45.2958984375, 46.75]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [25.0, 677.0, 315.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.908289909362793, -5.010406017303467, 0.8874778747558594, 6.785361289978027, 12.683245658874512, 18.581130981445312, 24.47901153564453, 30.376895904541016, 36.2747802734375, 42.172664642333984, 48.07054901123047, 53.96842956542969, 59.86631774902344, 65.76419830322266, 71.66207885742188, 77.55996704101562, 83.45785522460938, 89.3557357788086, 95.25362396240234, 101.15150451660156, 107.04939270019531, 112.94727325439453, 118.84515380859375, 124.7430419921875, 130.64093017578125, 136.538818359375, 142.4366912841797, 148.33457946777344, 154.2324676513672, 160.13035583496094, 166.02822875976562, 171.92611694335938, 177.82398986816406, 183.7218780517578, 189.6197509765625, 195.51763916015625, 201.41552734375, 207.31341552734375, 213.21128845214844, 219.1091766357422, 225.00706481933594, 230.9049530029297, 236.80282592773438, 242.70071411132812, 248.59860229492188, 254.49649047851562, 260.3943786621094, 266.292236328125, 272.19012451171875, 278.0880126953125, 283.98590087890625, 289.8837890625, 295.7816467285156, 301.6795349121094, 307.5774230957031, 313.4753112792969, 319.3731994628906, 325.2710876464844, 331.1689758300781, 337.0668640136719, 342.9647216796875, 348.86260986328125, 354.760498046875, 360.65838623046875, 366.5562744140625]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 7.0, 15.0, 8.0, 13.0, 16.0, 13.0, 32.0, 17.0, 33.0, 24.0, 25.0, 28.0, 32.0, 31.0, 31.0, 36.0, 39.0, 56.0, 38.0, 39.0, 43.0, 36.0, 49.0, 32.0, 29.0, 32.0, 34.0, 25.0, 27.0, 21.0, 19.0, 21.0, 16.0, 14.0, 12.0, 7.0, 8.0, 3.0, 2.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-71.33573150634766, -68.8845443725586, -66.433349609375, -63.98215866088867, -61.530967712402344, -59.079776763916016, -56.62858581542969, -54.177398681640625, -51.72620391845703, -49.2750129699707, -46.823822021484375, -44.37263107299805, -41.92144012451172, -39.47024917602539, -37.01905822753906, -34.56787109375, -32.11668014526367, -29.665489196777344, -27.214298248291016, -24.763107299804688, -22.31191635131836, -19.86072540283203, -17.409536361694336, -14.958345413208008, -12.50715446472168, -10.055963516235352, -7.604773044586182, -5.153582572937012, -2.7023916244506836, -0.25120067596435547, 2.1999893188476562, 4.651180267333984, 7.1023712158203125, 9.55356216430664, 12.004753112792969, 14.45594310760498, 16.907135009765625, 19.358325958251953, 21.80951499938965, 24.260705947875977, 26.711896896362305, 29.163087844848633, 31.61427879333496, 34.065467834472656, 36.516658782958984, 38.96784973144531, 41.41904067993164, 43.87023162841797, 46.3214225769043, 48.772613525390625, 51.22380447387695, 53.67499542236328, 56.12618637084961, 58.57737731933594, 61.028564453125, 63.479759216308594, 65.93094635009766, 68.38213348388672, 70.83332824707031, 73.28451538085938, 75.73571014404297, 78.18689727783203, 80.63809204101562, 83.08927917480469, 85.54047393798828]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 5.0, 7.0, 9.0, 14.0, 10.0, 28.0, 22.0, 26.0, 25.0, 24.0, 31.0, 35.0, 29.0, 45.0, 47.0, 46.0, 49.0, 45.0, 46.0, 39.0, 51.0, 39.0, 47.0, 42.0, 26.0, 39.0, 26.0, 28.0, 22.0, 18.0, 9.0, 13.0, 7.0, 7.0, 7.0, 13.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.79296875, -6.55511474609375, -6.3172607421875, -6.07940673828125, -5.841552734375, -5.60369873046875, -5.3658447265625, -5.12799072265625, -4.89013671875, -4.65228271484375, -4.4144287109375, -4.17657470703125, -3.938720703125, -3.70086669921875, -3.4630126953125, -3.22515869140625, -2.9873046875, -2.74945068359375, -2.5115966796875, -2.27374267578125, -2.035888671875, -1.79803466796875, -1.5601806640625, -1.32232666015625, -1.08447265625, -0.84661865234375, -0.6087646484375, -0.37091064453125, -0.133056640625, 0.10479736328125, 0.3426513671875, 0.58050537109375, 0.818359375, 1.05621337890625, 1.2940673828125, 1.53192138671875, 1.769775390625, 2.00762939453125, 2.2454833984375, 2.48333740234375, 2.72119140625, 2.95904541015625, 3.1968994140625, 3.43475341796875, 3.672607421875, 3.91046142578125, 4.1483154296875, 4.38616943359375, 4.6240234375, 4.86187744140625, 5.0997314453125, 5.33758544921875, 5.575439453125, 5.81329345703125, 6.0511474609375, 6.28900146484375, 6.52685546875, 6.76470947265625, 7.0025634765625, 7.24041748046875, 7.478271484375, 7.71612548828125, 7.9539794921875, 8.19183349609375, 8.4296875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 4.0, 5.0, 7.0, 14.0, 10.0, 12.0, 20.0, 28.0, 17.0, 30.0, 34.0, 24.0, 33.0, 50.0, 77.0, 209.0, 1232.0, 105644.0, 4037595.0, 47708.0, 961.0, 174.0, 84.0, 42.0, 40.0, 40.0, 36.0, 27.0, 21.0, 16.0, 12.0, 16.0, 11.0, 11.0, 8.0, 10.0, 7.0, 7.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.78125, -43.20654296875, -41.6318359375, -40.05712890625, -38.482421875, -36.90771484375, -35.3330078125, -33.75830078125, -32.18359375, -30.60888671875, -29.0341796875, -27.45947265625, -25.884765625, -24.31005859375, -22.7353515625, -21.16064453125, -19.5859375, -18.01123046875, -16.4365234375, -14.86181640625, -13.287109375, -11.71240234375, -10.1376953125, -8.56298828125, -6.98828125, -5.41357421875, -3.8388671875, -2.26416015625, -0.689453125, 0.88525390625, 2.4599609375, 4.03466796875, 5.609375, 7.18408203125, 8.7587890625, 10.33349609375, 11.908203125, 13.48291015625, 15.0576171875, 16.63232421875, 18.20703125, 19.78173828125, 21.3564453125, 22.93115234375, 24.505859375, 26.08056640625, 27.6552734375, 29.22998046875, 30.8046875, 32.37939453125, 33.9541015625, 35.52880859375, 37.103515625, 38.67822265625, 40.2529296875, 41.82763671875, 43.40234375, 44.97705078125, 46.5517578125, 48.12646484375, 49.701171875, 51.27587890625, 52.8505859375, 54.42529296875, 56.0]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 5.0, 4.0, 9.0, 14.0, 19.0, 33.0, 37.0, 65.0, 88.0, 124.0, 162.0, 209.0, 369.0, 481.0, 610.0, 539.0, 429.0, 279.0, 194.0, 125.0, 90.0, 60.0, 41.0, 37.0, 23.0, 10.0, 7.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.359375, -24.55908203125, -23.7587890625, -22.95849609375, -22.158203125, -21.35791015625, -20.5576171875, -19.75732421875, -18.95703125, -18.15673828125, -17.3564453125, -16.55615234375, -15.755859375, -14.95556640625, -14.1552734375, -13.35498046875, -12.5546875, -11.75439453125, -10.9541015625, -10.15380859375, -9.353515625, -8.55322265625, -7.7529296875, -6.95263671875, -6.15234375, -5.35205078125, -4.5517578125, -3.75146484375, -2.951171875, -2.15087890625, -1.3505859375, -0.55029296875, 0.25, 1.05029296875, 1.8505859375, 2.65087890625, 3.451171875, 4.25146484375, 5.0517578125, 5.85205078125, 6.65234375, 7.45263671875, 8.2529296875, 9.05322265625, 9.853515625, 10.65380859375, 11.4541015625, 12.25439453125, 13.0546875, 13.85498046875, 14.6552734375, 15.45556640625, 16.255859375, 17.05615234375, 17.8564453125, 18.65673828125, 19.45703125, 20.25732421875, 21.0576171875, 21.85791015625, 22.658203125, 23.45849609375, 24.2587890625, 25.05908203125, 25.859375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 8.0, 13.0, 12.0, 25.0, 40.0, 64.0, 98.0, 125.0, 153.0, 296.0, 673.0, 7922.0, 4113725.0, 68962.0, 1061.0, 423.0, 215.0, 149.0, 107.0, 69.0, 57.0, 31.0, 15.0, 15.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.6875, -114.939453125, -111.19140625, -107.443359375, -103.6953125, -99.947265625, -96.19921875, -92.451171875, -88.703125, -84.955078125, -81.20703125, -77.458984375, -73.7109375, -69.962890625, -66.21484375, -62.466796875, -58.71875, -54.970703125, -51.22265625, -47.474609375, -43.7265625, -39.978515625, -36.23046875, -32.482421875, -28.734375, -24.986328125, -21.23828125, -17.490234375, -13.7421875, -9.994140625, -6.24609375, -2.498046875, 1.25, 4.998046875, 8.74609375, 12.494140625, 16.2421875, 19.990234375, 23.73828125, 27.486328125, 31.234375, 34.982421875, 38.73046875, 42.478515625, 46.2265625, 49.974609375, 53.72265625, 57.470703125, 61.21875, 64.966796875, 68.71484375, 72.462890625, 76.2109375, 79.958984375, 83.70703125, 87.455078125, 91.203125, 94.951171875, 98.69921875, 102.447265625, 106.1953125, 109.943359375, 113.69140625, 117.439453125, 121.1875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 7.0, 50.0, 243.0, 398.0, 239.0, 76.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.334232330322266, -26.81269645690918, -19.291160583496094, -11.769622802734375, -4.248086929321289, 3.273448944091797, 10.794986724853516, 18.31652069091797, 25.838058471679688, 33.359596252441406, 40.88113021850586, 48.40266799926758, 55.92420196533203, 63.44573974609375, 70.96727752685547, 78.48881530761719, 86.01034545898438, 93.5318832397461, 101.05342102050781, 108.574951171875, 116.09648895263672, 123.61802673339844, 131.13955688476562, 138.66110229492188, 146.18264770507812, 153.7041778564453, 161.22572326660156, 168.74725341796875, 176.268798828125, 183.7903289794922, 191.31185913085938, 198.83340454101562, 206.3549346923828, 213.87646484375, 221.39801025390625, 228.91954040527344, 236.4410858154297, 243.96261596679688, 251.48416137695312, 259.00567626953125, 266.5272216796875, 274.04876708984375, 281.5702819824219, 289.0918273925781, 296.6133728027344, 304.1348876953125, 311.65643310546875, 319.177978515625, 326.69952392578125, 334.2210693359375, 341.7425842285156, 349.2641296386719, 356.7856750488281, 364.30718994140625, 371.8287353515625, 379.35028076171875, 386.8717956542969, 394.3933410644531, 401.91485595703125, 409.4364013671875, 416.95794677734375, 424.4794921875, 432.0010070800781, 439.5225524902344, 447.0440979003906]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 9.0, 8.0, 10.0, 13.0, 23.0, 16.0, 21.0, 25.0, 33.0, 36.0, 42.0, 32.0, 34.0, 48.0, 55.0, 43.0, 47.0, 43.0, 59.0, 45.0, 32.0, 52.0, 38.0, 33.0, 24.0, 30.0, 29.0, 18.0, 21.0, 17.0, 11.0, 12.0, 8.0, 8.0, 4.0, 7.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.67984008789062, -78.16622924804688, -75.6526107788086, -73.13899993896484, -70.62538146972656, -68.11177062988281, -65.59815979003906, -63.08454513549805, -60.57093048095703, -58.057315826416016, -55.543701171875, -53.03009033203125, -50.516475677490234, -48.00286102294922, -45.48925018310547, -42.97563552856445, -40.46202087402344, -37.94840621948242, -35.434791564941406, -32.921180725097656, -30.40756607055664, -27.893951416015625, -25.380338668823242, -22.86672592163086, -20.353111267089844, -17.839496612548828, -15.325883865356445, -12.812270164489746, -10.298656463623047, -7.785042762756348, -5.271429061889648, -2.7578163146972656, -0.24420166015625, 2.269412040710449, 4.783025741577148, 7.296639442443848, 9.810253143310547, 12.323866844177246, 14.837480545043945, 17.351093292236328, 19.864707946777344, 22.37832260131836, 24.891935348510742, 27.405548095703125, 29.91916275024414, 32.432777404785156, 34.946388244628906, 37.46000289916992, 39.97361755371094, 42.48723220825195, 45.00084686279297, 47.51445770263672, 50.028072357177734, 52.54168701171875, 55.0552978515625, 57.568912506103516, 60.08252716064453, 62.59614181518555, 65.10975646972656, 67.62336730957031, 70.13697814941406, 72.65059661865234, 75.1642074584961, 77.67782592773438, 80.19143676757812]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 5.0, 6.0, 8.0, 16.0, 25.0, 17.0, 18.0, 26.0, 24.0, 25.0, 31.0, 34.0, 39.0, 36.0, 38.0, 32.0, 53.0, 56.0, 51.0, 45.0, 53.0, 37.0, 42.0, 40.0, 31.0, 24.0, 26.0, 38.0, 20.0, 18.0, 13.0, 17.0, 11.0, 12.0, 8.0, 4.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.51171875, -7.26715087890625, -7.0225830078125, -6.77801513671875, -6.533447265625, -6.28887939453125, -6.0443115234375, -5.79974365234375, -5.55517578125, -5.31060791015625, -5.0660400390625, -4.82147216796875, -4.576904296875, -4.33233642578125, -4.0877685546875, -3.84320068359375, -3.5986328125, -3.35406494140625, -3.1094970703125, -2.86492919921875, -2.620361328125, -2.37579345703125, -2.1312255859375, -1.88665771484375, -1.64208984375, -1.39752197265625, -1.1529541015625, -0.90838623046875, -0.663818359375, -0.41925048828125, -0.1746826171875, 0.06988525390625, 0.314453125, 0.55902099609375, 0.8035888671875, 1.04815673828125, 1.292724609375, 1.53729248046875, 1.7818603515625, 2.02642822265625, 2.27099609375, 2.51556396484375, 2.7601318359375, 3.00469970703125, 3.249267578125, 3.49383544921875, 3.7384033203125, 3.98297119140625, 4.2275390625, 4.47210693359375, 4.7166748046875, 4.96124267578125, 5.205810546875, 5.45037841796875, 5.6949462890625, 5.93951416015625, 6.18408203125, 6.42864990234375, 6.6732177734375, 6.91778564453125, 7.162353515625, 7.40692138671875, 7.6514892578125, 7.89605712890625, 8.140625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 9.0, 7.0, 22.0, 26.0, 29.0, 53.0, 104.0, 133.0, 193.0, 267.0, 432.0, 706.0, 1060.0, 1687.0, 2667.0, 4313.0, 7242.0, 11720.0, 19212.0, 32732.0, 55794.0, 101187.0, 241158.0, 302030.0, 113499.0, 61926.0, 35551.0, 21373.0, 12805.0, 7790.0, 4815.0, 2894.0, 1874.0, 1142.0, 757.0, 471.0, 313.0, 190.0, 132.0, 86.0, 49.0, 42.0, 19.0, 14.0, 13.0, 8.0, 4.0, 3.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6923828125, -1.6412353515625, -1.590087890625, -1.5389404296875, -1.48779296875, -1.4366455078125, -1.385498046875, -1.3343505859375, -1.283203125, -1.2320556640625, -1.180908203125, -1.1297607421875, -1.07861328125, -1.0274658203125, -0.976318359375, -0.9251708984375, -0.8740234375, -0.8228759765625, -0.771728515625, -0.7205810546875, -0.66943359375, -0.6182861328125, -0.567138671875, -0.5159912109375, -0.46484375, -0.4136962890625, -0.362548828125, -0.3114013671875, -0.26025390625, -0.2091064453125, -0.157958984375, -0.1068115234375, -0.0556640625, -0.0045166015625, 0.046630859375, 0.0977783203125, 0.14892578125, 0.2000732421875, 0.251220703125, 0.3023681640625, 0.353515625, 0.4046630859375, 0.455810546875, 0.5069580078125, 0.55810546875, 0.6092529296875, 0.660400390625, 0.7115478515625, 0.7626953125, 0.8138427734375, 0.864990234375, 0.9161376953125, 0.96728515625, 1.0184326171875, 1.069580078125, 1.1207275390625, 1.171875, 1.2230224609375, 1.274169921875, 1.3253173828125, 1.37646484375, 1.4276123046875, 1.478759765625, 1.5299072265625, 1.5810546875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 4.0, 6.0, 3.0, 16.0, 14.0, 16.0, 14.0, 15.0, 19.0, 17.0, 23.0, 31.0, 33.0, 24.0, 47.0, 39.0, 48.0, 50.0, 41.0, 30.0, 1059.0, 46.0, 45.0, 42.0, 48.0, 35.0, 43.0, 31.0, 18.0, 22.0, 19.0, 26.0, 26.0, 14.0, 15.0, 11.0, 8.0, 7.0, 5.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.5523681640625, -4.401611328125, -4.2508544921875, -4.10009765625, -3.9493408203125, -3.798583984375, -3.6478271484375, -3.4970703125, -3.3463134765625, -3.195556640625, -3.0447998046875, -2.89404296875, -2.7432861328125, -2.592529296875, -2.4417724609375, -2.291015625, -2.1402587890625, -1.989501953125, -1.8387451171875, -1.68798828125, -1.5372314453125, -1.386474609375, -1.2357177734375, -1.0849609375, -0.9342041015625, -0.783447265625, -0.6326904296875, -0.48193359375, -0.3311767578125, -0.180419921875, -0.0296630859375, 0.12109375, 0.2718505859375, 0.422607421875, 0.5733642578125, 0.72412109375, 0.8748779296875, 1.025634765625, 1.1763916015625, 1.3271484375, 1.4779052734375, 1.628662109375, 1.7794189453125, 1.93017578125, 2.0809326171875, 2.231689453125, 2.3824462890625, 2.533203125, 2.6839599609375, 2.834716796875, 2.9854736328125, 3.13623046875, 3.2869873046875, 3.437744140625, 3.5885009765625, 3.7392578125, 3.8900146484375, 4.040771484375, 4.1915283203125, 4.34228515625, 4.4930419921875, 4.643798828125, 4.7945556640625, 4.9453125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 5.0, 10.0, 21.0, 20.0, 32.0, 63.0, 70.0, 102.0, 166.0, 256.0, 381.0, 556.0, 856.0, 1356.0, 2098.0, 3220.0, 5162.0, 8163.0, 12801.0, 19909.0, 32079.0, 54170.0, 101795.0, 243446.0, 1340452.0, 115369.0, 59608.0, 35108.0, 21575.0, 13675.0, 8746.0, 5634.0, 3654.0, 2258.0, 1481.0, 973.0, 604.0, 409.0, 298.0, 179.0, 108.0, 78.0, 60.0, 43.0, 25.0, 18.0, 14.0, 5.0, 8.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-1.5048828125, -1.4593963623046875, -1.413909912109375, -1.3684234619140625, -1.32293701171875, -1.2774505615234375, -1.231964111328125, -1.1864776611328125, -1.1409912109375, -1.0955047607421875, -1.050018310546875, -1.0045318603515625, -0.95904541015625, -0.9135589599609375, -0.868072509765625, -0.8225860595703125, -0.777099609375, -0.7316131591796875, -0.686126708984375, -0.6406402587890625, -0.59515380859375, -0.5496673583984375, -0.504180908203125, -0.4586944580078125, -0.4132080078125, -0.3677215576171875, -0.322235107421875, -0.2767486572265625, -0.23126220703125, -0.1857757568359375, -0.140289306640625, -0.0948028564453125, -0.04931640625, -0.0038299560546875, 0.041656494140625, 0.0871429443359375, 0.13262939453125, 0.1781158447265625, 0.223602294921875, 0.2690887451171875, 0.3145751953125, 0.3600616455078125, 0.405548095703125, 0.4510345458984375, 0.49652099609375, 0.5420074462890625, 0.587493896484375, 0.6329803466796875, 0.678466796875, 0.7239532470703125, 0.769439697265625, 0.8149261474609375, 0.86041259765625, 0.9058990478515625, 0.951385498046875, 0.9968719482421875, 1.0423583984375, 1.0878448486328125, 1.133331298828125, 1.1788177490234375, 1.22430419921875, 1.2697906494140625, 1.315277099609375, 1.3607635498046875, 1.40625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 6.0, 5.0, 8.0, 11.0, 9.0, 6.0, 7.0, 11.0, 20.0, 20.0, 22.0, 28.0, 32.0, 37.0, 54.0, 54.0, 63.0, 58.0, 78.0, 68.0, 74.0, 61.0, 44.0, 42.0, 31.0, 28.0, 17.0, 19.0, 12.0, 10.0, 5.0, 9.0, 10.0, 7.0, 8.0, 9.0, 3.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007925033569335938, -0.0007638037204742432, -0.0007351040840148926, -0.000706404447555542, -0.0006777048110961914, -0.0006490051746368408, -0.0006203055381774902, -0.0005916059017181396, -0.0005629062652587891, -0.0005342066287994385, -0.0005055069923400879, -0.0004768073558807373, -0.0004481077194213867, -0.00041940808296203613, -0.00039070844650268555, -0.00036200881004333496, -0.0003333091735839844, -0.0003046095371246338, -0.0002759099006652832, -0.0002472102642059326, -0.00021851062774658203, -0.00018981099128723145, -0.00016111135482788086, -0.00013241171836853027, -0.00010371208190917969, -7.50124454498291e-05, -4.6312808990478516e-05, -1.761317253112793e-05, 1.1086463928222656e-05, 3.978610038757324e-05, 6.848573684692383e-05, 9.718537330627441e-05, 0.000125885009765625, 0.00015458464622497559, 0.00018328428268432617, 0.00021198391914367676, 0.00024068355560302734, 0.00026938319206237793, 0.0002980828285217285, 0.0003267824649810791, 0.0003554821014404297, 0.0003841817378997803, 0.00041288137435913086, 0.00044158101081848145, 0.00047028064727783203, 0.0004989802837371826, 0.0005276799201965332, 0.0005563795566558838, 0.0005850791931152344, 0.000613778829574585, 0.0006424784660339355, 0.0006711781024932861, 0.0006998777389526367, 0.0007285773754119873, 0.0007572770118713379, 0.0007859766483306885, 0.0008146762847900391, 0.0008433759212493896, 0.0008720755577087402, 0.0009007751941680908, 0.0009294748306274414, 0.000958174467086792, 0.0009868741035461426, 0.0010155737400054932, 0.0010442733764648438]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 6.0, 1.0, 3.0, 3.0, 3.0, 8.0, 8.0, 13.0, 11.0, 15.0, 15.0, 25.0, 31.0, 60.0, 90.0, 153.0, 206.0, 398.0, 1301.0, 1034390.0, 10475.0, 563.0, 299.0, 156.0, 84.0, 49.0, 40.0, 34.0, 28.0, 12.0, 11.0, 13.0, 12.0, 8.0, 7.0, 7.0, 9.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.02764892578125, -0.026874303817749023, -0.026099681854248047, -0.02532505989074707, -0.024550437927246094, -0.023775815963745117, -0.02300119400024414, -0.022226572036743164, -0.021451950073242188, -0.02067732810974121, -0.019902706146240234, -0.019128084182739258, -0.01835346221923828, -0.017578840255737305, -0.016804218292236328, -0.01602959632873535, -0.015254974365234375, -0.014480352401733398, -0.013705730438232422, -0.012931108474731445, -0.012156486511230469, -0.011381864547729492, -0.010607242584228516, -0.009832620620727539, -0.009057998657226562, -0.008283376693725586, -0.007508754730224609, -0.006734132766723633, -0.005959510803222656, -0.00518488883972168, -0.004410266876220703, -0.0036356449127197266, -0.00286102294921875, -0.0020864009857177734, -0.0013117790222167969, -0.0005371570587158203, 0.00023746490478515625, 0.0010120868682861328, 0.0017867088317871094, 0.002561330795288086, 0.0033359527587890625, 0.004110574722290039, 0.004885196685791016, 0.005659818649291992, 0.006434440612792969, 0.007209062576293945, 0.007983684539794922, 0.008758306503295898, 0.009532928466796875, 0.010307550430297852, 0.011082172393798828, 0.011856794357299805, 0.012631416320800781, 0.013406038284301758, 0.014180660247802734, 0.014955282211303711, 0.015729904174804688, 0.016504526138305664, 0.01727914810180664, 0.018053770065307617, 0.018828392028808594, 0.01960301399230957, 0.020377635955810547, 0.021152257919311523, 0.0219268798828125]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 25.0, 126.0, 361.0, 370.0, 102.0, 22.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010926652466878295, -0.0010429599788039923, -0.0009932545945048332, -0.000943549326620996, -0.0008938440587371588, -0.0008441387326456606, -0.0007944334065541625, -0.0007447281386703253, -0.0006950228125788271, -0.000645317486487329, -0.0005956122186034918, -0.0005459068925119936, -0.0004962015664204955, -0.0004464962985366583, -0.00039679097244516015, -0.00034708567545749247, -0.0002973803784698248, -0.0002476750814821571, -0.0001979697699425742, -0.0001482644584029913, -9.855916141532362e-05, -4.8853864427655935e-05, 8.514616638422012e-07, 5.055675865150988e-05, 0.00010026205563917756, 0.00014996735262684524, 0.00019967266416642815, 0.00024937797570601106, 0.00029908327269367874, 0.0003487885696813464, 0.00039849389577284455, 0.00044819919276051223, 0.0004979046061635017, 0.0005476099322549999, 0.0005973152001388371, 0.0006470205262303352, 0.0006967257941141725, 0.0007464311202056706, 0.0007961364462971687, 0.000845841714181006, 0.0008955470402725041, 0.0009452523663640022, 0.0009949576342478395, 0.0010446629021316767, 0.0010943682864308357, 0.001144073554314673, 0.0011937788221985102, 0.0012434842064976692, 0.0012931894743815064, 0.0013428947422653437, 0.0013926001265645027, 0.00144230539444834, 0.0014920106623321772, 0.0015417160466313362, 0.0015914213145151734, 0.0016411265823990107, 0.0016908319666981697, 0.001740537234582007, 0.001790242618881166, 0.0018399478867650032, 0.0018896531546488404, 0.0019393584225326777, 0.0019890638068318367, 0.0020387691911309958, 0.002088474342599511]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 6.0, 8.0, 6.0, 7.0, 10.0, 16.0, 14.0, 18.0, 23.0, 29.0, 28.0, 23.0, 38.0, 34.0, 38.0, 30.0, 37.0, 41.0, 35.0, 49.0, 29.0, 42.0, 45.0, 37.0, 32.0, 35.0, 44.0, 30.0, 20.0, 28.0, 25.0, 14.0, 23.0, 12.0, 15.0, 9.0, 10.0, 9.0, 8.0, 2.0, 9.0, 7.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00045108795166015625, -0.0004370715469121933, -0.00042305514216423035, -0.0004090387374162674, -0.00039502233266830444, -0.0003810059279203415, -0.00036698952317237854, -0.0003529731184244156, -0.00033895671367645264, -0.0003249403089284897, -0.00031092390418052673, -0.0002969074994325638, -0.00028289109468460083, -0.0002688746899366379, -0.0002548582851886749, -0.00024084188044071198, -0.00022682547569274902, -0.00021280907094478607, -0.00019879266619682312, -0.00018477626144886017, -0.00017075985670089722, -0.00015674345195293427, -0.0001427270472049713, -0.00012871064245700836, -0.00011469423770904541, -0.00010067783296108246, -8.666142821311951e-05, -7.264502346515656e-05, -5.8628618717193604e-05, -4.461221396923065e-05, -3.05958092212677e-05, -1.657940447330475e-05, -2.562999725341797e-06, 1.1453405022621155e-05, 2.5469809770584106e-05, 3.948621451854706e-05, 5.350261926651001e-05, 6.751902401447296e-05, 8.153542876243591e-05, 9.555183351039886e-05, 0.00010956823825836182, 0.00012358464300632477, 0.00013760104775428772, 0.00015161745250225067, 0.00016563385725021362, 0.00017965026199817657, 0.00019366666674613953, 0.00020768307149410248, 0.00022169947624206543, 0.00023571588099002838, 0.00024973228573799133, 0.0002637486904859543, 0.00027776509523391724, 0.0002917814999818802, 0.00030579790472984314, 0.0003198143094778061, 0.00033383071422576904, 0.000347847118973732, 0.00036186352372169495, 0.0003758799284696579, 0.00038989633321762085, 0.0004039127379655838, 0.00041792914271354675, 0.0004319455474615097, 0.00044596195220947266]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 5.0, 6.0, 8.0, 16.0, 25.0, 17.0, 18.0, 26.0, 24.0, 25.0, 31.0, 34.0, 39.0, 36.0, 38.0, 32.0, 53.0, 56.0, 51.0, 46.0, 52.0, 37.0, 42.0, 40.0, 31.0, 24.0, 26.0, 38.0, 20.0, 18.0, 13.0, 17.0, 11.0, 12.0, 8.0, 4.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.51171875, -7.26715087890625, -7.0225830078125, -6.77801513671875, -6.533447265625, -6.28887939453125, -6.0443115234375, -5.79974365234375, -5.55517578125, -5.31060791015625, -5.0660400390625, -4.82147216796875, -4.576904296875, -4.33233642578125, -4.0877685546875, -3.84320068359375, -3.5986328125, -3.35406494140625, -3.1094970703125, -2.86492919921875, -2.620361328125, -2.37579345703125, -2.1312255859375, -1.88665771484375, -1.64208984375, -1.39752197265625, -1.1529541015625, -0.90838623046875, -0.663818359375, -0.41925048828125, -0.1746826171875, 0.06988525390625, 0.314453125, 0.55902099609375, 0.8035888671875, 1.04815673828125, 1.292724609375, 1.53729248046875, 1.7818603515625, 2.02642822265625, 2.27099609375, 2.51556396484375, 2.7601318359375, 3.00469970703125, 3.249267578125, 3.49383544921875, 3.7384033203125, 3.98297119140625, 4.2275390625, 4.47210693359375, 4.7166748046875, 4.96124267578125, 5.205810546875, 5.45037841796875, 5.6949462890625, 5.93951416015625, 6.18408203125, 6.42864990234375, 6.6732177734375, 6.91778564453125, 7.162353515625, 7.40692138671875, 7.6514892578125, 7.89605712890625, 8.140625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 14.0, 8.0, 11.0, 19.0, 33.0, 32.0, 48.0, 57.0, 90.0, 134.0, 195.0, 336.0, 504.0, 752.0, 1282.0, 2255.0, 4323.0, 9113.0, 22236.0, 74943.0, 407461.0, 408919.0, 74233.0, 22378.0, 9089.0, 4228.0, 2302.0, 1276.0, 761.0, 512.0, 306.0, 213.0, 138.0, 103.0, 66.0, 55.0, 44.0, 23.0, 23.0, 8.0, 6.0, 9.0, 3.0, 3.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.08984375, -5.8995361328125, -5.709228515625, -5.5189208984375, -5.32861328125, -5.1383056640625, -4.947998046875, -4.7576904296875, -4.5673828125, -4.3770751953125, -4.186767578125, -3.9964599609375, -3.80615234375, -3.6158447265625, -3.425537109375, -3.2352294921875, -3.044921875, -2.8546142578125, -2.664306640625, -2.4739990234375, -2.28369140625, -2.0933837890625, -1.903076171875, -1.7127685546875, -1.5224609375, -1.3321533203125, -1.141845703125, -0.9515380859375, -0.76123046875, -0.5709228515625, -0.380615234375, -0.1903076171875, 0.0, 0.1903076171875, 0.380615234375, 0.5709228515625, 0.76123046875, 0.9515380859375, 1.141845703125, 1.3321533203125, 1.5224609375, 1.7127685546875, 1.903076171875, 2.0933837890625, 2.28369140625, 2.4739990234375, 2.664306640625, 2.8546142578125, 3.044921875, 3.2352294921875, 3.425537109375, 3.6158447265625, 3.80615234375, 3.9964599609375, 4.186767578125, 4.3770751953125, 4.5673828125, 4.7576904296875, 4.947998046875, 5.1383056640625, 5.32861328125, 5.5189208984375, 5.709228515625, 5.8995361328125, 6.08984375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 6.0, 10.0, 14.0, 11.0, 9.0, 12.0, 22.0, 29.0, 23.0, 25.0, 31.0, 34.0, 38.0, 29.0, 52.0, 47.0, 98.0, 1726.0, 308.0, 73.0, 62.0, 49.0, 53.0, 40.0, 35.0, 27.0, 33.0, 23.0, 20.0, 17.0, 17.0, 11.0, 5.0, 13.0, 9.0, 7.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-27.0625, -26.262451171875, -25.46240234375, -24.662353515625, -23.8623046875, -23.062255859375, -22.26220703125, -21.462158203125, -20.662109375, -19.862060546875, -19.06201171875, -18.261962890625, -17.4619140625, -16.661865234375, -15.86181640625, -15.061767578125, -14.26171875, -13.461669921875, -12.66162109375, -11.861572265625, -11.0615234375, -10.261474609375, -9.46142578125, -8.661376953125, -7.861328125, -7.061279296875, -6.26123046875, -5.461181640625, -4.6611328125, -3.861083984375, -3.06103515625, -2.260986328125, -1.4609375, -0.660888671875, 0.13916015625, 0.939208984375, 1.7392578125, 2.539306640625, 3.33935546875, 4.139404296875, 4.939453125, 5.739501953125, 6.53955078125, 7.339599609375, 8.1396484375, 8.939697265625, 9.73974609375, 10.539794921875, 11.33984375, 12.139892578125, 12.93994140625, 13.739990234375, 14.5400390625, 15.340087890625, 16.14013671875, 16.940185546875, 17.740234375, 18.540283203125, 19.34033203125, 20.140380859375, 20.9404296875, 21.740478515625, 22.54052734375, 23.340576171875, 24.140625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 5.0, 5.0, 5.0, 13.0, 13.0, 5.0, 13.0, 14.0, 19.0, 24.0, 30.0, 46.0, 52.0, 73.0, 109.0, 166.0, 240.0, 605.0, 3074.0, 225950.0, 2907865.0, 5649.0, 784.0, 335.0, 159.0, 118.0, 76.0, 49.0, 37.0, 30.0, 30.0, 26.0, 16.0, 13.0, 10.0, 13.0, 9.0, 5.0, 7.0, 6.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.1875, -38.853515625, -37.51953125, -36.185546875, -34.8515625, -33.517578125, -32.18359375, -30.849609375, -29.515625, -28.181640625, -26.84765625, -25.513671875, -24.1796875, -22.845703125, -21.51171875, -20.177734375, -18.84375, -17.509765625, -16.17578125, -14.841796875, -13.5078125, -12.173828125, -10.83984375, -9.505859375, -8.171875, -6.837890625, -5.50390625, -4.169921875, -2.8359375, -1.501953125, -0.16796875, 1.166015625, 2.5, 3.833984375, 5.16796875, 6.501953125, 7.8359375, 9.169921875, 10.50390625, 11.837890625, 13.171875, 14.505859375, 15.83984375, 17.173828125, 18.5078125, 19.841796875, 21.17578125, 22.509765625, 23.84375, 25.177734375, 26.51171875, 27.845703125, 29.1796875, 30.513671875, 31.84765625, 33.181640625, 34.515625, 35.849609375, 37.18359375, 38.517578125, 39.8515625, 41.185546875, 42.51953125, 43.853515625, 45.1875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 10.0, 20.0, 33.0, 63.0, 92.0, 173.0, 220.0, 165.0, 119.0, 58.0, 33.0, 15.0, 5.0, 2.0, 0.0, 0.0, 3.0], "bins": [-42.61725997924805, -41.82050323486328, -41.023746490478516, -40.22698974609375, -39.430233001708984, -38.63347625732422, -37.83671951293945, -37.03996276855469, -36.24320602416992, -35.446449279785156, -34.64969253540039, -33.852935791015625, -33.05617904663086, -32.259422302246094, -31.462665557861328, -30.665908813476562, -29.86915397644043, -29.072397232055664, -28.2756404876709, -27.478883743286133, -26.682126998901367, -25.8853702545166, -25.08861541748047, -24.291858673095703, -23.495101928710938, -22.698345184326172, -21.901588439941406, -21.10483169555664, -20.308074951171875, -19.51131820678711, -18.714561462402344, -17.917804718017578, -17.121047973632812, -16.324291229248047, -15.527534484863281, -14.730777740478516, -13.93402099609375, -13.137264251708984, -12.340508460998535, -11.54375171661377, -10.74699592590332, -9.950239181518555, -9.153482437133789, -8.356725692749023, -7.559969425201416, -6.76321268081665, -5.966456413269043, -5.169699668884277, -4.372942924499512, -3.576186180114746, -2.7794296741485596, -1.982673168182373, -1.1859164237976074, -0.3891596794128418, 0.4075965881347656, 1.2043533325195312, 2.001110076904297, 2.7978668212890625, 3.594623327255249, 4.3913798332214355, 5.188136577606201, 5.984893321990967, 6.781649589538574, 7.57840633392334, 8.375163078308105]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 5.0, 5.0, 11.0, 11.0, 12.0, 15.0, 15.0, 18.0, 21.0, 15.0, 26.0, 23.0, 32.0, 30.0, 28.0, 27.0, 42.0, 38.0, 42.0, 26.0, 33.0, 36.0, 44.0, 43.0, 42.0, 38.0, 30.0, 36.0, 31.0, 20.0, 21.0, 23.0, 28.0, 18.0, 22.0, 13.0, 15.0, 13.0, 13.0, 7.0, 7.0, 6.0, 1.0, 3.0, 3.0, 7.0, 3.0, 3.0, 0.0, 1.0], "bins": [-80.3304443359375, -78.02043151855469, -75.7104263305664, -73.4004135131836, -71.09040069580078, -68.7803955078125, -66.47038269042969, -64.16036987304688, -61.85036087036133, -59.54035186767578, -57.23033905029297, -54.92033004760742, -52.610321044921875, -50.30030822753906, -47.990299224853516, -45.68029022216797, -43.370277404785156, -41.06026840209961, -38.7502555847168, -36.44024658203125, -34.13023376464844, -31.82022476196289, -29.510215759277344, -27.200204849243164, -24.890193939208984, -22.580183029174805, -20.270172119140625, -17.960163116455078, -15.650152206420898, -13.340141296386719, -11.030131340026855, -8.720121383666992, -6.410118103027344, -4.100107669830322, -1.7900972366333008, 0.5199131965637207, 2.829923629760742, 5.139934539794922, 7.449944496154785, 9.759954452514648, 12.069965362548828, 14.379976272583008, 16.689987182617188, 18.999996185302734, 21.310007095336914, 23.620018005371094, 25.93002700805664, 28.24003791809082, 30.550048828125, 32.86005783081055, 35.17007064819336, 37.480079650878906, 39.79009246826172, 42.100101470947266, 44.41011047363281, 46.720123291015625, 49.03013229370117, 51.34014129638672, 53.65015411376953, 55.96016311645508, 58.270172119140625, 60.58018493652344, 62.890193939208984, 65.20020294189453, 67.51021575927734]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 7.0, 7.0, 12.0, 16.0, 19.0, 25.0, 27.0, 25.0, 14.0, 34.0, 35.0, 32.0, 33.0, 40.0, 39.0, 41.0, 49.0, 59.0, 50.0, 46.0, 51.0, 36.0, 43.0, 40.0, 29.0, 21.0, 32.0, 25.0, 23.0, 10.0, 19.0, 12.0, 15.0, 10.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.60546875, -7.35418701171875, -7.1029052734375, -6.85162353515625, -6.600341796875, -6.34906005859375, -6.0977783203125, -5.84649658203125, -5.59521484375, -5.34393310546875, -5.0926513671875, -4.84136962890625, -4.590087890625, -4.33880615234375, -4.0875244140625, -3.83624267578125, -3.5849609375, -3.33367919921875, -3.0823974609375, -2.83111572265625, -2.579833984375, -2.32855224609375, -2.0772705078125, -1.82598876953125, -1.57470703125, -1.32342529296875, -1.0721435546875, -0.82086181640625, -0.569580078125, -0.31829833984375, -0.0670166015625, 0.18426513671875, 0.435546875, 0.68682861328125, 0.9381103515625, 1.18939208984375, 1.440673828125, 1.69195556640625, 1.9432373046875, 2.19451904296875, 2.44580078125, 2.69708251953125, 2.9483642578125, 3.19964599609375, 3.450927734375, 3.70220947265625, 3.9534912109375, 4.20477294921875, 4.4560546875, 4.70733642578125, 4.9586181640625, 5.20989990234375, 5.461181640625, 5.71246337890625, 5.9637451171875, 6.21502685546875, 6.46630859375, 6.71759033203125, 6.9688720703125, 7.22015380859375, 7.471435546875, 7.72271728515625, 7.9739990234375, 8.22528076171875, 8.4765625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 2.0, 1.0, 8.0, 7.0, 9.0, 13.0, 22.0, 27.0, 32.0, 33.0, 65.0, 105.0, 192.0, 312.0, 772.0, 2565.0, 13217.0, 108481.0, 1381685.0, 2365755.0, 288430.0, 25970.0, 4423.0, 1090.0, 463.0, 209.0, 127.0, 75.0, 48.0, 37.0, 29.0, 25.0, 18.0, 10.0, 10.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.859375, -16.30078125, -15.7421875, -15.18359375, -14.625, -14.06640625, -13.5078125, -12.94921875, -12.390625, -11.83203125, -11.2734375, -10.71484375, -10.15625, -9.59765625, -9.0390625, -8.48046875, -7.921875, -7.36328125, -6.8046875, -6.24609375, -5.6875, -5.12890625, -4.5703125, -4.01171875, -3.453125, -2.89453125, -2.3359375, -1.77734375, -1.21875, -0.66015625, -0.1015625, 0.45703125, 1.015625, 1.57421875, 2.1328125, 2.69140625, 3.25, 3.80859375, 4.3671875, 4.92578125, 5.484375, 6.04296875, 6.6015625, 7.16015625, 7.71875, 8.27734375, 8.8359375, 9.39453125, 9.953125, 10.51171875, 11.0703125, 11.62890625, 12.1875, 12.74609375, 13.3046875, 13.86328125, 14.421875, 14.98046875, 15.5390625, 16.09765625, 16.65625, 17.21484375, 17.7734375, 18.33203125, 18.890625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 14.0, 21.0, 41.0, 58.0, 66.0, 84.0, 154.0, 245.0, 406.0, 590.0, 690.0, 559.0, 412.0, 275.0, 156.0, 110.0, 64.0, 46.0, 19.0, 14.0, 13.0, 12.0, 7.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.59375, -27.654296875, -26.71484375, -25.775390625, -24.8359375, -23.896484375, -22.95703125, -22.017578125, -21.078125, -20.138671875, -19.19921875, -18.259765625, -17.3203125, -16.380859375, -15.44140625, -14.501953125, -13.5625, -12.623046875, -11.68359375, -10.744140625, -9.8046875, -8.865234375, -7.92578125, -6.986328125, -6.046875, -5.107421875, -4.16796875, -3.228515625, -2.2890625, -1.349609375, -0.41015625, 0.529296875, 1.46875, 2.408203125, 3.34765625, 4.287109375, 5.2265625, 6.166015625, 7.10546875, 8.044921875, 8.984375, 9.923828125, 10.86328125, 11.802734375, 12.7421875, 13.681640625, 14.62109375, 15.560546875, 16.5, 17.439453125, 18.37890625, 19.318359375, 20.2578125, 21.197265625, 22.13671875, 23.076171875, 24.015625, 24.955078125, 25.89453125, 26.833984375, 27.7734375, 28.712890625, 29.65234375, 30.591796875, 31.53125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 3.0, 5.0, 8.0, 11.0, 12.0, 29.0, 42.0, 54.0, 97.0, 114.0, 216.0, 373.0, 1573.0, 93694.0, 4085363.0, 11001.0, 843.0, 298.0, 171.0, 128.0, 69.0, 55.0, 30.0, 26.0, 16.0, 19.0, 10.0, 7.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.0625, -78.5439453125, -75.025390625, -71.5068359375, -67.98828125, -64.4697265625, -60.951171875, -57.4326171875, -53.9140625, -50.3955078125, -46.876953125, -43.3583984375, -39.83984375, -36.3212890625, -32.802734375, -29.2841796875, -25.765625, -22.2470703125, -18.728515625, -15.2099609375, -11.69140625, -8.1728515625, -4.654296875, -1.1357421875, 2.3828125, 5.9013671875, 9.419921875, 12.9384765625, 16.45703125, 19.9755859375, 23.494140625, 27.0126953125, 30.53125, 34.0498046875, 37.568359375, 41.0869140625, 44.60546875, 48.1240234375, 51.642578125, 55.1611328125, 58.6796875, 62.1982421875, 65.716796875, 69.2353515625, 72.75390625, 76.2724609375, 79.791015625, 83.3095703125, 86.828125, 90.3466796875, 93.865234375, 97.3837890625, 100.90234375, 104.4208984375, 107.939453125, 111.4580078125, 114.9765625, 118.4951171875, 122.013671875, 125.5322265625, 129.05078125, 132.5693359375, 136.087890625, 139.6064453125, 143.125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 36.0, 166.0, 303.0, 299.0, 157.0, 34.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-284.6612854003906, -277.87799072265625, -271.0946960449219, -264.3114013671875, -257.5281066894531, -250.74481201171875, -243.96151733398438, -237.17823791503906, -230.3949432373047, -223.6116485595703, -216.82835388183594, -210.04505920410156, -203.2617645263672, -196.47848510742188, -189.6951904296875, -182.91189575195312, -176.12860107421875, -169.34530639648438, -162.56201171875, -155.77871704101562, -148.99542236328125, -142.21212768554688, -135.4288330078125, -128.6455535888672, -121.86224365234375, -115.07894897460938, -108.295654296875, -101.51235961914062, -94.72907257080078, -87.9457778930664, -81.16248321533203, -74.37919616699219, -67.59590148925781, -60.81260681152344, -54.02931594848633, -47.24602127075195, -40.462730407714844, -33.67943572998047, -26.896141052246094, -20.112850189208984, -13.32955551147461, -6.546262264251709, 0.2370309829711914, 7.02032470703125, 13.803617477416992, 20.586910247802734, 27.37020492553711, 34.15349578857422, 40.936790466308594, 47.72008514404297, 54.50337600708008, 61.28667068481445, 68.06996154785156, 74.85325622558594, 81.63655090332031, 88.41984558105469, 95.20314025878906, 101.98643493652344, 108.76972961425781, 115.55302429199219, 122.33631134033203, 129.11959838867188, 135.90289306640625, 142.68618774414062, 149.469482421875]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 10.0, 13.0, 17.0, 15.0, 17.0, 17.0, 24.0, 24.0, 37.0, 29.0, 31.0, 48.0, 38.0, 49.0, 51.0, 47.0, 44.0, 38.0, 35.0, 46.0, 39.0, 34.0, 47.0, 33.0, 40.0, 27.0, 32.0, 29.0, 14.0, 21.0, 9.0, 5.0, 10.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-91.22701263427734, -88.80516815185547, -86.3833236694336, -83.96147155761719, -81.53962707519531, -79.11778259277344, -76.69593811035156, -74.27409362792969, -71.85224914550781, -69.43040466308594, -67.00856018066406, -64.58671569824219, -62.16486740112305, -59.743019104003906, -57.32117462158203, -54.899330139160156, -52.477481842041016, -50.05563735961914, -47.6337890625, -45.211944580078125, -42.79010009765625, -40.368255615234375, -37.946407318115234, -35.52456283569336, -33.10271453857422, -30.68086814880371, -28.259023666381836, -25.837177276611328, -23.415332794189453, -20.993486404418945, -18.571640014648438, -16.149795532226562, -13.727951049804688, -11.306105613708496, -8.884260177612305, -6.462413787841797, -4.0405683517456055, -1.618722915649414, 0.8031234741210938, 3.2249679565429688, 5.646814346313477, 8.068659782409668, 10.49050521850586, 12.912351608276367, 15.334197044372559, 17.75604248046875, 20.177888870239258, 22.599733352661133, 25.02157974243164, 27.44342613220215, 29.865270614624023, 32.28711700439453, 34.708961486816406, 37.13080596923828, 39.55265426635742, 41.9744987487793, 44.39634704589844, 46.81819152832031, 49.24003982543945, 51.66188430786133, 54.0837287902832, 56.505577087402344, 58.92742156982422, 61.349266052246094, 63.77111053466797]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 5.0, 7.0, 3.0, 2.0, 6.0, 9.0, 11.0, 16.0, 27.0, 26.0, 14.0, 33.0, 25.0, 35.0, 31.0, 40.0, 52.0, 47.0, 55.0, 45.0, 45.0, 62.0, 37.0, 43.0, 46.0, 47.0, 46.0, 30.0, 33.0, 28.0, 13.0, 15.0, 17.0, 16.0, 10.0, 6.0, 8.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.703125, -7.42919921875, -7.1552734375, -6.88134765625, -6.607421875, -6.33349609375, -6.0595703125, -5.78564453125, -5.51171875, -5.23779296875, -4.9638671875, -4.68994140625, -4.416015625, -4.14208984375, -3.8681640625, -3.59423828125, -3.3203125, -3.04638671875, -2.7724609375, -2.49853515625, -2.224609375, -1.95068359375, -1.6767578125, -1.40283203125, -1.12890625, -0.85498046875, -0.5810546875, -0.30712890625, -0.033203125, 0.24072265625, 0.5146484375, 0.78857421875, 1.0625, 1.33642578125, 1.6103515625, 1.88427734375, 2.158203125, 2.43212890625, 2.7060546875, 2.97998046875, 3.25390625, 3.52783203125, 3.8017578125, 4.07568359375, 4.349609375, 4.62353515625, 4.8974609375, 5.17138671875, 5.4453125, 5.71923828125, 5.9931640625, 6.26708984375, 6.541015625, 6.81494140625, 7.0888671875, 7.36279296875, 7.63671875, 7.91064453125, 8.1845703125, 8.45849609375, 8.732421875, 9.00634765625, 9.2802734375, 9.55419921875, 9.828125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 12.0, 16.0, 27.0, 37.0, 46.0, 84.0, 133.0, 159.0, 270.0, 447.0, 650.0, 988.0, 1656.0, 2750.0, 4489.0, 7191.0, 12203.0, 20791.0, 35994.0, 65373.0, 132256.0, 368613.0, 197883.0, 85469.0, 45865.0, 26001.0, 15525.0, 9176.0, 5330.0, 3413.0, 2061.0, 1249.0, 852.0, 521.0, 370.0, 219.0, 149.0, 87.0, 64.0, 41.0, 29.0, 18.0, 14.0, 6.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.8837890625, -1.827911376953125, -1.77203369140625, -1.716156005859375, -1.6602783203125, -1.604400634765625, -1.54852294921875, -1.492645263671875, -1.436767578125, -1.380889892578125, -1.32501220703125, -1.269134521484375, -1.2132568359375, -1.157379150390625, -1.10150146484375, -1.045623779296875, -0.98974609375, -0.933868408203125, -0.87799072265625, -0.822113037109375, -0.7662353515625, -0.710357666015625, -0.65447998046875, -0.598602294921875, -0.542724609375, -0.486846923828125, -0.43096923828125, -0.375091552734375, -0.3192138671875, -0.263336181640625, -0.20745849609375, -0.151580810546875, -0.095703125, -0.039825439453125, 0.01605224609375, 0.071929931640625, 0.1278076171875, 0.183685302734375, 0.23956298828125, 0.295440673828125, 0.351318359375, 0.407196044921875, 0.46307373046875, 0.518951416015625, 0.5748291015625, 0.630706787109375, 0.68658447265625, 0.742462158203125, 0.79833984375, 0.854217529296875, 0.91009521484375, 0.965972900390625, 1.0218505859375, 1.077728271484375, 1.13360595703125, 1.189483642578125, 1.245361328125, 1.301239013671875, 1.35711669921875, 1.412994384765625, 1.4688720703125, 1.524749755859375, 1.58062744140625, 1.636505126953125, 1.6923828125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 8.0, 6.0, 6.0, 10.0, 17.0, 11.0, 15.0, 19.0, 23.0, 21.0, 26.0, 23.0, 23.0, 25.0, 38.0, 38.0, 43.0, 40.0, 29.0, 37.0, 1055.0, 38.0, 42.0, 43.0, 43.0, 30.0, 35.0, 24.0, 40.0, 29.0, 16.0, 30.0, 27.0, 13.0, 22.0, 14.0, 12.0, 10.0, 7.0, 8.0, 2.0, 5.0, 1.0, 3.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.359375, -4.2208251953125, -4.082275390625, -3.9437255859375, -3.80517578125, -3.6666259765625, -3.528076171875, -3.3895263671875, -3.2509765625, -3.1124267578125, -2.973876953125, -2.8353271484375, -2.69677734375, -2.5582275390625, -2.419677734375, -2.2811279296875, -2.142578125, -2.0040283203125, -1.865478515625, -1.7269287109375, -1.58837890625, -1.4498291015625, -1.311279296875, -1.1727294921875, -1.0341796875, -0.8956298828125, -0.757080078125, -0.6185302734375, -0.47998046875, -0.3414306640625, -0.202880859375, -0.0643310546875, 0.07421875, 0.2127685546875, 0.351318359375, 0.4898681640625, 0.62841796875, 0.7669677734375, 0.905517578125, 1.0440673828125, 1.1826171875, 1.3211669921875, 1.459716796875, 1.5982666015625, 1.73681640625, 1.8753662109375, 2.013916015625, 2.1524658203125, 2.291015625, 2.4295654296875, 2.568115234375, 2.7066650390625, 2.84521484375, 2.9837646484375, 3.122314453125, 3.2608642578125, 3.3994140625, 3.5379638671875, 3.676513671875, 3.8150634765625, 3.95361328125, 4.0921630859375, 4.230712890625, 4.3692626953125, 4.5078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 10.0, 14.0, 11.0, 25.0, 28.0, 44.0, 37.0, 60.0, 114.0, 157.0, 223.0, 320.0, 478.0, 719.0, 1032.0, 1408.0, 2129.0, 3213.0, 4718.0, 7243.0, 10911.0, 16769.0, 25382.0, 39024.0, 64038.0, 117750.0, 1333149.0, 214576.0, 97440.0, 55618.0, 34478.0, 22270.0, 14597.0, 9714.0, 6374.0, 4329.0, 2717.0, 1946.0, 1300.0, 862.0, 590.0, 426.0, 279.0, 191.0, 135.0, 81.0, 57.0, 45.0, 30.0, 26.0, 13.0, 12.0, 8.0, 4.0, 6.0, 4.0, 1.0, 1.0], "bins": [-1.3623046875, -1.3208465576171875, -1.279388427734375, -1.2379302978515625, -1.19647216796875, -1.1550140380859375, -1.113555908203125, -1.0720977783203125, -1.0306396484375, -0.9891815185546875, -0.947723388671875, -0.9062652587890625, -0.86480712890625, -0.8233489990234375, -0.781890869140625, -0.7404327392578125, -0.698974609375, -0.6575164794921875, -0.616058349609375, -0.5746002197265625, -0.53314208984375, -0.4916839599609375, -0.450225830078125, -0.4087677001953125, -0.3673095703125, -0.3258514404296875, -0.284393310546875, -0.2429351806640625, -0.20147705078125, -0.1600189208984375, -0.118560791015625, -0.0771026611328125, -0.03564453125, 0.0058135986328125, 0.047271728515625, 0.0887298583984375, 0.13018798828125, 0.1716461181640625, 0.213104248046875, 0.2545623779296875, 0.2960205078125, 0.3374786376953125, 0.378936767578125, 0.4203948974609375, 0.46185302734375, 0.5033111572265625, 0.544769287109375, 0.5862274169921875, 0.627685546875, 0.6691436767578125, 0.710601806640625, 0.7520599365234375, 0.79351806640625, 0.8349761962890625, 0.876434326171875, 0.9178924560546875, 0.9593505859375, 1.0008087158203125, 1.042266845703125, 1.0837249755859375, 1.12518310546875, 1.1666412353515625, 1.208099365234375, 1.2495574951171875, 1.291015625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 13.0, 20.0, 20.0, 34.0, 48.0, 53.0, 77.0, 114.0, 110.0, 135.0, 112.0, 65.0, 43.0, 45.0, 21.0, 19.0, 18.0, 11.0, 7.0, 7.0, 3.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00148773193359375, -0.0014438778162002563, -0.0014000236988067627, -0.001356169581413269, -0.0013123154640197754, -0.0012684613466262817, -0.001224607229232788, -0.0011807531118392944, -0.0011368989944458008, -0.0010930448770523071, -0.0010491907596588135, -0.0010053366422653198, -0.0009614825248718262, -0.0009176284074783325, -0.0008737742900848389, -0.0008299201726913452, -0.0007860660552978516, -0.0007422119379043579, -0.0006983578205108643, -0.0006545037031173706, -0.000610649585723877, -0.0005667954683303833, -0.0005229413509368896, -0.000479087233543396, -0.00043523311614990234, -0.0003913789987564087, -0.00034752488136291504, -0.0003036707639694214, -0.00025981664657592773, -0.00021596252918243408, -0.00017210841178894043, -0.00012825429439544678, -8.440017700195312e-05, -4.054605960845947e-05, 3.3080577850341797e-06, 4.716217517852783e-05, 9.101629257202148e-05, 0.00013487040996551514, 0.0001787245273590088, 0.00022257864475250244, 0.0002664327621459961, 0.00031028687953948975, 0.0003541409969329834, 0.00039799511432647705, 0.0004418492317199707, 0.00048570334911346436, 0.000529557466506958, 0.0005734115839004517, 0.0006172657012939453, 0.000661119818687439, 0.0007049739360809326, 0.0007488280534744263, 0.0007926821708679199, 0.0008365362882614136, 0.0008803904056549072, 0.0009242445230484009, 0.0009680986404418945, 0.0010119527578353882, 0.0010558068752288818, 0.0010996609926223755, 0.0011435151100158691, 0.0011873692274093628, 0.0012312233448028564, 0.00127507746219635, 0.0013189315795898438]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 3.0, 11.0, 8.0, 14.0, 17.0, 20.0, 30.0, 54.0, 76.0, 166.0, 307.0, 777.0, 628817.0, 416846.0, 689.0, 278.0, 161.0, 85.0, 58.0, 41.0, 19.0, 13.0, 18.0, 10.0, 14.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026947021484375, -0.0260772705078125, -0.02520751953125, -0.0243377685546875, -0.023468017578125, -0.0225982666015625, -0.021728515625, -0.0208587646484375, -0.019989013671875, -0.0191192626953125, -0.01824951171875, -0.0173797607421875, -0.016510009765625, -0.0156402587890625, -0.0147705078125, -0.0139007568359375, -0.013031005859375, -0.0121612548828125, -0.01129150390625, -0.0104217529296875, -0.009552001953125, -0.0086822509765625, -0.0078125, -0.0069427490234375, -0.006072998046875, -0.0052032470703125, -0.00433349609375, -0.0034637451171875, -0.002593994140625, -0.0017242431640625, -0.0008544921875, 1.52587890625e-05, 0.000885009765625, 0.0017547607421875, 0.00262451171875, 0.0034942626953125, 0.004364013671875, 0.0052337646484375, 0.006103515625, 0.0069732666015625, 0.007843017578125, 0.0087127685546875, 0.00958251953125, 0.0104522705078125, 0.011322021484375, 0.0121917724609375, 0.0130615234375, 0.0139312744140625, 0.014801025390625, 0.0156707763671875, 0.01654052734375, 0.0174102783203125, 0.018280029296875, 0.0191497802734375, 0.02001953125, 0.0208892822265625, 0.021759033203125, 0.0226287841796875, 0.02349853515625, 0.0243682861328125, 0.025238037109375, 0.0261077880859375, 0.0269775390625, 0.0278472900390625, 0.028717041015625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 112.0, 829.0, 75.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006324330344796181, -0.00618203729391098, -0.006039744708687067, -0.0058974516578018665, -0.005755158606916666, -0.005612866021692753, -0.005470572970807552, -0.005328279919922352, -0.005185986869037151, -0.005043693818151951, -0.004901401232928038, -0.004759108182042837, -0.004616815131157637, -0.0044745225459337234, -0.004332229495048523, -0.0041899364441633224, -0.004047643858939409, -0.0039053510408848524, -0.003763057989999652, -0.003620765171945095, -0.0034784721210598946, -0.0033361793030053377, -0.003193886484950781, -0.0030515934340655804, -0.0029093006160110235, -0.0027670077979564667, -0.002624714747071266, -0.0024824219290167093, -0.0023401291109621525, -0.002197836060076952, -0.002055543242022395, -0.0019132503075525165, -0.0017709576059132814, -0.0016286646714434028, -0.001486371736973524, -0.0013440789189189672, -0.0012017859844490886, -0.00105949304997921, -0.0009172001737169921, -0.0007749072974547744, -0.0006326143629848957, -0.000490321428515017, -0.00034802855225279927, -0.00020573564688675106, -6.344274152070284e-05, 7.885019294917583e-05, 0.0002211430692113936, 0.00036343594547361135, 0.00050572887994349, 0.0006480218144133687, 0.0007903146906755865, 0.0009326075669378042, 0.001074900501407683, 0.0012171934358775616, 0.0013594862539321184, 0.001501779188401997, 0.0016440721228718758, 0.0017863650573417544, 0.0019286579918116331, 0.00207095080986619, 0.0022132438607513905, 0.0023555366788059473, 0.002497829496860504, 0.0026401225477457047, 0.0027824153658002615]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 10.0, 9.0, 9.0, 8.0, 15.0, 19.0, 18.0, 27.0, 17.0, 35.0, 32.0, 42.0, 26.0, 36.0, 40.0, 47.0, 48.0, 54.0, 38.0, 37.0, 44.0, 48.0, 31.0, 20.0, 30.0, 50.0, 29.0, 26.0, 28.0, 21.0, 15.0, 15.0, 15.0, 18.0, 8.0, 8.0, 12.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004774928092956543, -0.0004622172564268112, -0.00044694170355796814, -0.00043166615068912506, -0.000416390597820282, -0.0004011150449514389, -0.0003858394920825958, -0.00037056393921375275, -0.00035528838634490967, -0.0003400128334760666, -0.0003247372806072235, -0.00030946172773838043, -0.00029418617486953735, -0.0002789106220006943, -0.0002636350691318512, -0.0002483595162630081, -0.00023308396339416504, -0.00021780841052532196, -0.00020253285765647888, -0.0001872573047876358, -0.00017198175191879272, -0.00015670619904994965, -0.00014143064618110657, -0.0001261550933122635, -0.00011087954044342041, -9.560398757457733e-05, -8.032843470573425e-05, -6.505288183689117e-05, -4.9777328968048096e-05, -3.450177609920502e-05, -1.922622323036194e-05, -3.95067036151886e-06, 1.1324882507324219e-05, 2.6600435376167297e-05, 4.1875988245010376e-05, 5.7151541113853455e-05, 7.242709398269653e-05, 8.770264685153961e-05, 0.00010297819972038269, 0.00011825375258922577, 0.00013352930545806885, 0.00014880485832691193, 0.000164080411195755, 0.00017935596406459808, 0.00019463151693344116, 0.00020990706980228424, 0.00022518262267112732, 0.0002404581755399704, 0.0002557337284088135, 0.00027100928127765656, 0.00028628483414649963, 0.0003015603870153427, 0.0003168359398841858, 0.00033211149275302887, 0.00034738704562187195, 0.000362662598490715, 0.0003779381513595581, 0.0003932137042284012, 0.00040848925709724426, 0.00042376480996608734, 0.0004390403628349304, 0.0004543159157037735, 0.0004695914685726166, 0.00048486702144145966, 0.0005001425743103027]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 5.0, 7.0, 3.0, 2.0, 6.0, 9.0, 11.0, 16.0, 27.0, 26.0, 14.0, 33.0, 25.0, 35.0, 31.0, 40.0, 52.0, 47.0, 55.0, 45.0, 45.0, 62.0, 37.0, 43.0, 46.0, 47.0, 46.0, 30.0, 33.0, 28.0, 13.0, 15.0, 17.0, 16.0, 10.0, 6.0, 8.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.703125, -7.42919921875, -7.1552734375, -6.88134765625, -6.607421875, -6.33349609375, -6.0595703125, -5.78564453125, -5.51171875, -5.23779296875, -4.9638671875, -4.68994140625, -4.416015625, -4.14208984375, -3.8681640625, -3.59423828125, -3.3203125, -3.04638671875, -2.7724609375, -2.49853515625, -2.224609375, -1.95068359375, -1.6767578125, -1.40283203125, -1.12890625, -0.85498046875, -0.5810546875, -0.30712890625, -0.033203125, 0.24072265625, 0.5146484375, 0.78857421875, 1.0625, 1.33642578125, 1.6103515625, 1.88427734375, 2.158203125, 2.43212890625, 2.7060546875, 2.97998046875, 3.25390625, 3.52783203125, 3.8017578125, 4.07568359375, 4.349609375, 4.62353515625, 4.8974609375, 5.17138671875, 5.4453125, 5.71923828125, 5.9931640625, 6.26708984375, 6.541015625, 6.81494140625, 7.0888671875, 7.36279296875, 7.63671875, 7.91064453125, 8.1845703125, 8.45849609375, 8.732421875, 9.00634765625, 9.2802734375, 9.55419921875, 9.828125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 7.0, 4.0, 3.0, 6.0, 10.0, 18.0, 31.0, 40.0, 62.0, 83.0, 168.0, 290.0, 571.0, 1206.0, 2522.0, 6231.0, 17154.0, 58874.0, 263566.0, 523713.0, 123974.0, 32001.0, 10401.0, 4003.0, 1722.0, 882.0, 424.0, 241.0, 141.0, 56.0, 40.0, 36.0, 22.0, 17.0, 9.0, 9.0, 9.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80078125, -4.63092041015625, -4.4610595703125, -4.29119873046875, -4.121337890625, -3.95147705078125, -3.7816162109375, -3.61175537109375, -3.44189453125, -3.27203369140625, -3.1021728515625, -2.93231201171875, -2.762451171875, -2.59259033203125, -2.4227294921875, -2.25286865234375, -2.0830078125, -1.91314697265625, -1.7432861328125, -1.57342529296875, -1.403564453125, -1.23370361328125, -1.0638427734375, -0.89398193359375, -0.72412109375, -0.55426025390625, -0.3843994140625, -0.21453857421875, -0.044677734375, 0.12518310546875, 0.2950439453125, 0.46490478515625, 0.634765625, 0.80462646484375, 0.9744873046875, 1.14434814453125, 1.314208984375, 1.48406982421875, 1.6539306640625, 1.82379150390625, 1.99365234375, 2.16351318359375, 2.3333740234375, 2.50323486328125, 2.673095703125, 2.84295654296875, 3.0128173828125, 3.18267822265625, 3.3525390625, 3.52239990234375, 3.6922607421875, 3.86212158203125, 4.031982421875, 4.20184326171875, 4.3717041015625, 4.54156494140625, 4.71142578125, 4.88128662109375, 5.0511474609375, 5.22100830078125, 5.390869140625, 5.56072998046875, 5.7305908203125, 5.90045166015625, 6.0703125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 2.0, 9.0, 10.0, 13.0, 15.0, 23.0, 17.0, 23.0, 27.0, 29.0, 30.0, 32.0, 34.0, 42.0, 43.0, 52.0, 94.0, 1561.0, 469.0, 90.0, 51.0, 50.0, 45.0, 27.0, 34.0, 30.0, 21.0, 25.0, 26.0, 19.0, 13.0, 11.0, 15.0, 14.0, 9.0, 5.0, 4.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-24.1875, -23.32275390625, -22.4580078125, -21.59326171875, -20.728515625, -19.86376953125, -18.9990234375, -18.13427734375, -17.26953125, -16.40478515625, -15.5400390625, -14.67529296875, -13.810546875, -12.94580078125, -12.0810546875, -11.21630859375, -10.3515625, -9.48681640625, -8.6220703125, -7.75732421875, -6.892578125, -6.02783203125, -5.1630859375, -4.29833984375, -3.43359375, -2.56884765625, -1.7041015625, -0.83935546875, 0.025390625, 0.89013671875, 1.7548828125, 2.61962890625, 3.484375, 4.34912109375, 5.2138671875, 6.07861328125, 6.943359375, 7.80810546875, 8.6728515625, 9.53759765625, 10.40234375, 11.26708984375, 12.1318359375, 12.99658203125, 13.861328125, 14.72607421875, 15.5908203125, 16.45556640625, 17.3203125, 18.18505859375, 19.0498046875, 19.91455078125, 20.779296875, 21.64404296875, 22.5087890625, 23.37353515625, 24.23828125, 25.10302734375, 25.9677734375, 26.83251953125, 27.697265625, 28.56201171875, 29.4267578125, 30.29150390625, 31.15625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 8.0, 8.0, 11.0, 18.0, 18.0, 16.0, 24.0, 34.0, 32.0, 34.0, 62.0, 59.0, 109.0, 180.0, 342.0, 709.0, 4385.0, 2581564.0, 553358.0, 3175.0, 620.0, 293.0, 179.0, 118.0, 74.0, 49.0, 44.0, 37.0, 26.0, 18.0, 16.0, 21.0, 11.0, 11.0, 7.0, 2.0, 6.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-52.71875, -51.251953125, -49.78515625, -48.318359375, -46.8515625, -45.384765625, -43.91796875, -42.451171875, -40.984375, -39.517578125, -38.05078125, -36.583984375, -35.1171875, -33.650390625, -32.18359375, -30.716796875, -29.25, -27.783203125, -26.31640625, -24.849609375, -23.3828125, -21.916015625, -20.44921875, -18.982421875, -17.515625, -16.048828125, -14.58203125, -13.115234375, -11.6484375, -10.181640625, -8.71484375, -7.248046875, -5.78125, -4.314453125, -2.84765625, -1.380859375, 0.0859375, 1.552734375, 3.01953125, 4.486328125, 5.953125, 7.419921875, 8.88671875, 10.353515625, 11.8203125, 13.287109375, 14.75390625, 16.220703125, 17.6875, 19.154296875, 20.62109375, 22.087890625, 23.5546875, 25.021484375, 26.48828125, 27.955078125, 29.421875, 30.888671875, 32.35546875, 33.822265625, 35.2890625, 36.755859375, 38.22265625, 39.689453125, 41.15625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 30.0, 432.0, 509.0, 43.0, 2.0, 0.0, 1.0], "bins": [-249.012939453125, -244.79678344726562, -240.5806121826172, -236.3644561767578, -232.14828491210938, -227.93212890625, -223.71597290039062, -219.4998016357422, -215.2836456298828, -211.06748962402344, -206.851318359375, -202.63516235351562, -198.4189910888672, -194.2028350830078, -189.98666381835938, -185.7705078125, -181.55435180664062, -177.33819580078125, -173.1220245361328, -168.90586853027344, -164.689697265625, -160.47354125976562, -156.25738525390625, -152.0412139892578, -147.82504272460938, -143.60888671875, -139.39271545410156, -135.1765594482422, -130.96038818359375, -126.74423217773438, -122.52806854248047, -118.31190490722656, -114.09574890136719, -109.87958526611328, -105.66342163085938, -101.447265625, -97.2311019897461, -93.01493835449219, -88.79877471923828, -84.58261108398438, -80.36644744873047, -76.15028381347656, -71.93412017822266, -67.71795654296875, -63.501800537109375, -59.28563690185547, -55.06947326660156, -50.853309631347656, -46.63715362548828, -42.420989990234375, -38.204830169677734, -33.98866653442383, -29.772504806518555, -25.55634307861328, -21.340179443359375, -17.1240177154541, -12.907854080200195, -8.691692352294922, -4.475529670715332, -0.2593669891357422, 3.9567947387695312, 8.172956466674805, 12.389120101928711, 16.605281829833984, 20.821443557739258]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 11.0, 9.0, 8.0, 12.0, 9.0, 6.0, 15.0, 21.0, 23.0, 23.0, 24.0, 24.0, 36.0, 37.0, 37.0, 39.0, 41.0, 37.0, 43.0, 29.0, 38.0, 31.0, 41.0, 40.0, 34.0, 31.0, 31.0, 36.0, 40.0, 32.0, 17.0, 19.0, 18.0, 19.0, 19.0, 14.0, 22.0, 8.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-80.9436264038086, -78.33077239990234, -75.71792602539062, -73.10507202148438, -70.49221801757812, -67.87936401367188, -65.26651763916016, -62.653663635253906, -60.04081344604492, -57.42796325683594, -54.81510925292969, -52.2022590637207, -49.58940887451172, -46.97655487060547, -44.363704681396484, -41.7508544921875, -39.13800048828125, -36.525150299072266, -33.912296295166016, -31.29944610595703, -28.686594009399414, -26.073741912841797, -23.460891723632812, -20.848039627075195, -18.235187530517578, -15.622335433959961, -13.00948429107666, -10.39663314819336, -7.783781051635742, -5.170928955078125, -2.558077812194824, 0.05477333068847656, 2.6676254272460938, 5.280477046966553, 7.893328666687012, 10.506179809570312, 13.11903190612793, 15.731884002685547, 18.34473419189453, 20.95758628845215, 23.570438385009766, 26.183290481567383, 28.796142578125, 31.408992767333984, 34.02184295654297, 36.63469696044922, 39.2475471496582, 41.86039733886719, 44.47325134277344, 47.08610153198242, 49.69895553588867, 52.311805725097656, 54.924659729003906, 57.53750991821289, 60.150360107421875, 62.763214111328125, 65.37606811523438, 67.98892211914062, 70.60176849365234, 73.2146224975586, 75.82747650146484, 78.44032287597656, 81.05317687988281, 83.66603088378906, 86.27887725830078]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 5.0, 2.0, 5.0, 4.0, 5.0, 2.0, 10.0, 14.0, 19.0, 15.0, 27.0, 25.0, 24.0, 36.0, 29.0, 32.0, 35.0, 51.0, 62.0, 41.0, 58.0, 41.0, 62.0, 31.0, 43.0, 54.0, 47.0, 41.0, 31.0, 28.0, 31.0, 14.0, 14.0, 21.0, 14.0, 8.0, 7.0, 8.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.90234375, -7.62066650390625, -7.3389892578125, -7.05731201171875, -6.775634765625, -6.49395751953125, -6.2122802734375, -5.93060302734375, -5.64892578125, -5.36724853515625, -5.0855712890625, -4.80389404296875, -4.522216796875, -4.24053955078125, -3.9588623046875, -3.67718505859375, -3.3955078125, -3.11383056640625, -2.8321533203125, -2.55047607421875, -2.268798828125, -1.98712158203125, -1.7054443359375, -1.42376708984375, -1.14208984375, -0.86041259765625, -0.5787353515625, -0.29705810546875, -0.015380859375, 0.26629638671875, 0.5479736328125, 0.82965087890625, 1.111328125, 1.39300537109375, 1.6746826171875, 1.95635986328125, 2.238037109375, 2.51971435546875, 2.8013916015625, 3.08306884765625, 3.36474609375, 3.64642333984375, 3.9281005859375, 4.20977783203125, 4.491455078125, 4.77313232421875, 5.0548095703125, 5.33648681640625, 5.6181640625, 5.89984130859375, 6.1815185546875, 6.46319580078125, 6.744873046875, 7.02655029296875, 7.3082275390625, 7.58990478515625, 7.87158203125, 8.15325927734375, 8.4349365234375, 8.71661376953125, 8.998291015625, 9.27996826171875, 9.5616455078125, 9.84332275390625, 10.125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 6.0, 10.0, 19.0, 11.0, 18.0, 25.0, 23.0, 24.0, 48.0, 76.0, 73.0, 148.0, 414.0, 1548.0, 15832.0, 523551.0, 3454944.0, 188055.0, 7724.0, 952.0, 296.0, 158.0, 77.0, 46.0, 47.0, 23.0, 26.0, 21.0, 12.0, 16.0, 14.0, 10.0, 9.0, 6.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.015625, -27.09326171875, -26.1708984375, -25.24853515625, -24.326171875, -23.40380859375, -22.4814453125, -21.55908203125, -20.63671875, -19.71435546875, -18.7919921875, -17.86962890625, -16.947265625, -16.02490234375, -15.1025390625, -14.18017578125, -13.2578125, -12.33544921875, -11.4130859375, -10.49072265625, -9.568359375, -8.64599609375, -7.7236328125, -6.80126953125, -5.87890625, -4.95654296875, -4.0341796875, -3.11181640625, -2.189453125, -1.26708984375, -0.3447265625, 0.57763671875, 1.5, 2.42236328125, 3.3447265625, 4.26708984375, 5.189453125, 6.11181640625, 7.0341796875, 7.95654296875, 8.87890625, 9.80126953125, 10.7236328125, 11.64599609375, 12.568359375, 13.49072265625, 14.4130859375, 15.33544921875, 16.2578125, 17.18017578125, 18.1025390625, 19.02490234375, 19.947265625, 20.86962890625, 21.7919921875, 22.71435546875, 23.63671875, 24.55908203125, 25.4814453125, 26.40380859375, 27.326171875, 28.24853515625, 29.1708984375, 30.09326171875, 31.015625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 5.0, 13.0, 6.0, 7.0, 9.0, 20.0, 23.0, 47.0, 46.0, 72.0, 74.0, 145.0, 175.0, 266.0, 357.0, 493.0, 598.0, 486.0, 367.0, 243.0, 183.0, 136.0, 77.0, 70.0, 45.0, 40.0, 25.0, 22.0, 7.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-31.140625, -30.3896484375, -29.638671875, -28.8876953125, -28.13671875, -27.3857421875, -26.634765625, -25.8837890625, -25.1328125, -24.3818359375, -23.630859375, -22.8798828125, -22.12890625, -21.3779296875, -20.626953125, -19.8759765625, -19.125, -18.3740234375, -17.623046875, -16.8720703125, -16.12109375, -15.3701171875, -14.619140625, -13.8681640625, -13.1171875, -12.3662109375, -11.615234375, -10.8642578125, -10.11328125, -9.3623046875, -8.611328125, -7.8603515625, -7.109375, -6.3583984375, -5.607421875, -4.8564453125, -4.10546875, -3.3544921875, -2.603515625, -1.8525390625, -1.1015625, -0.3505859375, 0.400390625, 1.1513671875, 1.90234375, 2.6533203125, 3.404296875, 4.1552734375, 4.90625, 5.6572265625, 6.408203125, 7.1591796875, 7.91015625, 8.6611328125, 9.412109375, 10.1630859375, 10.9140625, 11.6650390625, 12.416015625, 13.1669921875, 13.91796875, 14.6689453125, 15.419921875, 16.1708984375, 16.921875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 6.0, 5.0, 14.0, 16.0, 22.0, 29.0, 48.0, 59.0, 132.0, 183.0, 311.0, 582.0, 3509.0, 3543556.0, 642581.0, 2003.0, 482.0, 240.0, 161.0, 113.0, 66.0, 45.0, 39.0, 27.0, 18.0, 13.0, 8.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.6875, -96.1142578125, -92.541015625, -88.9677734375, -85.39453125, -81.8212890625, -78.248046875, -74.6748046875, -71.1015625, -67.5283203125, -63.955078125, -60.3818359375, -56.80859375, -53.2353515625, -49.662109375, -46.0888671875, -42.515625, -38.9423828125, -35.369140625, -31.7958984375, -28.22265625, -24.6494140625, -21.076171875, -17.5029296875, -13.9296875, -10.3564453125, -6.783203125, -3.2099609375, 0.36328125, 3.9365234375, 7.509765625, 11.0830078125, 14.65625, 18.2294921875, 21.802734375, 25.3759765625, 28.94921875, 32.5224609375, 36.095703125, 39.6689453125, 43.2421875, 46.8154296875, 50.388671875, 53.9619140625, 57.53515625, 61.1083984375, 64.681640625, 68.2548828125, 71.828125, 75.4013671875, 78.974609375, 82.5478515625, 86.12109375, 89.6943359375, 93.267578125, 96.8408203125, 100.4140625, 103.9873046875, 107.560546875, 111.1337890625, 114.70703125, 118.2802734375, 121.853515625, 125.4267578125, 129.0]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 17.0, 110.0, 313.0, 376.0, 156.0, 36.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-252.63304138183594, -244.53671264648438, -236.4403839111328, -228.34405517578125, -220.24771118164062, -212.15139770507812, -204.0550537109375, -195.95872497558594, -187.86239624023438, -179.7660675048828, -171.66973876953125, -163.5734100341797, -155.47708129882812, -147.3807373046875, -139.28440856933594, -131.18807983398438, -123.09175109863281, -114.99542236328125, -106.89909362792969, -98.8027572631836, -90.70642852783203, -82.61009979248047, -74.51376342773438, -66.41743469238281, -58.32110595703125, -50.22477722167969, -42.12844467163086, -34.03211212158203, -25.93578338623047, -17.839454650878906, -9.743122100830078, -1.64678955078125, 6.449554443359375, 14.54588508605957, 22.642215728759766, 30.73854637145996, 38.834877014160156, 46.93120574951172, 55.02753829956055, 63.123870849609375, 71.22019958496094, 79.3165283203125, 87.41285705566406, 95.50919342041016, 103.60552215576172, 111.70185089111328, 119.79818725585938, 127.89451599121094, 135.9908447265625, 144.08717346191406, 152.18350219726562, 160.2798309326172, 168.37615966796875, 176.47250366210938, 184.56883239746094, 192.6651611328125, 200.76148986816406, 208.85781860351562, 216.9541473388672, 225.05047607421875, 233.14682006835938, 241.24313354492188, 249.3394775390625, 257.435791015625, 265.5321350097656]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 7.0, 13.0, 12.0, 18.0, 21.0, 11.0, 22.0, 17.0, 31.0, 36.0, 32.0, 39.0, 36.0, 29.0, 48.0, 38.0, 35.0, 45.0, 34.0, 49.0, 40.0, 32.0, 40.0, 32.0, 25.0, 30.0, 37.0, 28.0, 28.0, 19.0, 20.0, 12.0, 13.0, 7.0, 12.0, 7.0, 8.0, 2.0, 6.0, 4.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-80.74872589111328, -78.43477630615234, -76.12081909179688, -73.80686950683594, -71.492919921875, -69.17897033691406, -66.8650131225586, -64.55106353759766, -62.23711013793945, -59.92315673828125, -57.60920715332031, -55.29525375366211, -52.981300354003906, -50.66735076904297, -48.353397369384766, -46.03944396972656, -43.725494384765625, -41.41154098510742, -39.097591400146484, -36.78363800048828, -34.469688415527344, -32.15573501586914, -29.841781616210938, -27.527830123901367, -25.213878631591797, -22.899927139282227, -20.585975646972656, -18.272022247314453, -15.958070755004883, -13.644119262695312, -11.330166816711426, -9.016214370727539, -6.7022552490234375, -4.388303279876709, -2.0743513107299805, 0.23960065841674805, 2.5535526275634766, 4.867504119873047, 7.181456565856934, 9.49540901184082, 11.80936050415039, 14.123311996459961, 16.43726348876953, 18.751216888427734, 21.065168380737305, 23.379119873046875, 25.693073272705078, 28.00702476501465, 30.32097625732422, 32.63492965698242, 34.94887924194336, 37.26283264160156, 39.5767822265625, 41.8907356262207, 44.204689025878906, 46.518638610839844, 48.83259201049805, 51.14654541015625, 53.46049499511719, 55.77444839477539, 58.088401794433594, 60.40235137939453, 62.716304779052734, 65.03025817871094, 67.34420776367188]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 3.0, 9.0, 12.0, 12.0, 16.0, 19.0, 27.0, 23.0, 33.0, 43.0, 35.0, 32.0, 45.0, 45.0, 53.0, 46.0, 52.0, 55.0, 54.0, 46.0, 44.0, 36.0, 34.0, 42.0, 38.0, 26.0, 24.0, 15.0, 12.0, 15.0, 11.0, 12.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.8782958984375, -7.592529296875, -7.3067626953125, -7.02099609375, -6.7352294921875, -6.449462890625, -6.1636962890625, -5.8779296875, -5.5921630859375, -5.306396484375, -5.0206298828125, -4.73486328125, -4.4490966796875, -4.163330078125, -3.8775634765625, -3.591796875, -3.3060302734375, -3.020263671875, -2.7344970703125, -2.44873046875, -2.1629638671875, -1.877197265625, -1.5914306640625, -1.3056640625, -1.0198974609375, -0.734130859375, -0.4483642578125, -0.16259765625, 0.1231689453125, 0.408935546875, 0.6947021484375, 0.98046875, 1.2662353515625, 1.552001953125, 1.8377685546875, 2.12353515625, 2.4093017578125, 2.695068359375, 2.9808349609375, 3.2666015625, 3.5523681640625, 3.838134765625, 4.1239013671875, 4.40966796875, 4.6954345703125, 4.981201171875, 5.2669677734375, 5.552734375, 5.8385009765625, 6.124267578125, 6.4100341796875, 6.69580078125, 6.9815673828125, 7.267333984375, 7.5531005859375, 7.8388671875, 8.1246337890625, 8.410400390625, 8.6961669921875, 8.98193359375, 9.2677001953125, 9.553466796875, 9.8392333984375, 10.125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 0.0, 8.0, 7.0, 11.0, 20.0, 25.0, 26.0, 42.0, 68.0, 87.0, 109.0, 182.0, 227.0, 327.0, 476.0, 733.0, 1097.0, 1608.0, 2330.0, 3581.0, 5507.0, 8824.0, 14379.0, 23695.0, 40481.0, 71717.0, 138492.0, 344952.0, 181402.0, 86274.0, 48311.0, 27891.0, 16367.0, 10510.0, 6391.0, 4123.0, 2607.0, 1756.0, 1243.0, 815.0, 580.0, 387.0, 278.0, 187.0, 124.0, 106.0, 51.0, 49.0, 24.0, 21.0, 19.0, 11.0, 9.0, 7.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0], "bins": [-1.748046875, -1.6928253173828125, -1.637603759765625, -1.5823822021484375, -1.52716064453125, -1.4719390869140625, -1.416717529296875, -1.3614959716796875, -1.3062744140625, -1.2510528564453125, -1.195831298828125, -1.1406097412109375, -1.08538818359375, -1.0301666259765625, -0.974945068359375, -0.9197235107421875, -0.864501953125, -0.8092803955078125, -0.754058837890625, -0.6988372802734375, -0.64361572265625, -0.5883941650390625, -0.533172607421875, -0.4779510498046875, -0.4227294921875, -0.3675079345703125, -0.312286376953125, -0.2570648193359375, -0.20184326171875, -0.1466217041015625, -0.091400146484375, -0.0361785888671875, 0.01904296875, 0.0742645263671875, 0.129486083984375, 0.1847076416015625, 0.23992919921875, 0.2951507568359375, 0.350372314453125, 0.4055938720703125, 0.4608154296875, 0.5160369873046875, 0.571258544921875, 0.6264801025390625, 0.68170166015625, 0.7369232177734375, 0.792144775390625, 0.8473663330078125, 0.902587890625, 0.9578094482421875, 1.013031005859375, 1.0682525634765625, 1.12347412109375, 1.1786956787109375, 1.233917236328125, 1.2891387939453125, 1.3443603515625, 1.3995819091796875, 1.454803466796875, 1.5100250244140625, 1.56524658203125, 1.6204681396484375, 1.675689697265625, 1.7309112548828125, 1.7861328125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 4.0, 7.0, 7.0, 7.0, 14.0, 16.0, 16.0, 13.0, 25.0, 18.0, 26.0, 30.0, 40.0, 35.0, 28.0, 50.0, 31.0, 48.0, 29.0, 33.0, 1067.0, 32.0, 43.0, 30.0, 38.0, 38.0, 38.0, 39.0, 30.0, 27.0, 21.0, 25.0, 23.0, 22.0, 15.0, 11.0, 6.0, 8.0, 6.0, 5.0, 4.0, 9.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-5.30078125, -5.14373779296875, -4.9866943359375, -4.82965087890625, -4.672607421875, -4.51556396484375, -4.3585205078125, -4.20147705078125, -4.04443359375, -3.88739013671875, -3.7303466796875, -3.57330322265625, -3.416259765625, -3.25921630859375, -3.1021728515625, -2.94512939453125, -2.7880859375, -2.63104248046875, -2.4739990234375, -2.31695556640625, -2.159912109375, -2.00286865234375, -1.8458251953125, -1.68878173828125, -1.53173828125, -1.37469482421875, -1.2176513671875, -1.06060791015625, -0.903564453125, -0.74652099609375, -0.5894775390625, -0.43243408203125, -0.275390625, -0.11834716796875, 0.0386962890625, 0.19573974609375, 0.352783203125, 0.50982666015625, 0.6668701171875, 0.82391357421875, 0.98095703125, 1.13800048828125, 1.2950439453125, 1.45208740234375, 1.609130859375, 1.76617431640625, 1.9232177734375, 2.08026123046875, 2.2373046875, 2.39434814453125, 2.5513916015625, 2.70843505859375, 2.865478515625, 3.02252197265625, 3.1795654296875, 3.33660888671875, 3.49365234375, 3.65069580078125, 3.8077392578125, 3.96478271484375, 4.121826171875, 4.27886962890625, 4.4359130859375, 4.59295654296875, 4.75]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 6.0, 6.0, 6.0, 8.0, 14.0, 15.0, 43.0, 51.0, 68.0, 90.0, 129.0, 214.0, 300.0, 473.0, 651.0, 1034.0, 1575.0, 2375.0, 3502.0, 5463.0, 8500.0, 13369.0, 21011.0, 33592.0, 55175.0, 95893.0, 201875.0, 1349092.0, 122989.0, 67952.0, 40652.0, 25376.0, 15901.0, 10227.0, 6663.0, 4400.0, 2779.0, 1915.0, 1219.0, 862.0, 528.0, 361.0, 251.0, 154.0, 111.0, 100.0, 52.0, 39.0, 24.0, 15.0, 15.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4208984375, -1.37384033203125, -1.3267822265625, -1.27972412109375, -1.232666015625, -1.18560791015625, -1.1385498046875, -1.09149169921875, -1.04443359375, -0.99737548828125, -0.9503173828125, -0.90325927734375, -0.856201171875, -0.80914306640625, -0.7620849609375, -0.71502685546875, -0.66796875, -0.62091064453125, -0.5738525390625, -0.52679443359375, -0.479736328125, -0.43267822265625, -0.3856201171875, -0.33856201171875, -0.29150390625, -0.24444580078125, -0.1973876953125, -0.15032958984375, -0.103271484375, -0.05621337890625, -0.0091552734375, 0.03790283203125, 0.0849609375, 0.13201904296875, 0.1790771484375, 0.22613525390625, 0.273193359375, 0.32025146484375, 0.3673095703125, 0.41436767578125, 0.46142578125, 0.50848388671875, 0.5555419921875, 0.60260009765625, 0.649658203125, 0.69671630859375, 0.7437744140625, 0.79083251953125, 0.837890625, 0.88494873046875, 0.9320068359375, 0.97906494140625, 1.026123046875, 1.07318115234375, 1.1202392578125, 1.16729736328125, 1.21435546875, 1.26141357421875, 1.3084716796875, 1.35552978515625, 1.402587890625, 1.44964599609375, 1.4967041015625, 1.54376220703125, 1.5908203125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 5.0, 3.0, 5.0, 4.0, 8.0, 7.0, 8.0, 4.0, 15.0, 11.0, 14.0, 21.0, 23.0, 27.0, 30.0, 41.0, 37.0, 51.0, 57.0, 61.0, 68.0, 50.0, 72.0, 56.0, 43.0, 39.0, 32.0, 26.0, 21.0, 29.0, 30.0, 13.0, 20.0, 13.0, 10.0, 13.0, 6.0, 6.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0008687973022460938, -0.0008419007062911987, -0.0008150041103363037, -0.0007881075143814087, -0.0007612109184265137, -0.0007343143224716187, -0.0007074177265167236, -0.0006805211305618286, -0.0006536245346069336, -0.0006267279386520386, -0.0005998313426971436, -0.0005729347467422485, -0.0005460381507873535, -0.0005191415548324585, -0.0004922449588775635, -0.00046534836292266846, -0.00043845176696777344, -0.0004115551710128784, -0.0003846585750579834, -0.0003577619791030884, -0.00033086538314819336, -0.00030396878719329834, -0.0002770721912384033, -0.0002501755952835083, -0.00022327899932861328, -0.00019638240337371826, -0.00016948580741882324, -0.00014258921146392822, -0.0001156926155090332, -8.879601955413818e-05, -6.189942359924316e-05, -3.5002827644348145e-05, -8.106231689453125e-06, 1.8790364265441895e-05, 4.5686960220336914e-05, 7.258355617523193e-05, 9.948015213012695e-05, 0.00012637674808502197, 0.000153273344039917, 0.000180169939994812, 0.00020706653594970703, 0.00023396313190460205, 0.00026085972785949707, 0.0002877563238143921, 0.0003146529197692871, 0.00034154951572418213, 0.00036844611167907715, 0.00039534270763397217, 0.0004222393035888672, 0.0004491358995437622, 0.0004760324954986572, 0.0005029290914535522, 0.0005298256874084473, 0.0005567222833633423, 0.0005836188793182373, 0.0006105154752731323, 0.0006374120712280273, 0.0006643086671829224, 0.0006912052631378174, 0.0007181018590927124, 0.0007449984550476074, 0.0007718950510025024, 0.0007987916469573975, 0.0008256882429122925, 0.0008525848388671875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 2.0, 5.0, 15.0, 9.0, 14.0, 8.0, 21.0, 18.0, 25.0, 31.0, 44.0, 50.0, 63.0, 119.0, 182.0, 371.0, 1163.0, 866085.0, 178564.0, 804.0, 342.0, 170.0, 110.0, 70.0, 61.0, 28.0, 30.0, 23.0, 18.0, 14.0, 20.0, 5.0, 12.0, 8.0, 10.0, 9.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0208587646484375, -0.020204782485961914, -0.019550800323486328, -0.018896818161010742, -0.018242835998535156, -0.01758885383605957, -0.016934871673583984, -0.0162808895111084, -0.015626907348632812, -0.014972925186157227, -0.01431894302368164, -0.013664960861206055, -0.013010978698730469, -0.012356996536254883, -0.011703014373779297, -0.011049032211303711, -0.010395050048828125, -0.009741067886352539, -0.009087085723876953, -0.008433103561401367, -0.007779121398925781, -0.007125139236450195, -0.006471157073974609, -0.0058171749114990234, -0.0051631927490234375, -0.0045092105865478516, -0.0038552284240722656, -0.0032012462615966797, -0.0025472640991210938, -0.0018932819366455078, -0.0012392997741699219, -0.0005853176116943359, 6.866455078125e-05, 0.0007226467132568359, 0.0013766288757324219, 0.002030611038208008, 0.0026845932006835938, 0.0033385753631591797, 0.003992557525634766, 0.0046465396881103516, 0.0053005218505859375, 0.0059545040130615234, 0.006608486175537109, 0.007262468338012695, 0.007916450500488281, 0.008570432662963867, 0.009224414825439453, 0.009878396987915039, 0.010532379150390625, 0.011186361312866211, 0.011840343475341797, 0.012494325637817383, 0.013148307800292969, 0.013802289962768555, 0.01445627212524414, 0.015110254287719727, 0.015764236450195312, 0.0164182186126709, 0.017072200775146484, 0.01772618293762207, 0.018380165100097656, 0.019034147262573242, 0.019688129425048828, 0.020342111587524414, 0.02099609375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 19.0, 249.0, 555.0, 169.0, 22.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016488254768773913, -0.0015681134536862373, -0.0014874013140797615, -0.0014066892908886075, -0.0013259772676974535, -0.0012452651280909777, -0.0011645531048998237, -0.0010838410817086697, -0.0010031289421021938, -0.0009224168607033789, -0.0008417048375122249, -0.00076099275611341, -0.000680280732922256, -0.0005995686515234411, -0.0005188565701246262, -0.00043814454693347216, -0.00035743252374231815, -0.0002767204714473337, -0.000196008404600434, -0.00011529633775353432, -3.458428545854986e-05, 4.61277668364346e-05, 0.00012683984823524952, 0.00020755187142640352, 0.00028826395282521844, 0.0003689760051202029, 0.00044968805741518736, 0.0005304001388140023, 0.0006111122202128172, 0.0006918242434039712, 0.0007725363248027861, 0.0008532483479939401, 0.0009339605458080769, 0.0010146725689992309, 0.0010953847086057067, 0.0011760967317968607, 0.0012568087549880147, 0.0013375207781791687, 0.0014182329177856445, 0.0014989449409767985, 0.0015796569641679525, 0.0016603689873591065, 0.0017410811269655824, 0.0018217931501567364, 0.0019025051733478904, 0.0019832171965390444, 0.00206392933614552, 0.0021446412429213524, 0.002225353382527828, 0.002306065522134304, 0.0023867774289101362, 0.002467489568516612, 0.002548201708123088, 0.00262891361489892, 0.002709625754505396, 0.0027903378941118717, 0.0028710500337183475, 0.0029517621733248234, 0.0030324740801006556, 0.0031131862197071314, 0.003193898359313607, 0.0032746102660894394, 0.0033553224056959152, 0.003436034545302391, 0.0035167464520782232]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 9.0, 9.0, 15.0, 13.0, 22.0, 16.0, 25.0, 27.0, 23.0, 32.0, 33.0, 36.0, 35.0, 45.0, 39.0, 45.0, 40.0, 32.0, 36.0, 45.0, 45.0, 43.0, 37.0, 34.0, 38.0, 24.0, 31.0, 23.0, 19.0, 24.0, 28.0, 12.0, 11.0, 11.0, 11.0, 6.0, 4.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004642605781555176, -0.00044866278767585754, -0.0004330649971961975, -0.0004174672067165375, -0.00040186941623687744, -0.0003862716257572174, -0.0003706738352775574, -0.00035507604479789734, -0.0003394782543182373, -0.00032388046383857727, -0.00030828267335891724, -0.0002926848828792572, -0.00027708709239959717, -0.00026148930191993713, -0.0002458915114402771, -0.00023029372096061707, -0.00021469593048095703, -0.000199098140001297, -0.00018350034952163696, -0.00016790255904197693, -0.0001523047685623169, -0.00013670697808265686, -0.00012110918760299683, -0.00010551139712333679, -8.991360664367676e-05, -7.431581616401672e-05, -5.871802568435669e-05, -4.3120235204696655e-05, -2.752244472503662e-05, -1.1924654245376587e-05, 3.6731362342834473e-06, 1.927092671394348e-05, 3.4868717193603516e-05, 5.046650767326355e-05, 6.606429815292358e-05, 8.166208863258362e-05, 9.725987911224365e-05, 0.00011285766959190369, 0.00012845546007156372, 0.00014405325055122375, 0.0001596510410308838, 0.00017524883151054382, 0.00019084662199020386, 0.0002064444124698639, 0.00022204220294952393, 0.00023763999342918396, 0.000253237783908844, 0.00026883557438850403, 0.00028443336486816406, 0.0003000311553478241, 0.00031562894582748413, 0.00033122673630714417, 0.0003468245267868042, 0.00036242231726646423, 0.00037802010774612427, 0.0003936178982257843, 0.00040921568870544434, 0.00042481347918510437, 0.0004404112696647644, 0.00045600906014442444, 0.00047160685062408447, 0.0004872046411037445, 0.0005028024315834045, 0.0005184002220630646, 0.0005339980125427246]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 3.0, 9.0, 12.0, 12.0, 16.0, 19.0, 27.0, 23.0, 33.0, 43.0, 35.0, 32.0, 45.0, 45.0, 53.0, 46.0, 52.0, 55.0, 54.0, 46.0, 44.0, 36.0, 34.0, 42.0, 38.0, 26.0, 24.0, 15.0, 12.0, 15.0, 11.0, 12.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.8782958984375, -7.592529296875, -7.3067626953125, -7.02099609375, -6.7352294921875, -6.449462890625, -6.1636962890625, -5.8779296875, -5.5921630859375, -5.306396484375, -5.0206298828125, -4.73486328125, -4.4490966796875, -4.163330078125, -3.8775634765625, -3.591796875, -3.3060302734375, -3.020263671875, -2.7344970703125, -2.44873046875, -2.1629638671875, -1.877197265625, -1.5914306640625, -1.3056640625, -1.0198974609375, -0.734130859375, -0.4483642578125, -0.16259765625, 0.1231689453125, 0.408935546875, 0.6947021484375, 0.98046875, 1.2662353515625, 1.552001953125, 1.8377685546875, 2.12353515625, 2.4093017578125, 2.695068359375, 2.9808349609375, 3.2666015625, 3.5523681640625, 3.838134765625, 4.1239013671875, 4.40966796875, 4.6954345703125, 4.981201171875, 5.2669677734375, 5.552734375, 5.8385009765625, 6.124267578125, 6.4100341796875, 6.69580078125, 6.9815673828125, 7.267333984375, 7.5531005859375, 7.8388671875, 8.1246337890625, 8.410400390625, 8.6961669921875, 8.98193359375, 9.2677001953125, 9.553466796875, 9.8392333984375, 10.125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 6.0, 3.0, 7.0, 8.0, 18.0, 21.0, 26.0, 37.0, 46.0, 72.0, 95.0, 135.0, 211.0, 272.0, 386.0, 622.0, 848.0, 1189.0, 1856.0, 2774.0, 4187.0, 6789.0, 11578.0, 21715.0, 49457.0, 159915.0, 498707.0, 178773.0, 53400.0, 23070.0, 12025.0, 6897.0, 4459.0, 2912.0, 1951.0, 1248.0, 868.0, 604.0, 421.0, 304.0, 211.0, 127.0, 94.0, 67.0, 40.0, 29.0, 26.0, 18.0, 12.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.4609375, -4.30462646484375, -4.1483154296875, -3.99200439453125, -3.835693359375, -3.67938232421875, -3.5230712890625, -3.36676025390625, -3.21044921875, -3.05413818359375, -2.8978271484375, -2.74151611328125, -2.585205078125, -2.42889404296875, -2.2725830078125, -2.11627197265625, -1.9599609375, -1.80364990234375, -1.6473388671875, -1.49102783203125, -1.334716796875, -1.17840576171875, -1.0220947265625, -0.86578369140625, -0.70947265625, -0.55316162109375, -0.3968505859375, -0.24053955078125, -0.084228515625, 0.07208251953125, 0.2283935546875, 0.38470458984375, 0.541015625, 0.69732666015625, 0.8536376953125, 1.00994873046875, 1.166259765625, 1.32257080078125, 1.4788818359375, 1.63519287109375, 1.79150390625, 1.94781494140625, 2.1041259765625, 2.26043701171875, 2.416748046875, 2.57305908203125, 2.7293701171875, 2.88568115234375, 3.0419921875, 3.19830322265625, 3.3546142578125, 3.51092529296875, 3.667236328125, 3.82354736328125, 3.9798583984375, 4.13616943359375, 4.29248046875, 4.44879150390625, 4.6051025390625, 4.76141357421875, 4.917724609375, 5.07403564453125, 5.2303466796875, 5.38665771484375, 5.54296875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 6.0, 11.0, 6.0, 6.0, 18.0, 16.0, 29.0, 19.0, 23.0, 38.0, 40.0, 26.0, 46.0, 46.0, 55.0, 84.0, 243.0, 1742.0, 119.0, 54.0, 65.0, 57.0, 48.0, 31.0, 40.0, 31.0, 20.0, 28.0, 21.0, 16.0, 11.0, 14.0, 7.0, 11.0, 4.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.171875, -30.175537109375, -29.17919921875, -28.182861328125, -27.1865234375, -26.190185546875, -25.19384765625, -24.197509765625, -23.201171875, -22.204833984375, -21.20849609375, -20.212158203125, -19.2158203125, -18.219482421875, -17.22314453125, -16.226806640625, -15.23046875, -14.234130859375, -13.23779296875, -12.241455078125, -11.2451171875, -10.248779296875, -9.25244140625, -8.256103515625, -7.259765625, -6.263427734375, -5.26708984375, -4.270751953125, -3.2744140625, -2.278076171875, -1.28173828125, -0.285400390625, 0.7109375, 1.707275390625, 2.70361328125, 3.699951171875, 4.6962890625, 5.692626953125, 6.68896484375, 7.685302734375, 8.681640625, 9.677978515625, 10.67431640625, 11.670654296875, 12.6669921875, 13.663330078125, 14.65966796875, 15.656005859375, 16.65234375, 17.648681640625, 18.64501953125, 19.641357421875, 20.6376953125, 21.634033203125, 22.63037109375, 23.626708984375, 24.623046875, 25.619384765625, 26.61572265625, 27.612060546875, 28.6083984375, 29.604736328125, 30.60107421875, 31.597412109375, 32.59375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 1.0, 7.0, 6.0, 12.0, 11.0, 19.0, 15.0, 24.0, 20.0, 31.0, 38.0, 68.0, 76.0, 95.0, 177.0, 240.0, 504.0, 1419.0, 17883.0, 3076164.0, 45421.0, 2008.0, 571.0, 273.0, 160.0, 100.0, 90.0, 72.0, 40.0, 35.0, 29.0, 26.0, 14.0, 8.0, 12.0, 10.0, 9.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.78125, -56.978515625, -55.17578125, -53.373046875, -51.5703125, -49.767578125, -47.96484375, -46.162109375, -44.359375, -42.556640625, -40.75390625, -38.951171875, -37.1484375, -35.345703125, -33.54296875, -31.740234375, -29.9375, -28.134765625, -26.33203125, -24.529296875, -22.7265625, -20.923828125, -19.12109375, -17.318359375, -15.515625, -13.712890625, -11.91015625, -10.107421875, -8.3046875, -6.501953125, -4.69921875, -2.896484375, -1.09375, 0.708984375, 2.51171875, 4.314453125, 6.1171875, 7.919921875, 9.72265625, 11.525390625, 13.328125, 15.130859375, 16.93359375, 18.736328125, 20.5390625, 22.341796875, 24.14453125, 25.947265625, 27.75, 29.552734375, 31.35546875, 33.158203125, 34.9609375, 36.763671875, 38.56640625, 40.369140625, 42.171875, 43.974609375, 45.77734375, 47.580078125, 49.3828125, 51.185546875, 52.98828125, 54.791015625, 56.59375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 11.0, 22.0, 53.0, 122.0, 208.0, 199.0, 173.0, 109.0, 59.0, 21.0, 20.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.68754959106445, -34.22761917114258, -32.7676887512207, -31.307756423950195, -29.84782600402832, -28.387895584106445, -26.927963256835938, -25.468032836914062, -24.008102416992188, -22.548171997070312, -21.088241577148438, -19.62830924987793, -18.168378829956055, -16.70844841003418, -15.248517036437988, -13.788585662841797, -12.328655242919922, -10.868724822998047, -9.408793449401855, -7.948862552642822, -6.488931655883789, -5.029000759124756, -3.5690698623657227, -2.1091384887695312, -0.6492080688476562, 0.810722827911377, 2.27065372467041, 3.7305846214294434, 5.190515518188477, 6.65044641494751, 8.110377311706543, 9.570308685302734, 11.030242919921875, 12.49017333984375, 13.950104713439941, 15.410036087036133, 16.869966506958008, 18.329896926879883, 19.78982925415039, 21.249759674072266, 22.70969009399414, 24.169620513916016, 25.62955093383789, 27.0894832611084, 28.549413681030273, 30.00934410095215, 31.469276428222656, 32.92920684814453, 34.389137268066406, 35.84906768798828, 37.308998107910156, 38.76892852783203, 40.228858947753906, 41.68879318237305, 43.14872360229492, 44.6086540222168, 46.06858444213867, 47.52851486206055, 48.98844528198242, 50.4483757019043, 51.90830993652344, 53.36824035644531, 54.82817077636719, 56.28810119628906, 57.74803161621094]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 9.0, 4.0, 5.0, 5.0, 12.0, 6.0, 17.0, 18.0, 9.0, 11.0, 22.0, 19.0, 26.0, 20.0, 44.0, 47.0, 44.0, 39.0, 40.0, 26.0, 38.0, 47.0, 40.0, 40.0, 37.0, 39.0, 31.0, 33.0, 33.0, 43.0, 31.0, 26.0, 17.0, 20.0, 22.0, 23.0, 12.0, 9.0, 14.0, 4.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.5935287475586, -85.85505676269531, -83.11659240722656, -80.37812042236328, -77.6396484375, -74.90118408203125, -72.16271209716797, -69.42424011230469, -66.68577575683594, -63.94730758666992, -61.20883560180664, -58.470367431640625, -55.731895446777344, -52.99342727661133, -50.25495910644531, -47.51648712158203, -44.77801513671875, -42.039546966552734, -39.30107498168945, -36.56260681152344, -33.824134826660156, -31.08566665649414, -28.347198486328125, -25.608728408813477, -22.870258331298828, -20.13178825378418, -17.39331817626953, -14.654850006103516, -11.916379928588867, -9.177909851074219, -6.439441680908203, -3.7009716033935547, -0.9625091552734375, 1.7759604454040527, 4.514430046081543, 7.252899169921875, 9.991369247436523, 12.729839324951172, 15.468307495117188, 18.206777572631836, 20.945247650146484, 23.683717727661133, 26.42218780517578, 29.160655975341797, 31.899126052856445, 34.637596130371094, 37.37606430053711, 40.114532470703125, 42.853004455566406, 45.59147262573242, 48.3299446105957, 51.06841278076172, 53.806884765625, 56.545352935791016, 59.28382110595703, 62.02229309082031, 64.76075744628906, 67.49922943115234, 70.2376937866211, 72.97616577148438, 75.71463775634766, 78.45310974121094, 81.19157409667969, 83.93004608154297, 86.66851806640625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 0.0, 6.0, 10.0, 10.0, 17.0, 21.0, 16.0, 27.0, 37.0, 28.0, 43.0, 32.0, 43.0, 40.0, 48.0, 45.0, 54.0, 59.0, 53.0, 51.0, 44.0, 43.0, 32.0, 40.0, 33.0, 38.0, 27.0, 18.0, 10.0, 17.0, 10.0, 15.0, 9.0, 4.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4921875, -8.2005615234375, -7.908935546875, -7.6173095703125, -7.32568359375, -7.0340576171875, -6.742431640625, -6.4508056640625, -6.1591796875, -5.8675537109375, -5.575927734375, -5.2843017578125, -4.99267578125, -4.7010498046875, -4.409423828125, -4.1177978515625, -3.826171875, -3.5345458984375, -3.242919921875, -2.9512939453125, -2.65966796875, -2.3680419921875, -2.076416015625, -1.7847900390625, -1.4931640625, -1.2015380859375, -0.909912109375, -0.6182861328125, -0.32666015625, -0.0350341796875, 0.256591796875, 0.5482177734375, 0.83984375, 1.1314697265625, 1.423095703125, 1.7147216796875, 2.00634765625, 2.2979736328125, 2.589599609375, 2.8812255859375, 3.1728515625, 3.4644775390625, 3.756103515625, 4.0477294921875, 4.33935546875, 4.6309814453125, 4.922607421875, 5.2142333984375, 5.505859375, 5.7974853515625, 6.089111328125, 6.3807373046875, 6.67236328125, 6.9639892578125, 7.255615234375, 7.5472412109375, 7.8388671875, 8.1304931640625, 8.422119140625, 8.7137451171875, 9.00537109375, 9.2969970703125, 9.588623046875, 9.8802490234375, 10.171875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 10.0, 15.0, 19.0, 30.0, 44.0, 55.0, 100.0, 144.0, 327.0, 522.0, 1000.0, 2058.0, 4838.0, 11836.0, 33825.0, 125036.0, 558639.0, 1600166.0, 1343766.0, 379135.0, 90931.0, 25894.0, 8774.0, 3621.0, 1610.0, 829.0, 428.0, 216.0, 131.0, 92.0, 66.0, 37.0, 23.0, 23.0, 11.0, 10.0, 5.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.953125, -10.6297607421875, -10.306396484375, -9.9830322265625, -9.65966796875, -9.3363037109375, -9.012939453125, -8.6895751953125, -8.3662109375, -8.0428466796875, -7.719482421875, -7.3961181640625, -7.07275390625, -6.7493896484375, -6.426025390625, -6.1026611328125, -5.779296875, -5.4559326171875, -5.132568359375, -4.8092041015625, -4.48583984375, -4.1624755859375, -3.839111328125, -3.5157470703125, -3.1923828125, -2.8690185546875, -2.545654296875, -2.2222900390625, -1.89892578125, -1.5755615234375, -1.252197265625, -0.9288330078125, -0.60546875, -0.2821044921875, 0.041259765625, 0.3646240234375, 0.68798828125, 1.0113525390625, 1.334716796875, 1.6580810546875, 1.9814453125, 2.3048095703125, 2.628173828125, 2.9515380859375, 3.27490234375, 3.5982666015625, 3.921630859375, 4.2449951171875, 4.568359375, 4.8917236328125, 5.215087890625, 5.5384521484375, 5.86181640625, 6.1851806640625, 6.508544921875, 6.8319091796875, 7.1552734375, 7.4786376953125, 7.802001953125, 8.1253662109375, 8.44873046875, 8.7720947265625, 9.095458984375, 9.4188232421875, 9.7421875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 7.0, 14.0, 16.0, 38.0, 35.0, 60.0, 78.0, 100.0, 162.0, 243.0, 287.0, 391.0, 520.0, 487.0, 411.0, 340.0, 250.0, 179.0, 132.0, 102.0, 64.0, 48.0, 30.0, 27.0, 20.0, 3.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.59375, -20.900146484375, -20.20654296875, -19.512939453125, -18.8193359375, -18.125732421875, -17.43212890625, -16.738525390625, -16.044921875, -15.351318359375, -14.65771484375, -13.964111328125, -13.2705078125, -12.576904296875, -11.88330078125, -11.189697265625, -10.49609375, -9.802490234375, -9.10888671875, -8.415283203125, -7.7216796875, -7.028076171875, -6.33447265625, -5.640869140625, -4.947265625, -4.253662109375, -3.56005859375, -2.866455078125, -2.1728515625, -1.479248046875, -0.78564453125, -0.092041015625, 0.6015625, 1.295166015625, 1.98876953125, 2.682373046875, 3.3759765625, 4.069580078125, 4.76318359375, 5.456787109375, 6.150390625, 6.843994140625, 7.53759765625, 8.231201171875, 8.9248046875, 9.618408203125, 10.31201171875, 11.005615234375, 11.69921875, 12.392822265625, 13.08642578125, 13.780029296875, 14.4736328125, 15.167236328125, 15.86083984375, 16.554443359375, 17.248046875, 17.941650390625, 18.63525390625, 19.328857421875, 20.0224609375, 20.716064453125, 21.40966796875, 22.103271484375, 22.796875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 13.0, 18.0, 30.0, 44.0, 71.0, 93.0, 140.0, 258.0, 599.0, 4449.0, 3961132.0, 225208.0, 1300.0, 380.0, 192.0, 104.0, 77.0, 52.0, 30.0, 32.0, 14.0, 10.0, 7.0, 8.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.75, -103.04296875, -99.3359375, -95.62890625, -91.921875, -88.21484375, -84.5078125, -80.80078125, -77.09375, -73.38671875, -69.6796875, -65.97265625, -62.265625, -58.55859375, -54.8515625, -51.14453125, -47.4375, -43.73046875, -40.0234375, -36.31640625, -32.609375, -28.90234375, -25.1953125, -21.48828125, -17.78125, -14.07421875, -10.3671875, -6.66015625, -2.953125, 0.75390625, 4.4609375, 8.16796875, 11.875, 15.58203125, 19.2890625, 22.99609375, 26.703125, 30.41015625, 34.1171875, 37.82421875, 41.53125, 45.23828125, 48.9453125, 52.65234375, 56.359375, 60.06640625, 63.7734375, 67.48046875, 71.1875, 74.89453125, 78.6015625, 82.30859375, 86.015625, 89.72265625, 93.4296875, 97.13671875, 100.84375, 104.55078125, 108.2578125, 111.96484375, 115.671875, 119.37890625, 123.0859375, 126.79296875, 130.5]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 32.0, 125.0, 382.0, 339.0, 101.0, 27.0, 4.0, 0.0, 2.0], "bins": [-505.6151428222656, -496.8895263671875, -488.16387939453125, -479.4382629394531, -470.712646484375, -461.98699951171875, -453.2613830566406, -444.5357666015625, -435.81011962890625, -427.0845031738281, -418.3588562011719, -409.63323974609375, -400.9076232910156, -392.1820068359375, -383.45635986328125, -374.7307434082031, -366.005126953125, -357.2795104980469, -348.5538635253906, -339.8282470703125, -331.1026306152344, -322.37701416015625, -313.6513671875, -304.9257507324219, -296.20013427734375, -287.4745178222656, -278.7488708496094, -270.02325439453125, -261.2976379394531, -252.57200622558594, -243.84637451171875, -235.12075805664062, -226.3950958251953, -217.66946411132812, -208.94384765625, -200.2182159423828, -191.49258422851562, -182.7669677734375, -174.0413360595703, -165.31570434570312, -156.590087890625, -147.8644561767578, -139.1388397216797, -130.4132080078125, -121.68758392333984, -112.96195983886719, -104.236328125, -95.51070404052734, -86.78507995605469, -78.05945587158203, -69.33383178710938, -60.60820007324219, -51.88257598876953, -43.156951904296875, -34.43132400512695, -25.70569610595703, -16.98006820678711, -8.25444221496582, 0.47118377685546875, 9.196809768676758, 17.922435760498047, 26.648059844970703, 35.373687744140625, 44.09931564331055, 52.8249397277832]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 15.0, 12.0, 8.0, 16.0, 19.0, 28.0, 18.0, 25.0, 26.0, 32.0, 33.0, 45.0, 37.0, 48.0, 44.0, 40.0, 47.0, 47.0, 43.0, 49.0, 54.0, 39.0, 36.0, 31.0, 30.0, 26.0, 22.0, 27.0, 21.0, 15.0, 17.0, 15.0, 9.0, 8.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.72566223144531, -74.46015167236328, -72.19464111328125, -69.92913055419922, -67.66361999511719, -65.39810943603516, -63.13259506225586, -60.86708450317383, -58.6015739440918, -56.336063385009766, -54.070552825927734, -51.8050422668457, -49.539527893066406, -47.274017333984375, -45.008506774902344, -42.74299621582031, -40.47748565673828, -38.21197509765625, -35.94646453857422, -33.68095397949219, -31.415441513061523, -29.149930953979492, -26.884418487548828, -24.618907928466797, -22.353397369384766, -20.087886810302734, -17.822376251220703, -15.556863784790039, -13.291353225708008, -11.025842666625977, -8.760331153869629, -6.494819641113281, -4.229301452636719, -1.9637904167175293, 0.30172061920166016, 2.5672316551208496, 4.832742691040039, 7.09825325012207, 9.363764762878418, 11.629276275634766, 13.894786834716797, 16.160297393798828, 18.42580795288086, 20.691320419311523, 22.956830978393555, 25.222341537475586, 27.48785400390625, 29.75336456298828, 32.01887512207031, 34.284385681152344, 36.549896240234375, 38.815406799316406, 41.08091735839844, 43.34642791748047, 45.611942291259766, 47.8774528503418, 50.14296340942383, 52.40847396850586, 54.67398452758789, 56.93949508666992, 59.20500946044922, 61.47052001953125, 63.73603057861328, 66.00154113769531, 68.26705169677734]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 9.0, 8.0, 11.0, 13.0, 19.0, 36.0, 40.0, 32.0, 25.0, 40.0, 31.0, 40.0, 40.0, 52.0, 48.0, 54.0, 39.0, 50.0, 43.0, 52.0, 44.0, 50.0, 35.0, 30.0, 35.0, 17.0, 20.0, 14.0, 17.0, 16.0, 5.0, 5.0, 10.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6640625, -8.372314453125, -8.08056640625, -7.788818359375, -7.4970703125, -7.205322265625, -6.91357421875, -6.621826171875, -6.330078125, -6.038330078125, -5.74658203125, -5.454833984375, -5.1630859375, -4.871337890625, -4.57958984375, -4.287841796875, -3.99609375, -3.704345703125, -3.41259765625, -3.120849609375, -2.8291015625, -2.537353515625, -2.24560546875, -1.953857421875, -1.662109375, -1.370361328125, -1.07861328125, -0.786865234375, -0.4951171875, -0.203369140625, 0.08837890625, 0.380126953125, 0.671875, 0.963623046875, 1.25537109375, 1.547119140625, 1.8388671875, 2.130615234375, 2.42236328125, 2.714111328125, 3.005859375, 3.297607421875, 3.58935546875, 3.881103515625, 4.1728515625, 4.464599609375, 4.75634765625, 5.048095703125, 5.33984375, 5.631591796875, 5.92333984375, 6.215087890625, 6.5068359375, 6.798583984375, 7.09033203125, 7.382080078125, 7.673828125, 7.965576171875, 8.25732421875, 8.549072265625, 8.8408203125, 9.132568359375, 9.42431640625, 9.716064453125, 10.0078125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 9.0, 7.0, 11.0, 18.0, 36.0, 50.0, 65.0, 87.0, 139.0, 226.0, 289.0, 428.0, 636.0, 879.0, 1351.0, 2120.0, 3040.0, 4973.0, 7672.0, 12197.0, 19816.0, 32203.0, 53255.0, 95600.0, 220588.0, 316554.0, 115541.0, 62481.0, 36819.0, 22474.0, 14011.0, 8845.0, 5527.0, 3599.0, 2270.0, 1549.0, 983.0, 683.0, 455.0, 321.0, 233.0, 161.0, 113.0, 67.0, 50.0, 43.0, 27.0, 21.0, 14.0, 6.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0], "bins": [-1.7177734375, -1.6659393310546875, -1.614105224609375, -1.5622711181640625, -1.51043701171875, -1.4586029052734375, -1.406768798828125, -1.3549346923828125, -1.3031005859375, -1.2512664794921875, -1.199432373046875, -1.1475982666015625, -1.09576416015625, -1.0439300537109375, -0.992095947265625, -0.9402618408203125, -0.888427734375, -0.8365936279296875, -0.784759521484375, -0.7329254150390625, -0.68109130859375, -0.6292572021484375, -0.577423095703125, -0.5255889892578125, -0.4737548828125, -0.4219207763671875, -0.370086669921875, -0.3182525634765625, -0.26641845703125, -0.2145843505859375, -0.162750244140625, -0.1109161376953125, -0.05908203125, -0.0072479248046875, 0.044586181640625, 0.0964202880859375, 0.14825439453125, 0.2000885009765625, 0.251922607421875, 0.3037567138671875, 0.3555908203125, 0.4074249267578125, 0.459259033203125, 0.5110931396484375, 0.56292724609375, 0.6147613525390625, 0.666595458984375, 0.7184295654296875, 0.770263671875, 0.8220977783203125, 0.873931884765625, 0.9257659912109375, 0.97760009765625, 1.0294342041015625, 1.081268310546875, 1.1331024169921875, 1.1849365234375, 1.2367706298828125, 1.288604736328125, 1.3404388427734375, 1.39227294921875, 1.4441070556640625, 1.495941162109375, 1.5477752685546875, 1.599609375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 11.0, 12.0, 9.0, 16.0, 13.0, 12.0, 15.0, 33.0, 25.0, 27.0, 31.0, 34.0, 31.0, 35.0, 45.0, 39.0, 33.0, 34.0, 1069.0, 42.0, 44.0, 38.0, 29.0, 36.0, 32.0, 33.0, 23.0, 24.0, 21.0, 18.0, 12.0, 15.0, 22.0, 12.0, 19.0, 10.0, 13.0, 13.0, 9.0, 14.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-4.65234375, -4.506591796875, -4.36083984375, -4.215087890625, -4.0693359375, -3.923583984375, -3.77783203125, -3.632080078125, -3.486328125, -3.340576171875, -3.19482421875, -3.049072265625, -2.9033203125, -2.757568359375, -2.61181640625, -2.466064453125, -2.3203125, -2.174560546875, -2.02880859375, -1.883056640625, -1.7373046875, -1.591552734375, -1.44580078125, -1.300048828125, -1.154296875, -1.008544921875, -0.86279296875, -0.717041015625, -0.5712890625, -0.425537109375, -0.27978515625, -0.134033203125, 0.01171875, 0.157470703125, 0.30322265625, 0.448974609375, 0.5947265625, 0.740478515625, 0.88623046875, 1.031982421875, 1.177734375, 1.323486328125, 1.46923828125, 1.614990234375, 1.7607421875, 1.906494140625, 2.05224609375, 2.197998046875, 2.34375, 2.489501953125, 2.63525390625, 2.781005859375, 2.9267578125, 3.072509765625, 3.21826171875, 3.364013671875, 3.509765625, 3.655517578125, 3.80126953125, 3.947021484375, 4.0927734375, 4.238525390625, 4.38427734375, 4.530029296875, 4.67578125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 11.0, 8.0, 9.0, 29.0, 35.0, 48.0, 66.0, 104.0, 160.0, 208.0, 335.0, 454.0, 679.0, 970.0, 1484.0, 2313.0, 3409.0, 5057.0, 7339.0, 10759.0, 16020.0, 24156.0, 38063.0, 61746.0, 111538.0, 1337385.0, 220575.0, 96741.0, 55013.0, 34500.0, 22721.0, 15085.0, 9954.0, 6691.0, 4460.0, 3049.0, 1894.0, 1332.0, 882.0, 582.0, 399.0, 266.0, 203.0, 132.0, 91.0, 37.0, 40.0, 29.0, 27.0, 11.0, 5.0, 11.0, 8.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-1.4013671875, -1.357421875, -1.3134765625, -1.26953125, -1.2255859375, -1.181640625, -1.1376953125, -1.09375, -1.0498046875, -1.005859375, -0.9619140625, -0.91796875, -0.8740234375, -0.830078125, -0.7861328125, -0.7421875, -0.6982421875, -0.654296875, -0.6103515625, -0.56640625, -0.5224609375, -0.478515625, -0.4345703125, -0.390625, -0.3466796875, -0.302734375, -0.2587890625, -0.21484375, -0.1708984375, -0.126953125, -0.0830078125, -0.0390625, 0.0048828125, 0.048828125, 0.0927734375, 0.13671875, 0.1806640625, 0.224609375, 0.2685546875, 0.3125, 0.3564453125, 0.400390625, 0.4443359375, 0.48828125, 0.5322265625, 0.576171875, 0.6201171875, 0.6640625, 0.7080078125, 0.751953125, 0.7958984375, 0.83984375, 0.8837890625, 0.927734375, 0.9716796875, 1.015625, 1.0595703125, 1.103515625, 1.1474609375, 1.19140625, 1.2353515625, 1.279296875, 1.3232421875, 1.3671875, 1.4111328125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 3.0, 7.0, 6.0, 13.0, 13.0, 14.0, 25.0, 24.0, 32.0, 37.0, 37.0, 52.0, 87.0, 71.0, 91.0, 73.0, 83.0, 64.0, 48.0, 37.0, 38.0, 28.0, 25.0, 18.0, 12.0, 8.0, 15.0, 10.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0009341239929199219, -0.0009048283100128174, -0.0008755326271057129, -0.0008462369441986084, -0.0008169412612915039, -0.0007876455783843994, -0.0007583498954772949, -0.0007290542125701904, -0.0006997585296630859, -0.0006704628467559814, -0.000641167163848877, -0.0006118714809417725, -0.000582575798034668, -0.0005532801151275635, -0.000523984432220459, -0.0004946887493133545, -0.00046539306640625, -0.0004360973834991455, -0.000406801700592041, -0.0003775060176849365, -0.00034821033477783203, -0.00031891465187072754, -0.00028961896896362305, -0.00026032328605651855, -0.00023102760314941406, -0.00020173192024230957, -0.00017243623733520508, -0.00014314055442810059, -0.0001138448715209961, -8.45491886138916e-05, -5.525350570678711e-05, -2.5957822799682617e-05, 3.337860107421875e-06, 3.263354301452637e-05, 6.192922592163086e-05, 9.122490882873535e-05, 0.00012052059173583984, 0.00014981627464294434, 0.00017911195755004883, 0.00020840764045715332, 0.0002377033233642578, 0.0002669990062713623, 0.0002962946891784668, 0.0003255903720855713, 0.0003548860549926758, 0.0003841817378997803, 0.00041347742080688477, 0.00044277310371398926, 0.00047206878662109375, 0.0005013644695281982, 0.0005306601524353027, 0.0005599558353424072, 0.0005892515182495117, 0.0006185472011566162, 0.0006478428840637207, 0.0006771385669708252, 0.0007064342498779297, 0.0007357299327850342, 0.0007650256156921387, 0.0007943212985992432, 0.0008236169815063477, 0.0008529126644134521, 0.0008822083473205566, 0.0009115040302276611, 0.0009407997131347656]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 10.0, 7.0, 12.0, 17.0, 24.0, 38.0, 50.0, 71.0, 120.0, 210.0, 438.0, 1368.0, 938913.0, 105617.0, 838.0, 348.0, 178.0, 96.0, 53.0, 39.0, 23.0, 22.0, 14.0, 15.0, 7.0, 4.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0251312255859375, -0.024366140365600586, -0.023601055145263672, -0.022835969924926758, -0.022070884704589844, -0.02130579948425293, -0.020540714263916016, -0.0197756290435791, -0.019010543823242188, -0.018245458602905273, -0.01748037338256836, -0.016715288162231445, -0.01595020294189453, -0.015185117721557617, -0.014420032501220703, -0.013654947280883789, -0.012889862060546875, -0.012124776840209961, -0.011359691619873047, -0.010594606399536133, -0.009829521179199219, -0.009064435958862305, -0.00829935073852539, -0.0075342655181884766, -0.0067691802978515625, -0.0060040950775146484, -0.005239009857177734, -0.00447392463684082, -0.0037088394165039062, -0.002943754196166992, -0.002178668975830078, -0.001413583755493164, -0.00064849853515625, 0.00011658668518066406, 0.0008816719055175781, 0.0016467571258544922, 0.0024118423461914062, 0.0031769275665283203, 0.003942012786865234, 0.0047070980072021484, 0.0054721832275390625, 0.0062372684478759766, 0.007002353668212891, 0.007767438888549805, 0.008532524108886719, 0.009297609329223633, 0.010062694549560547, 0.010827779769897461, 0.011592864990234375, 0.012357950210571289, 0.013123035430908203, 0.013888120651245117, 0.014653205871582031, 0.015418291091918945, 0.01618337631225586, 0.016948461532592773, 0.017713546752929688, 0.0184786319732666, 0.019243717193603516, 0.02000880241394043, 0.020773887634277344, 0.021538972854614258, 0.022304058074951172, 0.023069143295288086, 0.023834228515625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 8.0, 23.0, 170.0, 421.0, 285.0, 88.0, 19.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00039740331703796983, -0.00032775328145362437, -0.0002581032458692789, -0.00018845321028493345, -0.00011880317470058799, -4.915313911624253e-05, 2.0496896468102932e-05, 9.014693205244839e-05, 0.00015979696763679385, 0.0002294470032211393, 0.00029909703880548477, 0.00036874707438983023, 0.0004383971099741757, 0.0005080471746623516, 0.0005776971811428666, 0.0006473471876233816, 0.0007169972523115575, 0.0007866473169997334, 0.0008562973234802485, 0.0009259473299607635, 0.0009955973364412785, 0.0010652474593371153, 0.0011348974658176303, 0.0012045474722981453, 0.0012741975951939821, 0.0013438476016744971, 0.0014134976081550121, 0.001483147731050849, 0.001552797737531364, 0.001622447744011879, 0.0016920978669077158, 0.0017617478733882308, 0.0018313978798687458, 0.0019010478863492608, 0.001970697892829776, 0.0020403480157256126, 0.002109997905790806, 0.0021796480286866426, 0.0022492981515824795, 0.0023189480416476727, 0.0023885981645435095, 0.0024582482874393463, 0.0025278981775045395, 0.0025975483004003763, 0.002667198423296213, 0.0027368483133614063, 0.002806498436257243, 0.0028761483263224363, 0.002945798449218273, 0.00301544857211411, 0.003085098462179303, 0.00315474858507514, 0.003224398475140333, 0.00329404859803617, 0.003363698720932007, 0.0034333486109972, 0.003502998733893037, 0.0035726488567888737, 0.003642298746854067, 0.0037119488697499037, 0.0037815989926457405, 0.0038512488827109337, 0.003920898772776127, 0.003990549128502607, 0.0040601990185678005]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 12.0, 12.0, 16.0, 14.0, 21.0, 21.0, 30.0, 24.0, 32.0, 28.0, 30.0, 30.0, 41.0, 32.0, 31.0, 37.0, 41.0, 47.0, 29.0, 43.0, 43.0, 37.0, 41.0, 30.0, 32.0, 30.0, 20.0, 31.0, 18.0, 23.0, 17.0, 19.0, 16.0, 15.0, 9.0, 4.0, 4.0, 8.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.00044715404510498047, -0.0004346594214439392, -0.00042216479778289795, -0.0004096701741218567, -0.00039717555046081543, -0.00038468092679977417, -0.0003721863031387329, -0.00035969167947769165, -0.0003471970558166504, -0.00033470243215560913, -0.00032220780849456787, -0.0003097131848335266, -0.00029721856117248535, -0.0002847239375114441, -0.00027222931385040283, -0.00025973469018936157, -0.0002472400665283203, -0.00023474544286727905, -0.0002222508192062378, -0.00020975619554519653, -0.00019726157188415527, -0.00018476694822311401, -0.00017227232456207275, -0.0001597777009010315, -0.00014728307723999023, -0.00013478845357894897, -0.00012229382991790771, -0.00010979920625686646, -9.73045825958252e-05, -8.480995893478394e-05, -7.231533527374268e-05, -5.9820711612701416e-05, -4.7326087951660156e-05, -3.4831464290618896e-05, -2.2336840629577637e-05, -9.842216968536377e-06, 2.652406692504883e-06, 1.5147030353546143e-05, 2.7641654014587402e-05, 4.013627767562866e-05, 5.263090133666992e-05, 6.512552499771118e-05, 7.762014865875244e-05, 9.01147723197937e-05, 0.00010260939598083496, 0.00011510401964187622, 0.00012759864330291748, 0.00014009326696395874, 0.000152587890625, 0.00016508251428604126, 0.00017757713794708252, 0.00019007176160812378, 0.00020256638526916504, 0.0002150610089302063, 0.00022755563259124756, 0.00024005025625228882, 0.0002525448799133301, 0.00026503950357437134, 0.0002775341272354126, 0.00029002875089645386, 0.0003025233745574951, 0.0003150179982185364, 0.00032751262187957764, 0.0003400072455406189, 0.00035250186920166016]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 9.0, 8.0, 11.0, 13.0, 19.0, 36.0, 40.0, 32.0, 25.0, 40.0, 31.0, 40.0, 40.0, 52.0, 48.0, 54.0, 39.0, 50.0, 43.0, 52.0, 44.0, 50.0, 35.0, 30.0, 35.0, 17.0, 20.0, 14.0, 17.0, 16.0, 5.0, 5.0, 10.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6640625, -8.372314453125, -8.08056640625, -7.788818359375, -7.4970703125, -7.205322265625, -6.91357421875, -6.621826171875, -6.330078125, -6.038330078125, -5.74658203125, -5.454833984375, -5.1630859375, -4.871337890625, -4.57958984375, -4.287841796875, -3.99609375, -3.704345703125, -3.41259765625, -3.120849609375, -2.8291015625, -2.537353515625, -2.24560546875, -1.953857421875, -1.662109375, -1.370361328125, -1.07861328125, -0.786865234375, -0.4951171875, -0.203369140625, 0.08837890625, 0.380126953125, 0.671875, 0.963623046875, 1.25537109375, 1.547119140625, 1.8388671875, 2.130615234375, 2.42236328125, 2.714111328125, 3.005859375, 3.297607421875, 3.58935546875, 3.881103515625, 4.1728515625, 4.464599609375, 4.75634765625, 5.048095703125, 5.33984375, 5.631591796875, 5.92333984375, 6.215087890625, 6.5068359375, 6.798583984375, 7.09033203125, 7.382080078125, 7.673828125, 7.965576171875, 8.25732421875, 8.549072265625, 8.8408203125, 9.132568359375, 9.42431640625, 9.716064453125, 10.0078125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 8.0, 12.0, 8.0, 20.0, 29.0, 38.0, 58.0, 106.0, 140.0, 225.0, 446.0, 775.0, 1564.0, 3091.0, 6929.0, 18139.0, 51951.0, 189971.0, 534639.0, 164897.0, 46672.0, 16265.0, 6500.0, 2944.0, 1389.0, 691.0, 369.0, 254.0, 133.0, 88.0, 66.0, 49.0, 28.0, 17.0, 15.0, 4.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.26171875, -6.05609130859375, -5.8504638671875, -5.64483642578125, -5.439208984375, -5.23358154296875, -5.0279541015625, -4.82232666015625, -4.61669921875, -4.41107177734375, -4.2054443359375, -3.99981689453125, -3.794189453125, -3.58856201171875, -3.3829345703125, -3.17730712890625, -2.9716796875, -2.76605224609375, -2.5604248046875, -2.35479736328125, -2.149169921875, -1.94354248046875, -1.7379150390625, -1.53228759765625, -1.32666015625, -1.12103271484375, -0.9154052734375, -0.70977783203125, -0.504150390625, -0.29852294921875, -0.0928955078125, 0.11273193359375, 0.318359375, 0.52398681640625, 0.7296142578125, 0.93524169921875, 1.140869140625, 1.34649658203125, 1.5521240234375, 1.75775146484375, 1.96337890625, 2.16900634765625, 2.3746337890625, 2.58026123046875, 2.785888671875, 2.99151611328125, 3.1971435546875, 3.40277099609375, 3.6083984375, 3.81402587890625, 4.0196533203125, 4.22528076171875, 4.430908203125, 4.63653564453125, 4.8421630859375, 5.04779052734375, 5.25341796875, 5.45904541015625, 5.6646728515625, 5.87030029296875, 6.075927734375, 6.28155517578125, 6.4871826171875, 6.69281005859375, 6.8984375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 10.0, 8.0, 11.0, 9.0, 9.0, 13.0, 16.0, 14.0, 28.0, 18.0, 20.0, 28.0, 42.0, 35.0, 55.0, 45.0, 55.0, 78.0, 174.0, 1669.0, 174.0, 84.0, 70.0, 43.0, 45.0, 41.0, 42.0, 28.0, 28.0, 26.0, 21.0, 22.0, 12.0, 11.0, 15.0, 12.0, 5.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.140625, -24.257568359375, -23.37451171875, -22.491455078125, -21.6083984375, -20.725341796875, -19.84228515625, -18.959228515625, -18.076171875, -17.193115234375, -16.31005859375, -15.427001953125, -14.5439453125, -13.660888671875, -12.77783203125, -11.894775390625, -11.01171875, -10.128662109375, -9.24560546875, -8.362548828125, -7.4794921875, -6.596435546875, -5.71337890625, -4.830322265625, -3.947265625, -3.064208984375, -2.18115234375, -1.298095703125, -0.4150390625, 0.468017578125, 1.35107421875, 2.234130859375, 3.1171875, 4.000244140625, 4.88330078125, 5.766357421875, 6.6494140625, 7.532470703125, 8.41552734375, 9.298583984375, 10.181640625, 11.064697265625, 11.94775390625, 12.830810546875, 13.7138671875, 14.596923828125, 15.47998046875, 16.363037109375, 17.24609375, 18.129150390625, 19.01220703125, 19.895263671875, 20.7783203125, 21.661376953125, 22.54443359375, 23.427490234375, 24.310546875, 25.193603515625, 26.07666015625, 26.959716796875, 27.8427734375, 28.725830078125, 29.60888671875, 30.491943359375, 31.375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 14.0, 26.0, 39.0, 60.0, 104.0, 215.0, 450.0, 1935.0, 3080681.0, 60441.0, 1058.0, 313.0, 150.0, 71.0, 47.0, 36.0, 28.0, 15.0, 13.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-175.375, -171.0810546875, -166.787109375, -162.4931640625, -158.19921875, -153.9052734375, -149.611328125, -145.3173828125, -141.0234375, -136.7294921875, -132.435546875, -128.1416015625, -123.84765625, -119.5537109375, -115.259765625, -110.9658203125, -106.671875, -102.3779296875, -98.083984375, -93.7900390625, -89.49609375, -85.2021484375, -80.908203125, -76.6142578125, -72.3203125, -68.0263671875, -63.732421875, -59.4384765625, -55.14453125, -50.8505859375, -46.556640625, -42.2626953125, -37.96875, -33.6748046875, -29.380859375, -25.0869140625, -20.79296875, -16.4990234375, -12.205078125, -7.9111328125, -3.6171875, 0.6767578125, 4.970703125, 9.2646484375, 13.55859375, 17.8525390625, 22.146484375, 26.4404296875, 30.734375, 35.0283203125, 39.322265625, 43.6162109375, 47.91015625, 52.2041015625, 56.498046875, 60.7919921875, 65.0859375, 69.3798828125, 73.673828125, 77.9677734375, 82.26171875, 86.5556640625, 90.849609375, 95.1435546875, 99.4375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 6.0, 578.0, 431.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.53816223144531, -52.896820068359375, -42.25547790527344, -31.614131927490234, -20.972789764404297, -10.33144760131836, 0.30989837646484375, 10.951240539550781, 21.59258270263672, 32.233924865722656, 42.875267028808594, 53.5166130065918, 64.157958984375, 74.79930114746094, 85.44064331054688, 96.08198547363281, 106.72332763671875, 117.36466979980469, 128.00601196289062, 138.64735412597656, 149.2886962890625, 159.93003845214844, 170.57138061523438, 181.21273803710938, 191.85406494140625, 202.4954071044922, 213.13674926757812, 223.77809143066406, 234.41943359375, 245.06077575683594, 255.70211791992188, 266.3434753417969, 276.9848327636719, 287.6261901855469, 298.26751708984375, 308.90887451171875, 319.5502014160156, 330.1915588378906, 340.8328857421875, 351.4742431640625, 362.1155700683594, 372.7569274902344, 383.39825439453125, 394.03961181640625, 404.6809387207031, 415.3222961425781, 425.963623046875, 436.60498046875, 447.246337890625, 457.8876953125, 468.5290222167969, 479.1703796386719, 489.81170654296875, 500.45306396484375, 511.0943908691406, 521.7357177734375, 532.3770751953125, 543.0184326171875, 553.6597900390625, 564.3010864257812, 574.9424438476562, 585.5838012695312, 596.2251586914062, 606.866455078125, 617.5078125]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 9.0, 9.0, 9.0, 8.0, 8.0, 16.0, 9.0, 14.0, 11.0, 16.0, 23.0, 28.0, 23.0, 20.0, 21.0, 35.0, 29.0, 38.0, 29.0, 45.0, 31.0, 53.0, 34.0, 42.0, 29.0, 38.0, 38.0, 32.0, 30.0, 32.0, 38.0, 19.0, 25.0, 25.0, 19.0, 17.0, 15.0, 17.0, 18.0, 16.0, 6.0, 3.0, 10.0, 3.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-71.00201416015625, -68.90438842773438, -66.8067626953125, -64.70913696289062, -62.61151123046875, -60.513885498046875, -58.416255950927734, -56.31863021850586, -54.221004486083984, -52.12337875366211, -50.025753021240234, -47.92812728881836, -45.83049774169922, -43.732872009277344, -41.63524627685547, -39.537620544433594, -37.43999481201172, -35.342369079589844, -33.24474334716797, -31.14711570739746, -29.049489974975586, -26.95186424255371, -24.854236602783203, -22.756610870361328, -20.658985137939453, -18.561359405517578, -16.463733673095703, -14.366106033325195, -12.26848030090332, -10.170854568481445, -8.073227882385254, -5.9756011962890625, -3.877979278564453, -1.78035306930542, 0.3172731399536133, 2.4148993492126465, 4.51252555847168, 6.610151290893555, 8.707777976989746, 10.805404663085938, 12.903030395507812, 15.000656127929688, 17.098281860351562, 19.19590950012207, 21.293535232543945, 23.39116096496582, 25.488788604736328, 27.586414337158203, 29.684040069580078, 31.781665802001953, 33.87929153442383, 35.9769172668457, 38.074546813964844, 40.17217254638672, 42.269798278808594, 44.36742401123047, 46.465049743652344, 48.56267547607422, 50.660301208496094, 52.75792694091797, 54.855552673339844, 56.95317840576172, 59.05080795288086, 61.148433685302734, 63.24605941772461]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 4.0, 13.0, 14.0, 30.0, 26.0, 29.0, 31.0, 30.0, 25.0, 41.0, 40.0, 36.0, 54.0, 35.0, 46.0, 45.0, 48.0, 46.0, 44.0, 51.0, 44.0, 37.0, 33.0, 35.0, 19.0, 28.0, 22.0, 12.0, 16.0, 7.0, 11.0, 7.0, 8.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.406494140625, -8.11767578125, -7.828857421875, -7.5400390625, -7.251220703125, -6.96240234375, -6.673583984375, -6.384765625, -6.095947265625, -5.80712890625, -5.518310546875, -5.2294921875, -4.940673828125, -4.65185546875, -4.363037109375, -4.07421875, -3.785400390625, -3.49658203125, -3.207763671875, -2.9189453125, -2.630126953125, -2.34130859375, -2.052490234375, -1.763671875, -1.474853515625, -1.18603515625, -0.897216796875, -0.6083984375, -0.319580078125, -0.03076171875, 0.258056640625, 0.546875, 0.835693359375, 1.12451171875, 1.413330078125, 1.7021484375, 1.990966796875, 2.27978515625, 2.568603515625, 2.857421875, 3.146240234375, 3.43505859375, 3.723876953125, 4.0126953125, 4.301513671875, 4.59033203125, 4.879150390625, 5.16796875, 5.456787109375, 5.74560546875, 6.034423828125, 6.3232421875, 6.612060546875, 6.90087890625, 7.189697265625, 7.478515625, 7.767333984375, 8.05615234375, 8.344970703125, 8.6337890625, 8.922607421875, 9.21142578125, 9.500244140625, 9.7890625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 11.0, 11.0, 11.0, 15.0, 28.0, 30.0, 39.0, 27.0, 40.0, 56.0, 102.0, 131.0, 244.0, 926.0, 27546.0, 3866458.0, 295240.0, 2354.0, 339.0, 185.0, 133.0, 83.0, 55.0, 26.0, 31.0, 28.0, 27.0, 15.0, 16.0, 10.0, 9.0, 10.0, 8.0, 4.0, 6.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.0, -45.4169921875, -43.833984375, -42.2509765625, -40.66796875, -39.0849609375, -37.501953125, -35.9189453125, -34.3359375, -32.7529296875, -31.169921875, -29.5869140625, -28.00390625, -26.4208984375, -24.837890625, -23.2548828125, -21.671875, -20.0888671875, -18.505859375, -16.9228515625, -15.33984375, -13.7568359375, -12.173828125, -10.5908203125, -9.0078125, -7.4248046875, -5.841796875, -4.2587890625, -2.67578125, -1.0927734375, 0.490234375, 2.0732421875, 3.65625, 5.2392578125, 6.822265625, 8.4052734375, 9.98828125, 11.5712890625, 13.154296875, 14.7373046875, 16.3203125, 17.9033203125, 19.486328125, 21.0693359375, 22.65234375, 24.2353515625, 25.818359375, 27.4013671875, 28.984375, 30.5673828125, 32.150390625, 33.7333984375, 35.31640625, 36.8994140625, 38.482421875, 40.0654296875, 41.6484375, 43.2314453125, 44.814453125, 46.3974609375, 47.98046875, 49.5634765625, 51.146484375, 52.7294921875, 54.3125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 8.0, 10.0, 10.0, 18.0, 38.0, 51.0, 86.0, 94.0, 172.0, 241.0, 413.0, 532.0, 632.0, 505.0, 431.0, 273.0, 213.0, 120.0, 69.0, 49.0, 39.0, 22.0, 18.0, 12.0, 6.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.796875, -22.026123046875, -21.25537109375, -20.484619140625, -19.7138671875, -18.943115234375, -18.17236328125, -17.401611328125, -16.630859375, -15.860107421875, -15.08935546875, -14.318603515625, -13.5478515625, -12.777099609375, -12.00634765625, -11.235595703125, -10.46484375, -9.694091796875, -8.92333984375, -8.152587890625, -7.3818359375, -6.611083984375, -5.84033203125, -5.069580078125, -4.298828125, -3.528076171875, -2.75732421875, -1.986572265625, -1.2158203125, -0.445068359375, 0.32568359375, 1.096435546875, 1.8671875, 2.637939453125, 3.40869140625, 4.179443359375, 4.9501953125, 5.720947265625, 6.49169921875, 7.262451171875, 8.033203125, 8.803955078125, 9.57470703125, 10.345458984375, 11.1162109375, 11.886962890625, 12.65771484375, 13.428466796875, 14.19921875, 14.969970703125, 15.74072265625, 16.511474609375, 17.2822265625, 18.052978515625, 18.82373046875, 19.594482421875, 20.365234375, 21.135986328125, 21.90673828125, 22.677490234375, 23.4482421875, 24.218994140625, 24.98974609375, 25.760498046875, 26.53125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 10.0, 13.0, 6.0, 3.0, 20.0, 29.0, 28.0, 44.0, 53.0, 57.0, 84.0, 103.0, 162.0, 243.0, 362.0, 683.0, 1838.0, 38526.0, 4005184.0, 141776.0, 2969.0, 772.0, 388.0, 230.0, 161.0, 123.0, 71.0, 70.0, 54.0, 47.0, 43.0, 28.0, 22.0, 18.0, 16.0, 15.0, 7.0, 4.0, 5.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-77.125, -74.8310546875, -72.537109375, -70.2431640625, -67.94921875, -65.6552734375, -63.361328125, -61.0673828125, -58.7734375, -56.4794921875, -54.185546875, -51.8916015625, -49.59765625, -47.3037109375, -45.009765625, -42.7158203125, -40.421875, -38.1279296875, -35.833984375, -33.5400390625, -31.24609375, -28.9521484375, -26.658203125, -24.3642578125, -22.0703125, -19.7763671875, -17.482421875, -15.1884765625, -12.89453125, -10.6005859375, -8.306640625, -6.0126953125, -3.71875, -1.4248046875, 0.869140625, 3.1630859375, 5.45703125, 7.7509765625, 10.044921875, 12.3388671875, 14.6328125, 16.9267578125, 19.220703125, 21.5146484375, 23.80859375, 26.1025390625, 28.396484375, 30.6904296875, 32.984375, 35.2783203125, 37.572265625, 39.8662109375, 42.16015625, 44.4541015625, 46.748046875, 49.0419921875, 51.3359375, 53.6298828125, 55.923828125, 58.2177734375, 60.51171875, 62.8056640625, 65.099609375, 67.3935546875, 69.6875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 16.0, 55.0, 144.0, 208.0, 243.0, 186.0, 106.0, 28.0, 14.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.00889587402344, -197.00038146972656, -191.99188232421875, -186.98336791992188, -181.974853515625, -176.9663543701172, -171.9578399658203, -166.9493408203125, -161.94082641601562, -156.93231201171875, -151.92381286621094, -146.91529846191406, -141.9067840576172, -136.89828491210938, -131.8897705078125, -126.88126373291016, -121.87274932861328, -116.86424255371094, -111.85572814941406, -106.84722137451172, -101.83871459960938, -96.8302001953125, -91.82169342041016, -86.81318664550781, -81.80467224121094, -76.7961654663086, -71.78765106201172, -66.77914428710938, -61.77063751220703, -56.76212692260742, -51.75361633300781, -46.74510955810547, -41.736595153808594, -36.728084564208984, -31.71957778930664, -26.71106719970703, -21.702558517456055, -16.694049835205078, -11.685539245605469, -6.677032470703125, -1.6685218811035156, 3.339987277984619, 8.348496437072754, 13.357006072998047, 18.365514755249023, 23.3740234375, 28.38253402709961, 33.39104080200195, 38.39955139160156, 43.40806198120117, 48.416568756103516, 53.425079345703125, 58.43358612060547, 63.44209671020508, 68.45060729980469, 73.45911407470703, 78.46762084960938, 83.47612762451172, 88.4846420288086, 93.49314880371094, 98.50165557861328, 103.51016235351562, 108.5186767578125, 113.52718353271484, 118.53569793701172]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 3.0, 5.0, 15.0, 9.0, 11.0, 14.0, 13.0, 13.0, 16.0, 19.0, 25.0, 28.0, 32.0, 25.0, 40.0, 29.0, 36.0, 52.0, 34.0, 43.0, 39.0, 40.0, 41.0, 36.0, 44.0, 46.0, 38.0, 29.0, 21.0, 31.0, 21.0, 20.0, 12.0, 16.0, 14.0, 20.0, 7.0, 16.0, 10.0, 12.0, 4.0, 2.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.48942184448242, -53.6074104309082, -51.72539520263672, -49.8433837890625, -47.96137237548828, -46.0793571472168, -44.19734573364258, -42.315330505371094, -40.433319091796875, -38.551307678222656, -36.66929244995117, -34.78728103637695, -32.90526580810547, -31.02325439453125, -29.14124298095703, -27.25922966003418, -25.377216339111328, -23.495203018188477, -21.613189697265625, -19.731178283691406, -17.849164962768555, -15.967151641845703, -14.085139274597168, -12.203126907348633, -10.321113586425781, -8.43910026550293, -6.5570878982543945, -4.675075054168701, -2.793062210083008, -0.9110488891601562, 0.9709634780883789, 2.852975845336914, 4.734992980957031, 6.617005825042725, 8.499018669128418, 10.381031036376953, 12.263044357299805, 14.145057678222656, 16.027069091796875, 17.909082412719727, 19.791095733642578, 21.67310905456543, 23.55512237548828, 25.4371337890625, 27.31914710998535, 29.201160430908203, 31.083171844482422, 32.965187072753906, 34.847198486328125, 36.729209899902344, 38.61122512817383, 40.49323654174805, 42.37525177001953, 44.25726318359375, 46.13927459716797, 48.02128601074219, 49.90330123901367, 51.78531265258789, 53.667327880859375, 55.549339294433594, 57.43135070800781, 59.3133659362793, 61.195377349853516, 63.077392578125, 64.95940399169922]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 5.0, 6.0, 5.0, 2.0, 7.0, 10.0, 9.0, 14.0, 23.0, 24.0, 33.0, 29.0, 31.0, 35.0, 46.0, 29.0, 34.0, 43.0, 44.0, 42.0, 41.0, 55.0, 53.0, 44.0, 45.0, 31.0, 26.0, 40.0, 40.0, 35.0, 19.0, 18.0, 16.0, 15.0, 9.0, 10.0, 11.0, 9.0, 2.0, 6.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.7197265625, -8.431640625, -8.1435546875, -7.85546875, -7.5673828125, -7.279296875, -6.9912109375, -6.703125, -6.4150390625, -6.126953125, -5.8388671875, -5.55078125, -5.2626953125, -4.974609375, -4.6865234375, -4.3984375, -4.1103515625, -3.822265625, -3.5341796875, -3.24609375, -2.9580078125, -2.669921875, -2.3818359375, -2.09375, -1.8056640625, -1.517578125, -1.2294921875, -0.94140625, -0.6533203125, -0.365234375, -0.0771484375, 0.2109375, 0.4990234375, 0.787109375, 1.0751953125, 1.36328125, 1.6513671875, 1.939453125, 2.2275390625, 2.515625, 2.8037109375, 3.091796875, 3.3798828125, 3.66796875, 3.9560546875, 4.244140625, 4.5322265625, 4.8203125, 5.1083984375, 5.396484375, 5.6845703125, 5.97265625, 6.2607421875, 6.548828125, 6.8369140625, 7.125, 7.4130859375, 7.701171875, 7.9892578125, 8.27734375, 8.5654296875, 8.853515625, 9.1416015625, 9.4296875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 10.0, 10.0, 17.0, 26.0, 24.0, 40.0, 73.0, 118.0, 212.0, 292.0, 474.0, 730.0, 1171.0, 1767.0, 2886.0, 4775.0, 8304.0, 14491.0, 25577.0, 46705.0, 87048.0, 195216.0, 369666.0, 135523.0, 67616.0, 36678.0, 20462.0, 11431.0, 6690.0, 4048.0, 2486.0, 1441.0, 920.0, 557.0, 381.0, 238.0, 159.0, 88.0, 59.0, 54.0, 32.0, 29.0, 14.0, 6.0, 4.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9970703125, -1.9332733154296875, -1.869476318359375, -1.8056793212890625, -1.74188232421875, -1.6780853271484375, -1.614288330078125, -1.5504913330078125, -1.4866943359375, -1.4228973388671875, -1.359100341796875, -1.2953033447265625, -1.23150634765625, -1.1677093505859375, -1.103912353515625, -1.0401153564453125, -0.976318359375, -0.9125213623046875, -0.848724365234375, -0.7849273681640625, -0.72113037109375, -0.6573333740234375, -0.593536376953125, -0.5297393798828125, -0.4659423828125, -0.4021453857421875, -0.338348388671875, -0.2745513916015625, -0.21075439453125, -0.1469573974609375, -0.083160400390625, -0.0193634033203125, 0.04443359375, 0.1082305908203125, 0.172027587890625, 0.2358245849609375, 0.29962158203125, 0.3634185791015625, 0.427215576171875, 0.4910125732421875, 0.5548095703125, 0.6186065673828125, 0.682403564453125, 0.7462005615234375, 0.80999755859375, 0.8737945556640625, 0.937591552734375, 1.0013885498046875, 1.065185546875, 1.1289825439453125, 1.192779541015625, 1.2565765380859375, 1.32037353515625, 1.3841705322265625, 1.447967529296875, 1.5117645263671875, 1.5755615234375, 1.6393585205078125, 1.703155517578125, 1.7669525146484375, 1.83074951171875, 1.8945465087890625, 1.958343505859375, 2.0221405029296875, 2.0859375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 2.0, 5.0, 5.0, 3.0, 8.0, 10.0, 12.0, 9.0, 16.0, 8.0, 17.0, 18.0, 19.0, 34.0, 30.0, 19.0, 30.0, 29.0, 35.0, 34.0, 34.0, 35.0, 40.0, 1065.0, 48.0, 41.0, 46.0, 37.0, 34.0, 22.0, 33.0, 32.0, 28.0, 19.0, 21.0, 24.0, 15.0, 15.0, 13.0, 17.0, 10.0, 12.0, 9.0, 7.0, 8.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-5.1875, -5.03265380859375, -4.8778076171875, -4.72296142578125, -4.568115234375, -4.41326904296875, -4.2584228515625, -4.10357666015625, -3.94873046875, -3.79388427734375, -3.6390380859375, -3.48419189453125, -3.329345703125, -3.17449951171875, -3.0196533203125, -2.86480712890625, -2.7099609375, -2.55511474609375, -2.4002685546875, -2.24542236328125, -2.090576171875, -1.93572998046875, -1.7808837890625, -1.62603759765625, -1.47119140625, -1.31634521484375, -1.1614990234375, -1.00665283203125, -0.851806640625, -0.69696044921875, -0.5421142578125, -0.38726806640625, -0.232421875, -0.07757568359375, 0.0772705078125, 0.23211669921875, 0.386962890625, 0.54180908203125, 0.6966552734375, 0.85150146484375, 1.00634765625, 1.16119384765625, 1.3160400390625, 1.47088623046875, 1.625732421875, 1.78057861328125, 1.9354248046875, 2.09027099609375, 2.2451171875, 2.39996337890625, 2.5548095703125, 2.70965576171875, 2.864501953125, 3.01934814453125, 3.1741943359375, 3.32904052734375, 3.48388671875, 3.63873291015625, 3.7935791015625, 3.94842529296875, 4.103271484375, 4.25811767578125, 4.4129638671875, 4.56781005859375, 4.72265625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 1.0, 6.0, 6.0, 9.0, 7.0, 10.0, 15.0, 29.0, 43.0, 70.0, 97.0, 117.0, 165.0, 274.0, 399.0, 570.0, 780.0, 1220.0, 1841.0, 2712.0, 3951.0, 5889.0, 8495.0, 12649.0, 18979.0, 28800.0, 45098.0, 74651.0, 146406.0, 1383790.0, 150377.0, 75895.0, 45578.0, 29302.0, 19488.0, 12859.0, 8347.0, 5823.0, 3953.0, 2661.0, 1787.0, 1275.0, 839.0, 577.0, 396.0, 275.0, 181.0, 141.0, 94.0, 53.0, 44.0, 43.0, 17.0, 19.0, 12.0, 10.0, 8.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0], "bins": [-1.4267578125, -1.3800048828125, -1.333251953125, -1.2864990234375, -1.23974609375, -1.1929931640625, -1.146240234375, -1.0994873046875, -1.052734375, -1.0059814453125, -0.959228515625, -0.9124755859375, -0.86572265625, -0.8189697265625, -0.772216796875, -0.7254638671875, -0.6787109375, -0.6319580078125, -0.585205078125, -0.5384521484375, -0.49169921875, -0.4449462890625, -0.398193359375, -0.3514404296875, -0.3046875, -0.2579345703125, -0.211181640625, -0.1644287109375, -0.11767578125, -0.0709228515625, -0.024169921875, 0.0225830078125, 0.0693359375, 0.1160888671875, 0.162841796875, 0.2095947265625, 0.25634765625, 0.3031005859375, 0.349853515625, 0.3966064453125, 0.443359375, 0.4901123046875, 0.536865234375, 0.5836181640625, 0.63037109375, 0.6771240234375, 0.723876953125, 0.7706298828125, 0.8173828125, 0.8641357421875, 0.910888671875, 0.9576416015625, 1.00439453125, 1.0511474609375, 1.097900390625, 1.1446533203125, 1.19140625, 1.2381591796875, 1.284912109375, 1.3316650390625, 1.37841796875, 1.4251708984375, 1.471923828125, 1.5186767578125, 1.5654296875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 8.0, 6.0, 10.0, 7.0, 20.0, 18.0, 23.0, 50.0, 39.0, 62.0, 65.0, 81.0, 97.0, 79.0, 90.0, 73.0, 63.0, 66.0, 28.0, 28.0, 20.0, 8.0, 10.0, 4.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00136566162109375, -0.0013307034969329834, -0.0012957453727722168, -0.0012607872486114502, -0.0012258291244506836, -0.001190871000289917, -0.0011559128761291504, -0.0011209547519683838, -0.0010859966278076172, -0.0010510385036468506, -0.001016080379486084, -0.0009811222553253174, -0.0009461641311645508, -0.0009112060070037842, -0.0008762478828430176, -0.000841289758682251, -0.0008063316345214844, -0.0007713735103607178, -0.0007364153861999512, -0.0007014572620391846, -0.000666499137878418, -0.0006315410137176514, -0.0005965828895568848, -0.0005616247653961182, -0.0005266666412353516, -0.000491708517074585, -0.00045675039291381836, -0.00042179226875305176, -0.00038683414459228516, -0.00035187602043151855, -0.00031691789627075195, -0.00028195977210998535, -0.00024700164794921875, -0.00021204352378845215, -0.00017708539962768555, -0.00014212727546691895, -0.00010716915130615234, -7.221102714538574e-05, -3.725290298461914e-05, -2.294778823852539e-06, 3.266334533691406e-05, 6.762146949768066e-05, 0.00010257959365844727, 0.00013753771781921387, 0.00017249584197998047, 0.00020745396614074707, 0.00024241209030151367, 0.0002773702144622803, 0.0003123283386230469, 0.0003472864627838135, 0.0003822445869445801, 0.0004172027111053467, 0.0004521608352661133, 0.0004871189594268799, 0.0005220770835876465, 0.0005570352077484131, 0.0005919933319091797, 0.0006269514560699463, 0.0006619095802307129, 0.0006968677043914795, 0.0007318258285522461, 0.0007667839527130127, 0.0008017420768737793, 0.0008367002010345459, 0.0008716583251953125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 6.0, 3.0, 6.0, 4.0, 12.0, 16.0, 22.0, 26.0, 34.0, 49.0, 97.0, 169.0, 354.0, 1432.0, 974412.0, 70495.0, 757.0, 266.0, 120.0, 71.0, 47.0, 39.0, 29.0, 14.0, 10.0, 10.0, 11.0, 4.0, 5.0, 4.0, 7.0, 2.0, 3.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0213623046875, -0.02056574821472168, -0.01976919174194336, -0.01897263526916504, -0.01817607879638672, -0.0173795223236084, -0.016582965850830078, -0.015786409378051758, -0.014989852905273438, -0.014193296432495117, -0.013396739959716797, -0.012600183486938477, -0.011803627014160156, -0.011007070541381836, -0.010210514068603516, -0.009413957595825195, -0.008617401123046875, -0.007820844650268555, -0.007024288177490234, -0.006227731704711914, -0.005431175231933594, -0.0046346187591552734, -0.003838062286376953, -0.003041505813598633, -0.0022449493408203125, -0.0014483928680419922, -0.0006518363952636719, 0.00014472007751464844, 0.0009412765502929688, 0.001737833023071289, 0.0025343894958496094, 0.0033309459686279297, 0.00412750244140625, 0.00492405891418457, 0.005720615386962891, 0.006517171859741211, 0.007313728332519531, 0.008110284805297852, 0.008906841278076172, 0.009703397750854492, 0.010499954223632812, 0.011296510696411133, 0.012093067169189453, 0.012889623641967773, 0.013686180114746094, 0.014482736587524414, 0.015279293060302734, 0.016075849533081055, 0.016872406005859375, 0.017668962478637695, 0.018465518951416016, 0.019262075424194336, 0.020058631896972656, 0.020855188369750977, 0.021651744842529297, 0.022448301315307617, 0.023244857788085938, 0.024041414260864258, 0.024837970733642578, 0.0256345272064209, 0.02643108367919922, 0.02722764015197754, 0.02802419662475586, 0.02882075309753418, 0.0296173095703125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 11.0, 222.0, 615.0, 154.0, 15.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003652448358479887, -0.0002585456822998822, -0.00015184655785560608, -4.514740430749953e-05, 6.155172013677657e-05, 0.00016825084458105266, 0.00027495002723298967, 0.00038164915167726576, 0.0004883483052253723, 0.0005950474296696484, 0.0007017465541139245, 0.0008084457367658615, 0.0009151448612101376, 0.0010218439856544137, 0.0011285431683063507, 0.0012352422345429659, 0.001341941417194903, 0.00144864059984684, 0.001555339666083455, 0.001662038848735392, 0.001768738031387329, 0.0018754370976239443, 0.0019821361638605595, 0.0020888354629278183, 0.0021955345291644335, 0.0023022335954010487, 0.0024089328944683075, 0.0025156319607049227, 0.002622331026941538, 0.0027290303260087967, 0.002835729392245412, 0.002942428458482027, 0.003049127757549286, 0.003155826823785901, 0.00326252612285316, 0.003369225189089775, 0.0034759242553263903, 0.0035826233215630054, 0.0036893226206302643, 0.0037960216868668795, 0.0039027207531034946, 0.0040094200521707535, 0.004116118885576725, 0.004222818184643984, 0.004329517483711243, 0.004436216317117214, 0.004542915616184473, 0.004649614915251732, 0.004756313748657703, 0.004863013047724962, 0.004969711881130934, 0.005076411180198193, 0.005183110479265451, 0.005289809312671423, 0.005396508611738682, 0.005503207910805941, 0.0056099072098731995, 0.005716606508940458, 0.00582330534234643, 0.005930004641413689, 0.0060367039404809475, 0.006143402773886919, 0.006250102072954178, 0.006356801372021437, 0.006463500205427408]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 6.0, 7.0, 15.0, 15.0, 13.0, 14.0, 18.0, 27.0, 25.0, 24.0, 27.0, 26.0, 34.0, 37.0, 40.0, 52.0, 43.0, 42.0, 40.0, 55.0, 42.0, 31.0, 41.0, 41.0, 42.0, 42.0, 25.0, 27.0, 21.0, 20.0, 17.0, 15.0, 12.0, 16.0, 11.0, 4.0, 5.0, 1.0, 6.0, 3.0, 7.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004323720932006836, -0.00041732750833034515, -0.0004022829234600067, -0.0003872383385896683, -0.00037219375371932983, -0.0003571491688489914, -0.00034210458397865295, -0.0003270599991083145, -0.0003120154142379761, -0.00029697082936763763, -0.0002819262444972992, -0.00026688165962696075, -0.0002518370747566223, -0.00023679248988628387, -0.00022174790501594543, -0.000206703320145607, -0.00019165873527526855, -0.00017661415040493011, -0.00016156956553459167, -0.00014652498066425323, -0.0001314803957939148, -0.00011643581092357635, -0.00010139122605323792, -8.634664118289948e-05, -7.130205631256104e-05, -5.6257471442222595e-05, -4.1212886571884155e-05, -2.6168301701545715e-05, -1.1123716831207275e-05, 3.9208680391311646e-06, 1.8965452909469604e-05, 3.4010037779808044e-05, 4.9054622650146484e-05, 6.409920752048492e-05, 7.914379239082336e-05, 9.41883772611618e-05, 0.00010923296213150024, 0.00012427754700183868, 0.00013932213187217712, 0.00015436671674251556, 0.000169411301612854, 0.00018445588648319244, 0.00019950047135353088, 0.00021454505622386932, 0.00022958964109420776, 0.0002446342259645462, 0.00025967881083488464, 0.0002747233957052231, 0.0002897679805755615, 0.00030481256544589996, 0.0003198571503162384, 0.00033490173518657684, 0.0003499463200569153, 0.0003649909049272537, 0.00038003548979759216, 0.0003950800746679306, 0.00041012465953826904, 0.0004251692444086075, 0.0004402138292789459, 0.00045525841414928436, 0.0004703029990196228, 0.00048534758388996124, 0.0005003921687602997, 0.0005154367536306381, 0.0005304813385009766]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 5.0, 6.0, 5.0, 2.0, 7.0, 10.0, 9.0, 14.0, 23.0, 24.0, 33.0, 30.0, 30.0, 35.0, 46.0, 29.0, 34.0, 43.0, 44.0, 42.0, 41.0, 55.0, 53.0, 44.0, 45.0, 31.0, 26.0, 40.0, 40.0, 35.0, 19.0, 18.0, 16.0, 15.0, 9.0, 10.0, 11.0, 9.0, 2.0, 6.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.7197265625, -8.431640625, -8.1435546875, -7.85546875, -7.5673828125, -7.279296875, -6.9912109375, -6.703125, -6.4150390625, -6.126953125, -5.8388671875, -5.55078125, -5.2626953125, -4.974609375, -4.6865234375, -4.3984375, -4.1103515625, -3.822265625, -3.5341796875, -3.24609375, -2.9580078125, -2.669921875, -2.3818359375, -2.09375, -1.8056640625, -1.517578125, -1.2294921875, -0.94140625, -0.6533203125, -0.365234375, -0.0771484375, 0.2109375, 0.4990234375, 0.787109375, 1.0751953125, 1.36328125, 1.6513671875, 1.939453125, 2.2275390625, 2.515625, 2.8037109375, 3.091796875, 3.3798828125, 3.66796875, 3.9560546875, 4.244140625, 4.5322265625, 4.8203125, 5.1083984375, 5.396484375, 5.6845703125, 5.97265625, 6.2607421875, 6.548828125, 6.8369140625, 7.125, 7.4130859375, 7.701171875, 7.9892578125, 8.27734375, 8.5654296875, 8.853515625, 9.1416015625, 9.4296875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 10.0, 14.0, 16.0, 30.0, 51.0, 57.0, 109.0, 178.0, 275.0, 443.0, 715.0, 1280.0, 2338.0, 4209.0, 8152.0, 15846.0, 34129.0, 83173.0, 266996.0, 423070.0, 118751.0, 45743.0, 20684.0, 10177.0, 5258.0, 2937.0, 1653.0, 896.0, 508.0, 293.0, 218.0, 129.0, 70.0, 46.0, 31.0, 21.0, 13.0, 13.0, 10.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -4.987060546875, -4.81005859375, -4.633056640625, -4.4560546875, -4.279052734375, -4.10205078125, -3.925048828125, -3.748046875, -3.571044921875, -3.39404296875, -3.217041015625, -3.0400390625, -2.863037109375, -2.68603515625, -2.509033203125, -2.33203125, -2.155029296875, -1.97802734375, -1.801025390625, -1.6240234375, -1.447021484375, -1.27001953125, -1.093017578125, -0.916015625, -0.739013671875, -0.56201171875, -0.385009765625, -0.2080078125, -0.031005859375, 0.14599609375, 0.322998046875, 0.5, 0.677001953125, 0.85400390625, 1.031005859375, 1.2080078125, 1.385009765625, 1.56201171875, 1.739013671875, 1.916015625, 2.093017578125, 2.27001953125, 2.447021484375, 2.6240234375, 2.801025390625, 2.97802734375, 3.155029296875, 3.33203125, 3.509033203125, 3.68603515625, 3.863037109375, 4.0400390625, 4.217041015625, 4.39404296875, 4.571044921875, 4.748046875, 4.925048828125, 5.10205078125, 5.279052734375, 5.4560546875, 5.633056640625, 5.81005859375, 5.987060546875, 6.1640625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 4.0, 6.0, 9.0, 16.0, 11.0, 6.0, 20.0, 22.0, 29.0, 39.0, 42.0, 37.0, 43.0, 53.0, 68.0, 107.0, 229.0, 1710.0, 148.0, 61.0, 55.0, 51.0, 45.0, 32.0, 40.0, 30.0, 14.0, 29.0, 14.0, 14.0, 12.0, 14.0, 9.0, 8.0, 2.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.0625, -36.8857421875, -35.708984375, -34.5322265625, -33.35546875, -32.1787109375, -31.001953125, -29.8251953125, -28.6484375, -27.4716796875, -26.294921875, -25.1181640625, -23.94140625, -22.7646484375, -21.587890625, -20.4111328125, -19.234375, -18.0576171875, -16.880859375, -15.7041015625, -14.52734375, -13.3505859375, -12.173828125, -10.9970703125, -9.8203125, -8.6435546875, -7.466796875, -6.2900390625, -5.11328125, -3.9365234375, -2.759765625, -1.5830078125, -0.40625, 0.7705078125, 1.947265625, 3.1240234375, 4.30078125, 5.4775390625, 6.654296875, 7.8310546875, 9.0078125, 10.1845703125, 11.361328125, 12.5380859375, 13.71484375, 14.8916015625, 16.068359375, 17.2451171875, 18.421875, 19.5986328125, 20.775390625, 21.9521484375, 23.12890625, 24.3056640625, 25.482421875, 26.6591796875, 27.8359375, 29.0126953125, 30.189453125, 31.3662109375, 32.54296875, 33.7197265625, 34.896484375, 36.0732421875, 37.25]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 10.0, 10.0, 23.0, 41.0, 34.0, 69.0, 79.0, 148.0, 252.0, 506.0, 2306.0, 2981924.0, 157833.0, 1398.0, 446.0, 216.0, 131.0, 88.0, 47.0, 34.0, 34.0, 21.0, 16.0, 9.0, 6.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-126.9375, -123.3994140625, -119.861328125, -116.3232421875, -112.78515625, -109.2470703125, -105.708984375, -102.1708984375, -98.6328125, -95.0947265625, -91.556640625, -88.0185546875, -84.48046875, -80.9423828125, -77.404296875, -73.8662109375, -70.328125, -66.7900390625, -63.251953125, -59.7138671875, -56.17578125, -52.6376953125, -49.099609375, -45.5615234375, -42.0234375, -38.4853515625, -34.947265625, -31.4091796875, -27.87109375, -24.3330078125, -20.794921875, -17.2568359375, -13.71875, -10.1806640625, -6.642578125, -3.1044921875, 0.43359375, 3.9716796875, 7.509765625, 11.0478515625, 14.5859375, 18.1240234375, 21.662109375, 25.2001953125, 28.73828125, 32.2763671875, 35.814453125, 39.3525390625, 42.890625, 46.4287109375, 49.966796875, 53.5048828125, 57.04296875, 60.5810546875, 64.119140625, 67.6572265625, 71.1953125, 74.7333984375, 78.271484375, 81.8095703125, 85.34765625, 88.8857421875, 92.423828125, 95.9619140625, 99.5]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 12.0, 96.0, 408.0, 416.0, 68.0, 10.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-253.13516235351562, -248.52536010742188, -243.91555786132812, -239.30577087402344, -234.6959686279297, -230.08616638183594, -225.4763641357422, -220.86656188964844, -216.25677490234375, -211.64697265625, -207.03717041015625, -202.42738342285156, -197.8175811767578, -193.20777893066406, -188.5979766845703, -183.98817443847656, -179.3783721923828, -174.76856994628906, -170.1587677001953, -165.54898071289062, -160.93917846679688, -156.32937622070312, -151.71957397460938, -147.10977172851562, -142.49996948242188, -137.89016723632812, -133.28036499023438, -128.6705780029297, -124.06077575683594, -119.45097351074219, -114.84117126464844, -110.23136901855469, -105.62156677246094, -101.01176452636719, -96.40196990966797, -91.79216766357422, -87.182373046875, -82.57257080078125, -77.9627685546875, -73.35296630859375, -68.74317169189453, -64.13336944580078, -59.52357482910156, -54.91377258300781, -50.30397415161133, -45.694175720214844, -41.084373474121094, -36.47457504272461, -31.864776611328125, -27.25497817993164, -22.645177841186523, -18.035377502441406, -13.425579071044922, -8.815780639648438, -4.20598030090332, 0.4038200378417969, 5.013618469238281, 9.623417854309082, 14.233217239379883, 18.843017578125, 23.452816009521484, 28.06261444091797, 32.67241668701172, 37.2822151184082, 41.89201354980469]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 0.0, 2.0, 1.0, 10.0, 5.0, 18.0, 13.0, 14.0, 10.0, 14.0, 15.0, 15.0, 22.0, 24.0, 27.0, 40.0, 32.0, 60.0, 31.0, 35.0, 39.0, 53.0, 35.0, 47.0, 53.0, 39.0, 41.0, 43.0, 33.0, 28.0, 29.0, 28.0, 29.0, 14.0, 15.0, 15.0, 13.0, 14.0, 12.0, 10.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.61297607421875, -79.75787353515625, -76.90277099609375, -74.04766082763672, -71.19255828857422, -68.33745574951172, -65.48234558105469, -62.62724304199219, -59.77214050292969, -56.91703796386719, -54.06193161010742, -51.206825256347656, -48.351722717285156, -45.496620178222656, -42.64151382446289, -39.786407470703125, -36.931304931640625, -34.076202392578125, -31.22109603881836, -28.365991592407227, -25.510887145996094, -22.65578269958496, -19.800678253173828, -16.945573806762695, -14.090469360351562, -11.23536491394043, -8.380260467529297, -5.525156021118164, -2.6700515747070312, 0.18505287170410156, 3.0401573181152344, 5.895261764526367, 8.750358581542969, 11.605463027954102, 14.460567474365234, 17.315671920776367, 20.1707763671875, 23.025880813598633, 25.880985260009766, 28.7360897064209, 31.59119415283203, 34.44629669189453, 37.3014030456543, 40.15650939941406, 43.01161193847656, 45.86671447753906, 48.72182083129883, 51.576927185058594, 54.432029724121094, 57.287132263183594, 60.14223861694336, 62.997344970703125, 65.85244750976562, 68.70755004882812, 71.56265258789062, 74.41776275634766, 77.27286529541016, 80.12796783447266, 82.98307800292969, 85.83818054199219, 88.69328308105469, 91.54838562011719, 94.40348815917969, 97.25859832763672, 100.11370086669922]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 6.0, 9.0, 5.0, 6.0, 6.0, 16.0, 16.0, 20.0, 29.0, 19.0, 30.0, 40.0, 46.0, 36.0, 27.0, 38.0, 44.0, 47.0, 33.0, 44.0, 48.0, 49.0, 41.0, 44.0, 32.0, 43.0, 24.0, 30.0, 40.0, 25.0, 13.0, 18.0, 15.0, 16.0, 12.0, 10.0, 2.0, 5.0, 5.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.296875, -8.99853515625, -8.7001953125, -8.40185546875, -8.103515625, -7.80517578125, -7.5068359375, -7.20849609375, -6.91015625, -6.61181640625, -6.3134765625, -6.01513671875, -5.716796875, -5.41845703125, -5.1201171875, -4.82177734375, -4.5234375, -4.22509765625, -3.9267578125, -3.62841796875, -3.330078125, -3.03173828125, -2.7333984375, -2.43505859375, -2.13671875, -1.83837890625, -1.5400390625, -1.24169921875, -0.943359375, -0.64501953125, -0.3466796875, -0.04833984375, 0.25, 0.54833984375, 0.8466796875, 1.14501953125, 1.443359375, 1.74169921875, 2.0400390625, 2.33837890625, 2.63671875, 2.93505859375, 3.2333984375, 3.53173828125, 3.830078125, 4.12841796875, 4.4267578125, 4.72509765625, 5.0234375, 5.32177734375, 5.6201171875, 5.91845703125, 6.216796875, 6.51513671875, 6.8134765625, 7.11181640625, 7.41015625, 7.70849609375, 8.0068359375, 8.30517578125, 8.603515625, 8.90185546875, 9.2001953125, 9.49853515625, 9.796875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 6.0, 8.0, 13.0, 10.0, 16.0, 34.0, 41.0, 44.0, 56.0, 81.0, 123.0, 198.0, 307.0, 544.0, 986.0, 1899.0, 4598.0, 12102.0, 40938.0, 203893.0, 947451.0, 1758420.0, 943003.0, 213865.0, 44962.0, 12064.0, 4393.0, 1911.0, 885.0, 493.0, 293.0, 184.0, 133.0, 96.0, 57.0, 39.0, 39.0, 22.0, 24.0, 12.0, 16.0, 5.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.421875, -12.0618896484375, -11.701904296875, -11.3419189453125, -10.98193359375, -10.6219482421875, -10.261962890625, -9.9019775390625, -9.5419921875, -9.1820068359375, -8.822021484375, -8.4620361328125, -8.10205078125, -7.7420654296875, -7.382080078125, -7.0220947265625, -6.662109375, -6.3021240234375, -5.942138671875, -5.5821533203125, -5.22216796875, -4.8621826171875, -4.502197265625, -4.1422119140625, -3.7822265625, -3.4222412109375, -3.062255859375, -2.7022705078125, -2.34228515625, -1.9822998046875, -1.622314453125, -1.2623291015625, -0.90234375, -0.5423583984375, -0.182373046875, 0.1776123046875, 0.53759765625, 0.8975830078125, 1.257568359375, 1.6175537109375, 1.9775390625, 2.3375244140625, 2.697509765625, 3.0574951171875, 3.41748046875, 3.7774658203125, 4.137451171875, 4.4974365234375, 4.857421875, 5.2174072265625, 5.577392578125, 5.9373779296875, 6.29736328125, 6.6573486328125, 7.017333984375, 7.3773193359375, 7.7373046875, 8.0972900390625, 8.457275390625, 8.8172607421875, 9.17724609375, 9.5372314453125, 9.897216796875, 10.2572021484375, 10.6171875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 11.0, 19.0, 25.0, 47.0, 73.0, 129.0, 210.0, 369.0, 650.0, 912.0, 662.0, 392.0, 266.0, 129.0, 76.0, 45.0, 24.0, 15.0, 10.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.578125, -21.481201171875, -20.38427734375, -19.287353515625, -18.1904296875, -17.093505859375, -15.99658203125, -14.899658203125, -13.802734375, -12.705810546875, -11.60888671875, -10.511962890625, -9.4150390625, -8.318115234375, -7.22119140625, -6.124267578125, -5.02734375, -3.930419921875, -2.83349609375, -1.736572265625, -0.6396484375, 0.457275390625, 1.55419921875, 2.651123046875, 3.748046875, 4.844970703125, 5.94189453125, 7.038818359375, 8.1357421875, 9.232666015625, 10.32958984375, 11.426513671875, 12.5234375, 13.620361328125, 14.71728515625, 15.814208984375, 16.9111328125, 18.008056640625, 19.10498046875, 20.201904296875, 21.298828125, 22.395751953125, 23.49267578125, 24.589599609375, 25.6865234375, 26.783447265625, 27.88037109375, 28.977294921875, 30.07421875, 31.171142578125, 32.26806640625, 33.364990234375, 34.4619140625, 35.558837890625, 36.65576171875, 37.752685546875, 38.849609375, 39.946533203125, 41.04345703125, 42.140380859375, 43.2373046875, 44.334228515625, 45.43115234375, 46.528076171875, 47.625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 4.0, 12.0, 15.0, 22.0, 17.0, 29.0, 41.0, 58.0, 65.0, 89.0, 158.0, 202.0, 395.0, 863.0, 4303.0, 2090806.0, 2090764.0, 4388.0, 858.0, 427.0, 216.0, 152.0, 94.0, 69.0, 52.0, 44.0, 33.0, 20.0, 16.0, 11.0, 12.0, 9.0, 10.0, 8.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-89.75, -86.9453125, -84.140625, -81.3359375, -78.53125, -75.7265625, -72.921875, -70.1171875, -67.3125, -64.5078125, -61.703125, -58.8984375, -56.09375, -53.2890625, -50.484375, -47.6796875, -44.875, -42.0703125, -39.265625, -36.4609375, -33.65625, -30.8515625, -28.046875, -25.2421875, -22.4375, -19.6328125, -16.828125, -14.0234375, -11.21875, -8.4140625, -5.609375, -2.8046875, 0.0, 2.8046875, 5.609375, 8.4140625, 11.21875, 14.0234375, 16.828125, 19.6328125, 22.4375, 25.2421875, 28.046875, 30.8515625, 33.65625, 36.4609375, 39.265625, 42.0703125, 44.875, 47.6796875, 50.484375, 53.2890625, 56.09375, 58.8984375, 61.703125, 64.5078125, 67.3125, 70.1171875, 72.921875, 75.7265625, 78.53125, 81.3359375, 84.140625, 86.9453125, 89.75]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 12.0, 41.0, 112.0, 229.0, 302.0, 190.0, 92.0, 22.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-283.7770080566406, -277.78961181640625, -271.8022155761719, -265.8148193359375, -259.8274230957031, -253.8400421142578, -247.85264587402344, -241.86524963378906, -235.87786865234375, -229.89047241210938, -223.903076171875, -217.91567993164062, -211.9282989501953, -205.94090270996094, -199.95350646972656, -193.9661102294922, -187.9787139892578, -181.99131774902344, -176.00392150878906, -170.01654052734375, -164.02914428710938, -158.041748046875, -152.05435180664062, -146.06695556640625, -140.07955932617188, -134.0921630859375, -128.10476684570312, -122.11737823486328, -116.12998962402344, -110.14259338378906, -104.15519714355469, -98.16780090332031, -92.180419921875, -86.19302368164062, -80.20563507080078, -74.2182388305664, -68.23085021972656, -62.24345397949219, -56.25605773925781, -50.2686653137207, -44.281272888183594, -38.293880462646484, -32.306488037109375, -26.319091796875, -20.33169937133789, -14.344306945800781, -8.356910705566406, -2.369518280029297, 3.6178741455078125, 9.605267524719238, 15.592660903930664, 21.580055236816406, 27.567447662353516, 33.554840087890625, 39.542236328125, 45.52962875366211, 51.51702117919922, 57.50441360473633, 63.49180603027344, 69.47920227050781, 75.46659851074219, 81.45398712158203, 87.4413833618164, 93.42877197265625, 99.41616821289062]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 10.0, 15.0, 8.0, 14.0, 16.0, 13.0, 19.0, 27.0, 32.0, 20.0, 35.0, 22.0, 36.0, 40.0, 45.0, 41.0, 44.0, 46.0, 42.0, 39.0, 45.0, 35.0, 36.0, 33.0, 26.0, 38.0, 30.0, 25.0, 16.0, 22.0, 17.0, 20.0, 18.0, 20.0, 10.0, 6.0, 7.0, 5.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-66.99694061279297, -64.9664535522461, -62.93596267700195, -60.90547180175781, -58.87498474121094, -56.84449768066406, -54.81400680541992, -52.78351593017578, -50.753028869628906, -48.72254180908203, -46.69205093383789, -44.66156005859375, -42.631072998046875, -40.6005859375, -38.57009506225586, -36.53960418701172, -34.509117126464844, -32.47863006591797, -30.448139190673828, -28.41765022277832, -26.387161254882812, -24.356672286987305, -22.326183319091797, -20.29569435119629, -18.26520538330078, -16.234716415405273, -14.204227447509766, -12.173738479614258, -10.14324951171875, -8.112760543823242, -6.082271575927734, -4.051782608032227, -2.02130126953125, 0.009187698364257812, 2.0396766662597656, 4.070165634155273, 6.100654602050781, 8.131143569946289, 10.161632537841797, 12.192121505737305, 14.222610473632812, 16.25309944152832, 18.283588409423828, 20.314077377319336, 22.344566345214844, 24.37505531311035, 26.40554428100586, 28.436033248901367, 30.466522216796875, 32.49700927734375, 34.52750015258789, 36.55799102783203, 38.588478088378906, 40.61896514892578, 42.64945602416992, 44.67994689941406, 46.71043395996094, 48.74092102050781, 50.77141189575195, 52.801902770996094, 54.83238983154297, 56.862876892089844, 58.893367767333984, 60.923858642578125, 62.954345703125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 9.0, 3.0, 7.0, 7.0, 10.0, 12.0, 12.0, 21.0, 22.0, 32.0, 30.0, 32.0, 36.0, 37.0, 41.0, 52.0, 46.0, 41.0, 42.0, 51.0, 38.0, 38.0, 35.0, 42.0, 35.0, 35.0, 35.0, 31.0, 36.0, 28.0, 21.0, 20.0, 9.0, 13.0, 5.0, 9.0, 7.0, 4.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.140625, -9.83349609375, -9.5263671875, -9.21923828125, -8.912109375, -8.60498046875, -8.2978515625, -7.99072265625, -7.68359375, -7.37646484375, -7.0693359375, -6.76220703125, -6.455078125, -6.14794921875, -5.8408203125, -5.53369140625, -5.2265625, -4.91943359375, -4.6123046875, -4.30517578125, -3.998046875, -3.69091796875, -3.3837890625, -3.07666015625, -2.76953125, -2.46240234375, -2.1552734375, -1.84814453125, -1.541015625, -1.23388671875, -0.9267578125, -0.61962890625, -0.3125, -0.00537109375, 0.3017578125, 0.60888671875, 0.916015625, 1.22314453125, 1.5302734375, 1.83740234375, 2.14453125, 2.45166015625, 2.7587890625, 3.06591796875, 3.373046875, 3.68017578125, 3.9873046875, 4.29443359375, 4.6015625, 4.90869140625, 5.2158203125, 5.52294921875, 5.830078125, 6.13720703125, 6.4443359375, 6.75146484375, 7.05859375, 7.36572265625, 7.6728515625, 7.97998046875, 8.287109375, 8.59423828125, 8.9013671875, 9.20849609375, 9.515625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 11.0, 13.0, 7.0, 19.0, 21.0, 34.0, 36.0, 69.0, 81.0, 151.0, 225.0, 276.0, 396.0, 573.0, 770.0, 1154.0, 1659.0, 2542.0, 3754.0, 5651.0, 8781.0, 13451.0, 21377.0, 34288.0, 54795.0, 94117.0, 190947.0, 299592.0, 125666.0, 70376.0, 42477.0, 26684.0, 16631.0, 10762.0, 6933.0, 4597.0, 3097.0, 2065.0, 1356.0, 935.0, 623.0, 469.0, 292.0, 271.0, 164.0, 104.0, 81.0, 51.0, 36.0, 29.0, 21.0, 14.0, 9.0, 5.0, 7.0, 10.0, 2.0, 2.0], "bins": [-1.7734375, -1.7200775146484375, -1.666717529296875, -1.6133575439453125, -1.55999755859375, -1.5066375732421875, -1.453277587890625, -1.3999176025390625, -1.3465576171875, -1.2931976318359375, -1.239837646484375, -1.1864776611328125, -1.13311767578125, -1.0797576904296875, -1.026397705078125, -0.9730377197265625, -0.919677734375, -0.8663177490234375, -0.812957763671875, -0.7595977783203125, -0.70623779296875, -0.6528778076171875, -0.599517822265625, -0.5461578369140625, -0.4927978515625, -0.4394378662109375, -0.386077880859375, -0.3327178955078125, -0.27935791015625, -0.2259979248046875, -0.172637939453125, -0.1192779541015625, -0.06591796875, -0.0125579833984375, 0.040802001953125, 0.0941619873046875, 0.14752197265625, 0.2008819580078125, 0.254241943359375, 0.3076019287109375, 0.3609619140625, 0.4143218994140625, 0.467681884765625, 0.5210418701171875, 0.57440185546875, 0.6277618408203125, 0.681121826171875, 0.7344818115234375, 0.787841796875, 0.8412017822265625, 0.894561767578125, 0.9479217529296875, 1.00128173828125, 1.0546417236328125, 1.108001708984375, 1.1613616943359375, 1.2147216796875, 1.2680816650390625, 1.321441650390625, 1.3748016357421875, 1.42816162109375, 1.4815216064453125, 1.534881591796875, 1.5882415771484375, 1.6416015625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 2.0, 7.0, 10.0, 6.0, 14.0, 5.0, 16.0, 13.0, 17.0, 23.0, 29.0, 39.0, 34.0, 40.0, 32.0, 33.0, 40.0, 42.0, 46.0, 31.0, 36.0, 1056.0, 36.0, 43.0, 35.0, 24.0, 41.0, 30.0, 35.0, 31.0, 21.0, 19.0, 17.0, 19.0, 20.0, 8.0, 15.0, 17.0, 10.0, 10.0, 8.0, 5.0, 3.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.36328125, -6.18707275390625, -6.0108642578125, -5.83465576171875, -5.658447265625, -5.48223876953125, -5.3060302734375, -5.12982177734375, -4.95361328125, -4.77740478515625, -4.6011962890625, -4.42498779296875, -4.248779296875, -4.07257080078125, -3.8963623046875, -3.72015380859375, -3.5439453125, -3.36773681640625, -3.1915283203125, -3.01531982421875, -2.839111328125, -2.66290283203125, -2.4866943359375, -2.31048583984375, -2.13427734375, -1.95806884765625, -1.7818603515625, -1.60565185546875, -1.429443359375, -1.25323486328125, -1.0770263671875, -0.90081787109375, -0.724609375, -0.54840087890625, -0.3721923828125, -0.19598388671875, -0.019775390625, 0.15643310546875, 0.3326416015625, 0.50885009765625, 0.68505859375, 0.86126708984375, 1.0374755859375, 1.21368408203125, 1.389892578125, 1.56610107421875, 1.7423095703125, 1.91851806640625, 2.0947265625, 2.27093505859375, 2.4471435546875, 2.62335205078125, 2.799560546875, 2.97576904296875, 3.1519775390625, 3.32818603515625, 3.50439453125, 3.68060302734375, 3.8568115234375, 4.03302001953125, 4.209228515625, 4.38543701171875, 4.5616455078125, 4.73785400390625, 4.9140625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 10.0, 13.0, 22.0, 33.0, 41.0, 55.0, 79.0, 160.0, 222.0, 316.0, 521.0, 840.0, 1398.0, 2082.0, 3439.0, 5281.0, 8230.0, 12889.0, 20801.0, 33989.0, 57017.0, 101922.0, 235413.0, 1334386.0, 115926.0, 62701.0, 37552.0, 23094.0, 14408.0, 8922.0, 5683.0, 3541.0, 2328.0, 1414.0, 890.0, 528.0, 348.0, 210.0, 156.0, 88.0, 61.0, 49.0, 31.0, 19.0, 13.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.69921875, -1.6427459716796875, -1.586273193359375, -1.5298004150390625, -1.47332763671875, -1.4168548583984375, -1.360382080078125, -1.3039093017578125, -1.2474365234375, -1.1909637451171875, -1.134490966796875, -1.0780181884765625, -1.02154541015625, -0.9650726318359375, -0.908599853515625, -0.8521270751953125, -0.795654296875, -0.7391815185546875, -0.682708740234375, -0.6262359619140625, -0.56976318359375, -0.5132904052734375, -0.456817626953125, -0.4003448486328125, -0.3438720703125, -0.2873992919921875, -0.230926513671875, -0.1744537353515625, -0.11798095703125, -0.0615081787109375, -0.005035400390625, 0.0514373779296875, 0.10791015625, 0.1643829345703125, 0.220855712890625, 0.2773284912109375, 0.33380126953125, 0.3902740478515625, 0.446746826171875, 0.5032196044921875, 0.5596923828125, 0.6161651611328125, 0.672637939453125, 0.7291107177734375, 0.78558349609375, 0.8420562744140625, 0.898529052734375, 0.9550018310546875, 1.011474609375, 1.0679473876953125, 1.124420166015625, 1.1808929443359375, 1.23736572265625, 1.2938385009765625, 1.350311279296875, 1.4067840576171875, 1.4632568359375, 1.5197296142578125, 1.576202392578125, 1.6326751708984375, 1.68914794921875, 1.7456207275390625, 1.802093505859375, 1.8585662841796875, 1.9150390625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 6.0, 9.0, 9.0, 8.0, 11.0, 10.0, 17.0, 31.0, 30.0, 25.0, 40.0, 43.0, 73.0, 53.0, 75.0, 86.0, 78.0, 75.0, 59.0, 57.0, 39.0, 33.0, 24.0, 21.0, 17.0, 13.0, 7.0, 8.0, 9.0, 6.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0011854171752929688, -0.0011502355337142944, -0.0011150538921356201, -0.0010798722505569458, -0.0010446906089782715, -0.0010095089673995972, -0.0009743273258209229, -0.0009391456842422485, -0.0009039640426635742, -0.0008687824010848999, -0.0008336007595062256, -0.0007984191179275513, -0.000763237476348877, -0.0007280558347702026, -0.0006928741931915283, -0.000657692551612854, -0.0006225109100341797, -0.0005873292684555054, -0.0005521476268768311, -0.0005169659852981567, -0.0004817843437194824, -0.0004466027021408081, -0.0004114210605621338, -0.00037623941898345947, -0.00034105777740478516, -0.00030587613582611084, -0.0002706944942474365, -0.0002355128526687622, -0.0002003312110900879, -0.00016514956951141357, -0.00012996792793273926, -9.478628635406494e-05, -5.9604644775390625e-05, -2.442300319671631e-05, 1.0758638381958008e-05, 4.5940279960632324e-05, 8.112192153930664e-05, 0.00011630356311798096, 0.00015148520469665527, 0.0001866668462753296, 0.0002218484878540039, 0.0002570301294326782, 0.00029221177101135254, 0.00032739341259002686, 0.00036257505416870117, 0.0003977566957473755, 0.0004329383373260498, 0.0004681199789047241, 0.0005033016204833984, 0.0005384832620620728, 0.0005736649036407471, 0.0006088465452194214, 0.0006440281867980957, 0.00067920982837677, 0.0007143914699554443, 0.0007495731115341187, 0.000784754753112793, 0.0008199363946914673, 0.0008551180362701416, 0.0008902996778488159, 0.0009254813194274902, 0.0009606629610061646, 0.0009958446025848389, 0.0010310262441635132, 0.0010662078857421875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 3.0, 4.0, 10.0, 7.0, 11.0, 10.0, 14.0, 21.0, 23.0, 39.0, 56.0, 94.0, 139.0, 264.0, 729.0, 16963.0, 1026766.0, 2271.0, 527.0, 202.0, 111.0, 72.0, 47.0, 38.0, 32.0, 25.0, 12.0, 15.0, 11.0, 7.0, 8.0, 5.0, 7.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.027557373046875, -0.026704788208007812, -0.025852203369140625, -0.024999618530273438, -0.02414703369140625, -0.023294448852539062, -0.022441864013671875, -0.021589279174804688, -0.0207366943359375, -0.019884109497070312, -0.019031524658203125, -0.018178939819335938, -0.01732635498046875, -0.016473770141601562, -0.015621185302734375, -0.014768600463867188, -0.013916015625, -0.013063430786132812, -0.012210845947265625, -0.011358261108398438, -0.01050567626953125, -0.009653091430664062, -0.008800506591796875, -0.007947921752929688, -0.0070953369140625, -0.0062427520751953125, -0.005390167236328125, -0.0045375823974609375, -0.00368499755859375, -0.0028324127197265625, -0.001979827880859375, -0.0011272430419921875, -0.000274658203125, 0.0005779266357421875, 0.001430511474609375, 0.0022830963134765625, 0.00313568115234375, 0.0039882659912109375, 0.004840850830078125, 0.0056934356689453125, 0.0065460205078125, 0.0073986053466796875, 0.008251190185546875, 0.009103775024414062, 0.00995635986328125, 0.010808944702148438, 0.011661529541015625, 0.012514114379882812, 0.01336669921875, 0.014219284057617188, 0.015071868896484375, 0.015924453735351562, 0.01677703857421875, 0.017629623413085938, 0.018482208251953125, 0.019334793090820312, 0.0201873779296875, 0.021039962768554688, 0.021892547607421875, 0.022745132446289062, 0.02359771728515625, 0.024450302124023438, 0.025302886962890625, 0.026155471801757812, 0.027008056640625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 17.0, 125.0, 431.0, 340.0, 91.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015701367519795895, -0.0014949573669582605, -0.0014197780983522534, -0.0013445987133309245, -0.0012694194447249174, -0.0011942400597035885, -0.0011190606746822596, -0.0010438812896609306, -0.0009687020210549235, -0.0008935226942412555, -0.0008183433674275875, -0.0007431639824062586, -0.0006679846555925906, -0.0005928053287789226, -0.0005176259437575936, -0.0004424466169439256, -0.0003672672901302576, -0.0002920879633165896, -0.00021690860739909112, -0.00014172926603350788, -6.654992466792464e-05, 8.62940214574337e-06, 8.380875806324184e-05, 0.0001589881139807403, 0.00023416744079440832, 0.00030934676760807633, 0.0003845261235255748, 0.00045970547944307327, 0.0005348848062567413, 0.0006100641330704093, 0.0006852435180917382, 0.0007604228449054062, 0.0008356024045497179, 0.0009107817313633859, 0.000985961058177054, 0.0010611404431983829, 0.00113631971180439, 0.0012114990968257189, 0.0012866784818470478, 0.0013618578668683767, 0.0014370371354743838, 0.0015122165204957128, 0.0015873957891017199, 0.0016625751741230488, 0.0017377545591443777, 0.0018129338277503848, 0.0018881132127717137, 0.001963292481377721, 0.0020384718663990498, 0.0021136512514203787, 0.0021888306364417076, 0.002264009788632393, 0.002339189173653722, 0.0024143685586750507, 0.0024895479436963797, 0.0025647273287177086, 0.002639906480908394, 0.002715085865929723, 0.0027902652509510517, 0.002865444403141737, 0.002940623788163066, 0.003015803173184395, 0.0030909825582057238, 0.0031661619432270527, 0.0032413413282483816]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 9.0, 5.0, 5.0, 8.0, 6.0, 7.0, 8.0, 15.0, 13.0, 13.0, 11.0, 15.0, 18.0, 22.0, 32.0, 37.0, 32.0, 44.0, 37.0, 35.0, 41.0, 32.0, 47.0, 42.0, 36.0, 37.0, 39.0, 27.0, 32.0, 34.0, 31.0, 32.0, 29.0, 27.0, 24.0, 20.0, 12.0, 16.0, 14.0, 10.0, 7.0, 8.0, 9.0, 6.0, 5.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0], "bins": [-0.0005207657814025879, -0.0005055731162428856, -0.0004903804510831833, -0.000475187785923481, -0.0004599951207637787, -0.0004448024556040764, -0.0004296097904443741, -0.0004144171252846718, -0.0003992244601249695, -0.0003840317949652672, -0.0003688391298055649, -0.0003536464646458626, -0.0003384537994861603, -0.000323261134326458, -0.0003080684691667557, -0.0002928758040070534, -0.0002776831388473511, -0.0002624904736876488, -0.00024729780852794647, -0.00023210514336824417, -0.00021691247820854187, -0.00020171981304883957, -0.00018652714788913727, -0.00017133448272943497, -0.00015614181756973267, -0.00014094915241003036, -0.00012575648725032806, -0.00011056382209062576, -9.537115693092346e-05, -8.017849177122116e-05, -6.498582661151886e-05, -4.979316145181656e-05, -3.460049629211426e-05, -1.9407831132411957e-05, -4.215165972709656e-06, 1.0977499186992645e-05, 2.6170164346694946e-05, 4.136282950639725e-05, 5.655549466609955e-05, 7.174815982580185e-05, 8.694082498550415e-05, 0.00010213349014520645, 0.00011732615530490875, 0.00013251882046461105, 0.00014771148562431335, 0.00016290415078401566, 0.00017809681594371796, 0.00019328948110342026, 0.00020848214626312256, 0.00022367481142282486, 0.00023886747658252716, 0.00025406014174222946, 0.00026925280690193176, 0.00028444547206163406, 0.00029963813722133636, 0.00031483080238103867, 0.00033002346754074097, 0.00034521613270044327, 0.00036040879786014557, 0.00037560146301984787, 0.00039079412817955017, 0.00040598679333925247, 0.0004211794584989548, 0.0004363721236586571, 0.0004515647888183594]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 9.0, 3.0, 7.0, 7.0, 10.0, 12.0, 12.0, 21.0, 22.0, 32.0, 30.0, 32.0, 36.0, 37.0, 41.0, 52.0, 46.0, 41.0, 42.0, 51.0, 38.0, 38.0, 35.0, 42.0, 35.0, 35.0, 35.0, 31.0, 36.0, 28.0, 21.0, 20.0, 9.0, 13.0, 5.0, 9.0, 7.0, 4.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.140625, -9.83349609375, -9.5263671875, -9.21923828125, -8.912109375, -8.60498046875, -8.2978515625, -7.99072265625, -7.68359375, -7.37646484375, -7.0693359375, -6.76220703125, -6.455078125, -6.14794921875, -5.8408203125, -5.53369140625, -5.2265625, -4.91943359375, -4.6123046875, -4.30517578125, -3.998046875, -3.69091796875, -3.3837890625, -3.07666015625, -2.76953125, -2.46240234375, -2.1552734375, -1.84814453125, -1.541015625, -1.23388671875, -0.9267578125, -0.61962890625, -0.3125, -0.00537109375, 0.3017578125, 0.60888671875, 0.916015625, 1.22314453125, 1.5302734375, 1.83740234375, 2.14453125, 2.45166015625, 2.7587890625, 3.06591796875, 3.373046875, 3.68017578125, 3.9873046875, 4.29443359375, 4.6015625, 4.90869140625, 5.2158203125, 5.52294921875, 5.830078125, 6.13720703125, 6.4443359375, 6.75146484375, 7.05859375, 7.36572265625, 7.6728515625, 7.97998046875, 8.287109375, 8.59423828125, 8.9013671875, 9.20849609375, 9.515625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 11.0, 18.0, 23.0, 35.0, 33.0, 50.0, 85.0, 120.0, 191.0, 303.0, 459.0, 749.0, 1241.0, 2518.0, 4722.0, 10694.0, 24673.0, 63423.0, 203431.0, 480439.0, 162107.0, 53682.0, 20886.0, 9206.0, 4238.0, 2064.0, 1154.0, 730.0, 442.0, 271.0, 190.0, 127.0, 61.0, 51.0, 31.0, 31.0, 21.0, 20.0, 4.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-7.6015625, -7.38690185546875, -7.1722412109375, -6.95758056640625, -6.742919921875, -6.52825927734375, -6.3135986328125, -6.09893798828125, -5.88427734375, -5.66961669921875, -5.4549560546875, -5.24029541015625, -5.025634765625, -4.81097412109375, -4.5963134765625, -4.38165283203125, -4.1669921875, -3.95233154296875, -3.7376708984375, -3.52301025390625, -3.308349609375, -3.09368896484375, -2.8790283203125, -2.66436767578125, -2.44970703125, -2.23504638671875, -2.0203857421875, -1.80572509765625, -1.591064453125, -1.37640380859375, -1.1617431640625, -0.94708251953125, -0.732421875, -0.51776123046875, -0.3031005859375, -0.08843994140625, 0.126220703125, 0.34088134765625, 0.5555419921875, 0.77020263671875, 0.98486328125, 1.19952392578125, 1.4141845703125, 1.62884521484375, 1.843505859375, 2.05816650390625, 2.2728271484375, 2.48748779296875, 2.7021484375, 2.91680908203125, 3.1314697265625, 3.34613037109375, 3.560791015625, 3.77545166015625, 3.9901123046875, 4.20477294921875, 4.41943359375, 4.63409423828125, 4.8487548828125, 5.06341552734375, 5.278076171875, 5.49273681640625, 5.7073974609375, 5.92205810546875, 6.13671875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 9.0, 7.0, 11.0, 11.0, 11.0, 20.0, 13.0, 12.0, 30.0, 28.0, 32.0, 35.0, 38.0, 64.0, 59.0, 81.0, 188.0, 1685.0, 181.0, 74.0, 67.0, 58.0, 44.0, 33.0, 41.0, 31.0, 21.0, 25.0, 25.0, 18.0, 13.0, 14.0, 7.0, 8.0, 6.0, 12.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-35.84375, -34.77294921875, -33.7021484375, -32.63134765625, -31.560546875, -30.48974609375, -29.4189453125, -28.34814453125, -27.27734375, -26.20654296875, -25.1357421875, -24.06494140625, -22.994140625, -21.92333984375, -20.8525390625, -19.78173828125, -18.7109375, -17.64013671875, -16.5693359375, -15.49853515625, -14.427734375, -13.35693359375, -12.2861328125, -11.21533203125, -10.14453125, -9.07373046875, -8.0029296875, -6.93212890625, -5.861328125, -4.79052734375, -3.7197265625, -2.64892578125, -1.578125, -0.50732421875, 0.5634765625, 1.63427734375, 2.705078125, 3.77587890625, 4.8466796875, 5.91748046875, 6.98828125, 8.05908203125, 9.1298828125, 10.20068359375, 11.271484375, 12.34228515625, 13.4130859375, 14.48388671875, 15.5546875, 16.62548828125, 17.6962890625, 18.76708984375, 19.837890625, 20.90869140625, 21.9794921875, 23.05029296875, 24.12109375, 25.19189453125, 26.2626953125, 27.33349609375, 28.404296875, 29.47509765625, 30.5458984375, 31.61669921875, 32.6875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 12.0, 9.0, 6.0, 14.0, 22.0, 23.0, 28.0, 40.0, 65.0, 63.0, 117.0, 142.0, 162.0, 274.0, 461.0, 1464.0, 65576.0, 3069811.0, 5552.0, 761.0, 304.0, 194.0, 132.0, 99.0, 85.0, 69.0, 39.0, 40.0, 36.0, 13.0, 17.0, 14.0, 14.0, 10.0, 2.0, 11.0, 3.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-87.4375, -84.80859375, -82.1796875, -79.55078125, -76.921875, -74.29296875, -71.6640625, -69.03515625, -66.40625, -63.77734375, -61.1484375, -58.51953125, -55.890625, -53.26171875, -50.6328125, -48.00390625, -45.375, -42.74609375, -40.1171875, -37.48828125, -34.859375, -32.23046875, -29.6015625, -26.97265625, -24.34375, -21.71484375, -19.0859375, -16.45703125, -13.828125, -11.19921875, -8.5703125, -5.94140625, -3.3125, -0.68359375, 1.9453125, 4.57421875, 7.203125, 9.83203125, 12.4609375, 15.08984375, 17.71875, 20.34765625, 22.9765625, 25.60546875, 28.234375, 30.86328125, 33.4921875, 36.12109375, 38.75, 41.37890625, 44.0078125, 46.63671875, 49.265625, 51.89453125, 54.5234375, 57.15234375, 59.78125, 62.41015625, 65.0390625, 67.66796875, 70.296875, 72.92578125, 75.5546875, 78.18359375, 80.8125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [4.0, 747.0, 267.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.430574417114258, -10.227721214294434, 1.9751319885253906, 14.177984237670898, 26.38083839416504, 38.58369445800781, 50.78654479980469, 62.989402770996094, 75.19225311279297, 87.39510345458984, 99.59796142578125, 111.80081176757812, 124.003662109375, 136.20651245117188, 148.40936279296875, 160.6122283935547, 172.81507873535156, 185.01792907714844, 197.2207794189453, 209.42364501953125, 221.62649536132812, 233.829345703125, 246.03219604492188, 258.23504638671875, 270.4378967285156, 282.6407470703125, 294.8435974121094, 307.04644775390625, 319.2492980957031, 331.4521484375, 343.655029296875, 355.8578796386719, 368.0606994628906, 380.2635498046875, 392.4664001464844, 404.66925048828125, 416.8721008300781, 429.074951171875, 441.27783203125, 453.4806823730469, 465.68353271484375, 477.8863830566406, 490.0892333984375, 502.2920837402344, 514.4949340820312, 526.6978149414062, 538.900634765625, 551.103515625, 563.3063354492188, 575.5092163085938, 587.7120361328125, 599.9149169921875, 612.1177368164062, 624.3206176757812, 636.5234375, 648.726318359375, 660.92919921875, 673.132080078125, 685.3348999023438, 697.5377807617188, 709.7406005859375, 721.9434814453125, 734.1463012695312, 746.3491821289062, 758.552001953125]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 8.0, 7.0, 1.0, 7.0, 9.0, 4.0, 13.0, 16.0, 20.0, 22.0, 29.0, 29.0, 39.0, 39.0, 34.0, 38.0, 51.0, 41.0, 46.0, 45.0, 57.0, 52.0, 34.0, 45.0, 45.0, 41.0, 28.0, 34.0, 25.0, 28.0, 19.0, 24.0, 20.0, 9.0, 9.0, 11.0, 6.0, 7.0, 3.0, 5.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.43708038330078, -93.23727416992188, -90.03746032714844, -86.83765411376953, -83.6378402709961, -80.43803405761719, -77.23822021484375, -74.03841400146484, -70.83860778808594, -67.63880157470703, -64.4389877319336, -61.23918151855469, -58.03936767578125, -54.839561462402344, -51.63975143432617, -48.43994140625, -45.24012756347656, -42.04031753540039, -38.84050750732422, -35.64070129394531, -32.440887451171875, -29.241079330444336, -26.041271209716797, -22.841461181640625, -19.641651153564453, -16.44184112548828, -13.242032051086426, -10.04222297668457, -6.842412948608398, -3.6426029205322266, -0.4427947998046875, 2.7570152282714844, 5.9568328857421875, 9.15664291381836, 12.356451988220215, 15.55626106262207, 18.756071090698242, 21.955881118774414, 25.155689239501953, 28.355499267578125, 31.555309295654297, 34.75511932373047, 37.95492935180664, 41.15473937988281, 44.35454559326172, 47.554359436035156, 50.75416564941406, 53.953975677490234, 57.153785705566406, 60.35359573364258, 63.55340576171875, 66.75321197509766, 69.9530258178711, 73.15283203125, 76.35264587402344, 79.55245208740234, 82.75225830078125, 85.95206451416016, 89.1518783569336, 92.3516845703125, 95.55149841308594, 98.75130462646484, 101.95111083984375, 105.15092468261719, 108.35073852539062]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 1.0, 4.0, 6.0, 11.0, 10.0, 9.0, 20.0, 13.0, 20.0, 19.0, 25.0, 30.0, 19.0, 32.0, 47.0, 40.0, 39.0, 44.0, 33.0, 58.0, 35.0, 30.0, 37.0, 43.0, 34.0, 34.0, 38.0, 34.0, 23.0, 33.0, 28.0, 23.0, 22.0, 22.0, 14.0, 15.0, 10.0, 7.0, 5.0, 11.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.1875, -9.8929443359375, -9.598388671875, -9.3038330078125, -9.00927734375, -8.7147216796875, -8.420166015625, -8.1256103515625, -7.8310546875, -7.5364990234375, -7.241943359375, -6.9473876953125, -6.65283203125, -6.3582763671875, -6.063720703125, -5.7691650390625, -5.474609375, -5.1800537109375, -4.885498046875, -4.5909423828125, -4.29638671875, -4.0018310546875, -3.707275390625, -3.4127197265625, -3.1181640625, -2.8236083984375, -2.529052734375, -2.2344970703125, -1.93994140625, -1.6453857421875, -1.350830078125, -1.0562744140625, -0.76171875, -0.4671630859375, -0.172607421875, 0.1219482421875, 0.41650390625, 0.7110595703125, 1.005615234375, 1.3001708984375, 1.5947265625, 1.8892822265625, 2.183837890625, 2.4783935546875, 2.77294921875, 3.0675048828125, 3.362060546875, 3.6566162109375, 3.951171875, 4.2457275390625, 4.540283203125, 4.8348388671875, 5.12939453125, 5.4239501953125, 5.718505859375, 6.0130615234375, 6.3076171875, 6.6021728515625, 6.896728515625, 7.1912841796875, 7.48583984375, 7.7803955078125, 8.074951171875, 8.3695068359375, 8.6640625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 9.0, 8.0, 10.0, 13.0, 13.0, 19.0, 17.0, 15.0, 24.0, 20.0, 46.0, 57.0, 97.0, 110.0, 192.0, 352.0, 1008.0, 5421.0, 133264.0, 3558221.0, 483347.0, 9475.0, 1385.0, 421.0, 191.0, 132.0, 101.0, 59.0, 48.0, 31.0, 21.0, 25.0, 23.0, 22.0, 15.0, 11.0, 7.0, 8.0, 7.0, 6.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-38.71875, -37.6005859375, -36.482421875, -35.3642578125, -34.24609375, -33.1279296875, -32.009765625, -30.8916015625, -29.7734375, -28.6552734375, -27.537109375, -26.4189453125, -25.30078125, -24.1826171875, -23.064453125, -21.9462890625, -20.828125, -19.7099609375, -18.591796875, -17.4736328125, -16.35546875, -15.2373046875, -14.119140625, -13.0009765625, -11.8828125, -10.7646484375, -9.646484375, -8.5283203125, -7.41015625, -6.2919921875, -5.173828125, -4.0556640625, -2.9375, -1.8193359375, -0.701171875, 0.4169921875, 1.53515625, 2.6533203125, 3.771484375, 4.8896484375, 6.0078125, 7.1259765625, 8.244140625, 9.3623046875, 10.48046875, 11.5986328125, 12.716796875, 13.8349609375, 14.953125, 16.0712890625, 17.189453125, 18.3076171875, 19.42578125, 20.5439453125, 21.662109375, 22.7802734375, 23.8984375, 25.0166015625, 26.134765625, 27.2529296875, 28.37109375, 29.4892578125, 30.607421875, 31.7255859375, 32.84375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 5.0, 8.0, 16.0, 24.0, 22.0, 46.0, 67.0, 89.0, 119.0, 195.0, 279.0, 460.0, 604.0, 608.0, 504.0, 345.0, 221.0, 152.0, 93.0, 64.0, 49.0, 31.0, 23.0, 9.0, 7.0, 10.0, 10.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-33.09375, -32.3271484375, -31.560546875, -30.7939453125, -30.02734375, -29.2607421875, -28.494140625, -27.7275390625, -26.9609375, -26.1943359375, -25.427734375, -24.6611328125, -23.89453125, -23.1279296875, -22.361328125, -21.5947265625, -20.828125, -20.0615234375, -19.294921875, -18.5283203125, -17.76171875, -16.9951171875, -16.228515625, -15.4619140625, -14.6953125, -13.9287109375, -13.162109375, -12.3955078125, -11.62890625, -10.8623046875, -10.095703125, -9.3291015625, -8.5625, -7.7958984375, -7.029296875, -6.2626953125, -5.49609375, -4.7294921875, -3.962890625, -3.1962890625, -2.4296875, -1.6630859375, -0.896484375, -0.1298828125, 0.63671875, 1.4033203125, 2.169921875, 2.9365234375, 3.703125, 4.4697265625, 5.236328125, 6.0029296875, 6.76953125, 7.5361328125, 8.302734375, 9.0693359375, 9.8359375, 10.6025390625, 11.369140625, 12.1357421875, 12.90234375, 13.6689453125, 14.435546875, 15.2021484375, 15.96875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 9.0, 7.0, 11.0, 14.0, 16.0, 25.0, 34.0, 68.0, 76.0, 78.0, 124.0, 234.0, 412.0, 1263.0, 43551.0, 4134332.0, 12045.0, 923.0, 385.0, 208.0, 129.0, 97.0, 62.0, 47.0, 39.0, 23.0, 15.0, 12.0, 9.0, 9.0, 7.0, 5.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.625, -93.22265625, -89.8203125, -86.41796875, -83.015625, -79.61328125, -76.2109375, -72.80859375, -69.40625, -66.00390625, -62.6015625, -59.19921875, -55.796875, -52.39453125, -48.9921875, -45.58984375, -42.1875, -38.78515625, -35.3828125, -31.98046875, -28.578125, -25.17578125, -21.7734375, -18.37109375, -14.96875, -11.56640625, -8.1640625, -4.76171875, -1.359375, 2.04296875, 5.4453125, 8.84765625, 12.25, 15.65234375, 19.0546875, 22.45703125, 25.859375, 29.26171875, 32.6640625, 36.06640625, 39.46875, 42.87109375, 46.2734375, 49.67578125, 53.078125, 56.48046875, 59.8828125, 63.28515625, 66.6875, 70.08984375, 73.4921875, 76.89453125, 80.296875, 83.69921875, 87.1015625, 90.50390625, 93.90625, 97.30859375, 100.7109375, 104.11328125, 107.515625, 110.91796875, 114.3203125, 117.72265625, 121.125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 67.0, 159.0, 326.0, 292.0, 110.0, 38.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.42677307128906, -134.02392578125, -127.6210708618164, -121.21821594238281, -114.81536865234375, -108.41252136230469, -102.0096664428711, -95.6068115234375, -89.20396423339844, -82.80111694335938, -76.39826202392578, -69.99540710449219, -63.592559814453125, -57.1897087097168, -50.78685760498047, -44.38400650024414, -37.98115539550781, -31.578304290771484, -25.175453186035156, -18.772602081298828, -12.3697509765625, -5.966899871826172, 0.43595123291015625, 6.838802337646484, 13.241653442382812, 19.64450454711914, 26.04735565185547, 32.4502067565918, 38.853057861328125, 45.25590896606445, 51.65876007080078, 58.06161117553711, 64.46444702148438, 70.86729431152344, 77.27014923095703, 83.67300415039062, 90.07585144042969, 96.47869873046875, 102.88155364990234, 109.28440856933594, 115.687255859375, 122.09010314941406, 128.49295043945312, 134.89581298828125, 141.2986602783203, 147.70150756835938, 154.1043701171875, 160.50721740722656, 166.91006469726562, 173.3129119873047, 179.71575927734375, 186.11862182617188, 192.52146911621094, 198.92431640625, 205.32717895507812, 211.7300262451172, 218.13287353515625, 224.5357208251953, 230.93856811523438, 237.3414306640625, 243.74427795410156, 250.14712524414062, 256.54998779296875, 262.95281982421875, 269.3556823730469]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 6.0, 10.0, 7.0, 12.0, 7.0, 12.0, 11.0, 13.0, 16.0, 19.0, 13.0, 17.0, 26.0, 19.0, 28.0, 30.0, 28.0, 31.0, 25.0, 24.0, 24.0, 34.0, 39.0, 38.0, 24.0, 27.0, 38.0, 35.0, 41.0, 30.0, 35.0, 23.0, 27.0, 25.0, 19.0, 20.0, 24.0, 24.0, 23.0, 16.0, 12.0, 10.0, 14.0, 11.0, 11.0, 8.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-59.25963592529297, -57.50947570800781, -55.759315490722656, -54.0091552734375, -52.25899887084961, -50.50883865356445, -48.7586784362793, -47.00851821899414, -45.25836181640625, -43.508201599121094, -41.75804138183594, -40.00788116455078, -38.25772476196289, -36.507564544677734, -34.75740432739258, -33.00724411010742, -31.257083892822266, -29.50692367553711, -27.756765365600586, -26.00660514831543, -24.256446838378906, -22.50628662109375, -20.756126403808594, -19.005966186523438, -17.255807876586914, -15.505648612976074, -13.755489349365234, -12.005329132080078, -10.255169868469238, -8.505010604858398, -6.754850387573242, -5.004691123962402, -3.254535675048828, -1.5043761730194092, 0.24578332901000977, 1.9959430694580078, 3.7461023330688477, 5.4962615966796875, 7.246421813964844, 8.996581077575684, 10.746740341186523, 12.496899604797363, 14.247058868408203, 15.99721908569336, 17.747379302978516, 19.49753761291504, 21.247697830200195, 22.99785614013672, 24.748016357421875, 26.49817657470703, 28.248334884643555, 29.99849510192871, 31.748653411865234, 33.49881362915039, 35.24897384643555, 36.9991340637207, 38.749290466308594, 40.49945068359375, 42.249610900878906, 43.99977111816406, 45.74992752075195, 47.50008773803711, 49.250247955322266, 51.00040817260742, 52.75056838989258]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 6.0, 8.0, 7.0, 9.0, 14.0, 15.0, 14.0, 23.0, 30.0, 26.0, 29.0, 43.0, 39.0, 49.0, 45.0, 46.0, 44.0, 42.0, 41.0, 47.0, 37.0, 51.0, 34.0, 43.0, 41.0, 41.0, 32.0, 25.0, 30.0, 18.0, 12.0, 10.0, 13.0, 8.0, 13.0, 4.0, 4.0, 0.0, 2.0, 6.0], "bins": [-14.34375, -14.00152587890625, -13.6593017578125, -13.31707763671875, -12.974853515625, -12.63262939453125, -12.2904052734375, -11.94818115234375, -11.60595703125, -11.26373291015625, -10.9215087890625, -10.57928466796875, -10.237060546875, -9.89483642578125, -9.5526123046875, -9.21038818359375, -8.8681640625, -8.52593994140625, -8.1837158203125, -7.84149169921875, -7.499267578125, -7.15704345703125, -6.8148193359375, -6.47259521484375, -6.13037109375, -5.78814697265625, -5.4459228515625, -5.10369873046875, -4.761474609375, -4.41925048828125, -4.0770263671875, -3.73480224609375, -3.392578125, -3.05035400390625, -2.7081298828125, -2.36590576171875, -2.023681640625, -1.68145751953125, -1.3392333984375, -0.99700927734375, -0.65478515625, -0.31256103515625, 0.0296630859375, 0.37188720703125, 0.714111328125, 1.05633544921875, 1.3985595703125, 1.74078369140625, 2.0830078125, 2.42523193359375, 2.7674560546875, 3.10968017578125, 3.451904296875, 3.79412841796875, 4.1363525390625, 4.47857666015625, 4.82080078125, 5.16302490234375, 5.5052490234375, 5.84747314453125, 6.189697265625, 6.53192138671875, 6.8741455078125, 7.21636962890625, 7.55859375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 11.0, 13.0, 14.0, 21.0, 46.0, 79.0, 112.0, 187.0, 306.0, 526.0, 1055.0, 1753.0, 3056.0, 5695.0, 10583.0, 20432.0, 40585.0, 85994.0, 215270.0, 410357.0, 131673.0, 59362.0, 29183.0, 14761.0, 7851.0, 4193.0, 2283.0, 1307.0, 753.0, 448.0, 223.0, 140.0, 101.0, 65.0, 34.0, 28.0, 9.0, 8.0, 10.0, 8.0, 8.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.73046875, -2.640228271484375, -2.54998779296875, -2.459747314453125, -2.3695068359375, -2.279266357421875, -2.18902587890625, -2.098785400390625, -2.008544921875, -1.918304443359375, -1.82806396484375, -1.737823486328125, -1.6475830078125, -1.557342529296875, -1.46710205078125, -1.376861572265625, -1.28662109375, -1.196380615234375, -1.10614013671875, -1.015899658203125, -0.9256591796875, -0.835418701171875, -0.74517822265625, -0.654937744140625, -0.564697265625, -0.474456787109375, -0.38421630859375, -0.293975830078125, -0.2037353515625, -0.113494873046875, -0.02325439453125, 0.066986083984375, 0.1572265625, 0.247467041015625, 0.33770751953125, 0.427947998046875, 0.5181884765625, 0.608428955078125, 0.69866943359375, 0.788909912109375, 0.879150390625, 0.969390869140625, 1.05963134765625, 1.149871826171875, 1.2401123046875, 1.330352783203125, 1.42059326171875, 1.510833740234375, 1.60107421875, 1.691314697265625, 1.78155517578125, 1.871795654296875, 1.9620361328125, 2.052276611328125, 2.14251708984375, 2.232757568359375, 2.322998046875, 2.413238525390625, 2.50347900390625, 2.593719482421875, 2.6839599609375, 2.774200439453125, 2.86444091796875, 2.954681396484375, 3.044921875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 10.0, 6.0, 3.0, 7.0, 12.0, 7.0, 9.0, 22.0, 14.0, 19.0, 17.0, 19.0, 18.0, 30.0, 30.0, 28.0, 32.0, 37.0, 33.0, 44.0, 26.0, 1063.0, 38.0, 43.0, 44.0, 36.0, 29.0, 38.0, 42.0, 48.0, 21.0, 28.0, 26.0, 16.0, 23.0, 15.0, 16.0, 20.0, 9.0, 14.0, 6.0, 8.0, 10.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.67578125, -5.4913330078125, -5.306884765625, -5.1224365234375, -4.93798828125, -4.7535400390625, -4.569091796875, -4.3846435546875, -4.2001953125, -4.0157470703125, -3.831298828125, -3.6468505859375, -3.46240234375, -3.2779541015625, -3.093505859375, -2.9090576171875, -2.724609375, -2.5401611328125, -2.355712890625, -2.1712646484375, -1.98681640625, -1.8023681640625, -1.617919921875, -1.4334716796875, -1.2490234375, -1.0645751953125, -0.880126953125, -0.6956787109375, -0.51123046875, -0.3267822265625, -0.142333984375, 0.0421142578125, 0.2265625, 0.4110107421875, 0.595458984375, 0.7799072265625, 0.96435546875, 1.1488037109375, 1.333251953125, 1.5177001953125, 1.7021484375, 1.8865966796875, 2.071044921875, 2.2554931640625, 2.43994140625, 2.6243896484375, 2.808837890625, 2.9932861328125, 3.177734375, 3.3621826171875, 3.546630859375, 3.7310791015625, 3.91552734375, 4.0999755859375, 4.284423828125, 4.4688720703125, 4.6533203125, 4.8377685546875, 5.022216796875, 5.2066650390625, 5.39111328125, 5.5755615234375, 5.760009765625, 5.9444580078125, 6.12890625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 12.0, 10.0, 19.0, 16.0, 27.0, 44.0, 52.0, 106.0, 135.0, 182.0, 268.0, 419.0, 609.0, 908.0, 1234.0, 1935.0, 2926.0, 4306.0, 6573.0, 9635.0, 14558.0, 22070.0, 34580.0, 55524.0, 96282.0, 211056.0, 1339627.0, 116784.0, 64762.0, 39346.0, 24741.0, 16155.0, 10723.0, 7191.0, 4722.0, 3223.0, 2067.0, 1426.0, 967.0, 575.0, 425.0, 298.0, 178.0, 137.0, 99.0, 63.0, 40.0, 33.0, 19.0, 11.0, 12.0, 4.0, 7.0, 5.0, 3.0, 1.0, 2.0], "bins": [-1.8408203125, -1.7852935791015625, -1.729766845703125, -1.6742401123046875, -1.61871337890625, -1.5631866455078125, -1.507659912109375, -1.4521331787109375, -1.3966064453125, -1.3410797119140625, -1.285552978515625, -1.2300262451171875, -1.17449951171875, -1.1189727783203125, -1.063446044921875, -1.0079193115234375, -0.952392578125, -0.8968658447265625, -0.841339111328125, -0.7858123779296875, -0.73028564453125, -0.6747589111328125, -0.619232177734375, -0.5637054443359375, -0.5081787109375, -0.4526519775390625, -0.397125244140625, -0.3415985107421875, -0.28607177734375, -0.2305450439453125, -0.175018310546875, -0.1194915771484375, -0.06396484375, -0.0084381103515625, 0.047088623046875, 0.1026153564453125, 0.15814208984375, 0.2136688232421875, 0.269195556640625, 0.3247222900390625, 0.3802490234375, 0.4357757568359375, 0.491302490234375, 0.5468292236328125, 0.60235595703125, 0.6578826904296875, 0.713409423828125, 0.7689361572265625, 0.824462890625, 0.8799896240234375, 0.935516357421875, 0.9910430908203125, 1.04656982421875, 1.1020965576171875, 1.157623291015625, 1.2131500244140625, 1.2686767578125, 1.3242034912109375, 1.379730224609375, 1.4352569580078125, 1.49078369140625, 1.5463104248046875, 1.601837158203125, 1.6573638916015625, 1.712890625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 8.0, 14.0, 11.0, 8.0, 7.0, 18.0, 15.0, 26.0, 35.0, 43.0, 47.0, 58.0, 74.0, 84.0, 96.0, 93.0, 73.0, 68.0, 50.0, 42.0, 32.0, 17.0, 16.0, 16.0, 14.0, 11.0, 5.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0014486312866210938, -0.0014041811227798462, -0.0013597309589385986, -0.001315280795097351, -0.0012708306312561035, -0.001226380467414856, -0.0011819303035736084, -0.0011374801397323608, -0.0010930299758911133, -0.0010485798120498657, -0.0010041296482086182, -0.0009596794843673706, -0.000915229320526123, -0.0008707791566848755, -0.0008263289928436279, -0.0007818788290023804, -0.0007374286651611328, -0.0006929785013198853, -0.0006485283374786377, -0.0006040781736373901, -0.0005596280097961426, -0.000515177845954895, -0.00047072768211364746, -0.0004262775182723999, -0.00038182735443115234, -0.0003373771905899048, -0.0002929270267486572, -0.00024847686290740967, -0.0002040266990661621, -0.00015957653522491455, -0.00011512637138366699, -7.067620754241943e-05, -2.6226043701171875e-05, 1.8224120140075684e-05, 6.267428398132324e-05, 0.0001071244478225708, 0.00015157461166381836, 0.00019602477550506592, 0.00024047493934631348, 0.00028492510318756104, 0.0003293752670288086, 0.00037382543087005615, 0.0004182755947113037, 0.00046272575855255127, 0.0005071759223937988, 0.0005516260862350464, 0.0005960762500762939, 0.0006405264139175415, 0.0006849765777587891, 0.0007294267416000366, 0.0007738769054412842, 0.0008183270692825317, 0.0008627772331237793, 0.0009072273969650269, 0.0009516775608062744, 0.000996127724647522, 0.0010405778884887695, 0.001085028052330017, 0.0011294782161712646, 0.0011739283800125122, 0.0012183785438537598, 0.0012628287076950073, 0.0013072788715362549, 0.0013517290353775024, 0.00139617919921875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 11.0, 19.0, 20.0, 13.0, 21.0, 34.0, 64.0, 107.0, 170.0, 528.0, 16779.0, 1028892.0, 1203.0, 282.0, 116.0, 86.0, 44.0, 37.0, 23.0, 18.0, 18.0, 7.0, 8.0, 12.0, 8.0, 9.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0347900390625, -0.0336766242980957, -0.032563209533691406, -0.03144979476928711, -0.030336380004882812, -0.029222965240478516, -0.02810955047607422, -0.026996135711669922, -0.025882720947265625, -0.024769306182861328, -0.02365589141845703, -0.022542476654052734, -0.021429061889648438, -0.02031564712524414, -0.019202232360839844, -0.018088817596435547, -0.01697540283203125, -0.015861988067626953, -0.014748573303222656, -0.01363515853881836, -0.012521743774414062, -0.011408329010009766, -0.010294914245605469, -0.009181499481201172, -0.008068084716796875, -0.006954669952392578, -0.005841255187988281, -0.004727840423583984, -0.0036144256591796875, -0.0025010108947753906, -0.0013875961303710938, -0.0002741813659667969, 0.0008392333984375, 0.0019526481628417969, 0.0030660629272460938, 0.004179477691650391, 0.0052928924560546875, 0.006406307220458984, 0.007519721984863281, 0.008633136749267578, 0.009746551513671875, 0.010859966278076172, 0.011973381042480469, 0.013086795806884766, 0.014200210571289062, 0.01531362533569336, 0.016427040100097656, 0.017540454864501953, 0.01865386962890625, 0.019767284393310547, 0.020880699157714844, 0.02199411392211914, 0.023107528686523438, 0.024220943450927734, 0.02533435821533203, 0.026447772979736328, 0.027561187744140625, 0.028674602508544922, 0.02978801727294922, 0.030901432037353516, 0.03201484680175781, 0.03312826156616211, 0.034241676330566406, 0.0353550910949707, 0.036468505859375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 83.0, 549.0, 349.0, 29.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000771817984059453, -0.0006589174154214561, -0.0005460168467834592, -0.0004331162781454623, -0.00032021570950746536, -0.00020731514086946845, -9.441457223147154e-05, 1.8485996406525373e-05, 0.00013138656504452229, 0.0002442871336825192, 0.0003571877023205161, 0.000470088270958513, 0.0005829888395965099, 0.0006958894082345068, 0.0008087899768725038, 0.0009216905455105007, 0.0010345911141484976, 0.0011474916245788336, 0.0012603922514244914, 0.0013732928782701492, 0.0014861933887004852, 0.0015990938991308212, 0.001711994525976479, 0.0018248951528221369, 0.0019377956632524729, 0.002050696173682809, 0.0021635969169437885, 0.0022764974273741245, 0.0023893979378044605, 0.0025022984482347965, 0.0026151989586651325, 0.002728099701926112, 0.002841000445187092, 0.002953900955617428, 0.003066801466047764, 0.0031797022093087435, 0.0032926027197390795, 0.0034055032301694155, 0.003518403973430395, 0.003631304483860731, 0.003744204994291067, 0.003857105504721403, 0.003970006015151739, 0.004082906525582075, 0.004195807501673698, 0.004308708012104034, 0.00442160852253437, 0.004534509032964706, 0.004647409543395042, 0.004760310053825378, 0.004873210564255714, 0.00498611107468605, 0.005099011585116386, 0.00521191256120801, 0.005324813071638346, 0.005437713582068682, 0.005550614092499018, 0.005663514602929354, 0.00577641511335969, 0.005889315623790026, 0.006002216599881649, 0.006115117110311985, 0.006228017620742321, 0.006340918131172657, 0.006453818641602993]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 10.0, 4.0, 11.0, 7.0, 12.0, 11.0, 15.0, 11.0, 19.0, 27.0, 29.0, 30.0, 31.0, 36.0, 38.0, 35.0, 50.0, 35.0, 54.0, 50.0, 43.0, 41.0, 40.0, 49.0, 34.0, 37.0, 27.0, 26.0, 23.0, 27.0, 29.0, 18.0, 23.0, 13.0, 15.0, 7.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006404519081115723, -0.000621275044977665, -0.0006020981818437576, -0.0005829213187098503, -0.000563744455575943, -0.0005445675924420357, -0.0005253907293081284, -0.000506213866174221, -0.0004870370030403137, -0.0004678601399064064, -0.0004486832767724991, -0.00042950641363859177, -0.00041032955050468445, -0.00039115268737077713, -0.0003719758242368698, -0.0003527989611029625, -0.0003336220979690552, -0.00031444523483514786, -0.00029526837170124054, -0.0002760915085673332, -0.0002569146454334259, -0.00023773778229951859, -0.00021856091916561127, -0.00019938405603170395, -0.00018020719289779663, -0.0001610303297638893, -0.000141853466629982, -0.00012267660349607468, -0.00010349974036216736, -8.432287722826004e-05, -6.514601409435272e-05, -4.5969150960445404e-05, -2.6792287826538086e-05, -7.615424692630768e-06, 1.156143844127655e-05, 3.073830157518387e-05, 4.9915164709091187e-05, 6.90920278429985e-05, 8.826889097690582e-05, 0.00010744575411081314, 0.00012662261724472046, 0.00014579948037862778, 0.0001649763435125351, 0.0001841532066464424, 0.00020333006978034973, 0.00022250693291425705, 0.00024168379604816437, 0.0002608606591820717, 0.000280037522315979, 0.0002992143854498863, 0.00031839124858379364, 0.00033756811171770096, 0.0003567449748516083, 0.0003759218379855156, 0.0003950987011194229, 0.00041427556425333023, 0.00043345242738723755, 0.00045262929052114487, 0.0004718061536550522, 0.0004909830167889595, 0.0005101598799228668, 0.0005293367430567741, 0.0005485136061906815, 0.0005676904693245888, 0.0005868673324584961]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 6.0, 8.0, 7.0, 9.0, 14.0, 15.0, 14.0, 23.0, 30.0, 26.0, 29.0, 43.0, 39.0, 50.0, 44.0, 46.0, 44.0, 42.0, 41.0, 47.0, 37.0, 51.0, 34.0, 43.0, 41.0, 41.0, 32.0, 25.0, 30.0, 18.0, 12.0, 10.0, 13.0, 8.0, 13.0, 4.0, 4.0, 0.0, 2.0, 6.0], "bins": [-14.34375, -14.00152587890625, -13.6593017578125, -13.31707763671875, -12.974853515625, -12.63262939453125, -12.2904052734375, -11.94818115234375, -11.60595703125, -11.26373291015625, -10.9215087890625, -10.57928466796875, -10.237060546875, -9.89483642578125, -9.5526123046875, -9.21038818359375, -8.8681640625, -8.52593994140625, -8.1837158203125, -7.84149169921875, -7.499267578125, -7.15704345703125, -6.8148193359375, -6.47259521484375, -6.13037109375, -5.78814697265625, -5.4459228515625, -5.10369873046875, -4.761474609375, -4.41925048828125, -4.0770263671875, -3.73480224609375, -3.392578125, -3.05035400390625, -2.7081298828125, -2.36590576171875, -2.023681640625, -1.68145751953125, -1.3392333984375, -0.99700927734375, -0.65478515625, -0.31256103515625, 0.0296630859375, 0.37188720703125, 0.714111328125, 1.05633544921875, 1.3985595703125, 1.74078369140625, 2.0830078125, 2.42523193359375, 2.7674560546875, 3.10968017578125, 3.451904296875, 3.79412841796875, 4.1363525390625, 4.47857666015625, 4.82080078125, 5.16302490234375, 5.5052490234375, 5.84747314453125, 6.189697265625, 6.53192138671875, 6.8741455078125, 7.21636962890625, 7.55859375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 10.0, 11.0, 14.0, 32.0, 31.0, 36.0, 59.0, 86.0, 140.0, 202.0, 279.0, 469.0, 730.0, 1339.0, 2492.0, 6501.0, 24827.0, 195278.0, 718116.0, 75456.0, 13488.0, 4175.0, 1963.0, 1014.0, 640.0, 392.0, 251.0, 150.0, 106.0, 78.0, 59.0, 38.0, 31.0, 24.0, 9.0, 15.0, 13.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.859375, -17.3533935546875, -16.847412109375, -16.3414306640625, -15.83544921875, -15.3294677734375, -14.823486328125, -14.3175048828125, -13.8115234375, -13.3055419921875, -12.799560546875, -12.2935791015625, -11.78759765625, -11.2816162109375, -10.775634765625, -10.2696533203125, -9.763671875, -9.2576904296875, -8.751708984375, -8.2457275390625, -7.73974609375, -7.2337646484375, -6.727783203125, -6.2218017578125, -5.7158203125, -5.2098388671875, -4.703857421875, -4.1978759765625, -3.69189453125, -3.1859130859375, -2.679931640625, -2.1739501953125, -1.66796875, -1.1619873046875, -0.656005859375, -0.1500244140625, 0.35595703125, 0.8619384765625, 1.367919921875, 1.8739013671875, 2.3798828125, 2.8858642578125, 3.391845703125, 3.8978271484375, 4.40380859375, 4.9097900390625, 5.415771484375, 5.9217529296875, 6.427734375, 6.9337158203125, 7.439697265625, 7.9456787109375, 8.45166015625, 8.9576416015625, 9.463623046875, 9.9696044921875, 10.4755859375, 10.9815673828125, 11.487548828125, 11.9935302734375, 12.49951171875, 13.0054931640625, 13.511474609375, 14.0174560546875, 14.5234375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 4.0, 2.0, 8.0, 8.0, 12.0, 23.0, 13.0, 21.0, 29.0, 26.0, 34.0, 37.0, 31.0, 43.0, 42.0, 54.0, 65.0, 180.0, 1709.0, 212.0, 82.0, 58.0, 45.0, 45.0, 39.0, 41.0, 28.0, 17.0, 30.0, 20.0, 15.0, 13.0, 8.0, 9.0, 13.0, 8.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.3125, -31.25439453125, -30.1962890625, -29.13818359375, -28.080078125, -27.02197265625, -25.9638671875, -24.90576171875, -23.84765625, -22.78955078125, -21.7314453125, -20.67333984375, -19.615234375, -18.55712890625, -17.4990234375, -16.44091796875, -15.3828125, -14.32470703125, -13.2666015625, -12.20849609375, -11.150390625, -10.09228515625, -9.0341796875, -7.97607421875, -6.91796875, -5.85986328125, -4.8017578125, -3.74365234375, -2.685546875, -1.62744140625, -0.5693359375, 0.48876953125, 1.546875, 2.60498046875, 3.6630859375, 4.72119140625, 5.779296875, 6.83740234375, 7.8955078125, 8.95361328125, 10.01171875, 11.06982421875, 12.1279296875, 13.18603515625, 14.244140625, 15.30224609375, 16.3603515625, 17.41845703125, 18.4765625, 19.53466796875, 20.5927734375, 21.65087890625, 22.708984375, 23.76708984375, 24.8251953125, 25.88330078125, 26.94140625, 27.99951171875, 29.0576171875, 30.11572265625, 31.173828125, 32.23193359375, 33.2900390625, 34.34814453125, 35.40625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 10.0, 10.0, 19.0, 28.0, 23.0, 43.0, 67.0, 93.0, 174.0, 277.0, 548.0, 2565.0, 3038637.0, 100873.0, 1243.0, 439.0, 198.0, 128.0, 95.0, 80.0, 50.0, 33.0, 15.0, 11.0, 11.0, 15.0, 6.0, 10.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-135.875, -132.083984375, -128.29296875, -124.501953125, -120.7109375, -116.919921875, -113.12890625, -109.337890625, -105.546875, -101.755859375, -97.96484375, -94.173828125, -90.3828125, -86.591796875, -82.80078125, -79.009765625, -75.21875, -71.427734375, -67.63671875, -63.845703125, -60.0546875, -56.263671875, -52.47265625, -48.681640625, -44.890625, -41.099609375, -37.30859375, -33.517578125, -29.7265625, -25.935546875, -22.14453125, -18.353515625, -14.5625, -10.771484375, -6.98046875, -3.189453125, 0.6015625, 4.392578125, 8.18359375, 11.974609375, 15.765625, 19.556640625, 23.34765625, 27.138671875, 30.9296875, 34.720703125, 38.51171875, 42.302734375, 46.09375, 49.884765625, 53.67578125, 57.466796875, 61.2578125, 65.048828125, 68.83984375, 72.630859375, 76.421875, 80.212890625, 84.00390625, 87.794921875, 91.5859375, 95.376953125, 99.16796875, 102.958984375, 106.75]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 16.0, 263.0, 658.0, 77.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.21563720703125, -40.60871505737305, -33.001792907714844, -25.394868850708008, -17.787946701049805, -10.181022644042969, -2.5741004943847656, 5.0328216552734375, 12.63974380493164, 20.246665954589844, 27.853588104248047, 35.46051025390625, 43.06743621826172, 50.67435836791992, 58.281280517578125, 65.88819885253906, 73.49512481689453, 81.10205078125, 88.70896911621094, 96.3158950805664, 103.92281341552734, 111.52973937988281, 119.13665771484375, 126.74358367919922, 134.3505096435547, 141.95742797851562, 149.56436157226562, 157.17127990722656, 164.7781982421875, 172.3851318359375, 179.99205017089844, 187.59896850585938, 195.2058868408203, 202.81280517578125, 210.41973876953125, 218.0266571044922, 225.63357543945312, 233.24050903320312, 240.84742736816406, 248.454345703125, 256.061279296875, 263.668212890625, 271.2751159667969, 278.8820495605469, 286.4889831542969, 294.09588623046875, 301.70281982421875, 309.30975341796875, 316.9166564941406, 324.5235900878906, 332.1304931640625, 339.7374267578125, 347.3443603515625, 354.9512634277344, 362.5581970214844, 370.16510009765625, 377.77203369140625, 385.37896728515625, 392.9858703613281, 400.5928039550781, 408.1997375488281, 415.806640625, 423.41357421875, 431.0205078125, 438.6274108886719]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 3.0, 8.0, 8.0, 4.0, 9.0, 8.0, 22.0, 14.0, 15.0, 24.0, 25.0, 20.0, 21.0, 31.0, 39.0, 38.0, 41.0, 42.0, 39.0, 42.0, 49.0, 40.0, 39.0, 39.0, 32.0, 43.0, 51.0, 34.0, 29.0, 36.0, 17.0, 32.0, 18.0, 18.0, 14.0, 13.0, 10.0, 11.0, 2.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-102.98809814453125, -100.13245391845703, -97.27680206298828, -94.42115783691406, -91.56550598144531, -88.7098617553711, -85.85420989990234, -82.99856567382812, -80.14291381835938, -77.28726959228516, -74.4316177368164, -71.57597351074219, -68.72032165527344, -65.86467742919922, -63.00902557373047, -60.15338134765625, -57.297733306884766, -54.44208526611328, -51.5864372253418, -48.73078918457031, -45.87514114379883, -43.019493103027344, -40.163848876953125, -37.308197021484375, -34.452552795410156, -31.596904754638672, -28.741256713867188, -25.885608673095703, -23.02996063232422, -20.174312591552734, -17.318666458129883, -14.463018417358398, -11.607368469238281, -8.751720428466797, -5.896072864532471, -3.0404253005981445, -0.18477725982666016, 2.670870780944824, 5.526517868041992, 8.382165908813477, 11.237813949584961, 14.093461990356445, 16.94911003112793, 19.80475616455078, 22.660404205322266, 25.51605224609375, 28.371700286865234, 31.22734832763672, 34.0829963684082, 36.93864440917969, 39.79429244995117, 42.649940490722656, 45.50558853149414, 48.361236572265625, 51.216880798339844, 54.072532653808594, 56.92817687988281, 59.7838249206543, 62.63947296142578, 65.4951171875, 68.35076904296875, 71.20641326904297, 74.06206512451172, 76.91770935058594, 79.77336120605469]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 9.0, 7.0, 5.0, 6.0, 13.0, 12.0, 14.0, 24.0, 28.0, 17.0, 39.0, 41.0, 35.0, 45.0, 39.0, 43.0, 44.0, 49.0, 36.0, 46.0, 55.0, 41.0, 42.0, 48.0, 30.0, 37.0, 39.0, 32.0, 18.0, 27.0, 15.0, 17.0, 14.0, 6.0, 7.0, 8.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-15.140625, -14.7657470703125, -14.390869140625, -14.0159912109375, -13.64111328125, -13.2662353515625, -12.891357421875, -12.5164794921875, -12.1416015625, -11.7667236328125, -11.391845703125, -11.0169677734375, -10.64208984375, -10.2672119140625, -9.892333984375, -9.5174560546875, -9.142578125, -8.7677001953125, -8.392822265625, -8.0179443359375, -7.64306640625, -7.2681884765625, -6.893310546875, -6.5184326171875, -6.1435546875, -5.7686767578125, -5.393798828125, -5.0189208984375, -4.64404296875, -4.2691650390625, -3.894287109375, -3.5194091796875, -3.14453125, -2.7696533203125, -2.394775390625, -2.0198974609375, -1.64501953125, -1.2701416015625, -0.895263671875, -0.5203857421875, -0.1455078125, 0.2293701171875, 0.604248046875, 0.9791259765625, 1.35400390625, 1.7288818359375, 2.103759765625, 2.4786376953125, 2.853515625, 3.2283935546875, 3.603271484375, 3.9781494140625, 4.35302734375, 4.7279052734375, 5.102783203125, 5.4776611328125, 5.8525390625, 6.2274169921875, 6.602294921875, 6.9771728515625, 7.35205078125, 7.7269287109375, 8.101806640625, 8.4766845703125, 8.8515625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 5.0, 9.0, 4.0, 7.0, 6.0, 10.0, 14.0, 15.0, 20.0, 25.0, 24.0, 41.0, 43.0, 54.0, 67.0, 198.0, 615.0, 3680.0, 131710.0, 3871048.0, 181646.0, 3923.0, 606.0, 175.0, 59.0, 49.0, 31.0, 41.0, 31.0, 25.0, 20.0, 23.0, 20.0, 10.0, 11.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-56.90625, -55.46630859375, -54.0263671875, -52.58642578125, -51.146484375, -49.70654296875, -48.2666015625, -46.82666015625, -45.38671875, -43.94677734375, -42.5068359375, -41.06689453125, -39.626953125, -38.18701171875, -36.7470703125, -35.30712890625, -33.8671875, -32.42724609375, -30.9873046875, -29.54736328125, -28.107421875, -26.66748046875, -25.2275390625, -23.78759765625, -22.34765625, -20.90771484375, -19.4677734375, -18.02783203125, -16.587890625, -15.14794921875, -13.7080078125, -12.26806640625, -10.828125, -9.38818359375, -7.9482421875, -6.50830078125, -5.068359375, -3.62841796875, -2.1884765625, -0.74853515625, 0.69140625, 2.13134765625, 3.5712890625, 5.01123046875, 6.451171875, 7.89111328125, 9.3310546875, 10.77099609375, 12.2109375, 13.65087890625, 15.0908203125, 16.53076171875, 17.970703125, 19.41064453125, 20.8505859375, 22.29052734375, 23.73046875, 25.17041015625, 26.6103515625, 28.05029296875, 29.490234375, 30.93017578125, 32.3701171875, 33.81005859375, 35.25]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 7.0, 8.0, 13.0, 21.0, 16.0, 46.0, 46.0, 79.0, 125.0, 195.0, 277.0, 489.0, 693.0, 618.0, 500.0, 305.0, 240.0, 133.0, 84.0, 54.0, 46.0, 29.0, 18.0, 12.0, 7.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.640625, -29.79052734375, -28.9404296875, -28.09033203125, -27.240234375, -26.39013671875, -25.5400390625, -24.68994140625, -23.83984375, -22.98974609375, -22.1396484375, -21.28955078125, -20.439453125, -19.58935546875, -18.7392578125, -17.88916015625, -17.0390625, -16.18896484375, -15.3388671875, -14.48876953125, -13.638671875, -12.78857421875, -11.9384765625, -11.08837890625, -10.23828125, -9.38818359375, -8.5380859375, -7.68798828125, -6.837890625, -5.98779296875, -5.1376953125, -4.28759765625, -3.4375, -2.58740234375, -1.7373046875, -0.88720703125, -0.037109375, 0.81298828125, 1.6630859375, 2.51318359375, 3.36328125, 4.21337890625, 5.0634765625, 5.91357421875, 6.763671875, 7.61376953125, 8.4638671875, 9.31396484375, 10.1640625, 11.01416015625, 11.8642578125, 12.71435546875, 13.564453125, 14.41455078125, 15.2646484375, 16.11474609375, 16.96484375, 17.81494140625, 18.6650390625, 19.51513671875, 20.365234375, 21.21533203125, 22.0654296875, 22.91552734375, 23.765625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 5.0, 8.0, 6.0, 3.0, 11.0, 12.0, 30.0, 27.0, 40.0, 34.0, 63.0, 83.0, 108.0, 139.0, 183.0, 254.0, 434.0, 924.0, 8472.0, 4005607.0, 174326.0, 1840.0, 534.0, 286.0, 221.0, 149.0, 104.0, 93.0, 68.0, 51.0, 47.0, 28.0, 25.0, 17.0, 15.0, 9.0, 4.0, 3.0, 6.0, 3.0, 4.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.0, -86.0078125, -83.015625, -80.0234375, -77.03125, -74.0390625, -71.046875, -68.0546875, -65.0625, -62.0703125, -59.078125, -56.0859375, -53.09375, -50.1015625, -47.109375, -44.1171875, -41.125, -38.1328125, -35.140625, -32.1484375, -29.15625, -26.1640625, -23.171875, -20.1796875, -17.1875, -14.1953125, -11.203125, -8.2109375, -5.21875, -2.2265625, 0.765625, 3.7578125, 6.75, 9.7421875, 12.734375, 15.7265625, 18.71875, 21.7109375, 24.703125, 27.6953125, 30.6875, 33.6796875, 36.671875, 39.6640625, 42.65625, 45.6484375, 48.640625, 51.6328125, 54.625, 57.6171875, 60.609375, 63.6015625, 66.59375, 69.5859375, 72.578125, 75.5703125, 78.5625, 81.5546875, 84.546875, 87.5390625, 90.53125, 93.5234375, 96.515625, 99.5078125, 102.5]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 50.0, 260.0, 448.0, 207.0, 37.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.01313018798828, -102.00872039794922, -93.00431823730469, -83.99990844726562, -74.99549865722656, -65.9910888671875, -56.9866828918457, -47.982276916503906, -38.977867126464844, -29.973459243774414, -20.969051361083984, -11.964643478393555, -2.960235595703125, 6.0441741943359375, 15.048580169677734, 24.05298614501953, 33.057395935058594, 42.061805725097656, 51.06621170043945, 60.07061767578125, 69.07502746582031, 78.07943725585938, 87.08384704589844, 96.08824920654297, 105.09265899658203, 114.0970687866211, 123.10147094726562, 132.1058807373047, 141.11029052734375, 150.1147003173828, 159.11911010742188, 168.12350463867188, 177.1279296875, 186.13233947753906, 195.13674926757812, 204.1411590576172, 213.14556884765625, 222.14996337890625, 231.1543731689453, 240.15878295898438, 249.16319274902344, 258.1676025390625, 267.1719970703125, 276.1764221191406, 285.1808166503906, 294.18524169921875, 303.18963623046875, 312.19403076171875, 321.1984558105469, 330.2028503417969, 339.207275390625, 348.211669921875, 357.2160949707031, 366.2204895019531, 375.22491455078125, 384.22930908203125, 393.23370361328125, 402.23809814453125, 411.2425231933594, 420.2469177246094, 429.2513427734375, 438.2557373046875, 447.2601623535156, 456.2645568847656, 465.26898193359375]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 5.0, 5.0, 7.0, 3.0, 6.0, 12.0, 17.0, 14.0, 21.0, 20.0, 11.0, 18.0, 21.0, 24.0, 23.0, 33.0, 35.0, 39.0, 36.0, 39.0, 41.0, 46.0, 34.0, 37.0, 49.0, 37.0, 34.0, 28.0, 30.0, 35.0, 24.0, 26.0, 24.0, 29.0, 19.0, 16.0, 20.0, 9.0, 13.0, 10.0, 10.0, 5.0, 8.0, 5.0, 6.0, 5.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.7250862121582, -52.86930847167969, -51.013526916503906, -49.15774917602539, -47.30196762084961, -45.446189880371094, -43.59040832519531, -41.7346305847168, -39.87885284423828, -38.023075103759766, -36.167293548583984, -34.31151580810547, -32.45573425292969, -30.599956512451172, -28.744176864624023, -26.888397216796875, -25.032615661621094, -23.176836013793945, -21.321056365966797, -19.46527862548828, -17.6094970703125, -15.753718376159668, -13.897939682006836, -12.042160034179688, -10.186380386352539, -8.33060073852539, -6.4748215675354, -4.61904239654541, -2.7632627487182617, -0.9074831008911133, 0.9482955932617188, 2.804075241088867, 4.659858703613281, 6.51563835144043, 8.371417999267578, 10.22719669342041, 12.082976341247559, 13.938755989074707, 15.794534683227539, 17.650314331054688, 19.506093978881836, 21.361873626708984, 23.217653274536133, 25.07343292236328, 26.929210662841797, 28.784992218017578, 30.640769958496094, 32.496551513671875, 34.35232925415039, 36.208106994628906, 38.06388854980469, 39.9196662902832, 41.775447845458984, 43.6312255859375, 45.48700714111328, 47.3427848815918, 49.19856262207031, 51.05434036254883, 52.91012191772461, 54.765899658203125, 56.621681213378906, 58.47745895385742, 60.33323669433594, 62.18901824951172, 64.0447998046875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 6.0, 10.0, 4.0, 2.0, 12.0, 13.0, 11.0, 24.0, 19.0, 18.0, 26.0, 31.0, 28.0, 33.0, 37.0, 43.0, 28.0, 40.0, 44.0, 49.0, 53.0, 46.0, 41.0, 36.0, 51.0, 43.0, 50.0, 25.0, 31.0, 29.0, 20.0, 18.0, 11.0, 18.0, 13.0, 22.0, 4.0, 7.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.9609375, -12.6121826171875, -12.263427734375, -11.9146728515625, -11.56591796875, -11.2171630859375, -10.868408203125, -10.5196533203125, -10.1708984375, -9.8221435546875, -9.473388671875, -9.1246337890625, -8.77587890625, -8.4271240234375, -8.078369140625, -7.7296142578125, -7.380859375, -7.0321044921875, -6.683349609375, -6.3345947265625, -5.98583984375, -5.6370849609375, -5.288330078125, -4.9395751953125, -4.5908203125, -4.2420654296875, -3.893310546875, -3.5445556640625, -3.19580078125, -2.8470458984375, -2.498291015625, -2.1495361328125, -1.80078125, -1.4520263671875, -1.103271484375, -0.7545166015625, -0.40576171875, -0.0570068359375, 0.291748046875, 0.6405029296875, 0.9892578125, 1.3380126953125, 1.686767578125, 2.0355224609375, 2.38427734375, 2.7330322265625, 3.081787109375, 3.4305419921875, 3.779296875, 4.1280517578125, 4.476806640625, 4.8255615234375, 5.17431640625, 5.5230712890625, 5.871826171875, 6.2205810546875, 6.5693359375, 6.9180908203125, 7.266845703125, 7.6156005859375, 7.96435546875, 8.3131103515625, 8.661865234375, 9.0106201171875, 9.359375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 10.0, 9.0, 4.0, 7.0, 13.0, 27.0, 31.0, 43.0, 73.0, 107.0, 147.0, 178.0, 345.0, 483.0, 675.0, 1092.0, 1611.0, 2358.0, 3671.0, 5802.0, 8800.0, 13169.0, 21087.0, 33641.0, 56969.0, 103078.0, 252530.0, 279585.0, 107174.0, 59191.0, 34740.0, 21690.0, 13874.0, 9023.0, 6009.0, 3741.0, 2421.0, 1780.0, 1128.0, 735.0, 489.0, 328.0, 212.0, 154.0, 77.0, 75.0, 57.0, 41.0, 19.0, 10.0, 8.0, 7.0, 5.0, 6.0, 2.0, 6.0, 5.0, 2.0], "bins": [-2.119140625, -2.05499267578125, -1.9908447265625, -1.92669677734375, -1.862548828125, -1.79840087890625, -1.7342529296875, -1.67010498046875, -1.60595703125, -1.54180908203125, -1.4776611328125, -1.41351318359375, -1.349365234375, -1.28521728515625, -1.2210693359375, -1.15692138671875, -1.0927734375, -1.02862548828125, -0.9644775390625, -0.90032958984375, -0.836181640625, -0.77203369140625, -0.7078857421875, -0.64373779296875, -0.57958984375, -0.51544189453125, -0.4512939453125, -0.38714599609375, -0.322998046875, -0.25885009765625, -0.1947021484375, -0.13055419921875, -0.06640625, -0.00225830078125, 0.0618896484375, 0.12603759765625, 0.190185546875, 0.25433349609375, 0.3184814453125, 0.38262939453125, 0.44677734375, 0.51092529296875, 0.5750732421875, 0.63922119140625, 0.703369140625, 0.76751708984375, 0.8316650390625, 0.89581298828125, 0.9599609375, 1.02410888671875, 1.0882568359375, 1.15240478515625, 1.216552734375, 1.28070068359375, 1.3448486328125, 1.40899658203125, 1.47314453125, 1.53729248046875, 1.6014404296875, 1.66558837890625, 1.729736328125, 1.79388427734375, 1.8580322265625, 1.92218017578125, 1.986328125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 6.0, 18.0, 11.0, 15.0, 14.0, 11.0, 10.0, 15.0, 11.0, 23.0, 31.0, 28.0, 44.0, 32.0, 34.0, 39.0, 38.0, 50.0, 1057.0, 46.0, 49.0, 41.0, 42.0, 30.0, 37.0, 35.0, 29.0, 33.0, 26.0, 29.0, 12.0, 27.0, 13.0, 13.0, 10.0, 12.0, 13.0, 10.0, 7.0, 3.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-7.05078125, -6.84893798828125, -6.6470947265625, -6.44525146484375, -6.243408203125, -6.04156494140625, -5.8397216796875, -5.63787841796875, -5.43603515625, -5.23419189453125, -5.0323486328125, -4.83050537109375, -4.628662109375, -4.42681884765625, -4.2249755859375, -4.02313232421875, -3.8212890625, -3.61944580078125, -3.4176025390625, -3.21575927734375, -3.013916015625, -2.81207275390625, -2.6102294921875, -2.40838623046875, -2.20654296875, -2.00469970703125, -1.8028564453125, -1.60101318359375, -1.399169921875, -1.19732666015625, -0.9954833984375, -0.79364013671875, -0.591796875, -0.38995361328125, -0.1881103515625, 0.01373291015625, 0.215576171875, 0.41741943359375, 0.6192626953125, 0.82110595703125, 1.02294921875, 1.22479248046875, 1.4266357421875, 1.62847900390625, 1.830322265625, 2.03216552734375, 2.2340087890625, 2.43585205078125, 2.6376953125, 2.83953857421875, 3.0413818359375, 3.24322509765625, 3.445068359375, 3.64691162109375, 3.8487548828125, 4.05059814453125, 4.25244140625, 4.45428466796875, 4.6561279296875, 4.85797119140625, 5.059814453125, 5.26165771484375, 5.4635009765625, 5.66534423828125, 5.8671875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 12.0, 8.0, 20.0, 30.0, 39.0, 54.0, 61.0, 130.0, 190.0, 292.0, 413.0, 644.0, 934.0, 1569.0, 2378.0, 3601.0, 5580.0, 8368.0, 12866.0, 20134.0, 31826.0, 52976.0, 96236.0, 233045.0, 1354923.0, 112793.0, 60211.0, 35709.0, 21939.0, 13833.0, 9075.0, 6115.0, 3962.0, 2491.0, 1635.0, 1030.0, 681.0, 423.0, 315.0, 191.0, 142.0, 83.0, 50.0, 39.0, 31.0, 23.0, 9.0, 11.0, 8.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8974609375, -1.8344573974609375, -1.771453857421875, -1.7084503173828125, -1.64544677734375, -1.5824432373046875, -1.519439697265625, -1.4564361572265625, -1.3934326171875, -1.3304290771484375, -1.267425537109375, -1.2044219970703125, -1.14141845703125, -1.0784149169921875, -1.015411376953125, -0.9524078369140625, -0.889404296875, -0.8264007568359375, -0.763397216796875, -0.7003936767578125, -0.63739013671875, -0.5743865966796875, -0.511383056640625, -0.4483795166015625, -0.3853759765625, -0.3223724365234375, -0.259368896484375, -0.1963653564453125, -0.13336181640625, -0.0703582763671875, -0.007354736328125, 0.0556488037109375, 0.11865234375, 0.1816558837890625, 0.244659423828125, 0.3076629638671875, 0.37066650390625, 0.4336700439453125, 0.496673583984375, 0.5596771240234375, 0.6226806640625, 0.6856842041015625, 0.748687744140625, 0.8116912841796875, 0.87469482421875, 0.9376983642578125, 1.000701904296875, 1.0637054443359375, 1.126708984375, 1.1897125244140625, 1.252716064453125, 1.3157196044921875, 1.37872314453125, 1.4417266845703125, 1.504730224609375, 1.5677337646484375, 1.6307373046875, 1.6937408447265625, 1.756744384765625, 1.8197479248046875, 1.88275146484375, 1.9457550048828125, 2.008758544921875, 2.0717620849609375, 2.134765625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 10.0, 8.0, 13.0, 14.0, 15.0, 24.0, 36.0, 42.0, 45.0, 54.0, 85.0, 92.0, 82.0, 96.0, 82.0, 66.0, 48.0, 43.0, 35.0, 24.0, 18.0, 17.0, 9.0, 2.0, 7.0, 5.0, 5.0, 3.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013246536254882812, -0.0012767314910888672, -0.0012288093566894531, -0.001180887222290039, -0.001132965087890625, -0.001085042953491211, -0.0010371208190917969, -0.0009891986846923828, -0.0009412765502929688, -0.0008933544158935547, -0.0008454322814941406, -0.0007975101470947266, -0.0007495880126953125, -0.0007016658782958984, -0.0006537437438964844, -0.0006058216094970703, -0.0005578994750976562, -0.0005099773406982422, -0.0004620552062988281, -0.00041413307189941406, -0.0003662109375, -0.00031828880310058594, -0.0002703666687011719, -0.0002224445343017578, -0.00017452239990234375, -0.0001266002655029297, -7.867813110351562e-05, -3.075599670410156e-05, 1.71661376953125e-05, 6.508827209472656e-05, 0.00011301040649414062, 0.0001609325408935547, 0.00020885467529296875, 0.0002567768096923828, 0.0003046989440917969, 0.00035262107849121094, 0.000400543212890625, 0.00044846534729003906, 0.0004963874816894531, 0.0005443096160888672, 0.0005922317504882812, 0.0006401538848876953, 0.0006880760192871094, 0.0007359981536865234, 0.0007839202880859375, 0.0008318424224853516, 0.0008797645568847656, 0.0009276866912841797, 0.0009756088256835938, 0.0010235309600830078, 0.0010714530944824219, 0.001119375228881836, 0.00116729736328125, 0.001215219497680664, 0.0012631416320800781, 0.0013110637664794922, 0.0013589859008789062, 0.0014069080352783203, 0.0014548301696777344, 0.0015027523040771484, 0.0015506744384765625, 0.0015985965728759766, 0.0016465187072753906, 0.0016944408416748047, 0.0017423629760742188]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 6.0, 4.0, 3.0, 5.0, 8.0, 8.0, 14.0, 13.0, 16.0, 41.0, 54.0, 66.0, 100.0, 192.0, 483.0, 5972.0, 1038589.0, 2102.0, 389.0, 173.0, 85.0, 53.0, 45.0, 25.0, 26.0, 21.0, 18.0, 12.0, 9.0, 5.0, 7.0, 2.0, 5.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.04296875, -0.04187798500061035, -0.0407872200012207, -0.039696455001831055, -0.038605690002441406, -0.03751492500305176, -0.03642416000366211, -0.03533339500427246, -0.03424263000488281, -0.033151865005493164, -0.032061100006103516, -0.030970335006713867, -0.02987957000732422, -0.02878880500793457, -0.027698040008544922, -0.026607275009155273, -0.025516510009765625, -0.024425745010375977, -0.023334980010986328, -0.02224421501159668, -0.02115345001220703, -0.020062685012817383, -0.018971920013427734, -0.017881155014038086, -0.016790390014648438, -0.01569962501525879, -0.01460886001586914, -0.013518095016479492, -0.012427330017089844, -0.011336565017700195, -0.010245800018310547, -0.009155035018920898, -0.00806427001953125, -0.0069735050201416016, -0.005882740020751953, -0.004791975021362305, -0.0037012100219726562, -0.002610445022583008, -0.0015196800231933594, -0.00042891502380371094, 0.0006618499755859375, 0.001752614974975586, 0.0028433799743652344, 0.003934144973754883, 0.005024909973144531, 0.00611567497253418, 0.007206439971923828, 0.008297204971313477, 0.009387969970703125, 0.010478734970092773, 0.011569499969482422, 0.01266026496887207, 0.013751029968261719, 0.014841794967651367, 0.015932559967041016, 0.017023324966430664, 0.018114089965820312, 0.01920485496520996, 0.02029561996459961, 0.021386384963989258, 0.022477149963378906, 0.023567914962768555, 0.024658679962158203, 0.02574944496154785, 0.0268402099609375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 16.0, 48.0, 99.0, 229.0, 276.0, 196.0, 91.0, 39.0, 10.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002055614721029997, -0.002011307515203953, -0.001967000076547265, -0.001922692870721221, -0.0018783856648951769, -0.001834078342653811, -0.001789771020412445, -0.001745463814586401, -0.001701156608760357, -0.001656849286518991, -0.001612542080692947, -0.001568234758451581, -0.001523927552625537, -0.001479620230384171, -0.001435312908142805, -0.001391005702316761, -0.001346698380075395, -0.0013023910578340292, -0.0012580838520079851, -0.0012137765297666192, -0.0011694693239405751, -0.0011251620016992092, -0.0010808547958731651, -0.0010365474736317992, -0.0009922401513904333, -0.0009479328873567283, -0.0009036256233230233, -0.0008593183010816574, -0.0008150110952556133, -0.0007707037730142474, -0.0007263965089805424, -0.0006820892449468374, -0.0006377821555361152, -0.0005934748915024102, -0.0005491676274687052, -0.0005048603052273393, -0.00046055307029746473, -0.00041624580626375973, -0.0003719385131262243, -0.0003276312490925193, -0.0002833239850588143, -0.0002390167210251093, -0.00019470944243948907, -0.00015040216385386884, -0.00010609489982016385, -6.178763578645885e-05, -1.7480342648923397e-05, 2.68269213847816e-05, 7.11341854184866e-05, 0.0001154414567281492, 0.00015974872803781182, 0.00020405600662343204, 0.00024836327065713704, 0.00029267053469084203, 0.0003369778278283775, 0.0003812850918620825, 0.0004255923558957875, 0.0004698996199294925, 0.0005142068839631975, 0.0005585141479969025, 0.0006028214702382684, 0.0006471286760643125, 0.0006914359983056784, 0.0007357432623393834, 0.0007800505263730884]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 7.0, 8.0, 11.0, 12.0, 16.0, 13.0, 11.0, 17.0, 16.0, 31.0, 20.0, 33.0, 35.0, 27.0, 42.0, 39.0, 48.0, 40.0, 45.0, 44.0, 42.0, 32.0, 40.0, 37.0, 45.0, 36.0, 32.0, 38.0, 20.0, 25.0, 25.0, 17.0, 24.0, 11.0, 5.0, 9.0, 10.0, 8.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0006409883499145508, -0.0006217369809746742, -0.0006024856120347977, -0.0005832342430949211, -0.0005639828741550446, -0.000544731505215168, -0.0005254801362752914, -0.0005062287673354149, -0.00048697739839553833, -0.0004677260294556618, -0.0004484746605157852, -0.00042922329157590866, -0.0004099719226360321, -0.00039072055369615555, -0.000371469184756279, -0.00035221781581640244, -0.0003329664468765259, -0.0003137150779366493, -0.00029446370899677277, -0.0002752123400568962, -0.00025596097111701965, -0.0002367096021771431, -0.00021745823323726654, -0.00019820686429738998, -0.00017895549535751343, -0.00015970412641763687, -0.00014045275747776031, -0.00012120138853788376, -0.0001019500195980072, -8.269865065813065e-05, -6.344728171825409e-05, -4.419591277837753e-05, -2.4944543838500977e-05, -5.69317489862442e-06, 1.3558194041252136e-05, 3.280956298112869e-05, 5.206093192100525e-05, 7.13123008608818e-05, 9.056366980075836e-05, 0.00010981503874063492, 0.00012906640768051147, 0.00014831777662038803, 0.0001675691455602646, 0.00018682051450014114, 0.0002060718834400177, 0.00022532325237989426, 0.0002445746213197708, 0.00026382599025964737, 0.0002830773591995239, 0.0003023287281394005, 0.00032158009707927704, 0.0003408314660191536, 0.00036008283495903015, 0.0003793342038989067, 0.00039858557283878326, 0.0004178369417786598, 0.0004370883107185364, 0.00045633967965841293, 0.0004755910485982895, 0.000494842417538166, 0.0005140937864780426, 0.0005333451554179192, 0.0005525965243577957, 0.0005718478932976723, 0.0005910992622375488]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 6.0, 10.0, 4.0, 2.0, 12.0, 13.0, 11.0, 24.0, 19.0, 18.0, 26.0, 31.0, 28.0, 33.0, 37.0, 43.0, 28.0, 40.0, 44.0, 49.0, 53.0, 46.0, 41.0, 36.0, 51.0, 43.0, 50.0, 25.0, 31.0, 29.0, 20.0, 18.0, 11.0, 18.0, 13.0, 22.0, 4.0, 7.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.9609375, -12.6121826171875, -12.263427734375, -11.9146728515625, -11.56591796875, -11.2171630859375, -10.868408203125, -10.5196533203125, -10.1708984375, -9.8221435546875, -9.473388671875, -9.1246337890625, -8.77587890625, -8.4271240234375, -8.078369140625, -7.7296142578125, -7.380859375, -7.0321044921875, -6.683349609375, -6.3345947265625, -5.98583984375, -5.6370849609375, -5.288330078125, -4.9395751953125, -4.5908203125, -4.2420654296875, -3.893310546875, -3.5445556640625, -3.19580078125, -2.8470458984375, -2.498291015625, -2.1495361328125, -1.80078125, -1.4520263671875, -1.103271484375, -0.7545166015625, -0.40576171875, -0.0570068359375, 0.291748046875, 0.6405029296875, 0.9892578125, 1.3380126953125, 1.686767578125, 2.0355224609375, 2.38427734375, 2.7330322265625, 3.081787109375, 3.4305419921875, 3.779296875, 4.1280517578125, 4.476806640625, 4.8255615234375, 5.17431640625, 5.5230712890625, 5.871826171875, 6.2205810546875, 6.5693359375, 6.9180908203125, 7.266845703125, 7.6156005859375, 7.96435546875, 8.3131103515625, 8.661865234375, 9.0106201171875, 9.359375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 21.0, 25.0, 41.0, 56.0, 100.0, 195.0, 297.0, 601.0, 1154.0, 2883.0, 8099.0, 30254.0, 198516.0, 670824.0, 105949.0, 19531.0, 5838.0, 2079.0, 992.0, 455.0, 243.0, 169.0, 93.0, 53.0, 20.0, 19.0, 13.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.234375, -14.865966796875, -14.49755859375, -14.129150390625, -13.7607421875, -13.392333984375, -13.02392578125, -12.655517578125, -12.287109375, -11.918701171875, -11.55029296875, -11.181884765625, -10.8134765625, -10.445068359375, -10.07666015625, -9.708251953125, -9.33984375, -8.971435546875, -8.60302734375, -8.234619140625, -7.8662109375, -7.497802734375, -7.12939453125, -6.760986328125, -6.392578125, -6.024169921875, -5.65576171875, -5.287353515625, -4.9189453125, -4.550537109375, -4.18212890625, -3.813720703125, -3.4453125, -3.076904296875, -2.70849609375, -2.340087890625, -1.9716796875, -1.603271484375, -1.23486328125, -0.866455078125, -0.498046875, -0.129638671875, 0.23876953125, 0.607177734375, 0.9755859375, 1.343994140625, 1.71240234375, 2.080810546875, 2.44921875, 2.817626953125, 3.18603515625, 3.554443359375, 3.9228515625, 4.291259765625, 4.65966796875, 5.028076171875, 5.396484375, 5.764892578125, 6.13330078125, 6.501708984375, 6.8701171875, 7.238525390625, 7.60693359375, 7.975341796875, 8.34375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 3.0, 8.0, 14.0, 16.0, 24.0, 27.0, 22.0, 25.0, 49.0, 49.0, 59.0, 53.0, 82.0, 166.0, 1850.0, 153.0, 72.0, 72.0, 53.0, 38.0, 43.0, 33.0, 25.0, 26.0, 19.0, 14.0, 10.0, 6.0, 8.0, 4.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.3125, -49.00537109375, -47.6982421875, -46.39111328125, -45.083984375, -43.77685546875, -42.4697265625, -41.16259765625, -39.85546875, -38.54833984375, -37.2412109375, -35.93408203125, -34.626953125, -33.31982421875, -32.0126953125, -30.70556640625, -29.3984375, -28.09130859375, -26.7841796875, -25.47705078125, -24.169921875, -22.86279296875, -21.5556640625, -20.24853515625, -18.94140625, -17.63427734375, -16.3271484375, -15.02001953125, -13.712890625, -12.40576171875, -11.0986328125, -9.79150390625, -8.484375, -7.17724609375, -5.8701171875, -4.56298828125, -3.255859375, -1.94873046875, -0.6416015625, 0.66552734375, 1.97265625, 3.27978515625, 4.5869140625, 5.89404296875, 7.201171875, 8.50830078125, 9.8154296875, 11.12255859375, 12.4296875, 13.73681640625, 15.0439453125, 16.35107421875, 17.658203125, 18.96533203125, 20.2724609375, 21.57958984375, 22.88671875, 24.19384765625, 25.5009765625, 26.80810546875, 28.115234375, 29.42236328125, 30.7294921875, 32.03662109375, 33.34375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 4.0, 9.0, 7.0, 19.0, 19.0, 29.0, 39.0, 51.0, 75.0, 92.0, 127.0, 176.0, 259.0, 425.0, 1247.0, 110387.0, 3028519.0, 2592.0, 533.0, 298.0, 213.0, 156.0, 108.0, 83.0, 58.0, 48.0, 34.0, 30.0, 8.0, 13.0, 12.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-83.0625, -80.2138671875, -77.365234375, -74.5166015625, -71.66796875, -68.8193359375, -65.970703125, -63.1220703125, -60.2734375, -57.4248046875, -54.576171875, -51.7275390625, -48.87890625, -46.0302734375, -43.181640625, -40.3330078125, -37.484375, -34.6357421875, -31.787109375, -28.9384765625, -26.08984375, -23.2412109375, -20.392578125, -17.5439453125, -14.6953125, -11.8466796875, -8.998046875, -6.1494140625, -3.30078125, -0.4521484375, 2.396484375, 5.2451171875, 8.09375, 10.9423828125, 13.791015625, 16.6396484375, 19.48828125, 22.3369140625, 25.185546875, 28.0341796875, 30.8828125, 33.7314453125, 36.580078125, 39.4287109375, 42.27734375, 45.1259765625, 47.974609375, 50.8232421875, 53.671875, 56.5205078125, 59.369140625, 62.2177734375, 65.06640625, 67.9150390625, 70.763671875, 73.6123046875, 76.4609375, 79.3095703125, 82.158203125, 85.0068359375, 87.85546875, 90.7041015625, 93.552734375, 96.4013671875, 99.25]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 26.0, 427.0, 512.0, 46.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-274.1693420410156, -269.0989990234375, -264.0286865234375, -258.9583435058594, -253.88800048828125, -248.8176727294922, -243.74732971191406, -238.677001953125, -233.60665893554688, -228.5363311767578, -223.4659881591797, -218.39566040039062, -213.3253173828125, -208.25498962402344, -203.1846466064453, -198.11431884765625, -193.04397583007812, -187.97364807128906, -182.90330505371094, -177.83297729492188, -172.76263427734375, -167.6923065185547, -162.62196350097656, -157.5516357421875, -152.48130798339844, -147.41098022460938, -142.34063720703125, -137.2703094482422, -132.19996643066406, -127.12963104248047, -122.05929565429688, -116.98896789550781, -111.91860961914062, -106.84827423095703, -101.77793884277344, -96.70760345458984, -91.63726806640625, -86.56693267822266, -81.49659729003906, -76.42626953125, -71.3559341430664, -66.28559875488281, -61.21526336669922, -56.144927978515625, -51.07459259033203, -46.00425720214844, -40.93392562866211, -35.863590240478516, -30.793254852294922, -25.722919464111328, -20.652584075927734, -15.582250595092773, -10.51191520690918, -5.441579818725586, -0.371246337890625, 4.699089050292969, 9.769424438476562, 14.839759826660156, 19.91009521484375, 24.98042869567871, 30.050764083862305, 35.12110137939453, 40.19143295288086, 45.26176834106445, 50.33210372924805]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 6.0, 8.0, 9.0, 12.0, 13.0, 15.0, 18.0, 14.0, 16.0, 23.0, 24.0, 26.0, 27.0, 21.0, 17.0, 36.0, 31.0, 35.0, 35.0, 41.0, 43.0, 40.0, 33.0, 38.0, 36.0, 36.0, 36.0, 27.0, 31.0, 30.0, 29.0, 20.0, 19.0, 19.0, 19.0, 16.0, 8.0, 9.0, 15.0, 6.0, 6.0, 12.0, 7.0, 5.0, 10.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-76.9843521118164, -74.50233459472656, -72.02031707763672, -69.53829956054688, -67.05628204345703, -64.57426452636719, -62.09224319458008, -59.61022186279297, -57.128204345703125, -54.64618682861328, -52.16416931152344, -49.682151794433594, -47.200130462646484, -44.71811294555664, -42.2360954284668, -39.75407409667969, -37.27206039428711, -34.790042877197266, -32.30802536010742, -29.826005935668945, -27.34398651123047, -24.861968994140625, -22.37995147705078, -19.897932052612305, -17.41591453552246, -14.9338960647583, -12.45187759399414, -9.969860076904297, -7.487841606140137, -5.005823135375977, -2.523805618286133, -0.04178619384765625, 2.4402313232421875, 4.922249794006348, 7.40426778793335, 9.886285781860352, 12.368304252624512, 14.850322723388672, 17.332340240478516, 19.814359664916992, 22.296377182006836, 24.77839469909668, 27.260414123535156, 29.742431640625, 32.224449157714844, 34.70646667480469, 37.18848419189453, 39.67050552368164, 42.152523040771484, 44.63454055786133, 47.11655807495117, 49.59857940673828, 52.080596923828125, 54.56261444091797, 57.04463195800781, 59.526649475097656, 62.0086669921875, 64.49068450927734, 66.97270202636719, 69.45471954345703, 71.93673706054688, 74.41876220703125, 76.90077209472656, 79.38279724121094, 81.86481475830078]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 9.0, 3.0, 4.0, 12.0, 12.0, 11.0, 19.0, 22.0, 20.0, 21.0, 25.0, 31.0, 29.0, 40.0, 42.0, 32.0, 28.0, 36.0, 55.0, 45.0, 62.0, 30.0, 43.0, 47.0, 35.0, 43.0, 30.0, 37.0, 31.0, 26.0, 15.0, 22.0, 9.0, 24.0, 14.0, 13.0, 11.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-13.359375, -13.0052490234375, -12.651123046875, -12.2969970703125, -11.94287109375, -11.5887451171875, -11.234619140625, -10.8804931640625, -10.5263671875, -10.1722412109375, -9.818115234375, -9.4639892578125, -9.10986328125, -8.7557373046875, -8.401611328125, -8.0474853515625, -7.693359375, -7.3392333984375, -6.985107421875, -6.6309814453125, -6.27685546875, -5.9227294921875, -5.568603515625, -5.2144775390625, -4.8603515625, -4.5062255859375, -4.152099609375, -3.7979736328125, -3.44384765625, -3.0897216796875, -2.735595703125, -2.3814697265625, -2.02734375, -1.6732177734375, -1.319091796875, -0.9649658203125, -0.61083984375, -0.2567138671875, 0.097412109375, 0.4515380859375, 0.8056640625, 1.1597900390625, 1.513916015625, 1.8680419921875, 2.22216796875, 2.5762939453125, 2.930419921875, 3.2845458984375, 3.638671875, 3.9927978515625, 4.346923828125, 4.7010498046875, 5.05517578125, 5.4093017578125, 5.763427734375, 6.1175537109375, 6.4716796875, 6.8258056640625, 7.179931640625, 7.5340576171875, 7.88818359375, 8.2423095703125, 8.596435546875, 8.9505615234375, 9.3046875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 2.0, 3.0, 6.0, 5.0, 4.0, 15.0, 19.0, 21.0, 14.0, 20.0, 30.0, 42.0, 66.0, 75.0, 108.0, 240.0, 543.0, 1830.0, 9618.0, 219868.0, 3100074.0, 833360.0, 23765.0, 2982.0, 797.0, 271.0, 140.0, 86.0, 56.0, 48.0, 29.0, 24.0, 26.0, 26.0, 13.0, 22.0, 10.0, 10.0, 4.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-33.78125, -32.860107421875, -31.93896484375, -31.017822265625, -30.0966796875, -29.175537109375, -28.25439453125, -27.333251953125, -26.412109375, -25.490966796875, -24.56982421875, -23.648681640625, -22.7275390625, -21.806396484375, -20.88525390625, -19.964111328125, -19.04296875, -18.121826171875, -17.20068359375, -16.279541015625, -15.3583984375, -14.437255859375, -13.51611328125, -12.594970703125, -11.673828125, -10.752685546875, -9.83154296875, -8.910400390625, -7.9892578125, -7.068115234375, -6.14697265625, -5.225830078125, -4.3046875, -3.383544921875, -2.46240234375, -1.541259765625, -0.6201171875, 0.301025390625, 1.22216796875, 2.143310546875, 3.064453125, 3.985595703125, 4.90673828125, 5.827880859375, 6.7490234375, 7.670166015625, 8.59130859375, 9.512451171875, 10.43359375, 11.354736328125, 12.27587890625, 13.197021484375, 14.1181640625, 15.039306640625, 15.96044921875, 16.881591796875, 17.802734375, 18.723876953125, 19.64501953125, 20.566162109375, 21.4873046875, 22.408447265625, 23.32958984375, 24.250732421875, 25.171875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 10.0, 12.0, 12.0, 34.0, 42.0, 55.0, 86.0, 127.0, 202.0, 387.0, 563.0, 781.0, 635.0, 432.0, 260.0, 148.0, 97.0, 81.0, 36.0, 29.0, 22.0, 12.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.921875, -28.035888671875, -27.14990234375, -26.263916015625, -25.3779296875, -24.491943359375, -23.60595703125, -22.719970703125, -21.833984375, -20.947998046875, -20.06201171875, -19.176025390625, -18.2900390625, -17.404052734375, -16.51806640625, -15.632080078125, -14.74609375, -13.860107421875, -12.97412109375, -12.088134765625, -11.2021484375, -10.316162109375, -9.43017578125, -8.544189453125, -7.658203125, -6.772216796875, -5.88623046875, -5.000244140625, -4.1142578125, -3.228271484375, -2.34228515625, -1.456298828125, -0.5703125, 0.315673828125, 1.20166015625, 2.087646484375, 2.9736328125, 3.859619140625, 4.74560546875, 5.631591796875, 6.517578125, 7.403564453125, 8.28955078125, 9.175537109375, 10.0615234375, 10.947509765625, 11.83349609375, 12.719482421875, 13.60546875, 14.491455078125, 15.37744140625, 16.263427734375, 17.1494140625, 18.035400390625, 18.92138671875, 19.807373046875, 20.693359375, 21.579345703125, 22.46533203125, 23.351318359375, 24.2373046875, 25.123291015625, 26.00927734375, 26.895263671875, 27.78125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 22.0, 29.0, 22.0, 42.0, 48.0, 64.0, 86.0, 133.0, 183.0, 227.0, 409.0, 901.0, 24042.0, 4152006.0, 13948.0, 850.0, 374.0, 227.0, 142.0, 136.0, 82.0, 68.0, 47.0, 41.0, 35.0, 26.0, 19.0, 15.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-103.875, -100.46484375, -97.0546875, -93.64453125, -90.234375, -86.82421875, -83.4140625, -80.00390625, -76.59375, -73.18359375, -69.7734375, -66.36328125, -62.953125, -59.54296875, -56.1328125, -52.72265625, -49.3125, -45.90234375, -42.4921875, -39.08203125, -35.671875, -32.26171875, -28.8515625, -25.44140625, -22.03125, -18.62109375, -15.2109375, -11.80078125, -8.390625, -4.98046875, -1.5703125, 1.83984375, 5.25, 8.66015625, 12.0703125, 15.48046875, 18.890625, 22.30078125, 25.7109375, 29.12109375, 32.53125, 35.94140625, 39.3515625, 42.76171875, 46.171875, 49.58203125, 52.9921875, 56.40234375, 59.8125, 63.22265625, 66.6328125, 70.04296875, 73.453125, 76.86328125, 80.2734375, 83.68359375, 87.09375, 90.50390625, 93.9140625, 97.32421875, 100.734375, 104.14453125, 107.5546875, 110.96484375, 114.375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 17.0, 92.0, 297.0, 361.0, 182.0, 50.0, 12.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-264.642578125, -258.2316589355469, -251.8207244873047, -245.40980529785156, -238.99887084960938, -232.58795166015625, -226.17703247070312, -219.76609802246094, -213.35516357421875, -206.94424438476562, -200.53330993652344, -194.1223907470703, -187.71145629882812, -181.300537109375, -174.88961791992188, -168.4786834716797, -162.06776428222656, -155.65684509277344, -149.24591064453125, -142.83499145507812, -136.42405700683594, -130.0131378173828, -123.60221099853516, -117.1912841796875, -110.78035736083984, -104.36943054199219, -97.95850372314453, -91.54757690429688, -85.13665771484375, -78.72572326660156, -72.31480407714844, -65.90387725830078, -59.49293518066406, -53.082008361816406, -46.67108154296875, -40.26015853881836, -33.8492317199707, -27.438304901123047, -21.027381896972656, -14.616455078125, -8.205528259277344, -1.794602394104004, 4.616323471069336, 11.02724838256836, 17.438175201416016, 23.849102020263672, 30.260025024414062, 36.67095184326172, 43.081878662109375, 49.49280548095703, 55.90373229980469, 62.31465530395508, 68.7255859375, 75.13650512695312, 81.54743194580078, 87.95835876464844, 94.3692855834961, 100.78021240234375, 107.1911392211914, 113.60206604003906, 120.01298522949219, 126.42391967773438, 132.8348388671875, 139.24575805664062, 145.6566925048828]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 4.0, 5.0, 5.0, 1.0, 10.0, 12.0, 15.0, 17.0, 13.0, 14.0, 13.0, 16.0, 20.0, 17.0, 27.0, 24.0, 41.0, 39.0, 37.0, 41.0, 47.0, 41.0, 36.0, 38.0, 43.0, 59.0, 40.0, 36.0, 36.0, 24.0, 27.0, 30.0, 23.0, 19.0, 19.0, 20.0, 12.0, 16.0, 11.0, 9.0, 9.0, 11.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-58.656368255615234, -56.8696174621582, -55.08287048339844, -53.296119689941406, -51.509368896484375, -49.722618103027344, -47.93586730957031, -46.14912033081055, -44.362369537353516, -42.575618743896484, -40.78887176513672, -39.00212097167969, -37.215370178222656, -35.428619384765625, -33.641868591308594, -31.855121612548828, -30.068370819091797, -28.281620025634766, -26.494871139526367, -24.70812225341797, -22.921371459960938, -21.134620666503906, -19.347871780395508, -17.56112289428711, -15.774372100830078, -13.987622261047363, -12.200872421264648, -10.414122581481934, -8.627372741699219, -6.840622901916504, -5.053873062133789, -3.267123222351074, -1.4803733825683594, 0.30637645721435547, 2.0931262969970703, 3.879876136779785, 5.6666259765625, 7.453375816345215, 9.24012565612793, 11.026875495910645, 12.81362533569336, 14.600375175476074, 16.38712501525879, 18.173873901367188, 19.96062469482422, 21.74737548828125, 23.53412437438965, 25.320873260498047, 27.107624053955078, 28.89437484741211, 30.681123733520508, 32.467872619628906, 34.25462341308594, 36.04137420654297, 37.828125, 39.614871978759766, 41.4016227722168, 43.18837356567383, 44.975120544433594, 46.761871337890625, 48.548622131347656, 50.33537292480469, 52.12212371826172, 53.908870697021484, 55.695621490478516]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 8.0, 9.0, 15.0, 17.0, 20.0, 27.0, 22.0, 28.0, 32.0, 27.0, 40.0, 42.0, 40.0, 44.0, 36.0, 47.0, 59.0, 53.0, 42.0, 55.0, 44.0, 43.0, 47.0, 33.0, 27.0, 26.0, 19.0, 24.0, 23.0, 15.0, 9.0, 6.0, 8.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.921875, -14.5399169921875, -14.157958984375, -13.7760009765625, -13.39404296875, -13.0120849609375, -12.630126953125, -12.2481689453125, -11.8662109375, -11.4842529296875, -11.102294921875, -10.7203369140625, -10.33837890625, -9.9564208984375, -9.574462890625, -9.1925048828125, -8.810546875, -8.4285888671875, -8.046630859375, -7.6646728515625, -7.28271484375, -6.9007568359375, -6.518798828125, -6.1368408203125, -5.7548828125, -5.3729248046875, -4.990966796875, -4.6090087890625, -4.22705078125, -3.8450927734375, -3.463134765625, -3.0811767578125, -2.69921875, -2.3172607421875, -1.935302734375, -1.5533447265625, -1.17138671875, -0.7894287109375, -0.407470703125, -0.0255126953125, 0.3564453125, 0.7384033203125, 1.120361328125, 1.5023193359375, 1.88427734375, 2.2662353515625, 2.648193359375, 3.0301513671875, 3.412109375, 3.7940673828125, 4.176025390625, 4.5579833984375, 4.93994140625, 5.3218994140625, 5.703857421875, 6.0858154296875, 6.4677734375, 6.8497314453125, 7.231689453125, 7.6136474609375, 7.99560546875, 8.3775634765625, 8.759521484375, 9.1414794921875, 9.5234375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 6.0, 6.0, 11.0, 17.0, 28.0, 37.0, 47.0, 78.0, 152.0, 230.0, 367.0, 626.0, 1075.0, 1800.0, 3080.0, 5224.0, 8829.0, 15067.0, 25947.0, 47996.0, 92659.0, 219345.0, 359419.0, 126062.0, 61546.0, 33188.0, 18750.0, 10889.0, 6497.0, 3865.0, 2344.0, 1295.0, 783.0, 452.0, 299.0, 196.0, 117.0, 74.0, 39.0, 34.0, 22.0, 15.0, 11.0, 6.0, 5.0, 6.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.451171875, -2.37261962890625, -2.2940673828125, -2.21551513671875, -2.136962890625, -2.05841064453125, -1.9798583984375, -1.90130615234375, -1.82275390625, -1.74420166015625, -1.6656494140625, -1.58709716796875, -1.508544921875, -1.42999267578125, -1.3514404296875, -1.27288818359375, -1.1943359375, -1.11578369140625, -1.0372314453125, -0.95867919921875, -0.880126953125, -0.80157470703125, -0.7230224609375, -0.64447021484375, -0.56591796875, -0.48736572265625, -0.4088134765625, -0.33026123046875, -0.251708984375, -0.17315673828125, -0.0946044921875, -0.01605224609375, 0.0625, 0.14105224609375, 0.2196044921875, 0.29815673828125, 0.376708984375, 0.45526123046875, 0.5338134765625, 0.61236572265625, 0.69091796875, 0.76947021484375, 0.8480224609375, 0.92657470703125, 1.005126953125, 1.08367919921875, 1.1622314453125, 1.24078369140625, 1.3193359375, 1.39788818359375, 1.4764404296875, 1.55499267578125, 1.633544921875, 1.71209716796875, 1.7906494140625, 1.86920166015625, 1.94775390625, 2.02630615234375, 2.1048583984375, 2.18341064453125, 2.261962890625, 2.34051513671875, 2.4190673828125, 2.49761962890625, 2.576171875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 8.0, 4.0, 2.0, 8.0, 8.0, 17.0, 12.0, 12.0, 18.0, 21.0, 28.0, 26.0, 35.0, 34.0, 37.0, 36.0, 41.0, 52.0, 43.0, 1070.0, 42.0, 38.0, 43.0, 46.0, 44.0, 29.0, 32.0, 31.0, 37.0, 22.0, 25.0, 23.0, 18.0, 22.0, 13.0, 16.0, 14.0, 5.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.82421875, -7.5992431640625, -7.374267578125, -7.1492919921875, -6.92431640625, -6.6993408203125, -6.474365234375, -6.2493896484375, -6.0244140625, -5.7994384765625, -5.574462890625, -5.3494873046875, -5.12451171875, -4.8995361328125, -4.674560546875, -4.4495849609375, -4.224609375, -3.9996337890625, -3.774658203125, -3.5496826171875, -3.32470703125, -3.0997314453125, -2.874755859375, -2.6497802734375, -2.4248046875, -2.1998291015625, -1.974853515625, -1.7498779296875, -1.52490234375, -1.2999267578125, -1.074951171875, -0.8499755859375, -0.625, -0.4000244140625, -0.175048828125, 0.0499267578125, 0.27490234375, 0.4998779296875, 0.724853515625, 0.9498291015625, 1.1748046875, 1.3997802734375, 1.624755859375, 1.8497314453125, 2.07470703125, 2.2996826171875, 2.524658203125, 2.7496337890625, 2.974609375, 3.1995849609375, 3.424560546875, 3.6495361328125, 3.87451171875, 4.0994873046875, 4.324462890625, 4.5494384765625, 4.7744140625, 4.9993896484375, 5.224365234375, 5.4493408203125, 5.67431640625, 5.8992919921875, 6.124267578125, 6.3492431640625, 6.57421875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 5.0, 5.0, 7.0, 13.0, 24.0, 30.0, 46.0, 85.0, 122.0, 156.0, 277.0, 418.0, 690.0, 1045.0, 1692.0, 2882.0, 4665.0, 7412.0, 11890.0, 19220.0, 31172.0, 52487.0, 96992.0, 232892.0, 1367142.0, 115264.0, 59856.0, 35290.0, 21378.0, 13049.0, 8009.0, 5019.0, 2975.0, 1908.0, 1121.0, 686.0, 399.0, 295.0, 170.0, 90.0, 87.0, 69.0, 37.0, 29.0, 13.0, 6.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.09765625, -2.02801513671875, -1.9583740234375, -1.88873291015625, -1.819091796875, -1.74945068359375, -1.6798095703125, -1.61016845703125, -1.54052734375, -1.47088623046875, -1.4012451171875, -1.33160400390625, -1.261962890625, -1.19232177734375, -1.1226806640625, -1.05303955078125, -0.9833984375, -0.91375732421875, -0.8441162109375, -0.77447509765625, -0.704833984375, -0.63519287109375, -0.5655517578125, -0.49591064453125, -0.42626953125, -0.35662841796875, -0.2869873046875, -0.21734619140625, -0.147705078125, -0.07806396484375, -0.0084228515625, 0.06121826171875, 0.130859375, 0.20050048828125, 0.2701416015625, 0.33978271484375, 0.409423828125, 0.47906494140625, 0.5487060546875, 0.61834716796875, 0.68798828125, 0.75762939453125, 0.8272705078125, 0.89691162109375, 0.966552734375, 1.03619384765625, 1.1058349609375, 1.17547607421875, 1.2451171875, 1.31475830078125, 1.3843994140625, 1.45404052734375, 1.523681640625, 1.59332275390625, 1.6629638671875, 1.73260498046875, 1.80224609375, 1.87188720703125, 1.9415283203125, 2.01116943359375, 2.080810546875, 2.15045166015625, 2.2200927734375, 2.28973388671875, 2.359375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 7.0, 3.0, 3.0, 7.0, 6.0, 13.0, 13.0, 10.0, 13.0, 20.0, 25.0, 31.0, 45.0, 50.0, 68.0, 62.0, 70.0, 63.0, 70.0, 62.0, 42.0, 50.0, 61.0, 38.0, 30.0, 29.0, 23.0, 22.0, 15.0, 9.0, 9.0, 9.0, 8.0, 6.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012540817260742188, -0.0012154430150985718, -0.0011768043041229248, -0.0011381655931472778, -0.0010995268821716309, -0.0010608881711959839, -0.001022249460220337, -0.00098361074924469, -0.000944972038269043, -0.000906333327293396, -0.000867694616317749, -0.000829055905342102, -0.0007904171943664551, -0.0007517784833908081, -0.0007131397724151611, -0.0006745010614395142, -0.0006358623504638672, -0.0005972236394882202, -0.0005585849285125732, -0.0005199462175369263, -0.0004813075065612793, -0.0004426687955856323, -0.00040403008460998535, -0.0003653913736343384, -0.0003267526626586914, -0.00028811395168304443, -0.00024947524070739746, -0.0002108365297317505, -0.00017219781875610352, -0.00013355910778045654, -9.492039680480957e-05, -5.62816858291626e-05, -1.7642974853515625e-05, 2.0995736122131348e-05, 5.963444709777832e-05, 9.827315807342529e-05, 0.00013691186904907227, 0.00017555058002471924, 0.0002141892910003662, 0.0002528280019760132, 0.00029146671295166016, 0.00033010542392730713, 0.0003687441349029541, 0.0004073828458786011, 0.00044602155685424805, 0.000484660267829895, 0.000523298978805542, 0.000561937689781189, 0.0006005764007568359, 0.0006392151117324829, 0.0006778538227081299, 0.0007164925336837769, 0.0007551312446594238, 0.0007937699556350708, 0.0008324086666107178, 0.0008710473775863647, 0.0009096860885620117, 0.0009483247995376587, 0.0009869635105133057, 0.0010256022214889526, 0.0010642409324645996, 0.0011028796434402466, 0.0011415183544158936, 0.0011801570653915405, 0.0012187957763671875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 6.0, 5.0, 4.0, 13.0, 8.0, 12.0, 20.0, 26.0, 22.0, 41.0, 41.0, 47.0, 92.0, 158.0, 308.0, 962.0, 221296.0, 823215.0, 1297.0, 383.0, 177.0, 120.0, 69.0, 55.0, 39.0, 31.0, 32.0, 20.0, 16.0, 5.0, 9.0, 9.0, 6.0, 6.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0270538330078125, -0.0261232852935791, -0.025192737579345703, -0.024262189865112305, -0.023331642150878906, -0.022401094436645508, -0.02147054672241211, -0.02053999900817871, -0.019609451293945312, -0.018678903579711914, -0.017748355865478516, -0.016817808151245117, -0.01588726043701172, -0.01495671272277832, -0.014026165008544922, -0.013095617294311523, -0.012165069580078125, -0.011234521865844727, -0.010303974151611328, -0.00937342643737793, -0.008442878723144531, -0.007512331008911133, -0.006581783294677734, -0.005651235580444336, -0.0047206878662109375, -0.003790140151977539, -0.0028595924377441406, -0.0019290447235107422, -0.0009984970092773438, -6.794929504394531e-05, 0.0008625984191894531, 0.0017931461334228516, 0.00272369384765625, 0.0036542415618896484, 0.004584789276123047, 0.005515336990356445, 0.006445884704589844, 0.007376432418823242, 0.00830698013305664, 0.009237527847290039, 0.010168075561523438, 0.011098623275756836, 0.012029170989990234, 0.012959718704223633, 0.013890266418457031, 0.01482081413269043, 0.015751361846923828, 0.016681909561157227, 0.017612457275390625, 0.018543004989624023, 0.019473552703857422, 0.02040410041809082, 0.02133464813232422, 0.022265195846557617, 0.023195743560791016, 0.024126291275024414, 0.025056838989257812, 0.02598738670349121, 0.02691793441772461, 0.027848482131958008, 0.028779029846191406, 0.029709577560424805, 0.030640125274658203, 0.0315706729888916, 0.032501220703125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 16.0, 26.0, 35.0, 87.0, 132.0, 177.0, 188.0, 146.0, 95.0, 56.0, 22.0, 12.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004642988496925682, -0.0004353416443336755, -0.0004063844389747828, -0.00037742723361589015, -0.00034847002825699747, -0.00031951285200193524, -0.00029055564664304256, -0.0002615984412841499, -0.00023264122137334198, -0.0002036840160144493, -0.00017472681065555662, -0.00014576961984857917, -0.00011681240721372887, -8.785520913079381e-05, -5.889800377190113e-05, -2.994079841300845e-05, -9.835930541157722e-07, 2.7973610485787503e-05, 5.693081402569078e-05, 8.588801574660465e-05, 0.00011484522110549733, 0.0001438024191884324, 0.00017275962454732507, 0.00020171682990621775, 0.00023067403526511043, 0.0002596312260720879, 0.00028858843143098056, 0.00031754563678987324, 0.0003465028421487659, 0.0003754600475076586, 0.0004044172528665513, 0.00043337445822544396, 0.0004623316344805062, 0.0004912888398393989, 0.0005202460451982915, 0.0005492032505571842, 0.0005781604559160769, 0.0006071176612749696, 0.0006360748666338623, 0.0006650320719927549, 0.0006939892773516476, 0.0007229464827105403, 0.000751903688069433, 0.0007808608934283257, 0.0008098180987872183, 0.000838775304146111, 0.0008677325095050037, 0.0008966897148638964, 0.0009256468620151281, 0.0009546040673740208, 0.0009835612727329135, 0.0010125184198841453, 0.0010414756834506989, 0.0010704328306019306, 0.0010993900941684842, 0.001128347241319716, 0.0011573045048862696, 0.0011862616520375013, 0.001215218915604055, 0.0012441760627552867, 0.0012731333263218403, 0.001302090473473072, 0.0013310477370396256, 0.0013600048841908574, 0.001388962147757411]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 3.0, 7.0, 3.0, 12.0, 10.0, 9.0, 12.0, 12.0, 11.0, 19.0, 16.0, 27.0, 20.0, 22.0, 25.0, 27.0, 36.0, 38.0, 30.0, 39.0, 36.0, 34.0, 36.0, 29.0, 46.0, 45.0, 26.0, 42.0, 30.0, 35.0, 32.0, 28.0, 25.0, 30.0, 24.0, 21.0, 11.0, 14.0, 15.0, 14.0, 12.0, 5.0, 9.0, 5.0, 4.0, 3.0, 0.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.000533759593963623, -0.0005171764642000198, -0.0005005933344364166, -0.0004840102046728134, -0.0004674270749092102, -0.000450843945145607, -0.0004342608153820038, -0.0004176776856184006, -0.00040109455585479736, -0.00038451142609119415, -0.00036792829632759094, -0.00035134516656398773, -0.0003347620368003845, -0.0003181789070367813, -0.0003015957772731781, -0.0002850126475095749, -0.0002684295177459717, -0.00025184638798236847, -0.00023526325821876526, -0.00021868012845516205, -0.00020209699869155884, -0.00018551386892795563, -0.00016893073916435242, -0.0001523476094007492, -0.000135764479637146, -0.00011918134987354279, -0.00010259822010993958, -8.601509034633636e-05, -6.943196058273315e-05, -5.2848830819129944e-05, -3.6265701055526733e-05, -1.9682571291923523e-05, -3.0994415283203125e-06, 1.3483688235282898e-05, 3.006681799888611e-05, 4.664994776248932e-05, 6.323307752609253e-05, 7.981620728969574e-05, 9.639933705329895e-05, 0.00011298246681690216, 0.00012956559658050537, 0.00014614872634410858, 0.0001627318561077118, 0.000179314985871315, 0.0001958981156349182, 0.00021248124539852142, 0.00022906437516212463, 0.00024564750492572784, 0.00026223063468933105, 0.00027881376445293427, 0.0002953968942165375, 0.0003119800239801407, 0.0003285631537437439, 0.0003451462835073471, 0.0003617294132709503, 0.00037831254303455353, 0.00039489567279815674, 0.00041147880256175995, 0.00042806193232536316, 0.00044464506208896637, 0.0004612281918525696, 0.0004778113216161728, 0.000494394451379776, 0.0005109775811433792, 0.0005275607109069824]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 8.0, 9.0, 15.0, 17.0, 20.0, 27.0, 22.0, 28.0, 32.0, 27.0, 40.0, 42.0, 40.0, 44.0, 36.0, 47.0, 59.0, 53.0, 42.0, 55.0, 44.0, 43.0, 47.0, 33.0, 27.0, 26.0, 19.0, 24.0, 23.0, 15.0, 9.0, 6.0, 8.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.921875, -14.5399169921875, -14.157958984375, -13.7760009765625, -13.39404296875, -13.0120849609375, -12.630126953125, -12.2481689453125, -11.8662109375, -11.4842529296875, -11.102294921875, -10.7203369140625, -10.33837890625, -9.9564208984375, -9.574462890625, -9.1925048828125, -8.810546875, -8.4285888671875, -8.046630859375, -7.6646728515625, -7.28271484375, -6.9007568359375, -6.518798828125, -6.1368408203125, -5.7548828125, -5.3729248046875, -4.990966796875, -4.6090087890625, -4.22705078125, -3.8450927734375, -3.463134765625, -3.0811767578125, -2.69921875, -2.3172607421875, -1.935302734375, -1.5533447265625, -1.17138671875, -0.7894287109375, -0.407470703125, -0.0255126953125, 0.3564453125, 0.7384033203125, 1.120361328125, 1.5023193359375, 1.88427734375, 2.2662353515625, 2.648193359375, 3.0301513671875, 3.412109375, 3.7940673828125, 4.176025390625, 4.5579833984375, 4.93994140625, 5.3218994140625, 5.703857421875, 6.0858154296875, 6.4677734375, 6.8497314453125, 7.231689453125, 7.6136474609375, 7.99560546875, 8.3775634765625, 8.759521484375, 9.1414794921875, 9.5234375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 6.0, 10.0, 10.0, 26.0, 23.0, 51.0, 55.0, 75.0, 117.0, 222.0, 365.0, 762.0, 1853.0, 6024.0, 25170.0, 178454.0, 720600.0, 91646.0, 16040.0, 4142.0, 1392.0, 605.0, 350.0, 194.0, 111.0, 79.0, 41.0, 47.0, 26.0, 16.0, 15.0, 5.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.5, -14.11181640625, -13.7236328125, -13.33544921875, -12.947265625, -12.55908203125, -12.1708984375, -11.78271484375, -11.39453125, -11.00634765625, -10.6181640625, -10.22998046875, -9.841796875, -9.45361328125, -9.0654296875, -8.67724609375, -8.2890625, -7.90087890625, -7.5126953125, -7.12451171875, -6.736328125, -6.34814453125, -5.9599609375, -5.57177734375, -5.18359375, -4.79541015625, -4.4072265625, -4.01904296875, -3.630859375, -3.24267578125, -2.8544921875, -2.46630859375, -2.078125, -1.68994140625, -1.3017578125, -0.91357421875, -0.525390625, -0.13720703125, 0.2509765625, 0.63916015625, 1.02734375, 1.41552734375, 1.8037109375, 2.19189453125, 2.580078125, 2.96826171875, 3.3564453125, 3.74462890625, 4.1328125, 4.52099609375, 4.9091796875, 5.29736328125, 5.685546875, 6.07373046875, 6.4619140625, 6.85009765625, 7.23828125, 7.62646484375, 8.0146484375, 8.40283203125, 8.791015625, 9.17919921875, 9.5673828125, 9.95556640625, 10.34375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 4.0, 9.0, 7.0, 8.0, 10.0, 12.0, 9.0, 19.0, 17.0, 24.0, 24.0, 20.0, 32.0, 37.0, 34.0, 33.0, 38.0, 49.0, 47.0, 199.0, 1837.0, 106.0, 45.0, 53.0, 39.0, 39.0, 44.0, 26.0, 27.0, 25.0, 24.0, 30.0, 14.0, 15.0, 21.0, 12.0, 8.0, 10.0, 12.0, 7.0, 4.0, 2.0, 6.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.921875, -28.935791015625, -27.94970703125, -26.963623046875, -25.9775390625, -24.991455078125, -24.00537109375, -23.019287109375, -22.033203125, -21.047119140625, -20.06103515625, -19.074951171875, -18.0888671875, -17.102783203125, -16.11669921875, -15.130615234375, -14.14453125, -13.158447265625, -12.17236328125, -11.186279296875, -10.2001953125, -9.214111328125, -8.22802734375, -7.241943359375, -6.255859375, -5.269775390625, -4.28369140625, -3.297607421875, -2.3115234375, -1.325439453125, -0.33935546875, 0.646728515625, 1.6328125, 2.618896484375, 3.60498046875, 4.591064453125, 5.5771484375, 6.563232421875, 7.54931640625, 8.535400390625, 9.521484375, 10.507568359375, 11.49365234375, 12.479736328125, 13.4658203125, 14.451904296875, 15.43798828125, 16.424072265625, 17.41015625, 18.396240234375, 19.38232421875, 20.368408203125, 21.3544921875, 22.340576171875, 23.32666015625, 24.312744140625, 25.298828125, 26.284912109375, 27.27099609375, 28.257080078125, 29.2431640625, 30.229248046875, 31.21533203125, 32.201416015625, 33.1875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 1.0, 4.0, 7.0, 5.0, 7.0, 11.0, 13.0, 8.0, 15.0, 23.0, 22.0, 25.0, 44.0, 42.0, 69.0, 72.0, 114.0, 158.0, 195.0, 317.0, 558.0, 2431.0, 2960596.0, 177900.0, 1632.0, 451.0, 271.0, 172.0, 105.0, 109.0, 71.0, 52.0, 46.0, 41.0, 22.0, 12.0, 21.0, 14.0, 13.0, 9.0, 8.0, 5.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-73.5625, -71.255859375, -68.94921875, -66.642578125, -64.3359375, -62.029296875, -59.72265625, -57.416015625, -55.109375, -52.802734375, -50.49609375, -48.189453125, -45.8828125, -43.576171875, -41.26953125, -38.962890625, -36.65625, -34.349609375, -32.04296875, -29.736328125, -27.4296875, -25.123046875, -22.81640625, -20.509765625, -18.203125, -15.896484375, -13.58984375, -11.283203125, -8.9765625, -6.669921875, -4.36328125, -2.056640625, 0.25, 2.556640625, 4.86328125, 7.169921875, 9.4765625, 11.783203125, 14.08984375, 16.396484375, 18.703125, 21.009765625, 23.31640625, 25.623046875, 27.9296875, 30.236328125, 32.54296875, 34.849609375, 37.15625, 39.462890625, 41.76953125, 44.076171875, 46.3828125, 48.689453125, 50.99609375, 53.302734375, 55.609375, 57.916015625, 60.22265625, 62.529296875, 64.8359375, 67.142578125, 69.44921875, 71.755859375, 74.0625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 577.0, 430.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-312.56585693359375, -306.5470275878906, -300.5282287597656, -294.5093994140625, -288.4906005859375, -282.4717712402344, -276.45294189453125, -270.43414306640625, -264.4153137207031, -258.396484375, -252.377685546875, -246.35885620117188, -240.3400421142578, -234.32122802734375, -228.30239868164062, -222.28358459472656, -216.2647705078125, -210.24595642089844, -204.22714233398438, -198.20831298828125, -192.1894989013672, -186.17068481445312, -180.15185546875, -174.13304138183594, -168.11422729492188, -162.0954132080078, -156.07659912109375, -150.05776977539062, -144.03895568847656, -138.0201416015625, -132.00131225585938, -125.98249816894531, -119.96369171142578, -113.94486999511719, -107.92605590820312, -101.90724182128906, -95.88842010498047, -89.86959838867188, -83.85078430175781, -77.83197021484375, -71.81314849853516, -65.79432678222656, -59.7755126953125, -53.75669479370117, -47.737876892089844, -41.719058990478516, -35.70024108886719, -29.68142318725586, -23.66260528564453, -17.643787384033203, -11.624969482421875, -5.606151580810547, 0.41266632080078125, 6.431484222412109, 12.450302124023438, 18.469120025634766, 24.487937927246094, 30.506755828857422, 36.52557373046875, 42.54439163208008, 48.563209533691406, 54.582027435302734, 60.60084533691406, 66.61965942382812, 72.63848114013672]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 6.0, 11.0, 2.0, 19.0, 15.0, 15.0, 26.0, 24.0, 20.0, 14.0, 24.0, 20.0, 46.0, 37.0, 39.0, 38.0, 45.0, 48.0, 57.0, 35.0, 38.0, 29.0, 43.0, 43.0, 43.0, 32.0, 27.0, 31.0, 22.0, 20.0, 27.0, 16.0, 19.0, 11.0, 10.0, 12.0, 10.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-97.09986114501953, -94.39815521240234, -91.69644927978516, -88.99474334716797, -86.29303741455078, -83.59132385253906, -80.88961791992188, -78.18791198730469, -75.4862060546875, -72.78450012207031, -70.08279418945312, -67.38108825683594, -64.67938232421875, -61.9776725769043, -59.27596664428711, -56.574256896972656, -53.872554779052734, -51.17084884643555, -48.46914291381836, -45.767433166503906, -43.06572723388672, -40.36402130126953, -37.662315368652344, -34.960609436035156, -32.25890350341797, -29.55719757080078, -26.85548973083496, -24.153783798217773, -21.452075958251953, -18.750370025634766, -16.048664093017578, -13.346956253051758, -10.645248413085938, -7.943541526794434, -5.241835117340088, -2.540128707885742, 0.16157817840576172, 2.8632850646972656, 5.564990997314453, 8.266698837280273, 10.968404769897461, 13.670111656188965, 16.37181854248047, 19.073524475097656, 21.775230407714844, 24.476938247680664, 27.17864418029785, 29.880352020263672, 32.58205795288086, 35.28376388549805, 37.985469818115234, 40.68717956542969, 43.388885498046875, 46.09059143066406, 48.79229736328125, 51.49400329589844, 54.195709228515625, 56.89741516113281, 59.59912109375, 62.30082702636719, 65.00253295898438, 67.70423889160156, 70.40594482421875, 73.10765838623047, 75.80936431884766]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 8.0, 11.0, 10.0, 14.0, 12.0, 33.0, 27.0, 25.0, 30.0, 30.0, 33.0, 36.0, 34.0, 48.0, 42.0, 42.0, 55.0, 44.0, 64.0, 40.0, 53.0, 38.0, 40.0, 36.0, 32.0, 29.0, 29.0, 17.0, 24.0, 15.0, 14.0, 8.0, 10.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.2734375, -14.88671875, -14.5, -14.11328125, -13.7265625, -13.33984375, -12.953125, -12.56640625, -12.1796875, -11.79296875, -11.40625, -11.01953125, -10.6328125, -10.24609375, -9.859375, -9.47265625, -9.0859375, -8.69921875, -8.3125, -7.92578125, -7.5390625, -7.15234375, -6.765625, -6.37890625, -5.9921875, -5.60546875, -5.21875, -4.83203125, -4.4453125, -4.05859375, -3.671875, -3.28515625, -2.8984375, -2.51171875, -2.125, -1.73828125, -1.3515625, -0.96484375, -0.578125, -0.19140625, 0.1953125, 0.58203125, 0.96875, 1.35546875, 1.7421875, 2.12890625, 2.515625, 2.90234375, 3.2890625, 3.67578125, 4.0625, 4.44921875, 4.8359375, 5.22265625, 5.609375, 5.99609375, 6.3828125, 6.76953125, 7.15625, 7.54296875, 7.9296875, 8.31640625, 8.703125, 9.08984375, 9.4765625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 4.0, 16.0, 13.0, 15.0, 23.0, 23.0, 21.0, 50.0, 39.0, 68.0, 63.0, 78.0, 139.0, 211.0, 346.0, 654.0, 2029.0, 12411.0, 424626.0, 3289429.0, 445738.0, 14468.0, 2075.0, 642.0, 339.0, 193.0, 106.0, 84.0, 81.0, 73.0, 41.0, 55.0, 31.0, 30.0, 14.0, 14.0, 11.0, 5.0, 4.0, 2.0, 5.0, 2.0, 3.0, 3.0], "bins": [-36.28125, -35.36279296875, -34.4443359375, -33.52587890625, -32.607421875, -31.68896484375, -30.7705078125, -29.85205078125, -28.93359375, -28.01513671875, -27.0966796875, -26.17822265625, -25.259765625, -24.34130859375, -23.4228515625, -22.50439453125, -21.5859375, -20.66748046875, -19.7490234375, -18.83056640625, -17.912109375, -16.99365234375, -16.0751953125, -15.15673828125, -14.23828125, -13.31982421875, -12.4013671875, -11.48291015625, -10.564453125, -9.64599609375, -8.7275390625, -7.80908203125, -6.890625, -5.97216796875, -5.0537109375, -4.13525390625, -3.216796875, -2.29833984375, -1.3798828125, -0.46142578125, 0.45703125, 1.37548828125, 2.2939453125, 3.21240234375, 4.130859375, 5.04931640625, 5.9677734375, 6.88623046875, 7.8046875, 8.72314453125, 9.6416015625, 10.56005859375, 11.478515625, 12.39697265625, 13.3154296875, 14.23388671875, 15.15234375, 16.07080078125, 16.9892578125, 17.90771484375, 18.826171875, 19.74462890625, 20.6630859375, 21.58154296875, 22.5]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 12.0, 17.0, 20.0, 28.0, 36.0, 52.0, 80.0, 106.0, 132.0, 265.0, 373.0, 544.0, 669.0, 582.0, 393.0, 259.0, 173.0, 98.0, 71.0, 47.0, 45.0, 26.0, 10.0, 9.0, 10.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.71875, -15.97607421875, -15.2333984375, -14.49072265625, -13.748046875, -13.00537109375, -12.2626953125, -11.52001953125, -10.77734375, -10.03466796875, -9.2919921875, -8.54931640625, -7.806640625, -7.06396484375, -6.3212890625, -5.57861328125, -4.8359375, -4.09326171875, -3.3505859375, -2.60791015625, -1.865234375, -1.12255859375, -0.3798828125, 0.36279296875, 1.10546875, 1.84814453125, 2.5908203125, 3.33349609375, 4.076171875, 4.81884765625, 5.5615234375, 6.30419921875, 7.046875, 7.78955078125, 8.5322265625, 9.27490234375, 10.017578125, 10.76025390625, 11.5029296875, 12.24560546875, 12.98828125, 13.73095703125, 14.4736328125, 15.21630859375, 15.958984375, 16.70166015625, 17.4443359375, 18.18701171875, 18.9296875, 19.67236328125, 20.4150390625, 21.15771484375, 21.900390625, 22.64306640625, 23.3857421875, 24.12841796875, 24.87109375, 25.61376953125, 26.3564453125, 27.09912109375, 27.841796875, 28.58447265625, 29.3271484375, 30.06982421875, 30.8125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 7.0, 15.0, 15.0, 24.0, 32.0, 42.0, 77.0, 86.0, 112.0, 145.0, 210.0, 313.0, 509.0, 1541.0, 2106731.0, 2081325.0, 1550.0, 461.0, 312.0, 180.0, 133.0, 135.0, 87.0, 75.0, 43.0, 36.0, 30.0, 21.0, 12.0, 11.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-157.375, -153.6279296875, -149.880859375, -146.1337890625, -142.38671875, -138.6396484375, -134.892578125, -131.1455078125, -127.3984375, -123.6513671875, -119.904296875, -116.1572265625, -112.41015625, -108.6630859375, -104.916015625, -101.1689453125, -97.421875, -93.6748046875, -89.927734375, -86.1806640625, -82.43359375, -78.6865234375, -74.939453125, -71.1923828125, -67.4453125, -63.6982421875, -59.951171875, -56.2041015625, -52.45703125, -48.7099609375, -44.962890625, -41.2158203125, -37.46875, -33.7216796875, -29.974609375, -26.2275390625, -22.48046875, -18.7333984375, -14.986328125, -11.2392578125, -7.4921875, -3.7451171875, 0.001953125, 3.7490234375, 7.49609375, 11.2431640625, 14.990234375, 18.7373046875, 22.484375, 26.2314453125, 29.978515625, 33.7255859375, 37.47265625, 41.2197265625, 44.966796875, 48.7138671875, 52.4609375, 56.2080078125, 59.955078125, 63.7021484375, 67.44921875, 71.1962890625, 74.943359375, 78.6904296875, 82.4375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 338.0, 651.0, 26.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-705.5086059570312, -688.3802490234375, -671.2518920898438, -654.12353515625, -636.9951782226562, -619.8668212890625, -602.738525390625, -585.6101684570312, -568.4818115234375, -551.3534545898438, -534.22509765625, -517.0967407226562, -499.9684143066406, -482.8400573730469, -465.7117004394531, -448.5833435058594, -431.4549865722656, -414.3266296386719, -397.1982727050781, -380.0699462890625, -362.94158935546875, -345.813232421875, -328.68487548828125, -311.5565185546875, -294.42816162109375, -277.2998046875, -260.17144775390625, -243.04310607910156, -225.91476440429688, -208.78640747070312, -191.65805053710938, -174.52969360351562, -157.40139770507812, -140.27304077148438, -123.14469909667969, -106.01634216308594, -88.88799285888672, -71.7596435546875, -54.63128662109375, -37.50293731689453, -20.374588012695312, -3.246236801147461, 13.88211441040039, 31.010467529296875, 48.138816833496094, 65.26716613769531, 82.39552307128906, 99.52387237548828, 116.6522216796875, 133.78057861328125, 150.90892028808594, 168.0372772216797, 185.16561889648438, 202.29397583007812, 219.42233276367188, 236.55068969726562, 253.6790313720703, 270.807373046875, 287.93572998046875, 305.0640869140625, 322.19244384765625, 339.32080078125, 356.44915771484375, 373.5774841308594, 390.7058410644531]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 7.0, 5.0, 12.0, 10.0, 17.0, 9.0, 17.0, 25.0, 25.0, 26.0, 24.0, 36.0, 33.0, 37.0, 35.0, 40.0, 39.0, 45.0, 39.0, 49.0, 51.0, 32.0, 43.0, 33.0, 47.0, 28.0, 40.0, 33.0, 22.0, 25.0, 25.0, 16.0, 18.0, 7.0, 3.0, 12.0, 4.0, 3.0, 6.0, 3.0, 6.0, 5.0, 2.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.68462371826172, -53.78672409057617, -51.88882064819336, -49.99092102050781, -48.093021392822266, -46.19512176513672, -44.297218322753906, -42.39931869506836, -40.50141906738281, -38.603519439697266, -36.70561599731445, -34.807716369628906, -32.90981674194336, -31.01191520690918, -29.114013671875, -27.216114044189453, -25.31821060180664, -23.42030906677246, -21.522409439086914, -19.624507904052734, -17.726608276367188, -15.828706741333008, -13.930805206298828, -12.032904624938965, -10.135004043579102, -8.237103462219238, -6.339202404022217, -4.441301345825195, -2.543400764465332, -0.6455001831054688, 1.252401351928711, 3.150301933288574, 5.0482025146484375, 6.946103096008301, 8.844003677368164, 10.741905212402344, 12.639805793762207, 14.53770637512207, 16.43560791015625, 18.333507537841797, 20.231409072875977, 22.129310607910156, 24.027210235595703, 25.925111770629883, 27.823013305664062, 29.72091293334961, 31.61881446838379, 33.51671600341797, 35.414615631103516, 37.31251525878906, 39.210418701171875, 41.10831832885742, 43.00621795654297, 44.90412139892578, 46.80202102661133, 48.699920654296875, 50.59782409667969, 52.495723724365234, 54.39362716674805, 56.291526794433594, 58.18942642211914, 60.08732604980469, 61.9852294921875, 63.88312911987305, 65.7810287475586]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 9.0, 13.0, 13.0, 13.0, 16.0, 16.0, 31.0, 20.0, 23.0, 31.0, 39.0, 41.0, 31.0, 38.0, 42.0, 37.0, 32.0, 45.0, 50.0, 52.0, 39.0, 44.0, 39.0, 45.0, 27.0, 32.0, 27.0, 27.0, 30.0, 10.0, 16.0, 15.0, 10.0, 4.0, 8.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.4921875, -12.146240234375, -11.80029296875, -11.454345703125, -11.1083984375, -10.762451171875, -10.41650390625, -10.070556640625, -9.724609375, -9.378662109375, -9.03271484375, -8.686767578125, -8.3408203125, -7.994873046875, -7.64892578125, -7.302978515625, -6.95703125, -6.611083984375, -6.26513671875, -5.919189453125, -5.5732421875, -5.227294921875, -4.88134765625, -4.535400390625, -4.189453125, -3.843505859375, -3.49755859375, -3.151611328125, -2.8056640625, -2.459716796875, -2.11376953125, -1.767822265625, -1.421875, -1.075927734375, -0.72998046875, -0.384033203125, -0.0380859375, 0.307861328125, 0.65380859375, 0.999755859375, 1.345703125, 1.691650390625, 2.03759765625, 2.383544921875, 2.7294921875, 3.075439453125, 3.42138671875, 3.767333984375, 4.11328125, 4.459228515625, 4.80517578125, 5.151123046875, 5.4970703125, 5.843017578125, 6.18896484375, 6.534912109375, 6.880859375, 7.226806640625, 7.57275390625, 7.918701171875, 8.2646484375, 8.610595703125, 8.95654296875, 9.302490234375, 9.6484375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 10.0, 10.0, 16.0, 20.0, 18.0, 37.0, 87.0, 113.0, 168.0, 246.0, 363.0, 586.0, 919.0, 1582.0, 2383.0, 3963.0, 6476.0, 10569.0, 18068.0, 31209.0, 56384.0, 108146.0, 269431.0, 288666.0, 111974.0, 58285.0, 31926.0, 18613.0, 10968.0, 6584.0, 4088.0, 2444.0, 1552.0, 940.0, 611.0, 443.0, 238.0, 120.0, 99.0, 78.0, 54.0, 28.0, 13.0, 13.0, 9.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.45703125, -2.38262939453125, -2.3082275390625, -2.23382568359375, -2.159423828125, -2.08502197265625, -2.0106201171875, -1.93621826171875, -1.86181640625, -1.78741455078125, -1.7130126953125, -1.63861083984375, -1.564208984375, -1.48980712890625, -1.4154052734375, -1.34100341796875, -1.2666015625, -1.19219970703125, -1.1177978515625, -1.04339599609375, -0.968994140625, -0.89459228515625, -0.8201904296875, -0.74578857421875, -0.67138671875, -0.59698486328125, -0.5225830078125, -0.44818115234375, -0.373779296875, -0.29937744140625, -0.2249755859375, -0.15057373046875, -0.076171875, -0.00177001953125, 0.0726318359375, 0.14703369140625, 0.221435546875, 0.29583740234375, 0.3702392578125, 0.44464111328125, 0.51904296875, 0.59344482421875, 0.6678466796875, 0.74224853515625, 0.816650390625, 0.89105224609375, 0.9654541015625, 1.03985595703125, 1.1142578125, 1.18865966796875, 1.2630615234375, 1.33746337890625, 1.411865234375, 1.48626708984375, 1.5606689453125, 1.63507080078125, 1.70947265625, 1.78387451171875, 1.8582763671875, 1.93267822265625, 2.007080078125, 2.08148193359375, 2.1558837890625, 2.23028564453125, 2.3046875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 5.0, 6.0, 7.0, 7.0, 15.0, 10.0, 21.0, 15.0, 20.0, 27.0, 29.0, 31.0, 31.0, 28.0, 27.0, 36.0, 29.0, 22.0, 26.0, 32.0, 29.0, 1068.0, 29.0, 42.0, 45.0, 38.0, 32.0, 28.0, 27.0, 30.0, 29.0, 33.0, 24.0, 14.0, 20.0, 23.0, 25.0, 9.0, 9.0, 8.0, 7.0, 4.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6875, -5.50244140625, -5.3173828125, -5.13232421875, -4.947265625, -4.76220703125, -4.5771484375, -4.39208984375, -4.20703125, -4.02197265625, -3.8369140625, -3.65185546875, -3.466796875, -3.28173828125, -3.0966796875, -2.91162109375, -2.7265625, -2.54150390625, -2.3564453125, -2.17138671875, -1.986328125, -1.80126953125, -1.6162109375, -1.43115234375, -1.24609375, -1.06103515625, -0.8759765625, -0.69091796875, -0.505859375, -0.32080078125, -0.1357421875, 0.04931640625, 0.234375, 0.41943359375, 0.6044921875, 0.78955078125, 0.974609375, 1.15966796875, 1.3447265625, 1.52978515625, 1.71484375, 1.89990234375, 2.0849609375, 2.27001953125, 2.455078125, 2.64013671875, 2.8251953125, 3.01025390625, 3.1953125, 3.38037109375, 3.5654296875, 3.75048828125, 3.935546875, 4.12060546875, 4.3056640625, 4.49072265625, 4.67578125, 4.86083984375, 5.0458984375, 5.23095703125, 5.416015625, 5.60107421875, 5.7861328125, 5.97119140625, 6.15625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 8.0, 12.0, 26.0, 29.0, 31.0, 55.0, 63.0, 119.0, 169.0, 228.0, 348.0, 516.0, 812.0, 1187.0, 1634.0, 2567.0, 3834.0, 5782.0, 9039.0, 13497.0, 20914.0, 31506.0, 48691.0, 77271.0, 144897.0, 1360276.0, 149579.0, 79068.0, 49606.0, 32399.0, 21341.0, 14107.0, 9112.0, 6103.0, 4000.0, 2684.0, 1781.0, 1221.0, 853.0, 545.0, 398.0, 268.0, 159.0, 104.0, 92.0, 64.0, 36.0, 32.0, 17.0, 17.0, 11.0, 10.0, 4.0, 6.0, 3.0, 2.0], "bins": [-1.87890625, -1.8228607177734375, -1.766815185546875, -1.7107696533203125, -1.65472412109375, -1.5986785888671875, -1.542633056640625, -1.4865875244140625, -1.4305419921875, -1.3744964599609375, -1.318450927734375, -1.2624053955078125, -1.20635986328125, -1.1503143310546875, -1.094268798828125, -1.0382232666015625, -0.982177734375, -0.9261322021484375, -0.870086669921875, -0.8140411376953125, -0.75799560546875, -0.7019500732421875, -0.645904541015625, -0.5898590087890625, -0.5338134765625, -0.4777679443359375, -0.421722412109375, -0.3656768798828125, -0.30963134765625, -0.2535858154296875, -0.197540283203125, -0.1414947509765625, -0.08544921875, -0.0294036865234375, 0.026641845703125, 0.0826873779296875, 0.13873291015625, 0.1947784423828125, 0.250823974609375, 0.3068695068359375, 0.3629150390625, 0.4189605712890625, 0.475006103515625, 0.5310516357421875, 0.58709716796875, 0.6431427001953125, 0.699188232421875, 0.7552337646484375, 0.811279296875, 0.8673248291015625, 0.923370361328125, 0.9794158935546875, 1.03546142578125, 1.0915069580078125, 1.147552490234375, 1.2035980224609375, 1.2596435546875, 1.3156890869140625, 1.371734619140625, 1.4277801513671875, 1.48382568359375, 1.5398712158203125, 1.595916748046875, 1.6519622802734375, 1.7080078125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 8.0, 1.0, 3.0, 7.0, 7.0, 6.0, 5.0, 10.0, 22.0, 24.0, 26.0, 27.0, 23.0, 44.0, 60.0, 84.0, 93.0, 93.0, 91.0, 81.0, 70.0, 40.0, 45.0, 24.0, 19.0, 19.0, 20.0, 8.0, 13.0, 3.0, 8.0, 8.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012559890747070312, -0.001208961009979248, -0.0011619329452514648, -0.0011149048805236816, -0.0010678768157958984, -0.0010208487510681152, -0.000973820686340332, -0.0009267926216125488, -0.0008797645568847656, -0.0008327364921569824, -0.0007857084274291992, -0.000738680362701416, -0.0006916522979736328, -0.0006446242332458496, -0.0005975961685180664, -0.0005505681037902832, -0.0005035400390625, -0.0004565119743347168, -0.0004094839096069336, -0.0003624558448791504, -0.0003154277801513672, -0.000268399715423584, -0.00022137165069580078, -0.00017434358596801758, -0.00012731552124023438, -8.028745651245117e-05, -3.325939178466797e-05, 1.3768672943115234e-05, 6.079673767089844e-05, 0.00010782480239868164, 0.00015485286712646484, 0.00020188093185424805, 0.00024890899658203125, 0.00029593706130981445, 0.00034296512603759766, 0.00038999319076538086, 0.00043702125549316406, 0.00048404932022094727, 0.0005310773849487305, 0.0005781054496765137, 0.0006251335144042969, 0.0006721615791320801, 0.0007191896438598633, 0.0007662177085876465, 0.0008132457733154297, 0.0008602738380432129, 0.0009073019027709961, 0.0009543299674987793, 0.0010013580322265625, 0.0010483860969543457, 0.001095414161682129, 0.0011424422264099121, 0.0011894702911376953, 0.0012364983558654785, 0.0012835264205932617, 0.001330554485321045, 0.0013775825500488281, 0.0014246106147766113, 0.0014716386795043945, 0.0015186667442321777, 0.001565694808959961, 0.0016127228736877441, 0.0016597509384155273, 0.0017067790031433105, 0.0017538070678710938]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 5.0, 7.0, 6.0, 8.0, 13.0, 15.0, 9.0, 21.0, 33.0, 29.0, 42.0, 73.0, 108.0, 226.0, 662.0, 15762.0, 1029120.0, 1533.0, 378.0, 158.0, 88.0, 70.0, 43.0, 35.0, 32.0, 23.0, 10.0, 7.0, 7.0, 5.0, 8.0, 5.0, 5.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040985107421875, -0.03988528251647949, -0.038785457611083984, -0.03768563270568848, -0.03658580780029297, -0.03548598289489746, -0.03438615798950195, -0.033286333084106445, -0.03218650817871094, -0.03108668327331543, -0.029986858367919922, -0.028887033462524414, -0.027787208557128906, -0.0266873836517334, -0.02558755874633789, -0.024487733840942383, -0.023387908935546875, -0.022288084030151367, -0.02118825912475586, -0.02008843421936035, -0.018988609313964844, -0.017888784408569336, -0.016788959503173828, -0.01568913459777832, -0.014589309692382812, -0.013489484786987305, -0.012389659881591797, -0.011289834976196289, -0.010190010070800781, -0.009090185165405273, -0.007990360260009766, -0.006890535354614258, -0.00579071044921875, -0.004690885543823242, -0.0035910606384277344, -0.0024912357330322266, -0.0013914108276367188, -0.00029158592224121094, 0.0008082389831542969, 0.0019080638885498047, 0.0030078887939453125, 0.00410771369934082, 0.005207538604736328, 0.006307363510131836, 0.007407188415527344, 0.008507013320922852, 0.00960683822631836, 0.010706663131713867, 0.011806488037109375, 0.012906312942504883, 0.01400613784790039, 0.015105962753295898, 0.016205787658691406, 0.017305612564086914, 0.018405437469482422, 0.01950526237487793, 0.020605087280273438, 0.021704912185668945, 0.022804737091064453, 0.02390456199645996, 0.02500438690185547, 0.026104211807250977, 0.027204036712646484, 0.028303861618041992, 0.0294036865234375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 9.0, 18.0, 55.0, 110.0, 190.0, 238.0, 213.0, 118.0, 29.0, 18.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001144057372584939, -0.0011051417095586658, -0.0010662261629477143, -0.001027310499921441, -0.0009883948368951678, -0.0009494792320765555, -0.0009105636272579432, -0.0008716479642316699, -0.0008327323594130576, -0.0007938167545944452, -0.000754901091568172, -0.0007159854867495596, -0.0006770698819309473, -0.000638154218904674, -0.0005992386140860617, -0.0005603230092674494, -0.0005214073462411761, -0.00048249171231873333, -0.00044357607839629054, -0.0004046604735776782, -0.0003657448396552354, -0.0003268292057327926, -0.0002879136009141803, -0.0002489979669917375, -0.0002100823330692947, -0.0001711666991468519, -0.00013225107977632433, -9.333545312983915e-05, -5.441982648335397e-05, -1.550419256091118e-05, 2.3411426809616387e-05, 6.232704618014395e-05, 0.00010124279651790857, 0.00014015843044035137, 0.00017907404981087893, 0.0002179896691814065, 0.0002569053031038493, 0.0002958209370262921, 0.0003347365418449044, 0.0003736521757673472, 0.00041256780968979, 0.0004514834436122328, 0.0004903990775346756, 0.0005293146823532879, 0.0005682302871719003, 0.0006071459501981735, 0.0006460615550167859, 0.0006849771598353982, 0.0007238928228616714, 0.0007628084276802838, 0.000801724090706557, 0.0008406396955251694, 0.0008795553585514426, 0.000918470963370055, 0.0009573865681886673, 0.0009963022312149405, 0.0010352178942412138, 0.001074133557267487, 0.0011130491038784385, 0.0011519647669047117, 0.001190880429930985, 0.0012297960929572582, 0.0012687116395682096, 0.001307627302594483, 0.0013465428492054343]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 6.0, 3.0, 7.0, 7.0, 13.0, 13.0, 14.0, 12.0, 13.0, 19.0, 16.0, 11.0, 22.0, 23.0, 33.0, 29.0, 37.0, 40.0, 41.0, 34.0, 39.0, 40.0, 45.0, 41.0, 45.0, 46.0, 49.0, 30.0, 29.0, 28.0, 24.0, 22.0, 28.0, 25.0, 15.0, 16.0, 14.0, 18.0, 11.0, 12.0, 11.0, 6.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005917549133300781, -0.0005721943452954292, -0.0005526337772607803, -0.0005330732092261314, -0.0005135126411914825, -0.0004939520731568336, -0.00047439150512218475, -0.00045483093708753586, -0.00043527036905288696, -0.00041570980101823807, -0.00039614923298358917, -0.0003765886649489403, -0.0003570280969142914, -0.0003374675288796425, -0.0003179069608449936, -0.0002983463928103447, -0.0002787858247756958, -0.0002592252567410469, -0.000239664688706398, -0.00022010412067174911, -0.00020054355263710022, -0.00018098298460245132, -0.00016142241656780243, -0.00014186184853315353, -0.00012230128049850464, -0.00010274071246385574, -8.318014442920685e-05, -6.361957639455795e-05, -4.405900835990906e-05, -2.4498440325260162e-05, -4.937872290611267e-06, 1.4622695744037628e-05, 3.4183263778686523e-05, 5.374383181333542e-05, 7.330439984798431e-05, 9.286496788263321e-05, 0.0001124255359172821, 0.000131986103951931, 0.0001515466719865799, 0.0001711072400212288, 0.00019066780805587769, 0.00021022837609052658, 0.00022978894412517548, 0.00024934951215982437, 0.00026891008019447327, 0.00028847064822912216, 0.00030803121626377106, 0.00032759178429841995, 0.00034715235233306885, 0.00036671292036771774, 0.00038627348840236664, 0.00040583405643701553, 0.00042539462447166443, 0.0004449551925063133, 0.0004645157605409622, 0.0004840763285756111, 0.00050363689661026, 0.0005231974646449089, 0.0005427580326795578, 0.0005623186007142067, 0.0005818791687488556, 0.0006014397367835045, 0.0006210003048181534, 0.0006405608728528023, 0.0006601214408874512]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 9.0, 13.0, 13.0, 13.0, 16.0, 16.0, 31.0, 20.0, 23.0, 31.0, 39.0, 41.0, 31.0, 38.0, 42.0, 37.0, 32.0, 45.0, 50.0, 52.0, 39.0, 44.0, 39.0, 45.0, 27.0, 32.0, 27.0, 27.0, 30.0, 10.0, 16.0, 15.0, 10.0, 4.0, 8.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.4921875, -12.146240234375, -11.80029296875, -11.454345703125, -11.1083984375, -10.762451171875, -10.41650390625, -10.070556640625, -9.724609375, -9.378662109375, -9.03271484375, -8.686767578125, -8.3408203125, -7.994873046875, -7.64892578125, -7.302978515625, -6.95703125, -6.611083984375, -6.26513671875, -5.919189453125, -5.5732421875, -5.227294921875, -4.88134765625, -4.535400390625, -4.189453125, -3.843505859375, -3.49755859375, -3.151611328125, -2.8056640625, -2.459716796875, -2.11376953125, -1.767822265625, -1.421875, -1.075927734375, -0.72998046875, -0.384033203125, -0.0380859375, 0.307861328125, 0.65380859375, 0.999755859375, 1.345703125, 1.691650390625, 2.03759765625, 2.383544921875, 2.7294921875, 3.075439453125, 3.42138671875, 3.767333984375, 4.11328125, 4.459228515625, 4.80517578125, 5.151123046875, 5.4970703125, 5.843017578125, 6.18896484375, 6.534912109375, 6.880859375, 7.226806640625, 7.57275390625, 7.918701171875, 8.2646484375, 8.610595703125, 8.95654296875, 9.302490234375, 9.6484375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 5.0, 10.0, 20.0, 6.0, 18.0, 36.0, 26.0, 63.0, 102.0, 216.0, 490.0, 1481.0, 4413.0, 16351.0, 66053.0, 385260.0, 467912.0, 79090.0, 18962.0, 5324.0, 1584.0, 582.0, 241.0, 105.0, 61.0, 42.0, 31.0, 21.0, 17.0, 11.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-13.7421875, -13.42303466796875, -13.1038818359375, -12.78472900390625, -12.465576171875, -12.14642333984375, -11.8272705078125, -11.50811767578125, -11.18896484375, -10.86981201171875, -10.5506591796875, -10.23150634765625, -9.912353515625, -9.59320068359375, -9.2740478515625, -8.95489501953125, -8.6357421875, -8.31658935546875, -7.9974365234375, -7.67828369140625, -7.359130859375, -7.03997802734375, -6.7208251953125, -6.40167236328125, -6.08251953125, -5.76336669921875, -5.4442138671875, -5.12506103515625, -4.805908203125, -4.48675537109375, -4.1676025390625, -3.84844970703125, -3.529296875, -3.21014404296875, -2.8909912109375, -2.57183837890625, -2.252685546875, -1.93353271484375, -1.6143798828125, -1.29522705078125, -0.97607421875, -0.65692138671875, -0.3377685546875, -0.01861572265625, 0.300537109375, 0.61968994140625, 0.9388427734375, 1.25799560546875, 1.5771484375, 1.89630126953125, 2.2154541015625, 2.53460693359375, 2.853759765625, 3.17291259765625, 3.4920654296875, 3.81121826171875, 4.13037109375, 4.44952392578125, 4.7686767578125, 5.08782958984375, 5.406982421875, 5.72613525390625, 6.0452880859375, 6.36444091796875, 6.68359375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 10.0, 9.0, 9.0, 13.0, 26.0, 23.0, 26.0, 28.0, 38.0, 45.0, 48.0, 67.0, 60.0, 134.0, 1885.0, 137.0, 71.0, 70.0, 48.0, 40.0, 37.0, 40.0, 34.0, 35.0, 24.0, 24.0, 11.0, 20.0, 0.0, 9.0, 3.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.90625, -42.515625, -41.125, -39.734375, -38.34375, -36.953125, -35.5625, -34.171875, -32.78125, -31.390625, -30.0, -28.609375, -27.21875, -25.828125, -24.4375, -23.046875, -21.65625, -20.265625, -18.875, -17.484375, -16.09375, -14.703125, -13.3125, -11.921875, -10.53125, -9.140625, -7.75, -6.359375, -4.96875, -3.578125, -2.1875, -0.796875, 0.59375, 1.984375, 3.375, 4.765625, 6.15625, 7.546875, 8.9375, 10.328125, 11.71875, 13.109375, 14.5, 15.890625, 17.28125, 18.671875, 20.0625, 21.453125, 22.84375, 24.234375, 25.625, 27.015625, 28.40625, 29.796875, 31.1875, 32.578125, 33.96875, 35.359375, 36.75, 38.140625, 39.53125, 40.921875, 42.3125, 43.703125, 45.09375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 7.0, 4.0, 19.0, 15.0, 30.0, 43.0, 53.0, 71.0, 91.0, 119.0, 187.0, 252.0, 405.0, 1277.0, 2772244.0, 368688.0, 1045.0, 350.0, 239.0, 164.0, 96.0, 82.0, 53.0, 36.0, 39.0, 20.0, 17.0, 11.0, 12.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-118.6875, -115.19140625, -111.6953125, -108.19921875, -104.703125, -101.20703125, -97.7109375, -94.21484375, -90.71875, -87.22265625, -83.7265625, -80.23046875, -76.734375, -73.23828125, -69.7421875, -66.24609375, -62.75, -59.25390625, -55.7578125, -52.26171875, -48.765625, -45.26953125, -41.7734375, -38.27734375, -34.78125, -31.28515625, -27.7890625, -24.29296875, -20.796875, -17.30078125, -13.8046875, -10.30859375, -6.8125, -3.31640625, 0.1796875, 3.67578125, 7.171875, 10.66796875, 14.1640625, 17.66015625, 21.15625, 24.65234375, 28.1484375, 31.64453125, 35.140625, 38.63671875, 42.1328125, 45.62890625, 49.125, 52.62109375, 56.1171875, 59.61328125, 63.109375, 66.60546875, 70.1015625, 73.59765625, 77.09375, 80.58984375, 84.0859375, 87.58203125, 91.078125, 94.57421875, 98.0703125, 101.56640625, 105.0625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 940.0, 71.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-582.8887939453125, -572.5997924804688, -562.310791015625, -552.0217895507812, -541.7327880859375, -531.4437866210938, -521.15478515625, -510.8657531738281, -500.5767517089844, -490.2877502441406, -479.9987487792969, -469.7097473144531, -459.4207458496094, -449.1317138671875, -438.84271240234375, -428.5537109375, -418.26470947265625, -407.9757080078125, -397.68670654296875, -387.397705078125, -377.10870361328125, -366.8197021484375, -356.53070068359375, -346.2416687011719, -335.95269775390625, -325.6636962890625, -315.37469482421875, -305.085693359375, -294.79669189453125, -284.5076904296875, -274.21868896484375, -263.9296569824219, -253.64065551757812, -243.35165405273438, -233.06265258789062, -222.77365112304688, -212.48463439941406, -202.1956329345703, -191.90663146972656, -181.61761474609375, -171.32862854003906, -161.0396270751953, -150.75062561035156, -140.46160888671875, -130.172607421875, -119.88360595703125, -109.5946044921875, -99.30559539794922, -89.01659393310547, -78.72759246826172, -68.43858337402344, -58.14958190917969, -47.86057662963867, -37.571571350097656, -27.282569885253906, -16.993560791015625, -6.704559326171875, 3.584444999694824, 13.873449325561523, 24.162452697753906, 34.45145797729492, 44.74046325683594, 55.02946472167969, 65.31847381591797, 75.60747528076172]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 6.0, 6.0, 7.0, 9.0, 10.0, 19.0, 17.0, 13.0, 16.0, 18.0, 22.0, 29.0, 24.0, 30.0, 47.0, 33.0, 38.0, 32.0, 37.0, 36.0, 38.0, 30.0, 48.0, 44.0, 49.0, 32.0, 35.0, 29.0, 29.0, 32.0, 31.0, 15.0, 19.0, 19.0, 22.0, 14.0, 12.0, 10.0, 5.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-96.1603775024414, -93.10614013671875, -90.0519027709961, -86.99766540527344, -83.94342041015625, -80.8891830444336, -77.83494567871094, -74.78070831298828, -71.72647094726562, -68.67223358154297, -65.61799621582031, -62.56375503540039, -59.509517669677734, -56.45527648925781, -53.401039123535156, -50.3468017578125, -47.29256057739258, -44.23832321166992, -41.18408203125, -38.129844665527344, -35.07560729980469, -32.02136993408203, -28.96712875366211, -25.912891387939453, -22.858652114868164, -19.804412841796875, -16.75017547607422, -13.69593620300293, -10.641697883605957, -7.587459564208984, -4.533220291137695, -1.478982925415039, 1.57525634765625, 4.629494667053223, 7.6837334632873535, 10.737972259521484, 13.792210578918457, 16.84644889831543, 19.90068817138672, 22.954925537109375, 26.009164810180664, 29.063404083251953, 32.11764144897461, 35.17188262939453, 38.22611999511719, 41.280357360839844, 44.3345947265625, 47.388832092285156, 50.44307327270508, 53.497310638427734, 56.551551818847656, 59.60578918457031, 62.66002655029297, 65.71426391601562, 68.76850891113281, 71.82273864746094, 74.87698364257812, 77.93122100830078, 80.98545837402344, 84.03970336914062, 87.09394073486328, 90.14817810058594, 93.2024154663086, 96.25665283203125, 99.3108901977539]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 6.0, 2.0, 4.0, 5.0, 3.0, 8.0, 9.0, 10.0, 16.0, 17.0, 9.0, 21.0, 22.0, 31.0, 19.0, 32.0, 32.0, 31.0, 39.0, 33.0, 45.0, 38.0, 33.0, 29.0, 53.0, 54.0, 50.0, 33.0, 38.0, 32.0, 32.0, 34.0, 32.0, 33.0, 20.0, 23.0, 11.0, 9.0, 17.0, 12.0, 9.0, 9.0, 2.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.5703125, -12.2254638671875, -11.880615234375, -11.5357666015625, -11.19091796875, -10.8460693359375, -10.501220703125, -10.1563720703125, -9.8115234375, -9.4666748046875, -9.121826171875, -8.7769775390625, -8.43212890625, -8.0872802734375, -7.742431640625, -7.3975830078125, -7.052734375, -6.7078857421875, -6.363037109375, -6.0181884765625, -5.67333984375, -5.3284912109375, -4.983642578125, -4.6387939453125, -4.2939453125, -3.9490966796875, -3.604248046875, -3.2593994140625, -2.91455078125, -2.5697021484375, -2.224853515625, -1.8800048828125, -1.53515625, -1.1903076171875, -0.845458984375, -0.5006103515625, -0.15576171875, 0.1890869140625, 0.533935546875, 0.8787841796875, 1.2236328125, 1.5684814453125, 1.913330078125, 2.2581787109375, 2.60302734375, 2.9478759765625, 3.292724609375, 3.6375732421875, 3.982421875, 4.3272705078125, 4.672119140625, 5.0169677734375, 5.36181640625, 5.7066650390625, 6.051513671875, 6.3963623046875, 6.7412109375, 7.0860595703125, 7.430908203125, 7.7757568359375, 8.12060546875, 8.4654541015625, 8.810302734375, 9.1551513671875, 9.5]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 7.0, 10.0, 9.0, 7.0, 14.0, 14.0, 17.0, 17.0, 19.0, 25.0, 33.0, 48.0, 44.0, 69.0, 137.0, 257.0, 619.0, 1680.0, 11074.0, 936725.0, 3170821.0, 67487.0, 3311.0, 945.0, 363.0, 151.0, 78.0, 50.0, 44.0, 40.0, 21.0, 28.0, 26.0, 25.0, 12.0, 12.0, 8.0, 5.0, 12.0, 5.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-42.03125, -40.87109375, -39.7109375, -38.55078125, -37.390625, -36.23046875, -35.0703125, -33.91015625, -32.75, -31.58984375, -30.4296875, -29.26953125, -28.109375, -26.94921875, -25.7890625, -24.62890625, -23.46875, -22.30859375, -21.1484375, -19.98828125, -18.828125, -17.66796875, -16.5078125, -15.34765625, -14.1875, -13.02734375, -11.8671875, -10.70703125, -9.546875, -8.38671875, -7.2265625, -6.06640625, -4.90625, -3.74609375, -2.5859375, -1.42578125, -0.265625, 0.89453125, 2.0546875, 3.21484375, 4.375, 5.53515625, 6.6953125, 7.85546875, 9.015625, 10.17578125, 11.3359375, 12.49609375, 13.65625, 14.81640625, 15.9765625, 17.13671875, 18.296875, 19.45703125, 20.6171875, 21.77734375, 22.9375, 24.09765625, 25.2578125, 26.41796875, 27.578125, 28.73828125, 29.8984375, 31.05859375, 32.21875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 1.0, 6.0, 7.0, 8.0, 19.0, 23.0, 47.0, 32.0, 54.0, 60.0, 110.0, 146.0, 193.0, 358.0, 491.0, 599.0, 547.0, 433.0, 267.0, 188.0, 133.0, 89.0, 70.0, 50.0, 42.0, 35.0, 17.0, 14.0, 6.0, 7.0, 3.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.484375, -22.845703125, -22.20703125, -21.568359375, -20.9296875, -20.291015625, -19.65234375, -19.013671875, -18.375, -17.736328125, -17.09765625, -16.458984375, -15.8203125, -15.181640625, -14.54296875, -13.904296875, -13.265625, -12.626953125, -11.98828125, -11.349609375, -10.7109375, -10.072265625, -9.43359375, -8.794921875, -8.15625, -7.517578125, -6.87890625, -6.240234375, -5.6015625, -4.962890625, -4.32421875, -3.685546875, -3.046875, -2.408203125, -1.76953125, -1.130859375, -0.4921875, 0.146484375, 0.78515625, 1.423828125, 2.0625, 2.701171875, 3.33984375, 3.978515625, 4.6171875, 5.255859375, 5.89453125, 6.533203125, 7.171875, 7.810546875, 8.44921875, 9.087890625, 9.7265625, 10.365234375, 11.00390625, 11.642578125, 12.28125, 12.919921875, 13.55859375, 14.197265625, 14.8359375, 15.474609375, 16.11328125, 16.751953125, 17.390625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 7.0, 10.0, 21.0, 36.0, 44.0, 50.0, 66.0, 110.0, 154.0, 184.0, 257.0, 428.0, 937.0, 26502.0, 4158448.0, 5124.0, 683.0, 357.0, 209.0, 167.0, 117.0, 107.0, 70.0, 48.0, 43.0, 28.0, 14.0, 12.0, 11.0, 11.0, 11.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-145.125, -141.2421875, -137.359375, -133.4765625, -129.59375, -125.7109375, -121.828125, -117.9453125, -114.0625, -110.1796875, -106.296875, -102.4140625, -98.53125, -94.6484375, -90.765625, -86.8828125, -83.0, -79.1171875, -75.234375, -71.3515625, -67.46875, -63.5859375, -59.703125, -55.8203125, -51.9375, -48.0546875, -44.171875, -40.2890625, -36.40625, -32.5234375, -28.640625, -24.7578125, -20.875, -16.9921875, -13.109375, -9.2265625, -5.34375, -1.4609375, 2.421875, 6.3046875, 10.1875, 14.0703125, 17.953125, 21.8359375, 25.71875, 29.6015625, 33.484375, 37.3671875, 41.25, 45.1328125, 49.015625, 52.8984375, 56.78125, 60.6640625, 64.546875, 68.4296875, 72.3125, 76.1953125, 80.078125, 83.9609375, 87.84375, 91.7265625, 95.609375, 99.4921875, 103.375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 56.0, 463.0, 450.0, 45.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-488.7304382324219, -478.0940856933594, -467.4577331542969, -456.8213806152344, -446.18505859375, -435.5487060546875, -424.912353515625, -414.2760009765625, -403.6396484375, -393.0032958984375, -382.366943359375, -371.7305908203125, -361.09423828125, -350.4579162597656, -339.8215637207031, -329.1852111816406, -318.5488586425781, -307.9125061035156, -297.2761535644531, -286.6398010253906, -276.00347900390625, -265.36712646484375, -254.73077392578125, -244.09442138671875, -233.45806884765625, -222.82171630859375, -212.18536376953125, -201.5490264892578, -190.9126739501953, -180.2763214111328, -169.63998413085938, -159.00363159179688, -148.3672637939453, -137.7309112548828, -127.09456634521484, -116.45822143554688, -105.82186889648438, -95.18551635742188, -84.5491714477539, -73.91282653808594, -63.27647399902344, -52.6401252746582, -42.00377655029297, -31.367427825927734, -20.7310791015625, -10.094730377197266, 0.5416183471679688, 11.177963256835938, 21.814315795898438, 32.45066452026367, 43.087013244628906, 53.72336196899414, 64.35971069335938, 74.99606323242188, 85.63240814208984, 96.26875305175781, 106.90510559082031, 117.54145812988281, 128.17779541015625, 138.81414794921875, 149.45050048828125, 160.08685302734375, 170.72320556640625, 181.3595428466797, 191.9958953857422]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 7.0, 5.0, 5.0, 12.0, 5.0, 7.0, 15.0, 12.0, 15.0, 19.0, 25.0, 29.0, 29.0, 29.0, 39.0, 35.0, 37.0, 48.0, 40.0, 45.0, 39.0, 37.0, 38.0, 49.0, 44.0, 35.0, 40.0, 36.0, 28.0, 31.0, 32.0, 26.0, 19.0, 15.0, 9.0, 8.0, 12.0, 13.0, 8.0, 8.0, 4.0, 1.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-60.716278076171875, -58.83168029785156, -56.947086334228516, -55.0624885559082, -53.177894592285156, -51.293296813964844, -49.4087028503418, -47.524105072021484, -45.63951110839844, -43.754913330078125, -41.87031936645508, -39.985721588134766, -38.10112762451172, -36.216529846191406, -34.33193588256836, -32.44733810424805, -30.562742233276367, -28.678146362304688, -26.793550491333008, -24.908954620361328, -23.02435874938965, -21.13976287841797, -19.255165100097656, -17.37057113647461, -15.485974311828613, -13.601378440856934, -11.716782569885254, -9.832185745239258, -7.947590351104736, -6.062994003295898, -4.178398132324219, -2.293802261352539, -0.4092063903808594, 1.4753895998001099, 3.359985589981079, 5.244581699371338, 7.129177570343018, 9.013773918151855, 10.898369789123535, 12.782965660095215, 14.667561531066895, 16.55215835571289, 18.43675422668457, 20.32135009765625, 22.20594596862793, 24.09054183959961, 25.97513771057129, 27.85973358154297, 29.74432945251465, 31.628925323486328, 33.51352310180664, 35.39811706542969, 37.28271484375, 39.16730880737305, 41.05190658569336, 42.936500549316406, 44.82109832763672, 46.70569610595703, 48.59029006958008, 50.47488784790039, 52.35948181152344, 54.24407958984375, 56.1286735534668, 58.01327133178711, 59.897865295410156]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 11.0, 8.0, 12.0, 14.0, 9.0, 16.0, 15.0, 21.0, 20.0, 32.0, 24.0, 31.0, 34.0, 37.0, 37.0, 33.0, 34.0, 39.0, 46.0, 37.0, 43.0, 52.0, 54.0, 29.0, 44.0, 32.0, 32.0, 23.0, 35.0, 20.0, 24.0, 14.0, 24.0, 14.0, 9.0, 5.0, 5.0, 9.0, 8.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.15625, -10.8189697265625, -10.481689453125, -10.1444091796875, -9.80712890625, -9.4698486328125, -9.132568359375, -8.7952880859375, -8.4580078125, -8.1207275390625, -7.783447265625, -7.4461669921875, -7.10888671875, -6.7716064453125, -6.434326171875, -6.0970458984375, -5.759765625, -5.4224853515625, -5.085205078125, -4.7479248046875, -4.41064453125, -4.0733642578125, -3.736083984375, -3.3988037109375, -3.0615234375, -2.7242431640625, -2.386962890625, -2.0496826171875, -1.71240234375, -1.3751220703125, -1.037841796875, -0.7005615234375, -0.36328125, -0.0260009765625, 0.311279296875, 0.6485595703125, 0.98583984375, 1.3231201171875, 1.660400390625, 1.9976806640625, 2.3349609375, 2.6722412109375, 3.009521484375, 3.3468017578125, 3.68408203125, 4.0213623046875, 4.358642578125, 4.6959228515625, 5.033203125, 5.3704833984375, 5.707763671875, 6.0450439453125, 6.38232421875, 6.7196044921875, 7.056884765625, 7.3941650390625, 7.7314453125, 8.0687255859375, 8.406005859375, 8.7432861328125, 9.08056640625, 9.4178466796875, 9.755126953125, 10.0924072265625, 10.4296875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 8.0, 13.0, 8.0, 7.0, 23.0, 44.0, 50.0, 71.0, 100.0, 168.0, 267.0, 386.0, 662.0, 1019.0, 1667.0, 2650.0, 4316.0, 6817.0, 11599.0, 19011.0, 32455.0, 56827.0, 107048.0, 266630.0, 283720.0, 111179.0, 58376.0, 33242.0, 19624.0, 11764.0, 7098.0, 4412.0, 2687.0, 1691.0, 1080.0, 633.0, 419.0, 285.0, 150.0, 118.0, 81.0, 51.0, 25.0, 28.0, 19.0, 12.0, 6.0, 2.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.423828125, -2.350433349609375, -2.27703857421875, -2.203643798828125, -2.1302490234375, -2.056854248046875, -1.98345947265625, -1.910064697265625, -1.836669921875, -1.763275146484375, -1.68988037109375, -1.616485595703125, -1.5430908203125, -1.469696044921875, -1.39630126953125, -1.322906494140625, -1.24951171875, -1.176116943359375, -1.10272216796875, -1.029327392578125, -0.9559326171875, -0.882537841796875, -0.80914306640625, -0.735748291015625, -0.662353515625, -0.588958740234375, -0.51556396484375, -0.442169189453125, -0.3687744140625, -0.295379638671875, -0.22198486328125, -0.148590087890625, -0.0751953125, -0.001800537109375, 0.07159423828125, 0.144989013671875, 0.2183837890625, 0.291778564453125, 0.36517333984375, 0.438568115234375, 0.511962890625, 0.585357666015625, 0.65875244140625, 0.732147216796875, 0.8055419921875, 0.878936767578125, 0.95233154296875, 1.025726318359375, 1.09912109375, 1.172515869140625, 1.24591064453125, 1.319305419921875, 1.3927001953125, 1.466094970703125, 1.53948974609375, 1.612884521484375, 1.686279296875, 1.759674072265625, 1.83306884765625, 1.906463623046875, 1.9798583984375, 2.053253173828125, 2.12664794921875, 2.200042724609375, 2.2734375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 6.0, 6.0, 5.0, 4.0, 10.0, 11.0, 13.0, 11.0, 16.0, 16.0, 29.0, 29.0, 30.0, 37.0, 27.0, 33.0, 33.0, 34.0, 45.0, 47.0, 1066.0, 52.0, 52.0, 56.0, 37.0, 36.0, 39.0, 32.0, 33.0, 35.0, 23.0, 27.0, 17.0, 18.0, 12.0, 10.0, 15.0, 9.0, 8.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.16015625, -6.93499755859375, -6.7098388671875, -6.48468017578125, -6.259521484375, -6.03436279296875, -5.8092041015625, -5.58404541015625, -5.35888671875, -5.13372802734375, -4.9085693359375, -4.68341064453125, -4.458251953125, -4.23309326171875, -4.0079345703125, -3.78277587890625, -3.5576171875, -3.33245849609375, -3.1072998046875, -2.88214111328125, -2.656982421875, -2.43182373046875, -2.2066650390625, -1.98150634765625, -1.75634765625, -1.53118896484375, -1.3060302734375, -1.08087158203125, -0.855712890625, -0.63055419921875, -0.4053955078125, -0.18023681640625, 0.044921875, 0.27008056640625, 0.4952392578125, 0.72039794921875, 0.945556640625, 1.17071533203125, 1.3958740234375, 1.62103271484375, 1.84619140625, 2.07135009765625, 2.2965087890625, 2.52166748046875, 2.746826171875, 2.97198486328125, 3.1971435546875, 3.42230224609375, 3.6474609375, 3.87261962890625, 4.0977783203125, 4.32293701171875, 4.548095703125, 4.77325439453125, 4.9984130859375, 5.22357177734375, 5.44873046875, 5.67388916015625, 5.8990478515625, 6.12420654296875, 6.349365234375, 6.57452392578125, 6.7996826171875, 7.02484130859375, 7.25]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 2.0, 8.0, 16.0, 10.0, 15.0, 23.0, 45.0, 70.0, 117.0, 145.0, 212.0, 330.0, 481.0, 726.0, 1129.0, 1827.0, 2997.0, 4568.0, 7390.0, 11829.0, 19234.0, 31479.0, 52726.0, 95184.0, 236532.0, 1366461.0, 112036.0, 59221.0, 35282.0, 21533.0, 13255.0, 8041.0, 5093.0, 3189.0, 2093.0, 1316.0, 848.0, 504.0, 354.0, 281.0, 146.0, 130.0, 86.0, 55.0, 32.0, 27.0, 15.0, 12.0, 11.0, 6.0, 1.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-2.177734375, -2.10992431640625, -2.0421142578125, -1.97430419921875, -1.906494140625, -1.83868408203125, -1.7708740234375, -1.70306396484375, -1.63525390625, -1.56744384765625, -1.4996337890625, -1.43182373046875, -1.364013671875, -1.29620361328125, -1.2283935546875, -1.16058349609375, -1.0927734375, -1.02496337890625, -0.9571533203125, -0.88934326171875, -0.821533203125, -0.75372314453125, -0.6859130859375, -0.61810302734375, -0.55029296875, -0.48248291015625, -0.4146728515625, -0.34686279296875, -0.279052734375, -0.21124267578125, -0.1434326171875, -0.07562255859375, -0.0078125, 0.05999755859375, 0.1278076171875, 0.19561767578125, 0.263427734375, 0.33123779296875, 0.3990478515625, 0.46685791015625, 0.53466796875, 0.60247802734375, 0.6702880859375, 0.73809814453125, 0.805908203125, 0.87371826171875, 0.9415283203125, 1.00933837890625, 1.0771484375, 1.14495849609375, 1.2127685546875, 1.28057861328125, 1.348388671875, 1.41619873046875, 1.4840087890625, 1.55181884765625, 1.61962890625, 1.68743896484375, 1.7552490234375, 1.82305908203125, 1.890869140625, 1.95867919921875, 2.0264892578125, 2.09429931640625, 2.162109375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 10.0, 12.0, 11.0, 14.0, 26.0, 42.0, 45.0, 55.0, 76.0, 69.0, 98.0, 104.0, 106.0, 72.0, 59.0, 58.0, 37.0, 25.0, 19.0, 14.0, 8.0, 5.0, 5.0, 7.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013370513916015625, -0.0012881606817245483, -0.0012392699718475342, -0.00119037926197052, -0.0011414885520935059, -0.0010925978422164917, -0.0010437071323394775, -0.0009948164224624634, -0.0009459257125854492, -0.0008970350027084351, -0.0008481442928314209, -0.0007992535829544067, -0.0007503628730773926, -0.0007014721632003784, -0.0006525814533233643, -0.0006036907434463501, -0.0005548000335693359, -0.0005059093236923218, -0.0004570186138153076, -0.00040812790393829346, -0.0003592371940612793, -0.00031034648418426514, -0.000261455774307251, -0.00021256506443023682, -0.00016367435455322266, -0.0001147836446762085, -6.589293479919434e-05, -1.7002224922180176e-05, 3.1888484954833984e-05, 8.077919483184814e-05, 0.0001296699047088623, 0.00017856061458587646, 0.00022745132446289062, 0.0002763420343399048, 0.00032523274421691895, 0.0003741234540939331, 0.00042301416397094727, 0.0004719048738479614, 0.0005207955837249756, 0.0005696862936019897, 0.0006185770034790039, 0.0006674677133560181, 0.0007163584232330322, 0.0007652491331100464, 0.0008141398429870605, 0.0008630305528640747, 0.0009119212627410889, 0.000960811972618103, 0.0010097026824951172, 0.0010585933923721313, 0.0011074841022491455, 0.0011563748121261597, 0.0012052655220031738, 0.001254156231880188, 0.0013030469417572021, 0.0013519376516342163, 0.0014008283615112305, 0.0014497190713882446, 0.0014986097812652588, 0.001547500491142273, 0.0015963912010192871, 0.0016452819108963013, 0.0016941726207733154, 0.0017430633306503296, 0.0017919540405273438]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 6.0, 8.0, 4.0, 7.0, 19.0, 25.0, 38.0, 55.0, 113.0, 153.0, 407.0, 3032.0, 1042206.0, 1676.0, 344.0, 174.0, 89.0, 50.0, 41.0, 32.0, 18.0, 16.0, 12.0, 8.0, 5.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.045074462890625, -0.04383659362792969, -0.042598724365234375, -0.04136085510253906, -0.04012298583984375, -0.03888511657714844, -0.037647247314453125, -0.03640937805175781, -0.0351715087890625, -0.03393363952636719, -0.032695770263671875, -0.03145790100097656, -0.03022003173828125, -0.028982162475585938, -0.027744293212890625, -0.026506423950195312, -0.0252685546875, -0.024030685424804688, -0.022792816162109375, -0.021554946899414062, -0.02031707763671875, -0.019079208374023438, -0.017841339111328125, -0.016603469848632812, -0.0153656005859375, -0.014127731323242188, -0.012889862060546875, -0.011651992797851562, -0.01041412353515625, -0.009176254272460938, -0.007938385009765625, -0.0067005157470703125, -0.005462646484375, -0.0042247772216796875, -0.002986907958984375, -0.0017490386962890625, -0.00051116943359375, 0.0007266998291015625, 0.001964569091796875, 0.0032024383544921875, 0.0044403076171875, 0.0056781768798828125, 0.006916046142578125, 0.008153915405273438, 0.00939178466796875, 0.010629653930664062, 0.011867523193359375, 0.013105392456054688, 0.01434326171875, 0.015581130981445312, 0.016819000244140625, 0.018056869506835938, 0.01929473876953125, 0.020532608032226562, 0.021770477294921875, 0.023008346557617188, 0.0242462158203125, 0.025484085083007812, 0.026721954345703125, 0.027959823608398438, 0.02919769287109375, 0.030435562133789062, 0.031673431396484375, 0.03291130065917969, 0.034149169921875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 8.0, 21.0, 47.0, 143.0, 244.0, 297.0, 171.0, 61.0, 17.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020674681290984154, -0.0020226251799613237, -0.001977782230824232, -0.0019329393981024623, -0.0018880964489653707, -0.0018432536162436008, -0.0017984106671065092, -0.0017535677179694176, -0.001708724768832326, -0.0016638818196952343, -0.0016190389869734645, -0.0015741960378363729, -0.0015293530886992812, -0.0014845102559775114, -0.0014396673068404198, -0.0013948243577033281, -0.0013499815249815583, -0.0013051385758444667, -0.0012602957431226969, -0.0012154527939856052, -0.0011706098448485136, -0.001125766895711422, -0.0010809240629896522, -0.0010360811138525605, -0.0009912382811307907, -0.00094639539020136, -0.0009015524410642684, -0.0008567095501348376, -0.000811866600997746, -0.0007670237100683153, -0.0007221808191388845, -0.0006773378700017929, -0.0006324950372800231, -0.0005876521463505924, -0.0005428091972135007, -0.00049796630628407, -0.00045312338625080884, -0.00040828046621754766, -0.00036343757528811693, -0.00031859465525485575, -0.00027375173522159457, -0.0002289088151883334, -0.00018406590970698744, -0.0001392230042256415, -9.438008419238031e-05, -4.953716415911913e-05, -4.694273229688406e-06, 4.0148646803572774e-05, 8.499156683683395e-05, 0.00012983448687009513, 0.00017467739235144109, 0.00021952029783278704, 0.0002643632178660482, 0.0003092061378993094, 0.0003540490288287401, 0.0003988919488620013, 0.0004437348688952625, 0.0004885777598246932, 0.0005334207089617848, 0.0005782635998912156, 0.0006231064908206463, 0.0006679494399577379, 0.0007127923308871686, 0.0007576352218165994, 0.000802478170953691]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 3.0, 3.0, 5.0, 9.0, 7.0, 9.0, 14.0, 22.0, 21.0, 29.0, 15.0, 24.0, 33.0, 37.0, 36.0, 39.0, 43.0, 33.0, 39.0, 44.0, 37.0, 30.0, 44.0, 44.0, 44.0, 47.0, 42.0, 40.0, 22.0, 34.0, 17.0, 30.0, 21.0, 9.0, 17.0, 13.0, 7.0, 8.0, 7.0, 12.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005329251289367676, -0.000513705424964428, -0.0004944857209920883, -0.0004752660170197487, -0.00045604631304740906, -0.00043682660907506943, -0.0004176069051027298, -0.00039838720113039017, -0.00037916749715805054, -0.0003599477931857109, -0.0003407280892133713, -0.00032150838524103165, -0.000302288681268692, -0.0002830689772963524, -0.00026384927332401276, -0.0002446295693516731, -0.0002254098653793335, -0.00020619016140699387, -0.00018697045743465424, -0.0001677507534623146, -0.00014853104948997498, -0.00012931134551763535, -0.00011009164154529572, -9.087193757295609e-05, -7.165223360061646e-05, -5.2432529628276825e-05, -3.3212825655937195e-05, -1.3993121683597565e-05, 5.2265822887420654e-06, 2.4446286261081696e-05, 4.3665990233421326e-05, 6.288569420576096e-05, 8.210539817810059e-05, 0.00010132510215044022, 0.00012054480612277985, 0.00013976451009511948, 0.0001589842140674591, 0.00017820391803979874, 0.00019742362201213837, 0.000216643325984478, 0.00023586302995681763, 0.00025508273392915726, 0.0002743024379014969, 0.0002935221418738365, 0.00031274184584617615, 0.0003319615498185158, 0.0003511812537908554, 0.00037040095776319504, 0.00038962066173553467, 0.0004088403657078743, 0.00042806006968021393, 0.00044727977365255356, 0.0004664994776248932, 0.0004857191815972328, 0.0005049388855695724, 0.0005241585895419121, 0.0005433782935142517, 0.0005625979974865913, 0.000581817701458931, 0.0006010374054312706, 0.0006202571094036102, 0.0006394768133759499, 0.0006586965173482895, 0.0006779162213206291, 0.0006971359252929688]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 11.0, 8.0, 12.0, 14.0, 9.0, 16.0, 15.0, 21.0, 20.0, 32.0, 24.0, 31.0, 34.0, 37.0, 37.0, 33.0, 34.0, 39.0, 46.0, 37.0, 43.0, 52.0, 54.0, 29.0, 44.0, 32.0, 32.0, 23.0, 35.0, 20.0, 24.0, 14.0, 24.0, 14.0, 9.0, 5.0, 5.0, 9.0, 8.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.15625, -10.8189697265625, -10.481689453125, -10.1444091796875, -9.80712890625, -9.4698486328125, -9.132568359375, -8.7952880859375, -8.4580078125, -8.1207275390625, -7.783447265625, -7.4461669921875, -7.10888671875, -6.7716064453125, -6.434326171875, -6.0970458984375, -5.759765625, -5.4224853515625, -5.085205078125, -4.7479248046875, -4.41064453125, -4.0733642578125, -3.736083984375, -3.3988037109375, -3.0615234375, -2.7242431640625, -2.386962890625, -2.0496826171875, -1.71240234375, -1.3751220703125, -1.037841796875, -0.7005615234375, -0.36328125, -0.0260009765625, 0.311279296875, 0.6485595703125, 0.98583984375, 1.3231201171875, 1.660400390625, 1.9976806640625, 2.3349609375, 2.6722412109375, 3.009521484375, 3.3468017578125, 3.68408203125, 4.0213623046875, 4.358642578125, 4.6959228515625, 5.033203125, 5.3704833984375, 5.707763671875, 6.0450439453125, 6.38232421875, 6.7196044921875, 7.056884765625, 7.3941650390625, 7.7314453125, 8.0687255859375, 8.406005859375, 8.7432861328125, 9.08056640625, 9.4178466796875, 9.755126953125, 10.0924072265625, 10.4296875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 10.0, 12.0, 13.0, 22.0, 22.0, 32.0, 37.0, 57.0, 80.0, 85.0, 124.0, 162.0, 274.0, 475.0, 928.0, 2563.0, 8483.0, 33001.0, 144155.0, 597821.0, 199754.0, 43629.0, 10972.0, 3166.0, 1084.0, 510.0, 316.0, 213.0, 148.0, 96.0, 76.0, 49.0, 52.0, 38.0, 24.0, 12.0, 10.0, 17.0, 9.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.921875, -11.55615234375, -11.1904296875, -10.82470703125, -10.458984375, -10.09326171875, -9.7275390625, -9.36181640625, -8.99609375, -8.63037109375, -8.2646484375, -7.89892578125, -7.533203125, -7.16748046875, -6.8017578125, -6.43603515625, -6.0703125, -5.70458984375, -5.3388671875, -4.97314453125, -4.607421875, -4.24169921875, -3.8759765625, -3.51025390625, -3.14453125, -2.77880859375, -2.4130859375, -2.04736328125, -1.681640625, -1.31591796875, -0.9501953125, -0.58447265625, -0.21875, 0.14697265625, 0.5126953125, 0.87841796875, 1.244140625, 1.60986328125, 1.9755859375, 2.34130859375, 2.70703125, 3.07275390625, 3.4384765625, 3.80419921875, 4.169921875, 4.53564453125, 4.9013671875, 5.26708984375, 5.6328125, 5.99853515625, 6.3642578125, 6.72998046875, 7.095703125, 7.46142578125, 7.8271484375, 8.19287109375, 8.55859375, 8.92431640625, 9.2900390625, 9.65576171875, 10.021484375, 10.38720703125, 10.7529296875, 11.11865234375, 11.484375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 3.0, 7.0, 9.0, 10.0, 10.0, 10.0, 17.0, 29.0, 22.0, 16.0, 30.0, 38.0, 35.0, 49.0, 38.0, 52.0, 68.0, 110.0, 1691.0, 311.0, 77.0, 56.0, 46.0, 49.0, 29.0, 33.0, 31.0, 28.0, 11.0, 29.0, 14.0, 19.0, 11.0, 13.0, 14.0, 8.0, 11.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-38.15625, -37.09130859375, -36.0263671875, -34.96142578125, -33.896484375, -32.83154296875, -31.7666015625, -30.70166015625, -29.63671875, -28.57177734375, -27.5068359375, -26.44189453125, -25.376953125, -24.31201171875, -23.2470703125, -22.18212890625, -21.1171875, -20.05224609375, -18.9873046875, -17.92236328125, -16.857421875, -15.79248046875, -14.7275390625, -13.66259765625, -12.59765625, -11.53271484375, -10.4677734375, -9.40283203125, -8.337890625, -7.27294921875, -6.2080078125, -5.14306640625, -4.078125, -3.01318359375, -1.9482421875, -0.88330078125, 0.181640625, 1.24658203125, 2.3115234375, 3.37646484375, 4.44140625, 5.50634765625, 6.5712890625, 7.63623046875, 8.701171875, 9.76611328125, 10.8310546875, 11.89599609375, 12.9609375, 14.02587890625, 15.0908203125, 16.15576171875, 17.220703125, 18.28564453125, 19.3505859375, 20.41552734375, 21.48046875, 22.54541015625, 23.6103515625, 24.67529296875, 25.740234375, 26.80517578125, 27.8701171875, 28.93505859375, 30.0]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 11.0, 19.0, 20.0, 19.0, 27.0, 37.0, 43.0, 57.0, 87.0, 117.0, 153.0, 232.0, 336.0, 840.0, 15082.0, 3121172.0, 5616.0, 681.0, 332.0, 222.0, 131.0, 124.0, 80.0, 59.0, 55.0, 33.0, 16.0, 28.0, 16.0, 17.0, 6.0, 11.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.3125, -67.650390625, -64.98828125, -62.326171875, -59.6640625, -57.001953125, -54.33984375, -51.677734375, -49.015625, -46.353515625, -43.69140625, -41.029296875, -38.3671875, -35.705078125, -33.04296875, -30.380859375, -27.71875, -25.056640625, -22.39453125, -19.732421875, -17.0703125, -14.408203125, -11.74609375, -9.083984375, -6.421875, -3.759765625, -1.09765625, 1.564453125, 4.2265625, 6.888671875, 9.55078125, 12.212890625, 14.875, 17.537109375, 20.19921875, 22.861328125, 25.5234375, 28.185546875, 30.84765625, 33.509765625, 36.171875, 38.833984375, 41.49609375, 44.158203125, 46.8203125, 49.482421875, 52.14453125, 54.806640625, 57.46875, 60.130859375, 62.79296875, 65.455078125, 68.1171875, 70.779296875, 73.44140625, 76.103515625, 78.765625, 81.427734375, 84.08984375, 86.751953125, 89.4140625, 92.076171875, 94.73828125, 97.400390625, 100.0625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 59.0, 280.0, 466.0, 177.0, 26.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.5234832763672, -131.73863220214844, -128.9537811279297, -126.1689224243164, -123.38407135009766, -120.5992202758789, -117.81436157226562, -115.02951049804688, -112.24465942382812, -109.45980834960938, -106.6749496459961, -103.89009857177734, -101.1052474975586, -98.32039642333984, -95.53553771972656, -92.75068664550781, -89.96583557128906, -87.18098449707031, -84.39612579345703, -81.61127471923828, -78.82642364501953, -76.04157257080078, -73.2567138671875, -70.47186279296875, -67.68700408935547, -64.90215301513672, -62.1172981262207, -59.33244323730469, -56.54759216308594, -53.76273727416992, -50.977882385253906, -48.193031311035156, -45.408180236816406, -42.62332534790039, -39.83847427368164, -37.053619384765625, -34.268768310546875, -31.48391342163086, -28.699060440063477, -25.914207458496094, -23.12935447692871, -20.344501495361328, -17.559648513793945, -14.774794578552246, -11.989941596984863, -9.20508861541748, -6.420234680175781, -3.6353816986083984, -0.8505287170410156, 1.9343245029449463, 4.719177722930908, 7.504031181335449, 10.288884162902832, 13.073737144470215, 15.858591079711914, 18.643444061279297, 21.42829704284668, 24.213150024414062, 26.998003005981445, 29.782855987548828, 32.567710876464844, 35.352561950683594, 38.13741683959961, 40.922271728515625, 43.707122802734375]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 5.0, 9.0, 8.0, 6.0, 12.0, 16.0, 19.0, 26.0, 18.0, 18.0, 20.0, 32.0, 27.0, 44.0, 30.0, 41.0, 40.0, 39.0, 36.0, 47.0, 43.0, 37.0, 39.0, 50.0, 37.0, 37.0, 30.0, 30.0, 28.0, 19.0, 24.0, 17.0, 16.0, 10.0, 18.0, 9.0, 8.0, 11.0, 4.0, 8.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-88.08821105957031, -85.36933135986328, -82.65045166015625, -79.93157196044922, -77.21269226074219, -74.49382019042969, -71.77494049072266, -69.05606079101562, -66.3371810913086, -63.61830139160156, -60.89942169189453, -58.180545806884766, -55.461666107177734, -52.7427864074707, -50.02391052246094, -47.305030822753906, -44.586151123046875, -41.867271423339844, -39.14839172363281, -36.42951583862305, -33.710636138916016, -30.991756439208984, -28.272878646850586, -25.554000854492188, -22.835121154785156, -20.116241455078125, -17.397363662719727, -14.678484916687012, -11.959606170654297, -9.240727424621582, -6.521848678588867, -3.8029708862304688, -1.0840911865234375, 1.6347875595092773, 4.353666305541992, 7.072545051574707, 9.791423797607422, 12.510302543640137, 15.229181289672852, 17.94805908203125, 20.66693878173828, 23.385818481445312, 26.10469627380371, 28.82357406616211, 31.54245376586914, 34.26133346557617, 36.98020935058594, 39.69908905029297, 42.41796875, 45.13684844970703, 47.85572814941406, 50.57460403442383, 53.29348373413086, 56.01236343383789, 58.731239318847656, 61.45011901855469, 64.16899871826172, 66.88787841796875, 69.60675811767578, 72.32563781738281, 75.04450988769531, 77.76338958740234, 80.48226928710938, 83.2011489868164, 85.92002868652344]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 6.0, 8.0, 11.0, 13.0, 10.0, 13.0, 20.0, 14.0, 17.0, 30.0, 30.0, 27.0, 31.0, 30.0, 40.0, 32.0, 34.0, 49.0, 37.0, 43.0, 36.0, 48.0, 38.0, 33.0, 31.0, 35.0, 44.0, 26.0, 28.0, 38.0, 20.0, 19.0, 18.0, 20.0, 10.0, 8.0, 11.0, 5.0, 7.0, 7.0, 3.0, 9.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.3125, -10.9759521484375, -10.639404296875, -10.3028564453125, -9.96630859375, -9.6297607421875, -9.293212890625, -8.9566650390625, -8.6201171875, -8.2835693359375, -7.947021484375, -7.6104736328125, -7.27392578125, -6.9373779296875, -6.600830078125, -6.2642822265625, -5.927734375, -5.5911865234375, -5.254638671875, -4.9180908203125, -4.58154296875, -4.2449951171875, -3.908447265625, -3.5718994140625, -3.2353515625, -2.8988037109375, -2.562255859375, -2.2257080078125, -1.88916015625, -1.5526123046875, -1.216064453125, -0.8795166015625, -0.54296875, -0.2064208984375, 0.130126953125, 0.4666748046875, 0.80322265625, 1.1397705078125, 1.476318359375, 1.8128662109375, 2.1494140625, 2.4859619140625, 2.822509765625, 3.1590576171875, 3.49560546875, 3.8321533203125, 4.168701171875, 4.5052490234375, 4.841796875, 5.1783447265625, 5.514892578125, 5.8514404296875, 6.18798828125, 6.5245361328125, 6.861083984375, 7.1976318359375, 7.5341796875, 7.8707275390625, 8.207275390625, 8.5438232421875, 8.88037109375, 9.2169189453125, 9.553466796875, 9.8900146484375, 10.2265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 4.0, 5.0, 10.0, 8.0, 5.0, 13.0, 16.0, 24.0, 27.0, 34.0, 40.0, 50.0, 67.0, 88.0, 118.0, 171.0, 291.0, 503.0, 1469.0, 8192.0, 379326.0, 3599756.0, 195555.0, 5899.0, 1218.0, 483.0, 246.0, 162.0, 93.0, 99.0, 64.0, 65.0, 40.0, 32.0, 13.0, 23.0, 15.0, 12.0, 7.0, 10.0, 5.0, 4.0, 4.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.90625, -35.80224609375, -34.6982421875, -33.59423828125, -32.490234375, -31.38623046875, -30.2822265625, -29.17822265625, -28.07421875, -26.97021484375, -25.8662109375, -24.76220703125, -23.658203125, -22.55419921875, -21.4501953125, -20.34619140625, -19.2421875, -18.13818359375, -17.0341796875, -15.93017578125, -14.826171875, -13.72216796875, -12.6181640625, -11.51416015625, -10.41015625, -9.30615234375, -8.2021484375, -7.09814453125, -5.994140625, -4.89013671875, -3.7861328125, -2.68212890625, -1.578125, -0.47412109375, 0.6298828125, 1.73388671875, 2.837890625, 3.94189453125, 5.0458984375, 6.14990234375, 7.25390625, 8.35791015625, 9.4619140625, 10.56591796875, 11.669921875, 12.77392578125, 13.8779296875, 14.98193359375, 16.0859375, 17.18994140625, 18.2939453125, 19.39794921875, 20.501953125, 21.60595703125, 22.7099609375, 23.81396484375, 24.91796875, 26.02197265625, 27.1259765625, 28.22998046875, 29.333984375, 30.43798828125, 31.5419921875, 32.64599609375, 33.75]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 5.0, 10.0, 24.0, 31.0, 70.0, 157.0, 326.0, 684.0, 1181.0, 857.0, 366.0, 175.0, 88.0, 53.0, 28.0, 13.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.625, -60.331787109375, -59.03857421875, -57.745361328125, -56.4521484375, -55.158935546875, -53.86572265625, -52.572509765625, -51.279296875, -49.986083984375, -48.69287109375, -47.399658203125, -46.1064453125, -44.813232421875, -43.52001953125, -42.226806640625, -40.93359375, -39.640380859375, -38.34716796875, -37.053955078125, -35.7607421875, -34.467529296875, -33.17431640625, -31.881103515625, -30.587890625, -29.294677734375, -28.00146484375, -26.708251953125, -25.4150390625, -24.121826171875, -22.82861328125, -21.535400390625, -20.2421875, -18.948974609375, -17.65576171875, -16.362548828125, -15.0693359375, -13.776123046875, -12.48291015625, -11.189697265625, -9.896484375, -8.603271484375, -7.31005859375, -6.016845703125, -4.7236328125, -3.430419921875, -2.13720703125, -0.843994140625, 0.44921875, 1.742431640625, 3.03564453125, 4.328857421875, 5.6220703125, 6.915283203125, 8.20849609375, 9.501708984375, 10.794921875, 12.088134765625, 13.38134765625, 14.674560546875, 15.9677734375, 17.260986328125, 18.55419921875, 19.847412109375, 21.140625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 18.0, 23.0, 71.0, 115.0, 168.0, 261.0, 605.0, 5006.0, 4185254.0, 1621.0, 494.0, 279.0, 155.0, 93.0, 50.0, 33.0, 15.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.1875, -115.6611328125, -108.134765625, -100.6083984375, -93.08203125, -85.5556640625, -78.029296875, -70.5029296875, -62.9765625, -55.4501953125, -47.923828125, -40.3974609375, -32.87109375, -25.3447265625, -17.818359375, -10.2919921875, -2.765625, 4.7607421875, 12.287109375, 19.8134765625, 27.33984375, 34.8662109375, 42.392578125, 49.9189453125, 57.4453125, 64.9716796875, 72.498046875, 80.0244140625, 87.55078125, 95.0771484375, 102.603515625, 110.1298828125, 117.65625, 125.1826171875, 132.708984375, 140.2353515625, 147.76171875, 155.2880859375, 162.814453125, 170.3408203125, 177.8671875, 185.3935546875, 192.919921875, 200.4462890625, 207.97265625, 215.4990234375, 223.025390625, 230.5517578125, 238.078125, 245.6044921875, 253.130859375, 260.6572265625, 268.18359375, 275.7099609375, 283.236328125, 290.7626953125, 298.2890625, 305.8154296875, 313.341796875, 320.8681640625, 328.39453125, 335.9208984375, 343.447265625, 350.9736328125, 358.5]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 10.0, 22.0, 33.0, 63.0, 114.0, 162.0, 170.0, 161.0, 130.0, 69.0, 39.0, 21.0, 8.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.78638458251953, -103.0548324584961, -100.32328033447266, -97.59172821044922, -94.86017608642578, -92.12862396240234, -89.3970718383789, -86.66551971435547, -83.93396759033203, -81.2024154663086, -78.47086334228516, -75.73931121826172, -73.00775909423828, -70.27620697021484, -67.5446548461914, -64.81310272216797, -62.08155059814453, -59.349998474121094, -56.618446350097656, -53.88689422607422, -51.15534210205078, -48.423789978027344, -45.692237854003906, -42.96068572998047, -40.22913360595703, -37.497581481933594, -34.766029357910156, -32.03447723388672, -29.30292510986328, -26.571372985839844, -23.839820861816406, -21.10826873779297, -18.37671661376953, -15.645164489746094, -12.913612365722656, -10.182060241699219, -7.450508117675781, -4.718955993652344, -1.9874038696289062, 0.7441482543945312, 3.4757003784179688, 6.207252502441406, 8.938804626464844, 11.670356750488281, 14.401908874511719, 17.133460998535156, 19.865013122558594, 22.59656524658203, 25.32811737060547, 28.059669494628906, 30.791221618652344, 33.52277374267578, 36.25432586669922, 38.985877990722656, 41.717430114746094, 44.44898223876953, 47.18053436279297, 49.912086486816406, 52.643638610839844, 55.37519073486328, 58.10674285888672, 60.838294982910156, 63.569847106933594, 66.30139923095703, 69.03295135498047]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 4.0, 10.0, 3.0, 7.0, 8.0, 11.0, 20.0, 19.0, 18.0, 17.0, 23.0, 28.0, 36.0, 29.0, 37.0, 39.0, 26.0, 38.0, 40.0, 42.0, 40.0, 36.0, 35.0, 37.0, 43.0, 35.0, 39.0, 26.0, 37.0, 32.0, 26.0, 19.0, 23.0, 14.0, 21.0, 14.0, 15.0, 10.0, 7.0, 6.0, 9.0, 2.0, 2.0, 7.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.13151550292969, -53.29866409301758, -51.4658088684082, -49.632957458496094, -47.80010223388672, -45.96725082397461, -44.1343994140625, -42.301544189453125, -40.46868896484375, -38.63583755493164, -36.802982330322266, -34.970130920410156, -33.13727569580078, -31.304424285888672, -29.47157096862793, -27.638717651367188, -25.805866241455078, -23.973012924194336, -22.140159606933594, -20.307308197021484, -18.47445297241211, -16.6416015625, -14.808748245239258, -12.975894927978516, -11.143041610717773, -9.310188293457031, -7.477335453033447, -5.644482612609863, -3.811629295349121, -1.978775978088379, -0.14592361450195312, 1.686929702758789, 3.5197792053222656, 5.352632522583008, 7.185485363006592, 9.018338203430176, 10.851191520690918, 12.68404483795166, 14.516897201538086, 16.349750518798828, 18.18260383605957, 20.015457153320312, 21.848310470581055, 23.681163787841797, 25.514015197753906, 27.34687042236328, 29.17972183227539, 31.012575149536133, 32.845428466796875, 34.678279876708984, 36.51113510131836, 38.34398651123047, 40.176841735839844, 42.00969314575195, 43.84254455566406, 45.67539978027344, 47.50825500488281, 49.34110641479492, 51.1739616394043, 53.006813049316406, 54.83966827392578, 56.67251968383789, 58.50537109375, 60.338226318359375, 62.171077728271484]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 4.0, 1.0, 2.0, 4.0, 10.0, 8.0, 11.0, 15.0, 16.0, 19.0, 17.0, 26.0, 23.0, 21.0, 27.0, 33.0, 31.0, 39.0, 38.0, 52.0, 43.0, 48.0, 45.0, 49.0, 39.0, 35.0, 34.0, 32.0, 32.0, 33.0, 32.0, 30.0, 24.0, 26.0, 14.0, 13.0, 13.0, 19.0, 13.0, 7.0, 6.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.7265625, -11.384765625, -11.04296875, -10.701171875, -10.359375, -10.017578125, -9.67578125, -9.333984375, -8.9921875, -8.650390625, -8.30859375, -7.966796875, -7.625, -7.283203125, -6.94140625, -6.599609375, -6.2578125, -5.916015625, -5.57421875, -5.232421875, -4.890625, -4.548828125, -4.20703125, -3.865234375, -3.5234375, -3.181640625, -2.83984375, -2.498046875, -2.15625, -1.814453125, -1.47265625, -1.130859375, -0.7890625, -0.447265625, -0.10546875, 0.236328125, 0.578125, 0.919921875, 1.26171875, 1.603515625, 1.9453125, 2.287109375, 2.62890625, 2.970703125, 3.3125, 3.654296875, 3.99609375, 4.337890625, 4.6796875, 5.021484375, 5.36328125, 5.705078125, 6.046875, 6.388671875, 6.73046875, 7.072265625, 7.4140625, 7.755859375, 8.09765625, 8.439453125, 8.78125, 9.123046875, 9.46484375, 9.806640625, 10.1484375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 7.0, 4.0, 11.0, 15.0, 33.0, 35.0, 53.0, 71.0, 118.0, 137.0, 292.0, 351.0, 544.0, 863.0, 1167.0, 1862.0, 2862.0, 4274.0, 6603.0, 10524.0, 16338.0, 25713.0, 41219.0, 68990.0, 125888.0, 311599.0, 193206.0, 92015.0, 53531.0, 32524.0, 20528.0, 12970.0, 8436.0, 5357.0, 3585.0, 2247.0, 1468.0, 1069.0, 634.0, 454.0, 290.0, 208.0, 139.0, 103.0, 67.0, 52.0, 29.0, 30.0, 15.0, 6.0, 9.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0], "bins": [-2.158203125, -2.092315673828125, -2.02642822265625, -1.960540771484375, -1.8946533203125, -1.828765869140625, -1.76287841796875, -1.696990966796875, -1.631103515625, -1.565216064453125, -1.49932861328125, -1.433441162109375, -1.3675537109375, -1.301666259765625, -1.23577880859375, -1.169891357421875, -1.10400390625, -1.038116455078125, -0.97222900390625, -0.906341552734375, -0.8404541015625, -0.774566650390625, -0.70867919921875, -0.642791748046875, -0.576904296875, -0.511016845703125, -0.44512939453125, -0.379241943359375, -0.3133544921875, -0.247467041015625, -0.18157958984375, -0.115692138671875, -0.0498046875, 0.016082763671875, 0.08197021484375, 0.147857666015625, 0.2137451171875, 0.279632568359375, 0.34552001953125, 0.411407470703125, 0.477294921875, 0.543182373046875, 0.60906982421875, 0.674957275390625, 0.7408447265625, 0.806732177734375, 0.87261962890625, 0.938507080078125, 1.00439453125, 1.070281982421875, 1.13616943359375, 1.202056884765625, 1.2679443359375, 1.333831787109375, 1.39971923828125, 1.465606689453125, 1.531494140625, 1.597381591796875, 1.66326904296875, 1.729156494140625, 1.7950439453125, 1.860931396484375, 1.92681884765625, 1.992706298828125, 2.05859375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 5.0, 5.0, 6.0, 3.0, 11.0, 12.0, 14.0, 10.0, 16.0, 26.0, 18.0, 25.0, 32.0, 27.0, 40.0, 37.0, 51.0, 51.0, 49.0, 50.0, 1059.0, 42.0, 40.0, 32.0, 41.0, 35.0, 31.0, 37.0, 41.0, 27.0, 24.0, 20.0, 18.0, 16.0, 15.0, 14.0, 10.0, 8.0, 8.0, 7.0, 1.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.71484375, -6.49041748046875, -6.2659912109375, -6.04156494140625, -5.817138671875, -5.59271240234375, -5.3682861328125, -5.14385986328125, -4.91943359375, -4.69500732421875, -4.4705810546875, -4.24615478515625, -4.021728515625, -3.79730224609375, -3.5728759765625, -3.34844970703125, -3.1240234375, -2.89959716796875, -2.6751708984375, -2.45074462890625, -2.226318359375, -2.00189208984375, -1.7774658203125, -1.55303955078125, -1.32861328125, -1.10418701171875, -0.8797607421875, -0.65533447265625, -0.430908203125, -0.20648193359375, 0.0179443359375, 0.24237060546875, 0.466796875, 0.69122314453125, 0.9156494140625, 1.14007568359375, 1.364501953125, 1.58892822265625, 1.8133544921875, 2.03778076171875, 2.26220703125, 2.48663330078125, 2.7110595703125, 2.93548583984375, 3.159912109375, 3.38433837890625, 3.6087646484375, 3.83319091796875, 4.0576171875, 4.28204345703125, 4.5064697265625, 4.73089599609375, 4.955322265625, 5.17974853515625, 5.4041748046875, 5.62860107421875, 5.85302734375, 6.07745361328125, 6.3018798828125, 6.52630615234375, 6.750732421875, 6.97515869140625, 7.1995849609375, 7.42401123046875, 7.6484375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 17.0, 22.0, 32.0, 57.0, 67.0, 94.0, 144.0, 234.0, 356.0, 571.0, 867.0, 1378.0, 2187.0, 3287.0, 5285.0, 8260.0, 12947.0, 20671.0, 34262.0, 58619.0, 110895.0, 1336706.0, 253414.0, 104041.0, 55950.0, 32510.0, 19817.0, 12380.0, 7818.0, 5070.0, 3215.0, 2060.0, 1441.0, 859.0, 552.0, 348.0, 226.0, 155.0, 88.0, 65.0, 50.0, 40.0, 32.0, 17.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.3125, -2.244384765625, -2.17626953125, -2.108154296875, -2.0400390625, -1.971923828125, -1.90380859375, -1.835693359375, -1.767578125, -1.699462890625, -1.63134765625, -1.563232421875, -1.4951171875, -1.427001953125, -1.35888671875, -1.290771484375, -1.22265625, -1.154541015625, -1.08642578125, -1.018310546875, -0.9501953125, -0.882080078125, -0.81396484375, -0.745849609375, -0.677734375, -0.609619140625, -0.54150390625, -0.473388671875, -0.4052734375, -0.337158203125, -0.26904296875, -0.200927734375, -0.1328125, -0.064697265625, 0.00341796875, 0.071533203125, 0.1396484375, 0.207763671875, 0.27587890625, 0.343994140625, 0.412109375, 0.480224609375, 0.54833984375, 0.616455078125, 0.6845703125, 0.752685546875, 0.82080078125, 0.888916015625, 0.95703125, 1.025146484375, 1.09326171875, 1.161376953125, 1.2294921875, 1.297607421875, 1.36572265625, 1.433837890625, 1.501953125, 1.570068359375, 1.63818359375, 1.706298828125, 1.7744140625, 1.842529296875, 1.91064453125, 1.978759765625, 2.046875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 6.0, 5.0, 10.0, 2.0, 8.0, 2.0, 5.0, 9.0, 10.0, 16.0, 10.0, 30.0, 25.0, 34.0, 34.0, 31.0, 40.0, 61.0, 57.0, 63.0, 85.0, 72.0, 53.0, 55.0, 45.0, 34.0, 43.0, 25.0, 23.0, 23.0, 12.0, 14.0, 8.0, 7.0, 5.0, 8.0, 2.0, 10.0, 3.0, 5.0, 3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0009737014770507812, -0.0009406507015228271, -0.000907599925994873, -0.0008745491504669189, -0.0008414983749389648, -0.0008084475994110107, -0.0007753968238830566, -0.0007423460483551025, -0.0007092952728271484, -0.0006762444972991943, -0.0006431937217712402, -0.0006101429462432861, -0.000577092170715332, -0.0005440413951873779, -0.0005109906196594238, -0.0004779398441314697, -0.0004448890686035156, -0.0004118382930755615, -0.0003787875175476074, -0.0003457367420196533, -0.0003126859664916992, -0.0002796351909637451, -0.000246584415435791, -0.00021353363990783691, -0.0001804828643798828, -0.0001474320888519287, -0.00011438131332397461, -8.133053779602051e-05, -4.8279762268066406e-05, -1.5228986740112305e-05, 1.7821788787841797e-05, 5.08725643157959e-05, 8.392333984375e-05, 0.0001169741153717041, 0.0001500248908996582, 0.0001830756664276123, 0.0002161264419555664, 0.0002491772174835205, 0.0002822279930114746, 0.0003152787685394287, 0.0003483295440673828, 0.0003813803195953369, 0.000414431095123291, 0.0004474818706512451, 0.0004805326461791992, 0.0005135834217071533, 0.0005466341972351074, 0.0005796849727630615, 0.0006127357482910156, 0.0006457865238189697, 0.0006788372993469238, 0.0007118880748748779, 0.000744938850402832, 0.0007779896259307861, 0.0008110404014587402, 0.0008440911769866943, 0.0008771419525146484, 0.0009101927280426025, 0.0009432435035705566, 0.0009762942790985107, 0.0010093450546264648, 0.001042395830154419, 0.001075446605682373, 0.0011084973812103271, 0.0011415481567382812]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 4.0, 2.0, 5.0, 4.0, 14.0, 12.0, 11.0, 24.0, 19.0, 39.0, 59.0, 80.0, 137.0, 205.0, 459.0, 1725.0, 1024660.0, 19561.0, 751.0, 277.0, 143.0, 104.0, 63.0, 46.0, 42.0, 20.0, 18.0, 9.0, 13.0, 10.0, 10.0, 6.0, 4.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.03326416015625, -0.03230595588684082, -0.03134775161743164, -0.03038954734802246, -0.02943134307861328, -0.0284731388092041, -0.027514934539794922, -0.026556730270385742, -0.025598526000976562, -0.024640321731567383, -0.023682117462158203, -0.022723913192749023, -0.021765708923339844, -0.020807504653930664, -0.019849300384521484, -0.018891096115112305, -0.017932891845703125, -0.016974687576293945, -0.016016483306884766, -0.015058279037475586, -0.014100074768066406, -0.013141870498657227, -0.012183666229248047, -0.011225461959838867, -0.010267257690429688, -0.009309053421020508, -0.008350849151611328, -0.0073926448822021484, -0.006434440612792969, -0.005476236343383789, -0.004518032073974609, -0.0035598278045654297, -0.00260162353515625, -0.0016434192657470703, -0.0006852149963378906, 0.00027298927307128906, 0.0012311935424804688, 0.0021893978118896484, 0.003147602081298828, 0.004105806350708008, 0.0050640106201171875, 0.006022214889526367, 0.006980419158935547, 0.007938623428344727, 0.008896827697753906, 0.009855031967163086, 0.010813236236572266, 0.011771440505981445, 0.012729644775390625, 0.013687849044799805, 0.014646053314208984, 0.015604257583618164, 0.016562461853027344, 0.017520666122436523, 0.018478870391845703, 0.019437074661254883, 0.020395278930664062, 0.021353483200073242, 0.022311687469482422, 0.0232698917388916, 0.02422809600830078, 0.02518630027770996, 0.02614450454711914, 0.02710270881652832, 0.0280609130859375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 45.0, 173.0, 428.0, 283.0, 64.0, 10.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014867241261526942, -0.001414787257090211, -0.0013428505044430494, -0.0012709136353805661, -0.0011989767663180828, -0.0011270400136709213, -0.001055103144608438, -0.0009831662755459547, -0.0009112295228987932, -0.0008392927120439708, -0.0007673559011891484, -0.0006954190321266651, -0.0006234822212718427, -0.0005515454104170203, -0.00047960857045836747, -0.0004076717304997146, -0.0003357349196448922, -0.0002637981087900698, -0.00019186126883141696, -0.00011992444342467934, -4.798761801794171e-05, 2.3949192836880684e-05, 9.588603279553354e-05, 0.0001678228727541864, 0.0002397596836090088, 0.0003116964944638312, 0.00038363333442248404, 0.0004555701743811369, 0.0005275069852359593, 0.0005994437960907817, 0.000671380665153265, 0.0007433174760080874, 0.000815254170447588, 0.0008871909813024104, 0.0009591277921572328, 0.001031064661219716, 0.0011030014138668776, 0.0011749382829293609, 0.0012468751519918442, 0.0013188119046390057, 0.001390748773701489, 0.0014626856427639723, 0.0015346223954111338, 0.001606559264473617, 0.0016784961335361004, 0.0017504328861832619, 0.0018223697552457452, 0.0018943066243082285, 0.00196624337695539, 0.0020381801296025515, 0.0021101171150803566, 0.002182053867727518, 0.0022539906203746796, 0.002325927373021841, 0.002397864358499646, 0.0024698011111468077, 0.002541738096624613, 0.0026136748492717743, 0.0026856118347495794, 0.002757548587396741, 0.0028294853400439024, 0.0029014223255217075, 0.002973359078168869, 0.0030452958308160305, 0.003117232583463192]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 0.0, 2.0, 4.0, 8.0, 6.0, 12.0, 13.0, 12.0, 9.0, 21.0, 20.0, 18.0, 27.0, 16.0, 32.0, 40.0, 35.0, 42.0, 41.0, 27.0, 31.0, 32.0, 36.0, 50.0, 44.0, 32.0, 40.0, 40.0, 47.0, 35.0, 23.0, 28.0, 32.0, 22.0, 21.0, 19.0, 15.0, 14.0, 18.0, 6.0, 10.0, 4.0, 5.0, 5.0, 3.0, 7.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0005573034286499023, -0.000540412962436676, -0.0005235224962234497, -0.0005066320300102234, -0.0004897415637969971, -0.00047285109758377075, -0.00045596063137054443, -0.0004390701651573181, -0.0004221796989440918, -0.0004052892327308655, -0.00038839876651763916, -0.00037150830030441284, -0.0003546178340911865, -0.0003377273678779602, -0.0003208369016647339, -0.00030394643545150757, -0.00028705596923828125, -0.00027016550302505493, -0.0002532750368118286, -0.0002363845705986023, -0.00021949410438537598, -0.00020260363817214966, -0.00018571317195892334, -0.00016882270574569702, -0.0001519322395324707, -0.00013504177331924438, -0.00011815130710601807, -0.00010126084089279175, -8.437037467956543e-05, -6.747990846633911e-05, -5.058944225311279e-05, -3.3698976039886475e-05, -1.6808509826660156e-05, 8.195638656616211e-08, 1.697242259979248e-05, 3.38628888130188e-05, 5.075335502624512e-05, 6.764382123947144e-05, 8.453428745269775e-05, 0.00010142475366592407, 0.00011831521987915039, 0.0001352056860923767, 0.00015209615230560303, 0.00016898661851882935, 0.00018587708473205566, 0.00020276755094528198, 0.0002196580171585083, 0.00023654848337173462, 0.00025343894958496094, 0.00027032941579818726, 0.0002872198820114136, 0.0003041103482246399, 0.0003210008144378662, 0.00033789128065109253, 0.00035478174686431885, 0.00037167221307754517, 0.0003885626792907715, 0.0004054531455039978, 0.0004223436117172241, 0.00043923407793045044, 0.00045612454414367676, 0.0004730150103569031, 0.0004899054765701294, 0.0005067959427833557, 0.000523686408996582]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 4.0, 1.0, 2.0, 4.0, 10.0, 8.0, 11.0, 15.0, 16.0, 19.0, 17.0, 26.0, 23.0, 21.0, 27.0, 33.0, 31.0, 39.0, 38.0, 52.0, 43.0, 48.0, 45.0, 49.0, 39.0, 35.0, 34.0, 32.0, 32.0, 33.0, 32.0, 30.0, 24.0, 26.0, 14.0, 13.0, 13.0, 19.0, 13.0, 7.0, 6.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.7265625, -11.384765625, -11.04296875, -10.701171875, -10.359375, -10.017578125, -9.67578125, -9.333984375, -8.9921875, -8.650390625, -8.30859375, -7.966796875, -7.625, -7.283203125, -6.94140625, -6.599609375, -6.2578125, -5.916015625, -5.57421875, -5.232421875, -4.890625, -4.548828125, -4.20703125, -3.865234375, -3.5234375, -3.181640625, -2.83984375, -2.498046875, -2.15625, -1.814453125, -1.47265625, -1.130859375, -0.7890625, -0.447265625, -0.10546875, 0.236328125, 0.578125, 0.919921875, 1.26171875, 1.603515625, 1.9453125, 2.287109375, 2.62890625, 2.970703125, 3.3125, 3.654296875, 3.99609375, 4.337890625, 4.6796875, 5.021484375, 5.36328125, 5.705078125, 6.046875, 6.388671875, 6.73046875, 7.072265625, 7.4140625, 7.755859375, 8.09765625, 8.439453125, 8.78125, 9.123046875, 9.46484375, 9.806640625, 10.1484375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 9.0, 5.0, 2.0, 3.0, 5.0, 12.0, 10.0, 10.0, 38.0, 17.0, 32.0, 42.0, 59.0, 83.0, 98.0, 130.0, 213.0, 319.0, 539.0, 905.0, 2307.0, 11214.0, 139013.0, 816944.0, 65737.0, 6900.0, 1688.0, 759.0, 455.0, 282.0, 198.0, 123.0, 105.0, 69.0, 62.0, 31.0, 27.0, 34.0, 24.0, 19.0, 8.0, 8.0, 8.0, 5.0, 7.0, 0.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.625, -20.995849609375, -20.36669921875, -19.737548828125, -19.1083984375, -18.479248046875, -17.85009765625, -17.220947265625, -16.591796875, -15.962646484375, -15.33349609375, -14.704345703125, -14.0751953125, -13.446044921875, -12.81689453125, -12.187744140625, -11.55859375, -10.929443359375, -10.30029296875, -9.671142578125, -9.0419921875, -8.412841796875, -7.78369140625, -7.154541015625, -6.525390625, -5.896240234375, -5.26708984375, -4.637939453125, -4.0087890625, -3.379638671875, -2.75048828125, -2.121337890625, -1.4921875, -0.863037109375, -0.23388671875, 0.395263671875, 1.0244140625, 1.653564453125, 2.28271484375, 2.911865234375, 3.541015625, 4.170166015625, 4.79931640625, 5.428466796875, 6.0576171875, 6.686767578125, 7.31591796875, 7.945068359375, 8.57421875, 9.203369140625, 9.83251953125, 10.461669921875, 11.0908203125, 11.719970703125, 12.34912109375, 12.978271484375, 13.607421875, 14.236572265625, 14.86572265625, 15.494873046875, 16.1240234375, 16.753173828125, 17.38232421875, 18.011474609375, 18.640625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 1.0, 6.0, 7.0, 11.0, 13.0, 24.0, 31.0, 39.0, 29.0, 46.0, 57.0, 60.0, 96.0, 287.0, 1821.0, 100.0, 79.0, 64.0, 65.0, 55.0, 40.0, 35.0, 24.0, 13.0, 17.0, 8.0, 5.0, 5.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.0, -53.3896484375, -51.779296875, -50.1689453125, -48.55859375, -46.9482421875, -45.337890625, -43.7275390625, -42.1171875, -40.5068359375, -38.896484375, -37.2861328125, -35.67578125, -34.0654296875, -32.455078125, -30.8447265625, -29.234375, -27.6240234375, -26.013671875, -24.4033203125, -22.79296875, -21.1826171875, -19.572265625, -17.9619140625, -16.3515625, -14.7412109375, -13.130859375, -11.5205078125, -9.91015625, -8.2998046875, -6.689453125, -5.0791015625, -3.46875, -1.8583984375, -0.248046875, 1.3623046875, 2.97265625, 4.5830078125, 6.193359375, 7.8037109375, 9.4140625, 11.0244140625, 12.634765625, 14.2451171875, 15.85546875, 17.4658203125, 19.076171875, 20.6865234375, 22.296875, 23.9072265625, 25.517578125, 27.1279296875, 28.73828125, 30.3486328125, 31.958984375, 33.5693359375, 35.1796875, 36.7900390625, 38.400390625, 40.0107421875, 41.62109375, 43.2314453125, 44.841796875, 46.4521484375, 48.0625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 6.0, 6.0, 16.0, 18.0, 26.0, 41.0, 44.0, 72.0, 97.0, 150.0, 358.0, 1225.0, 3121940.0, 20514.0, 562.0, 241.0, 125.0, 68.0, 40.0, 37.0, 33.0, 23.0, 18.0, 13.0, 6.0, 7.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-143.875, -139.046875, -134.21875, -129.390625, -124.5625, -119.734375, -114.90625, -110.078125, -105.25, -100.421875, -95.59375, -90.765625, -85.9375, -81.109375, -76.28125, -71.453125, -66.625, -61.796875, -56.96875, -52.140625, -47.3125, -42.484375, -37.65625, -32.828125, -28.0, -23.171875, -18.34375, -13.515625, -8.6875, -3.859375, 0.96875, 5.796875, 10.625, 15.453125, 20.28125, 25.109375, 29.9375, 34.765625, 39.59375, 44.421875, 49.25, 54.078125, 58.90625, 63.734375, 68.5625, 73.390625, 78.21875, 83.046875, 87.875, 92.703125, 97.53125, 102.359375, 107.1875, 112.015625, 116.84375, 121.671875, 126.5, 131.328125, 136.15625, 140.984375, 145.8125, 150.640625, 155.46875, 160.296875, 165.125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 11.0, 27.0, 71.0, 142.0, 175.0, 227.0, 162.0, 114.0, 52.0, 24.0, 6.0, 1.0, 1.0], "bins": [-73.5364990234375, -72.2325210571289, -70.92853546142578, -69.62455749511719, -68.3205795288086, -67.01659393310547, -65.71261596679688, -64.40863800048828, -63.104652404785156, -61.8006706237793, -60.4966926574707, -59.192710876464844, -57.888729095458984, -56.584747314453125, -55.28076934814453, -53.97678756713867, -52.67280960083008, -51.36882781982422, -50.064849853515625, -48.760868072509766, -47.456886291503906, -46.15290832519531, -44.84892654418945, -43.544944763183594, -42.240966796875, -40.93698501586914, -39.63300704956055, -38.32902526855469, -37.02504348754883, -35.72106170654297, -34.417083740234375, -33.113101959228516, -31.80912208557129, -30.505142211914062, -29.201160430908203, -27.897180557250977, -26.59320068359375, -25.28921890258789, -23.985239028930664, -22.681259155273438, -21.377277374267578, -20.07329750061035, -18.769315719604492, -17.465335845947266, -16.161354064941406, -14.85737419128418, -13.553394317626953, -12.24941349029541, -10.945432662963867, -9.641451835632324, -8.337471008300781, -7.033491134643555, -5.729510307312012, -4.425529479980469, -3.121549129486084, -1.8175687789916992, -0.5135879516601562, 0.7903926372528076, 2.0943732261657715, 3.3983538150787354, 4.702334403991699, 6.006315231323242, 7.310295581817627, 8.614275932312012, 9.918256759643555]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 5.0, 15.0, 10.0, 13.0, 13.0, 13.0, 14.0, 24.0, 32.0, 36.0, 30.0, 37.0, 32.0, 40.0, 42.0, 41.0, 34.0, 37.0, 52.0, 36.0, 45.0, 35.0, 38.0, 34.0, 33.0, 41.0, 21.0, 27.0, 26.0, 21.0, 28.0, 13.0, 12.0, 13.0, 13.0, 9.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-139.5255584716797, -135.69566345214844, -131.86575317382812, -128.03585815429688, -124.2059555053711, -120.37605285644531, -116.54615783691406, -112.71625518798828, -108.8863525390625, -105.05644989013672, -101.22655487060547, -97.39665222167969, -93.5667495727539, -89.73684692382812, -85.90695190429688, -82.0770492553711, -78.24714660644531, -74.41724395751953, -70.58734893798828, -66.7574462890625, -62.92754364013672, -59.0976448059082, -55.26774597167969, -51.437843322753906, -47.607948303222656, -43.77804946899414, -39.94814682006836, -36.118247985839844, -32.28834533691406, -28.458446502685547, -24.6285457611084, -20.79864501953125, -16.96874237060547, -13.13884162902832, -9.308940887451172, -5.47904109954834, -1.6491403579711914, 2.1807594299316406, 6.010660171508789, 9.840560913085938, 13.670461654663086, 17.500362396240234, 21.330263137817383, 25.16016387939453, 28.990062713623047, 32.81996154785156, 36.649864196777344, 40.479766845703125, 44.30966567993164, 48.139564514160156, 51.96946716308594, 55.79936599731445, 59.629268646240234, 63.45916748046875, 67.28907012939453, 71.11897277832031, 74.94886779785156, 78.77877044677734, 82.6086654663086, 86.43856811523438, 90.26847076416016, 94.09837341308594, 97.92826843261719, 101.75817108154297, 105.58807373046875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 1.0, 9.0, 8.0, 12.0, 13.0, 10.0, 9.0, 19.0, 27.0, 20.0, 18.0, 34.0, 26.0, 32.0, 30.0, 44.0, 33.0, 41.0, 44.0, 36.0, 58.0, 47.0, 37.0, 34.0, 29.0, 33.0, 36.0, 31.0, 36.0, 32.0, 26.0, 17.0, 13.0, 14.0, 20.0, 13.0, 10.0, 8.0, 11.0, 8.0, 5.0, 3.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.7890625, -11.4364013671875, -11.083740234375, -10.7310791015625, -10.37841796875, -10.0257568359375, -9.673095703125, -9.3204345703125, -8.9677734375, -8.6151123046875, -8.262451171875, -7.9097900390625, -7.55712890625, -7.2044677734375, -6.851806640625, -6.4991455078125, -6.146484375, -5.7938232421875, -5.441162109375, -5.0885009765625, -4.73583984375, -4.3831787109375, -4.030517578125, -3.6778564453125, -3.3251953125, -2.9725341796875, -2.619873046875, -2.2672119140625, -1.91455078125, -1.5618896484375, -1.209228515625, -0.8565673828125, -0.50390625, -0.1512451171875, 0.201416015625, 0.5540771484375, 0.90673828125, 1.2593994140625, 1.612060546875, 1.9647216796875, 2.3173828125, 2.6700439453125, 3.022705078125, 3.3753662109375, 3.72802734375, 4.0806884765625, 4.433349609375, 4.7860107421875, 5.138671875, 5.4913330078125, 5.843994140625, 6.1966552734375, 6.54931640625, 6.9019775390625, 7.254638671875, 7.6072998046875, 7.9599609375, 8.3126220703125, 8.665283203125, 9.0179443359375, 9.37060546875, 9.7232666015625, 10.075927734375, 10.4285888671875, 10.78125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 9.0, 9.0, 5.0, 13.0, 16.0, 17.0, 24.0, 27.0, 46.0, 55.0, 71.0, 114.0, 143.0, 218.0, 301.0, 557.0, 1016.0, 2241.0, 5392.0, 17074.0, 80368.0, 419722.0, 1346241.0, 1578917.0, 586520.0, 118140.0, 24449.0, 6953.0, 2555.0, 1231.0, 686.0, 328.0, 218.0, 158.0, 115.0, 78.0, 62.0, 52.0, 41.0, 24.0, 11.0, 21.0, 12.0, 5.0, 8.0, 4.0, 6.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-13.7734375, -13.3575439453125, -12.941650390625, -12.5257568359375, -12.10986328125, -11.6939697265625, -11.278076171875, -10.8621826171875, -10.4462890625, -10.0303955078125, -9.614501953125, -9.1986083984375, -8.78271484375, -8.3668212890625, -7.950927734375, -7.5350341796875, -7.119140625, -6.7032470703125, -6.287353515625, -5.8714599609375, -5.45556640625, -5.0396728515625, -4.623779296875, -4.2078857421875, -3.7919921875, -3.3760986328125, -2.960205078125, -2.5443115234375, -2.12841796875, -1.7125244140625, -1.296630859375, -0.8807373046875, -0.46484375, -0.0489501953125, 0.366943359375, 0.7828369140625, 1.19873046875, 1.6146240234375, 2.030517578125, 2.4464111328125, 2.8623046875, 3.2781982421875, 3.694091796875, 4.1099853515625, 4.52587890625, 4.9417724609375, 5.357666015625, 5.7735595703125, 6.189453125, 6.6053466796875, 7.021240234375, 7.4371337890625, 7.85302734375, 8.2689208984375, 8.684814453125, 9.1007080078125, 9.5166015625, 9.9324951171875, 10.348388671875, 10.7642822265625, 11.18017578125, 11.5960693359375, 12.011962890625, 12.4278564453125, 12.84375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 5.0, 19.0, 17.0, 36.0, 66.0, 125.0, 165.0, 287.0, 496.0, 855.0, 757.0, 497.0, 302.0, 168.0, 125.0, 69.0, 32.0, 24.0, 15.0, 10.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0, -16.875, -15.75, -14.625, -13.5, -12.375, -11.25, -10.125, -9.0, -7.875, -6.75, -5.625, -4.5, -3.375, -2.25, -1.125, 0.0, 1.125, 2.25, 3.375, 4.5, 5.625, 6.75, 7.875, 9.0, 10.125, 11.25, 12.375, 13.5, 14.625, 15.75, 16.875, 18.0, 19.125, 20.25, 21.375, 22.5, 23.625, 24.75, 25.875, 27.0, 28.125, 29.25, 30.375, 31.5, 32.625, 33.75, 34.875, 36.0, 37.125, 38.25, 39.375, 40.5, 41.625, 42.75, 43.875, 45.0, 46.125, 47.25, 48.375, 49.5, 50.625, 51.75, 52.875, 54.0]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 14.0, 22.0, 25.0, 38.0, 51.0, 91.0, 153.0, 149.0, 217.0, 303.0, 509.0, 1248.0, 37144.0, 4146563.0, 5472.0, 889.0, 446.0, 273.0, 188.0, 129.0, 120.0, 81.0, 55.0, 41.0, 24.0, 18.0, 4.0, 10.0, 6.0, 2.0, 3.0], "bins": [-192.75, -188.58984375, -184.4296875, -180.26953125, -176.109375, -171.94921875, -167.7890625, -163.62890625, -159.46875, -155.30859375, -151.1484375, -146.98828125, -142.828125, -138.66796875, -134.5078125, -130.34765625, -126.1875, -122.02734375, -117.8671875, -113.70703125, -109.546875, -105.38671875, -101.2265625, -97.06640625, -92.90625, -88.74609375, -84.5859375, -80.42578125, -76.265625, -72.10546875, -67.9453125, -63.78515625, -59.625, -55.46484375, -51.3046875, -47.14453125, -42.984375, -38.82421875, -34.6640625, -30.50390625, -26.34375, -22.18359375, -18.0234375, -13.86328125, -9.703125, -5.54296875, -1.3828125, 2.77734375, 6.9375, 11.09765625, 15.2578125, 19.41796875, 23.578125, 27.73828125, 31.8984375, 36.05859375, 40.21875, 44.37890625, 48.5390625, 52.69921875, 56.859375, 61.01953125, 65.1796875, 69.33984375, 73.5]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 919.0, 94.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-629.6895141601562, -600.6205444335938, -571.5516357421875, -542.482666015625, -513.4137573242188, -484.34478759765625, -455.2758483886719, -426.2069091796875, -397.1379699707031, -368.06903076171875, -339.0000915527344, -309.93115234375, -280.8621826171875, -251.7932586669922, -222.72430419921875, -193.65536499023438, -164.58642578125, -135.51748657226562, -106.44853973388672, -77.37959289550781, -48.31065368652344, -19.241714477539062, 9.827239990234375, 38.89617919921875, 67.96511840820312, 97.0340576171875, 126.1030044555664, 155.1719512939453, 184.2408905029297, 213.30982971191406, 242.3787841796875, 271.4477233886719, 300.5166015625, 329.5855407714844, 358.65447998046875, 387.72344970703125, 416.7923583984375, 445.861328125, 474.9302673339844, 503.99920654296875, 533.068115234375, 562.1370849609375, 591.2059936523438, 620.2749633789062, 649.3438720703125, 678.412841796875, 707.4818115234375, 736.5507202148438, 765.6196899414062, 794.6886596679688, 823.757568359375, 852.8265380859375, 881.8954467773438, 910.9644165039062, 940.0333251953125, 969.102294921875, 998.1712646484375, 1027.240234375, 1056.3092041015625, 1085.3780517578125, 1114.447021484375, 1143.5159912109375, 1172.5849609375, 1201.65380859375, 1230.7227783203125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 3.0, 7.0, 5.0, 6.0, 13.0, 14.0, 13.0, 23.0, 19.0, 29.0, 22.0, 25.0, 40.0, 41.0, 35.0, 51.0, 51.0, 47.0, 48.0, 51.0, 42.0, 33.0, 52.0, 41.0, 44.0, 35.0, 35.0, 23.0, 26.0, 23.0, 21.0, 11.0, 15.0, 15.0, 8.0, 6.0, 4.0, 3.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-80.765380859375, -78.41329193115234, -76.06121063232422, -73.70912170410156, -71.35704040527344, -69.00495147705078, -66.65286254882812, -64.30078125, -61.948692321777344, -59.59660720825195, -57.24452209472656, -54.892433166503906, -52.540348052978516, -50.188262939453125, -47.83617401123047, -45.48408889770508, -43.13200378417969, -40.7799186706543, -38.427833557128906, -36.07574462890625, -33.72365951538086, -31.37157440185547, -29.019487380981445, -26.667400360107422, -24.31531524658203, -21.96323013305664, -19.611143112182617, -17.259056091308594, -14.906970977783203, -12.554884910583496, -10.202798843383789, -7.850711822509766, -5.498634338378906, -3.146548271179199, -0.7944622039794922, 1.5576238632202148, 3.909709930419922, 6.261795997619629, 8.613882064819336, 10.96596908569336, 13.31805419921875, 15.670140266418457, 18.022226333618164, 20.374313354492188, 22.726398468017578, 25.07848358154297, 27.430570602416992, 29.782657623291016, 32.134742736816406, 34.4868278503418, 36.83891296386719, 39.191001892089844, 41.543087005615234, 43.895172119140625, 46.24726104736328, 48.59934616088867, 50.95143127441406, 53.30351638793945, 55.655601501464844, 58.0076904296875, 60.35977554321289, 62.71186065673828, 65.06394958496094, 67.41603088378906, 69.76811981201172]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 0.0, 2.0, 4.0, 7.0, 17.0, 14.0, 10.0, 14.0, 15.0, 18.0, 23.0, 22.0, 28.0, 26.0, 38.0, 38.0, 25.0, 31.0, 40.0, 45.0, 36.0, 43.0, 35.0, 49.0, 36.0, 42.0, 31.0, 40.0, 11.0, 37.0, 38.0, 29.0, 25.0, 14.0, 15.0, 14.0, 19.0, 8.0, 9.0, 9.0, 13.0, 5.0, 4.0, 5.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-11.3125, -10.970458984375, -10.62841796875, -10.286376953125, -9.9443359375, -9.602294921875, -9.26025390625, -8.918212890625, -8.576171875, -8.234130859375, -7.89208984375, -7.550048828125, -7.2080078125, -6.865966796875, -6.52392578125, -6.181884765625, -5.83984375, -5.497802734375, -5.15576171875, -4.813720703125, -4.4716796875, -4.129638671875, -3.78759765625, -3.445556640625, -3.103515625, -2.761474609375, -2.41943359375, -2.077392578125, -1.7353515625, -1.393310546875, -1.05126953125, -0.709228515625, -0.3671875, -0.025146484375, 0.31689453125, 0.658935546875, 1.0009765625, 1.343017578125, 1.68505859375, 2.027099609375, 2.369140625, 2.711181640625, 3.05322265625, 3.395263671875, 3.7373046875, 4.079345703125, 4.42138671875, 4.763427734375, 5.10546875, 5.447509765625, 5.78955078125, 6.131591796875, 6.4736328125, 6.815673828125, 7.15771484375, 7.499755859375, 7.841796875, 8.183837890625, 8.52587890625, 8.867919921875, 9.2099609375, 9.552001953125, 9.89404296875, 10.236083984375, 10.578125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 4.0, 8.0, 8.0, 19.0, 25.0, 54.0, 69.0, 78.0, 101.0, 164.0, 279.0, 317.0, 404.0, 641.0, 960.0, 1288.0, 1845.0, 2593.0, 3776.0, 5178.0, 7642.0, 11025.0, 16213.0, 24786.0, 37541.0, 58603.0, 100827.0, 236228.0, 254693.0, 104379.0, 61047.0, 38455.0, 25122.0, 16952.0, 11239.0, 7674.0, 5385.0, 3675.0, 2723.0, 1896.0, 1328.0, 1010.0, 672.0, 503.0, 350.0, 260.0, 160.0, 105.0, 78.0, 66.0, 39.0, 27.0, 16.0, 9.0, 8.0, 6.0, 3.0, 3.0, 4.0, 0.0, 2.0], "bins": [-1.939453125, -1.876953125, -1.814453125, -1.751953125, -1.689453125, -1.626953125, -1.564453125, -1.501953125, -1.439453125, -1.376953125, -1.314453125, -1.251953125, -1.189453125, -1.126953125, -1.064453125, -1.001953125, -0.939453125, -0.876953125, -0.814453125, -0.751953125, -0.689453125, -0.626953125, -0.564453125, -0.501953125, -0.439453125, -0.376953125, -0.314453125, -0.251953125, -0.189453125, -0.126953125, -0.064453125, -0.001953125, 0.060546875, 0.123046875, 0.185546875, 0.248046875, 0.310546875, 0.373046875, 0.435546875, 0.498046875, 0.560546875, 0.623046875, 0.685546875, 0.748046875, 0.810546875, 0.873046875, 0.935546875, 0.998046875, 1.060546875, 1.123046875, 1.185546875, 1.248046875, 1.310546875, 1.373046875, 1.435546875, 1.498046875, 1.560546875, 1.623046875, 1.685546875, 1.748046875, 1.810546875, 1.873046875, 1.935546875, 1.998046875, 2.060546875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 2.0, 5.0, 9.0, 10.0, 6.0, 21.0, 25.0, 19.0, 22.0, 23.0, 28.0, 34.0, 33.0, 41.0, 36.0, 36.0, 48.0, 52.0, 1076.0, 46.0, 35.0, 42.0, 34.0, 42.0, 29.0, 45.0, 25.0, 31.0, 22.0, 26.0, 20.0, 23.0, 22.0, 13.0, 12.0, 8.0, 2.0, 8.0, 0.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.8828125, -8.62664794921875, -8.3704833984375, -8.11431884765625, -7.858154296875, -7.60198974609375, -7.3458251953125, -7.08966064453125, -6.83349609375, -6.57733154296875, -6.3211669921875, -6.06500244140625, -5.808837890625, -5.55267333984375, -5.2965087890625, -5.04034423828125, -4.7841796875, -4.52801513671875, -4.2718505859375, -4.01568603515625, -3.759521484375, -3.50335693359375, -3.2471923828125, -2.99102783203125, -2.73486328125, -2.47869873046875, -2.2225341796875, -1.96636962890625, -1.710205078125, -1.45404052734375, -1.1978759765625, -0.94171142578125, -0.685546875, -0.42938232421875, -0.1732177734375, 0.08294677734375, 0.339111328125, 0.59527587890625, 0.8514404296875, 1.10760498046875, 1.36376953125, 1.61993408203125, 1.8760986328125, 2.13226318359375, 2.388427734375, 2.64459228515625, 2.9007568359375, 3.15692138671875, 3.4130859375, 3.66925048828125, 3.9254150390625, 4.18157958984375, 4.437744140625, 4.69390869140625, 4.9500732421875, 5.20623779296875, 5.46240234375, 5.71856689453125, 5.9747314453125, 6.23089599609375, 6.487060546875, 6.74322509765625, 6.9993896484375, 7.25555419921875, 7.51171875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 6.0, 9.0, 16.0, 15.0, 29.0, 54.0, 52.0, 87.0, 142.0, 184.0, 337.0, 499.0, 818.0, 1104.0, 1850.0, 2882.0, 4843.0, 7793.0, 12762.0, 20211.0, 33655.0, 56386.0, 103280.0, 1213296.0, 391581.0, 102822.0, 56142.0, 33417.0, 20209.0, 12471.0, 7601.0, 4641.0, 2830.0, 1786.0, 1123.0, 749.0, 486.0, 336.0, 206.0, 125.0, 89.0, 68.0, 51.0, 28.0, 17.0, 11.0, 11.0, 11.0, 5.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.369140625, -2.2901611328125, -2.211181640625, -2.1322021484375, -2.05322265625, -1.9742431640625, -1.895263671875, -1.8162841796875, -1.7373046875, -1.6583251953125, -1.579345703125, -1.5003662109375, -1.42138671875, -1.3424072265625, -1.263427734375, -1.1844482421875, -1.10546875, -1.0264892578125, -0.947509765625, -0.8685302734375, -0.78955078125, -0.7105712890625, -0.631591796875, -0.5526123046875, -0.4736328125, -0.3946533203125, -0.315673828125, -0.2366943359375, -0.15771484375, -0.0787353515625, 0.000244140625, 0.0792236328125, 0.158203125, 0.2371826171875, 0.316162109375, 0.3951416015625, 0.47412109375, 0.5531005859375, 0.632080078125, 0.7110595703125, 0.7900390625, 0.8690185546875, 0.947998046875, 1.0269775390625, 1.10595703125, 1.1849365234375, 1.263916015625, 1.3428955078125, 1.421875, 1.5008544921875, 1.579833984375, 1.6588134765625, 1.73779296875, 1.8167724609375, 1.895751953125, 1.9747314453125, 2.0537109375, 2.1326904296875, 2.211669921875, 2.2906494140625, 2.36962890625, 2.4486083984375, 2.527587890625, 2.6065673828125, 2.685546875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 7.0, 10.0, 16.0, 18.0, 24.0, 21.0, 44.0, 46.0, 46.0, 50.0, 63.0, 78.0, 85.0, 72.0, 76.0, 75.0, 62.0, 49.0, 34.0, 29.0, 23.0, 15.0, 12.0, 9.0, 11.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013637542724609375, -0.0013212859630584717, -0.0012788176536560059, -0.00123634934425354, -0.0011938810348510742, -0.0011514127254486084, -0.0011089444160461426, -0.0010664761066436768, -0.001024007797241211, -0.0009815394878387451, -0.0009390711784362793, -0.0008966028690338135, -0.0008541345596313477, -0.0008116662502288818, -0.000769197940826416, -0.0007267296314239502, -0.0006842613220214844, -0.0006417930126190186, -0.0005993247032165527, -0.0005568563938140869, -0.0005143880844116211, -0.0004719197750091553, -0.00042945146560668945, -0.00038698315620422363, -0.0003445148468017578, -0.000302046537399292, -0.00025957822799682617, -0.00021710991859436035, -0.00017464160919189453, -0.0001321732997894287, -8.970499038696289e-05, -4.723668098449707e-05, -4.76837158203125e-06, 3.769993782043457e-05, 8.016824722290039e-05, 0.0001226365566253662, 0.00016510486602783203, 0.00020757317543029785, 0.00025004148483276367, 0.0002925097942352295, 0.0003349781036376953, 0.00037744641304016113, 0.00041991472244262695, 0.0004623830318450928, 0.0005048513412475586, 0.0005473196506500244, 0.0005897879600524902, 0.0006322562694549561, 0.0006747245788574219, 0.0007171928882598877, 0.0007596611976623535, 0.0008021295070648193, 0.0008445978164672852, 0.000887066125869751, 0.0009295344352722168, 0.0009720027446746826, 0.0010144710540771484, 0.0010569393634796143, 0.00109940767288208, 0.001141875982284546, 0.0011843442916870117, 0.0012268126010894775, 0.0012692809104919434, 0.0013117492198944092, 0.001354217529296875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 5.0, 6.0, 12.0, 10.0, 11.0, 22.0, 20.0, 37.0, 29.0, 66.0, 70.0, 124.0, 186.0, 409.0, 2424.0, 1033775.0, 9945.0, 597.0, 266.0, 139.0, 90.0, 73.0, 59.0, 42.0, 23.0, 20.0, 25.0, 19.0, 18.0, 6.0, 7.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.031280517578125, -0.030402660369873047, -0.029524803161621094, -0.02864694595336914, -0.027769088745117188, -0.026891231536865234, -0.02601337432861328, -0.025135517120361328, -0.024257659912109375, -0.023379802703857422, -0.02250194549560547, -0.021624088287353516, -0.020746231079101562, -0.01986837387084961, -0.018990516662597656, -0.018112659454345703, -0.01723480224609375, -0.016356945037841797, -0.015479087829589844, -0.01460123062133789, -0.013723373413085938, -0.012845516204833984, -0.011967658996582031, -0.011089801788330078, -0.010211944580078125, -0.009334087371826172, -0.008456230163574219, -0.007578372955322266, -0.0067005157470703125, -0.005822658538818359, -0.004944801330566406, -0.004066944122314453, -0.0031890869140625, -0.002311229705810547, -0.0014333724975585938, -0.0005555152893066406, 0.0003223419189453125, 0.0012001991271972656, 0.0020780563354492188, 0.002955913543701172, 0.003833770751953125, 0.004711627960205078, 0.005589485168457031, 0.006467342376708984, 0.0073451995849609375, 0.00822305679321289, 0.009100914001464844, 0.009978771209716797, 0.01085662841796875, 0.011734485626220703, 0.012612342834472656, 0.01349020004272461, 0.014368057250976562, 0.015245914459228516, 0.01612377166748047, 0.017001628875732422, 0.017879486083984375, 0.018757343292236328, 0.01963520050048828, 0.020513057708740234, 0.021390914916992188, 0.02226877212524414, 0.023146629333496094, 0.024024486541748047, 0.02490234375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 16.0, 293.0, 606.0, 93.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002163088647648692, -0.0020445517729967833, -0.0019260148983448744, -0.0018074781401082873, -0.0016889412654563785, -0.0015704043908044696, -0.0014518676325678825, -0.0013333307579159737, -0.0012147938832640648, -0.001096257008612156, -0.000977720133960247, -0.00085918337572366, -0.0007406465010717511, -0.0006221096264198422, -0.0005035728099755943, -0.0003850359935313463, -0.00026649911887943745, -0.00014796227333135903, -2.942542778328061e-05, 8.91114177647978e-05, 0.00020764826331287622, 0.0003261851379647851, 0.00044472195440903306, 0.000563258770853281, 0.0006817956455051899, 0.0008003325201570988, 0.0009188693366013467, 0.0010374061530455947, 0.0011559430276975036, 0.0012744799023494124, 0.0013930166605859995, 0.0015115535352379084, 0.0016300901770591736, 0.0017486270517110825, 0.0018671639263629913, 0.0019857008010149, 0.002104237675666809, 0.002222774550318718, 0.002341311192139983, 0.002459848066791892, 0.002578384941443801, 0.00269692181609571, 0.0028154586907476187, 0.0029339955653995275, 0.0030525322072207928, 0.0031710690818727016, 0.0032896059565246105, 0.0034081428311765194, 0.0035266797058284283, 0.003645216580480337, 0.003763753455132246, 0.003882290329784155, 0.004000827204436064, 0.004119364079087973, 0.0042379009537398815, 0.004356437362730503, 0.004474974237382412, 0.004593511112034321, 0.00471204798668623, 0.004830584861338139, 0.0049491217359900475, 0.005067658610641956, 0.005186195485293865, 0.005304732359945774, 0.005423269234597683]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 5.0, 8.0, 5.0, 10.0, 13.0, 14.0, 17.0, 11.0, 23.0, 22.0, 23.0, 21.0, 23.0, 30.0, 31.0, 53.0, 35.0, 32.0, 41.0, 44.0, 43.0, 23.0, 37.0, 41.0, 41.0, 48.0, 31.0, 31.0, 29.0, 20.0, 20.0, 27.0, 21.0, 11.0, 18.0, 13.0, 8.0, 18.0, 13.0, 9.0, 4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0005220770835876465, -0.0005059316754341125, -0.0004897862672805786, -0.0004736408591270447, -0.00045749545097351074, -0.0004413500428199768, -0.00042520463466644287, -0.00040905922651290894, -0.000392913818359375, -0.00037676841020584106, -0.00036062300205230713, -0.0003444775938987732, -0.00032833218574523926, -0.0003121867775917053, -0.0002960413694381714, -0.00027989596128463745, -0.0002637505531311035, -0.0002476051449775696, -0.00023145973682403564, -0.0002153143286705017, -0.00019916892051696777, -0.00018302351236343384, -0.0001668781042098999, -0.00015073269605636597, -0.00013458728790283203, -0.0001184418797492981, -0.00010229647159576416, -8.615106344223022e-05, -7.000565528869629e-05, -5.3860247135162354e-05, -3.771483898162842e-05, -2.1569430828094482e-05, -5.424022674560547e-06, 1.0721385478973389e-05, 2.6866793632507324e-05, 4.301220178604126e-05, 5.9157609939575195e-05, 7.530301809310913e-05, 9.144842624664307e-05, 0.000107593834400177, 0.00012373924255371094, 0.00013988465070724487, 0.0001560300588607788, 0.00017217546701431274, 0.00018832087516784668, 0.00020446628332138062, 0.00022061169147491455, 0.00023675709962844849, 0.0002529025077819824, 0.00026904791593551636, 0.0002851933240890503, 0.00030133873224258423, 0.00031748414039611816, 0.0003336295485496521, 0.00034977495670318604, 0.00036592036485671997, 0.0003820657730102539, 0.00039821118116378784, 0.0004143565893173218, 0.0004305019974708557, 0.00044664740562438965, 0.0004627928137779236, 0.0004789382219314575, 0.0004950836300849915, 0.0005112290382385254]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 0.0, 2.0, 4.0, 7.0, 17.0, 14.0, 10.0, 14.0, 15.0, 18.0, 23.0, 22.0, 28.0, 26.0, 38.0, 38.0, 25.0, 31.0, 40.0, 45.0, 36.0, 43.0, 35.0, 49.0, 36.0, 42.0, 31.0, 40.0, 11.0, 37.0, 38.0, 29.0, 25.0, 14.0, 15.0, 14.0, 19.0, 8.0, 9.0, 9.0, 13.0, 5.0, 4.0, 5.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-11.3125, -10.970458984375, -10.62841796875, -10.286376953125, -9.9443359375, -9.602294921875, -9.26025390625, -8.918212890625, -8.576171875, -8.234130859375, -7.89208984375, -7.550048828125, -7.2080078125, -6.865966796875, -6.52392578125, -6.181884765625, -5.83984375, -5.497802734375, -5.15576171875, -4.813720703125, -4.4716796875, -4.129638671875, -3.78759765625, -3.445556640625, -3.103515625, -2.761474609375, -2.41943359375, -2.077392578125, -1.7353515625, -1.393310546875, -1.05126953125, -0.709228515625, -0.3671875, -0.025146484375, 0.31689453125, 0.658935546875, 1.0009765625, 1.343017578125, 1.68505859375, 2.027099609375, 2.369140625, 2.711181640625, 3.05322265625, 3.395263671875, 3.7373046875, 4.079345703125, 4.42138671875, 4.763427734375, 5.10546875, 5.447509765625, 5.78955078125, 6.131591796875, 6.4736328125, 6.815673828125, 7.15771484375, 7.499755859375, 7.841796875, 8.183837890625, 8.52587890625, 8.867919921875, 9.2099609375, 9.552001953125, 9.89404296875, 10.236083984375, 10.578125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 1.0, 6.0, 5.0, 6.0, 11.0, 8.0, 13.0, 24.0, 29.0, 40.0, 53.0, 66.0, 109.0, 177.0, 315.0, 556.0, 1079.0, 2375.0, 5026.0, 12157.0, 30827.0, 87100.0, 270066.0, 406933.0, 148277.0, 50240.0, 18710.0, 7692.0, 3352.0, 1516.0, 727.0, 385.0, 222.0, 130.0, 88.0, 62.0, 39.0, 28.0, 23.0, 21.0, 18.0, 14.0, 9.0, 8.0, 9.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.375, -10.0628662109375, -9.750732421875, -9.4385986328125, -9.12646484375, -8.8143310546875, -8.502197265625, -8.1900634765625, -7.8779296875, -7.5657958984375, -7.253662109375, -6.9415283203125, -6.62939453125, -6.3172607421875, -6.005126953125, -5.6929931640625, -5.380859375, -5.0687255859375, -4.756591796875, -4.4444580078125, -4.13232421875, -3.8201904296875, -3.508056640625, -3.1959228515625, -2.8837890625, -2.5716552734375, -2.259521484375, -1.9473876953125, -1.63525390625, -1.3231201171875, -1.010986328125, -0.6988525390625, -0.38671875, -0.0745849609375, 0.237548828125, 0.5496826171875, 0.86181640625, 1.1739501953125, 1.486083984375, 1.7982177734375, 2.1103515625, 2.4224853515625, 2.734619140625, 3.0467529296875, 3.35888671875, 3.6710205078125, 3.983154296875, 4.2952880859375, 4.607421875, 4.9195556640625, 5.231689453125, 5.5438232421875, 5.85595703125, 6.1680908203125, 6.480224609375, 6.7923583984375, 7.1044921875, 7.4166259765625, 7.728759765625, 8.0408935546875, 8.35302734375, 8.6651611328125, 8.977294921875, 9.2894287109375, 9.6015625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 2.0, 6.0, 5.0, 10.0, 16.0, 8.0, 8.0, 21.0, 21.0, 23.0, 32.0, 28.0, 47.0, 45.0, 69.0, 58.0, 95.0, 1677.0, 426.0, 68.0, 61.0, 55.0, 44.0, 31.0, 28.0, 28.0, 25.0, 25.0, 14.0, 16.0, 16.0, 13.0, 11.0, 3.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.59375, -52.09912109375, -50.6044921875, -49.10986328125, -47.615234375, -46.12060546875, -44.6259765625, -43.13134765625, -41.63671875, -40.14208984375, -38.6474609375, -37.15283203125, -35.658203125, -34.16357421875, -32.6689453125, -31.17431640625, -29.6796875, -28.18505859375, -26.6904296875, -25.19580078125, -23.701171875, -22.20654296875, -20.7119140625, -19.21728515625, -17.72265625, -16.22802734375, -14.7333984375, -13.23876953125, -11.744140625, -10.24951171875, -8.7548828125, -7.26025390625, -5.765625, -4.27099609375, -2.7763671875, -1.28173828125, 0.212890625, 1.70751953125, 3.2021484375, 4.69677734375, 6.19140625, 7.68603515625, 9.1806640625, 10.67529296875, 12.169921875, 13.66455078125, 15.1591796875, 16.65380859375, 18.1484375, 19.64306640625, 21.1376953125, 22.63232421875, 24.126953125, 25.62158203125, 27.1162109375, 28.61083984375, 30.10546875, 31.60009765625, 33.0947265625, 34.58935546875, 36.083984375, 37.57861328125, 39.0732421875, 40.56787109375, 42.0625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 6.0, 8.0, 16.0, 21.0, 15.0, 23.0, 38.0, 41.0, 79.0, 98.0, 91.0, 126.0, 242.0, 415.0, 1156.0, 59207.0, 3076920.0, 5456.0, 728.0, 296.0, 189.0, 138.0, 108.0, 74.0, 54.0, 33.0, 32.0, 21.0, 12.0, 16.0, 13.0, 5.0, 9.0, 4.0, 8.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.625, -66.2001953125, -63.775390625, -61.3505859375, -58.92578125, -56.5009765625, -54.076171875, -51.6513671875, -49.2265625, -46.8017578125, -44.376953125, -41.9521484375, -39.52734375, -37.1025390625, -34.677734375, -32.2529296875, -29.828125, -27.4033203125, -24.978515625, -22.5537109375, -20.12890625, -17.7041015625, -15.279296875, -12.8544921875, -10.4296875, -8.0048828125, -5.580078125, -3.1552734375, -0.73046875, 1.6943359375, 4.119140625, 6.5439453125, 8.96875, 11.3935546875, 13.818359375, 16.2431640625, 18.66796875, 21.0927734375, 23.517578125, 25.9423828125, 28.3671875, 30.7919921875, 33.216796875, 35.6416015625, 38.06640625, 40.4912109375, 42.916015625, 45.3408203125, 47.765625, 50.1904296875, 52.615234375, 55.0400390625, 57.46484375, 59.8896484375, 62.314453125, 64.7392578125, 67.1640625, 69.5888671875, 72.013671875, 74.4384765625, 76.86328125, 79.2880859375, 81.712890625, 84.1376953125, 86.5625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 238.0, 773.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-577.455078125, -567.178466796875, -556.9019165039062, -546.6253662109375, -536.3487548828125, -526.0721435546875, -515.7955932617188, -505.5190124511719, -495.242431640625, -484.9658508300781, -474.68927001953125, -464.4126892089844, -454.1361083984375, -443.8595275878906, -433.58294677734375, -423.3063659667969, -413.02978515625, -402.7532043457031, -392.47662353515625, -382.2000427246094, -371.9234619140625, -361.6468811035156, -351.37030029296875, -341.0937194824219, -330.817138671875, -320.5405578613281, -310.26397705078125, -299.9873962402344, -289.7108154296875, -279.4342346191406, -269.15765380859375, -258.8810729980469, -248.6044921875, -238.32791137695312, -228.05133056640625, -217.77474975585938, -207.4981689453125, -197.22158813476562, -186.94500732421875, -176.66842651367188, -166.391845703125, -156.11526489257812, -145.83868408203125, -135.56210327148438, -125.2855224609375, -115.00894165039062, -104.73236083984375, -94.45578002929688, -84.17919158935547, -73.9026107788086, -63.62602996826172, -53.349449157714844, -43.07286834716797, -32.796287536621094, -22.51970672607422, -12.243125915527344, -1.9665451049804688, 8.310035705566406, 18.58661651611328, 28.863197326660156, 39.13977813720703, 49.416358947753906, 59.69293975830078, 69.96952056884766, 80.24610137939453]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 6.0, 2.0, 6.0, 4.0, 8.0, 17.0, 16.0, 9.0, 26.0, 28.0, 17.0, 34.0, 35.0, 35.0, 37.0, 48.0, 35.0, 46.0, 50.0, 55.0, 56.0, 52.0, 38.0, 45.0, 44.0, 19.0, 34.0, 34.0, 38.0, 24.0, 27.0, 15.0, 14.0, 11.0, 7.0, 6.0, 11.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.9784698486328, -130.09603881835938, -126.21360778808594, -122.3311767578125, -118.44874572753906, -114.56631469726562, -110.68389129638672, -106.80146026611328, -102.91902923583984, -99.0365982055664, -95.15416717529297, -91.27173614501953, -87.38931274414062, -83.50688171386719, -79.62445068359375, -75.74201965332031, -71.85958862304688, -67.97715759277344, -64.0947265625, -60.21229934692383, -56.32986831665039, -52.44743728637695, -48.56501007080078, -44.682579040527344, -40.800148010253906, -36.91771697998047, -33.03528594970703, -29.15285873413086, -25.270427703857422, -21.387996673583984, -17.50556755065918, -13.623138427734375, -9.740715026855469, -5.858284950256348, -1.9758548736572266, 1.9065752029418945, 5.789005279541016, 9.671436309814453, 13.553865432739258, 17.436294555664062, 21.3187255859375, 25.201156616210938, 29.083585739135742, 32.96601486206055, 36.848445892333984, 40.73087692260742, 44.613304138183594, 48.49573516845703, 52.37816619873047, 56.260597229003906, 60.143028259277344, 64.02545928955078, 67.90788269042969, 71.79031372070312, 75.67274475097656, 79.55517578125, 83.43760681152344, 87.32003784179688, 91.20246887207031, 95.08489990234375, 98.96733093261719, 102.84976196289062, 106.73218536376953, 110.61461639404297, 114.4970474243164]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 1.0, 5.0, 12.0, 5.0, 7.0, 20.0, 16.0, 18.0, 24.0, 19.0, 21.0, 32.0, 29.0, 37.0, 33.0, 32.0, 35.0, 45.0, 46.0, 40.0, 47.0, 35.0, 42.0, 41.0, 41.0, 40.0, 32.0, 24.0, 28.0, 35.0, 21.0, 13.0, 21.0, 17.0, 18.0, 16.0, 7.0, 5.0, 10.0, 9.0, 4.0, 5.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-12.0, -11.6309814453125, -11.261962890625, -10.8929443359375, -10.52392578125, -10.1549072265625, -9.785888671875, -9.4168701171875, -9.0478515625, -8.6788330078125, -8.309814453125, -7.9407958984375, -7.57177734375, -7.2027587890625, -6.833740234375, -6.4647216796875, -6.095703125, -5.7266845703125, -5.357666015625, -4.9886474609375, -4.61962890625, -4.2506103515625, -3.881591796875, -3.5125732421875, -3.1435546875, -2.7745361328125, -2.405517578125, -2.0364990234375, -1.66748046875, -1.2984619140625, -0.929443359375, -0.5604248046875, -0.19140625, 0.1776123046875, 0.546630859375, 0.9156494140625, 1.28466796875, 1.6536865234375, 2.022705078125, 2.3917236328125, 2.7607421875, 3.1297607421875, 3.498779296875, 3.8677978515625, 4.23681640625, 4.6058349609375, 4.974853515625, 5.3438720703125, 5.712890625, 6.0819091796875, 6.450927734375, 6.8199462890625, 7.18896484375, 7.5579833984375, 7.927001953125, 8.2960205078125, 8.6650390625, 9.0340576171875, 9.403076171875, 9.7720947265625, 10.14111328125, 10.5101318359375, 10.879150390625, 11.2481689453125, 11.6171875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 7.0, 6.0, 11.0, 17.0, 13.0, 10.0, 16.0, 28.0, 33.0, 37.0, 50.0, 57.0, 66.0, 121.0, 168.0, 381.0, 1312.0, 14974.0, 1863339.0, 2292811.0, 18259.0, 1486.0, 432.0, 150.0, 95.0, 87.0, 49.0, 49.0, 29.0, 36.0, 26.0, 23.0, 14.0, 15.0, 21.0, 2.0, 11.0, 6.0, 9.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-48.46875, -47.04443359375, -45.6201171875, -44.19580078125, -42.771484375, -41.34716796875, -39.9228515625, -38.49853515625, -37.07421875, -35.64990234375, -34.2255859375, -32.80126953125, -31.376953125, -29.95263671875, -28.5283203125, -27.10400390625, -25.6796875, -24.25537109375, -22.8310546875, -21.40673828125, -19.982421875, -18.55810546875, -17.1337890625, -15.70947265625, -14.28515625, -12.86083984375, -11.4365234375, -10.01220703125, -8.587890625, -7.16357421875, -5.7392578125, -4.31494140625, -2.890625, -1.46630859375, -0.0419921875, 1.38232421875, 2.806640625, 4.23095703125, 5.6552734375, 7.07958984375, 8.50390625, 9.92822265625, 11.3525390625, 12.77685546875, 14.201171875, 15.62548828125, 17.0498046875, 18.47412109375, 19.8984375, 21.32275390625, 22.7470703125, 24.17138671875, 25.595703125, 27.02001953125, 28.4443359375, 29.86865234375, 31.29296875, 32.71728515625, 34.1416015625, 35.56591796875, 36.990234375, 38.41455078125, 39.8388671875, 41.26318359375, 42.6875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 14.0, 11.0, 16.0, 19.0, 31.0, 29.0, 40.0, 44.0, 62.0, 75.0, 111.0, 124.0, 182.0, 212.0, 318.0, 388.0, 458.0, 436.0, 359.0, 252.0, 183.0, 170.0, 98.0, 97.0, 75.0, 55.0, 42.0, 32.0, 27.0, 24.0, 18.0, 15.0, 7.0, 12.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-16.046875, -15.54052734375, -15.0341796875, -14.52783203125, -14.021484375, -13.51513671875, -13.0087890625, -12.50244140625, -11.99609375, -11.48974609375, -10.9833984375, -10.47705078125, -9.970703125, -9.46435546875, -8.9580078125, -8.45166015625, -7.9453125, -7.43896484375, -6.9326171875, -6.42626953125, -5.919921875, -5.41357421875, -4.9072265625, -4.40087890625, -3.89453125, -3.38818359375, -2.8818359375, -2.37548828125, -1.869140625, -1.36279296875, -0.8564453125, -0.35009765625, 0.15625, 0.66259765625, 1.1689453125, 1.67529296875, 2.181640625, 2.68798828125, 3.1943359375, 3.70068359375, 4.20703125, 4.71337890625, 5.2197265625, 5.72607421875, 6.232421875, 6.73876953125, 7.2451171875, 7.75146484375, 8.2578125, 8.76416015625, 9.2705078125, 9.77685546875, 10.283203125, 10.78955078125, 11.2958984375, 11.80224609375, 12.30859375, 12.81494140625, 13.3212890625, 13.82763671875, 14.333984375, 14.84033203125, 15.3466796875, 15.85302734375, 16.359375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 4.0, 9.0, 12.0, 13.0, 11.0, 17.0, 15.0, 32.0, 25.0, 50.0, 72.0, 65.0, 93.0, 88.0, 153.0, 221.0, 278.0, 477.0, 1382.0, 100097.0, 4078125.0, 10900.0, 732.0, 349.0, 218.0, 161.0, 132.0, 117.0, 104.0, 73.0, 52.0, 40.0, 37.0, 23.0, 21.0, 18.0, 18.0, 11.0, 7.0, 4.0, 10.0, 3.0, 2.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.0, -95.734375, -92.46875, -89.203125, -85.9375, -82.671875, -79.40625, -76.140625, -72.875, -69.609375, -66.34375, -63.078125, -59.8125, -56.546875, -53.28125, -50.015625, -46.75, -43.484375, -40.21875, -36.953125, -33.6875, -30.421875, -27.15625, -23.890625, -20.625, -17.359375, -14.09375, -10.828125, -7.5625, -4.296875, -1.03125, 2.234375, 5.5, 8.765625, 12.03125, 15.296875, 18.5625, 21.828125, 25.09375, 28.359375, 31.625, 34.890625, 38.15625, 41.421875, 44.6875, 47.953125, 51.21875, 54.484375, 57.75, 61.015625, 64.28125, 67.546875, 70.8125, 74.078125, 77.34375, 80.609375, 83.875, 87.140625, 90.40625, 93.671875, 96.9375, 100.203125, 103.46875, 106.734375, 110.0]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 13.0, 765.0, 236.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-816.59521484375, -797.9414672851562, -779.2877197265625, -760.6339721679688, -741.980224609375, -723.3264770507812, -704.6727294921875, -686.0189819335938, -667.365234375, -648.7114868164062, -630.0577392578125, -611.4039916992188, -592.750244140625, -574.0964965820312, -555.4427490234375, -536.7890014648438, -518.13525390625, -499.48150634765625, -480.8277587890625, -462.17401123046875, -443.520263671875, -424.86651611328125, -406.2127685546875, -387.55902099609375, -368.9052734375, -350.25152587890625, -331.5977783203125, -312.94403076171875, -294.290283203125, -275.63653564453125, -256.9827880859375, -238.32904052734375, -219.67523193359375, -201.021484375, -182.36773681640625, -163.7139892578125, -145.06024169921875, -126.406494140625, -107.75274658203125, -89.0989990234375, -70.44525146484375, -51.79150390625, -33.13775634765625, -14.4840087890625, 4.16973876953125, 22.823486328125, 41.47723388671875, 60.1309814453125, 78.78472900390625, 97.4384765625, 116.09222412109375, 134.7459716796875, 153.39971923828125, 172.053466796875, 190.70721435546875, 209.3609619140625, 228.01470947265625, 246.66845703125, 265.32220458984375, 283.9759521484375, 302.62969970703125, 321.283447265625, 339.93719482421875, 358.5909423828125, 377.24468994140625]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 7.0, 2.0, 2.0, 8.0, 6.0, 15.0, 15.0, 15.0, 17.0, 19.0, 24.0, 18.0, 22.0, 35.0, 29.0, 33.0, 27.0, 30.0, 42.0, 33.0, 45.0, 40.0, 41.0, 28.0, 50.0, 39.0, 38.0, 41.0, 34.0, 30.0, 26.0, 23.0, 30.0, 17.0, 24.0, 27.0, 14.0, 13.0, 7.0, 5.0, 10.0, 6.0, 4.0, 3.0, 5.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-61.996986389160156, -59.94422149658203, -57.89146041870117, -55.83869552612305, -53.78593444824219, -51.73316955566406, -49.68040466308594, -47.62763977050781, -45.57487869262695, -43.52211380004883, -41.46935272216797, -39.416587829589844, -37.36382293701172, -35.31106185913086, -33.258296966552734, -31.205533981323242, -29.15277099609375, -27.100008010864258, -25.047245025634766, -22.99448013305664, -20.94171714782715, -18.888954162597656, -16.83618927001953, -14.783426284790039, -12.730663299560547, -10.677900314331055, -8.625136375427246, -6.572372913360596, -4.519609451293945, -2.466846466064453, -0.41408252716064453, 1.638681411743164, 3.6914443969726562, 5.744207859039307, 7.796971321105957, 9.849735260009766, 11.902498245239258, 13.95526123046875, 16.008026123046875, 18.060789108276367, 20.11355209350586, 22.16631507873535, 24.219078063964844, 26.27184295654297, 28.32460594177246, 30.377368927001953, 32.43013381958008, 34.48289489746094, 36.53565979003906, 38.58842468261719, 40.64118576049805, 42.69395065307617, 44.74671173095703, 46.799476623535156, 48.85224151611328, 50.905006408691406, 52.957767486572266, 55.01053237915039, 57.06329345703125, 59.116058349609375, 61.1688232421875, 63.22158432006836, 65.27434539794922, 67.32711029052734, 69.37987518310547]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 7.0, 7.0, 12.0, 7.0, 11.0, 16.0, 16.0, 11.0, 20.0, 22.0, 23.0, 18.0, 37.0, 35.0, 35.0, 38.0, 40.0, 32.0, 37.0, 49.0, 37.0, 49.0, 36.0, 38.0, 31.0, 34.0, 33.0, 35.0, 26.0, 28.0, 25.0, 19.0, 27.0, 17.0, 14.0, 20.0, 9.0, 11.0, 9.0, 9.0, 5.0, 4.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.6484375, -11.29248046875, -10.9365234375, -10.58056640625, -10.224609375, -9.86865234375, -9.5126953125, -9.15673828125, -8.80078125, -8.44482421875, -8.0888671875, -7.73291015625, -7.376953125, -7.02099609375, -6.6650390625, -6.30908203125, -5.953125, -5.59716796875, -5.2412109375, -4.88525390625, -4.529296875, -4.17333984375, -3.8173828125, -3.46142578125, -3.10546875, -2.74951171875, -2.3935546875, -2.03759765625, -1.681640625, -1.32568359375, -0.9697265625, -0.61376953125, -0.2578125, 0.09814453125, 0.4541015625, 0.81005859375, 1.166015625, 1.52197265625, 1.8779296875, 2.23388671875, 2.58984375, 2.94580078125, 3.3017578125, 3.65771484375, 4.013671875, 4.36962890625, 4.7255859375, 5.08154296875, 5.4375, 5.79345703125, 6.1494140625, 6.50537109375, 6.861328125, 7.21728515625, 7.5732421875, 7.92919921875, 8.28515625, 8.64111328125, 8.9970703125, 9.35302734375, 9.708984375, 10.06494140625, 10.4208984375, 10.77685546875, 11.1328125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 7.0, 5.0, 7.0, 12.0, 28.0, 37.0, 71.0, 64.0, 120.0, 175.0, 270.0, 405.0, 629.0, 954.0, 1473.0, 2278.0, 3495.0, 5524.0, 8903.0, 14192.0, 23367.0, 39098.0, 68347.0, 127959.0, 345019.0, 188257.0, 90010.0, 50286.0, 29638.0, 17837.0, 11012.0, 6829.0, 4314.0, 2778.0, 1785.0, 1169.0, 739.0, 491.0, 329.0, 230.0, 124.0, 101.0, 63.0, 46.0, 30.0, 17.0, 13.0, 11.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.62890625, -2.548583984375, -2.46826171875, -2.387939453125, -2.3076171875, -2.227294921875, -2.14697265625, -2.066650390625, -1.986328125, -1.906005859375, -1.82568359375, -1.745361328125, -1.6650390625, -1.584716796875, -1.50439453125, -1.424072265625, -1.34375, -1.263427734375, -1.18310546875, -1.102783203125, -1.0224609375, -0.942138671875, -0.86181640625, -0.781494140625, -0.701171875, -0.620849609375, -0.54052734375, -0.460205078125, -0.3798828125, -0.299560546875, -0.21923828125, -0.138916015625, -0.05859375, 0.021728515625, 0.10205078125, 0.182373046875, 0.2626953125, 0.343017578125, 0.42333984375, 0.503662109375, 0.583984375, 0.664306640625, 0.74462890625, 0.824951171875, 0.9052734375, 0.985595703125, 1.06591796875, 1.146240234375, 1.2265625, 1.306884765625, 1.38720703125, 1.467529296875, 1.5478515625, 1.628173828125, 1.70849609375, 1.788818359375, 1.869140625, 1.949462890625, 2.02978515625, 2.110107421875, 2.1904296875, 2.270751953125, 2.35107421875, 2.431396484375, 2.51171875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 4.0, 3.0, 8.0, 2.0, 4.0, 6.0, 11.0, 6.0, 10.0, 13.0, 14.0, 8.0, 16.0, 18.0, 27.0, 21.0, 30.0, 30.0, 30.0, 44.0, 39.0, 33.0, 31.0, 44.0, 32.0, 1058.0, 48.0, 33.0, 44.0, 32.0, 23.0, 23.0, 33.0, 33.0, 27.0, 23.0, 30.0, 12.0, 23.0, 20.0, 15.0, 20.0, 7.0, 10.0, 4.0, 4.0, 5.0, 3.0, 6.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-6.76953125, -6.56085205078125, -6.3521728515625, -6.14349365234375, -5.934814453125, -5.72613525390625, -5.5174560546875, -5.30877685546875, -5.10009765625, -4.89141845703125, -4.6827392578125, -4.47406005859375, -4.265380859375, -4.05670166015625, -3.8480224609375, -3.63934326171875, -3.4306640625, -3.22198486328125, -3.0133056640625, -2.80462646484375, -2.595947265625, -2.38726806640625, -2.1785888671875, -1.96990966796875, -1.76123046875, -1.55255126953125, -1.3438720703125, -1.13519287109375, -0.926513671875, -0.71783447265625, -0.5091552734375, -0.30047607421875, -0.091796875, 0.11688232421875, 0.3255615234375, 0.53424072265625, 0.742919921875, 0.95159912109375, 1.1602783203125, 1.36895751953125, 1.57763671875, 1.78631591796875, 1.9949951171875, 2.20367431640625, 2.412353515625, 2.62103271484375, 2.8297119140625, 3.03839111328125, 3.2470703125, 3.45574951171875, 3.6644287109375, 3.87310791015625, 4.081787109375, 4.29046630859375, 4.4991455078125, 4.70782470703125, 4.91650390625, 5.12518310546875, 5.3338623046875, 5.54254150390625, 5.751220703125, 5.95989990234375, 6.1685791015625, 6.37725830078125, 6.5859375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 10.0, 10.0, 7.0, 26.0, 32.0, 29.0, 46.0, 71.0, 91.0, 127.0, 194.0, 313.0, 457.0, 701.0, 907.0, 1398.0, 1940.0, 2844.0, 4216.0, 6351.0, 9311.0, 13652.0, 20728.0, 31632.0, 49666.0, 83351.0, 165927.0, 1366199.0, 134773.0, 72377.0, 44523.0, 28494.0, 18453.0, 12332.0, 7995.0, 5619.0, 3825.0, 2628.0, 1813.0, 1270.0, 865.0, 606.0, 391.0, 297.0, 200.0, 123.0, 92.0, 59.0, 43.0, 35.0, 36.0, 18.0, 12.0, 11.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.9736328125, -1.9107208251953125, -1.847808837890625, -1.7848968505859375, -1.72198486328125, -1.6590728759765625, -1.596160888671875, -1.5332489013671875, -1.4703369140625, -1.4074249267578125, -1.344512939453125, -1.2816009521484375, -1.21868896484375, -1.1557769775390625, -1.092864990234375, -1.0299530029296875, -0.967041015625, -0.9041290283203125, -0.841217041015625, -0.7783050537109375, -0.71539306640625, -0.6524810791015625, -0.589569091796875, -0.5266571044921875, -0.4637451171875, -0.4008331298828125, -0.337921142578125, -0.2750091552734375, -0.21209716796875, -0.1491851806640625, -0.086273193359375, -0.0233612060546875, 0.03955078125, 0.1024627685546875, 0.165374755859375, 0.2282867431640625, 0.29119873046875, 0.3541107177734375, 0.417022705078125, 0.4799346923828125, 0.5428466796875, 0.6057586669921875, 0.668670654296875, 0.7315826416015625, 0.79449462890625, 0.8574066162109375, 0.920318603515625, 0.9832305908203125, 1.046142578125, 1.1090545654296875, 1.171966552734375, 1.2348785400390625, 1.29779052734375, 1.3607025146484375, 1.423614501953125, 1.4865264892578125, 1.5494384765625, 1.6123504638671875, 1.675262451171875, 1.7381744384765625, 1.80108642578125, 1.8639984130859375, 1.926910400390625, 1.9898223876953125, 2.052734375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 5.0, 6.0, 13.0, 11.0, 17.0, 25.0, 24.0, 42.0, 44.0, 54.0, 82.0, 78.0, 88.0, 95.0, 71.0, 56.0, 65.0, 50.0, 39.0, 24.0, 29.0, 12.0, 10.0, 14.0, 4.0, 9.0, 9.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015087127685546875, -0.0014614611864089966, -0.0014142096042633057, -0.0013669580221176147, -0.0013197064399719238, -0.001272454857826233, -0.001225203275680542, -0.001177951693534851, -0.0011307001113891602, -0.0010834485292434692, -0.0010361969470977783, -0.0009889453649520874, -0.0009416937828063965, -0.0008944422006607056, -0.0008471906185150146, -0.0007999390363693237, -0.0007526874542236328, -0.0007054358720779419, -0.000658184289932251, -0.0006109327077865601, -0.0005636811256408691, -0.0005164295434951782, -0.0004691779613494873, -0.0004219263792037964, -0.00037467479705810547, -0.00032742321491241455, -0.00028017163276672363, -0.00023292005062103271, -0.0001856684684753418, -0.00013841688632965088, -9.116530418395996e-05, -4.391372203826904e-05, 3.337860107421875e-06, 5.058944225311279e-05, 9.784102439880371e-05, 0.00014509260654449463, 0.00019234418869018555, 0.00023959577083587646, 0.0002868473529815674, 0.0003340989351272583, 0.0003813505172729492, 0.00042860209941864014, 0.00047585368156433105, 0.000523105263710022, 0.0005703568458557129, 0.0006176084280014038, 0.0006648600101470947, 0.0007121115922927856, 0.0007593631744384766, 0.0008066147565841675, 0.0008538663387298584, 0.0009011179208755493, 0.0009483695030212402, 0.0009956210851669312, 0.001042872667312622, 0.001090124249458313, 0.001137375831604004, 0.0011846274137496948, 0.0012318789958953857, 0.0012791305780410767, 0.0013263821601867676, 0.0013736337423324585, 0.0014208853244781494, 0.0014681369066238403, 0.0015153884887695312]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 6.0, 6.0, 13.0, 8.0, 13.0, 18.0, 19.0, 34.0, 47.0, 46.0, 68.0, 109.0, 157.0, 364.0, 1057.0, 886079.0, 158896.0, 828.0, 301.0, 122.0, 100.0, 75.0, 43.0, 33.0, 26.0, 12.0, 19.0, 16.0, 10.0, 8.0, 3.0, 6.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03411865234375, -0.033082008361816406, -0.03204536437988281, -0.03100872039794922, -0.029972076416015625, -0.02893543243408203, -0.027898788452148438, -0.026862144470214844, -0.02582550048828125, -0.024788856506347656, -0.023752212524414062, -0.02271556854248047, -0.021678924560546875, -0.02064228057861328, -0.019605636596679688, -0.018568992614746094, -0.0175323486328125, -0.016495704650878906, -0.015459060668945312, -0.014422416687011719, -0.013385772705078125, -0.012349128723144531, -0.011312484741210938, -0.010275840759277344, -0.00923919677734375, -0.008202552795410156, -0.0071659088134765625, -0.006129264831542969, -0.005092620849609375, -0.004055976867675781, -0.0030193328857421875, -0.0019826889038085938, -0.000946044921875, 9.059906005859375e-05, 0.0011272430419921875, 0.0021638870239257812, 0.003200531005859375, 0.004237174987792969, 0.0052738189697265625, 0.006310462951660156, 0.00734710693359375, 0.008383750915527344, 0.009420394897460938, 0.010457038879394531, 0.011493682861328125, 0.012530326843261719, 0.013566970825195312, 0.014603614807128906, 0.0156402587890625, 0.016676902770996094, 0.017713546752929688, 0.01875019073486328, 0.019786834716796875, 0.02082347869873047, 0.021860122680664062, 0.022896766662597656, 0.02393341064453125, 0.024970054626464844, 0.026006698608398438, 0.02704334259033203, 0.028079986572265625, 0.02911663055419922, 0.030153274536132812, 0.031189918518066406, 0.0322265625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 14.0, 50.0, 139.0, 267.0, 268.0, 173.0, 70.0, 20.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007206786540336907, -0.0006731952307745814, -0.0006257118075154722, -0.0005782283842563629, -0.0005307449027895927, -0.00048326150863431394, -0.0004357780562713742, -0.00038829463301226497, -0.0003408112097531557, -0.00029332778649404645, -0.0002458443632349372, -0.00019836091087199748, -0.00015087748761288822, -0.00010339406435377896, -5.591061199083924e-05, -8.427188731729984e-06, 3.9056234527379274e-05, 8.653966506244615e-05, 0.00013402309559751302, 0.0001815065334085375, 0.00022898995666764677, 0.000276473379926756, 0.00032395683228969574, 0.000371440255548805, 0.00041892367880791426, 0.0004664071020670235, 0.0005138905253261328, 0.000561374006792903, 0.0006088573718443513, 0.0006563408533111215, 0.0007038242765702307, 0.00075130769982934, 0.0007987911812961102, 0.0008462746045552194, 0.0008937580278143287, 0.0009412415092810988, 0.0009887248743325472, 0.0010362083557993174, 0.0010836918372660875, 0.0011311752023175359, 0.0011786585673689842, 0.0012261420488357544, 0.0012736254138872027, 0.001321108895353973, 0.0013685922604054213, 0.0014160757418721914, 0.0014635592233389616, 0.00151104258839041, 0.0015585260698571801, 0.0016060095513239503, 0.0016534929163753986, 0.0017009763978421688, 0.0017484597628936172, 0.0017959432443603873, 0.0018434266094118357, 0.0018909100908786058, 0.001938393572345376, 0.001985877053812146, 0.0020333605352789164, 0.002080843783915043, 0.002128327265381813, 0.0021758107468485832, 0.0022232942283153534, 0.0022707777097821236, 0.00231826095841825]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 3.0, 8.0, 5.0, 10.0, 10.0, 8.0, 14.0, 13.0, 12.0, 27.0, 19.0, 23.0, 21.0, 27.0, 34.0, 38.0, 38.0, 42.0, 32.0, 56.0, 39.0, 38.0, 40.0, 42.0, 36.0, 37.0, 37.0, 33.0, 39.0, 28.0, 22.0, 29.0, 15.0, 25.0, 24.0, 13.0, 14.0, 18.0, 6.0, 4.0, 4.0, 6.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.000668942928314209, -0.0006496105343103409, -0.0006302781403064728, -0.0006109457463026047, -0.0005916133522987366, -0.0005722809582948685, -0.0005529485642910004, -0.0005336161702871323, -0.0005142837762832642, -0.0004949513822793961, -0.00047561898827552795, -0.00045628659427165985, -0.00043695420026779175, -0.00041762180626392365, -0.00039828941226005554, -0.00037895701825618744, -0.00035962462425231934, -0.00034029223024845123, -0.00032095983624458313, -0.000301627442240715, -0.0002822950482368469, -0.0002629626542329788, -0.00024363026022911072, -0.00022429786622524261, -0.0002049654722213745, -0.0001856330782175064, -0.0001663006842136383, -0.0001469682902097702, -0.0001276358962059021, -0.000108303502202034, -8.89711081981659e-05, -6.963871419429779e-05, -5.030632019042969e-05, -3.0973926186561584e-05, -1.1641532182693481e-05, 7.690861821174622e-06, 2.7023255825042725e-05, 4.635564982891083e-05, 6.568804383277893e-05, 8.502043783664703e-05, 0.00010435283184051514, 0.00012368522584438324, 0.00014301761984825134, 0.00016235001385211945, 0.00018168240785598755, 0.00020101480185985565, 0.00022034719586372375, 0.00023967958986759186, 0.00025901198387145996, 0.00027834437787532806, 0.00029767677187919617, 0.00031700916588306427, 0.0003363415598869324, 0.0003556739538908005, 0.0003750063478946686, 0.0003943387418985367, 0.0004136711359024048, 0.0004330035299062729, 0.000452335923910141, 0.0004716683179140091, 0.0004910007119178772, 0.0005103331059217453, 0.0005296654999256134, 0.0005489978939294815, 0.0005683302879333496]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 7.0, 7.0, 12.0, 7.0, 11.0, 16.0, 16.0, 11.0, 20.0, 22.0, 23.0, 18.0, 37.0, 35.0, 35.0, 38.0, 40.0, 32.0, 37.0, 49.0, 37.0, 49.0, 36.0, 38.0, 31.0, 34.0, 33.0, 35.0, 26.0, 28.0, 25.0, 19.0, 27.0, 17.0, 14.0, 20.0, 9.0, 11.0, 9.0, 9.0, 5.0, 4.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.6484375, -11.29248046875, -10.9365234375, -10.58056640625, -10.224609375, -9.86865234375, -9.5126953125, -9.15673828125, -8.80078125, -8.44482421875, -8.0888671875, -7.73291015625, -7.376953125, -7.02099609375, -6.6650390625, -6.30908203125, -5.953125, -5.59716796875, -5.2412109375, -4.88525390625, -4.529296875, -4.17333984375, -3.8173828125, -3.46142578125, -3.10546875, -2.74951171875, -2.3935546875, -2.03759765625, -1.681640625, -1.32568359375, -0.9697265625, -0.61376953125, -0.2578125, 0.09814453125, 0.4541015625, 0.81005859375, 1.166015625, 1.52197265625, 1.8779296875, 2.23388671875, 2.58984375, 2.94580078125, 3.3017578125, 3.65771484375, 4.013671875, 4.36962890625, 4.7255859375, 5.08154296875, 5.4375, 5.79345703125, 6.1494140625, 6.50537109375, 6.861328125, 7.21728515625, 7.5732421875, 7.92919921875, 8.28515625, 8.64111328125, 8.9970703125, 9.35302734375, 9.708984375, 10.06494140625, 10.4208984375, 10.77685546875, 11.1328125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 12.0, 8.0, 11.0, 24.0, 23.0, 17.0, 26.0, 39.0, 54.0, 74.0, 117.0, 164.0, 225.0, 315.0, 590.0, 1494.0, 7526.0, 58859.0, 665810.0, 281025.0, 25754.0, 3883.0, 1045.0, 428.0, 294.0, 192.0, 132.0, 94.0, 73.0, 46.0, 43.0, 31.0, 17.0, 28.0, 10.0, 12.0, 8.0, 13.0, 6.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.765625, -22.07177734375, -21.3779296875, -20.68408203125, -19.990234375, -19.29638671875, -18.6025390625, -17.90869140625, -17.21484375, -16.52099609375, -15.8271484375, -15.13330078125, -14.439453125, -13.74560546875, -13.0517578125, -12.35791015625, -11.6640625, -10.97021484375, -10.2763671875, -9.58251953125, -8.888671875, -8.19482421875, -7.5009765625, -6.80712890625, -6.11328125, -5.41943359375, -4.7255859375, -4.03173828125, -3.337890625, -2.64404296875, -1.9501953125, -1.25634765625, -0.5625, 0.13134765625, 0.8251953125, 1.51904296875, 2.212890625, 2.90673828125, 3.6005859375, 4.29443359375, 4.98828125, 5.68212890625, 6.3759765625, 7.06982421875, 7.763671875, 8.45751953125, 9.1513671875, 9.84521484375, 10.5390625, 11.23291015625, 11.9267578125, 12.62060546875, 13.314453125, 14.00830078125, 14.7021484375, 15.39599609375, 16.08984375, 16.78369140625, 17.4775390625, 18.17138671875, 18.865234375, 19.55908203125, 20.2529296875, 20.94677734375, 21.640625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 7.0, 8.0, 12.0, 10.0, 12.0, 19.0, 20.0, 28.0, 39.0, 35.0, 45.0, 61.0, 69.0, 73.0, 122.0, 1723.0, 280.0, 96.0, 67.0, 64.0, 41.0, 41.0, 32.0, 34.0, 20.0, 20.0, 18.0, 16.0, 13.0, 3.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.625, -43.01806640625, -41.4111328125, -39.80419921875, -38.197265625, -36.59033203125, -34.9833984375, -33.37646484375, -31.76953125, -30.16259765625, -28.5556640625, -26.94873046875, -25.341796875, -23.73486328125, -22.1279296875, -20.52099609375, -18.9140625, -17.30712890625, -15.7001953125, -14.09326171875, -12.486328125, -10.87939453125, -9.2724609375, -7.66552734375, -6.05859375, -4.45166015625, -2.8447265625, -1.23779296875, 0.369140625, 1.97607421875, 3.5830078125, 5.18994140625, 6.796875, 8.40380859375, 10.0107421875, 11.61767578125, 13.224609375, 14.83154296875, 16.4384765625, 18.04541015625, 19.65234375, 21.25927734375, 22.8662109375, 24.47314453125, 26.080078125, 27.68701171875, 29.2939453125, 30.90087890625, 32.5078125, 34.11474609375, 35.7216796875, 37.32861328125, 38.935546875, 40.54248046875, 42.1494140625, 43.75634765625, 45.36328125, 46.97021484375, 48.5771484375, 50.18408203125, 51.791015625, 53.39794921875, 55.0048828125, 56.61181640625, 58.21875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 6.0, 11.0, 16.0, 17.0, 17.0, 36.0, 34.0, 69.0, 63.0, 125.0, 162.0, 415.0, 1181.0, 49074.0, 3089976.0, 3199.0, 554.0, 235.0, 153.0, 98.0, 61.0, 54.0, 27.0, 25.0, 17.0, 12.0, 15.0, 12.0, 10.0, 9.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-134.625, -130.9091796875, -127.193359375, -123.4775390625, -119.76171875, -116.0458984375, -112.330078125, -108.6142578125, -104.8984375, -101.1826171875, -97.466796875, -93.7509765625, -90.03515625, -86.3193359375, -82.603515625, -78.8876953125, -75.171875, -71.4560546875, -67.740234375, -64.0244140625, -60.30859375, -56.5927734375, -52.876953125, -49.1611328125, -45.4453125, -41.7294921875, -38.013671875, -34.2978515625, -30.58203125, -26.8662109375, -23.150390625, -19.4345703125, -15.71875, -12.0029296875, -8.287109375, -4.5712890625, -0.85546875, 2.8603515625, 6.576171875, 10.2919921875, 14.0078125, 17.7236328125, 21.439453125, 25.1552734375, 28.87109375, 32.5869140625, 36.302734375, 40.0185546875, 43.734375, 47.4501953125, 51.166015625, 54.8818359375, 58.59765625, 62.3134765625, 66.029296875, 69.7451171875, 73.4609375, 77.1767578125, 80.892578125, 84.6083984375, 88.32421875, 92.0400390625, 95.755859375, 99.4716796875, 103.1875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 16.0, 102.0, 503.0, 342.0, 49.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.08769607543945, -37.3053092956543, -32.52292251586914, -27.740535736083984, -22.958148956298828, -18.175762176513672, -13.393375396728516, -8.61098861694336, -3.828601837158203, 0.9537849426269531, 5.736171722412109, 10.518558502197266, 15.300945281982422, 20.083332061767578, 24.865718841552734, 29.64810562133789, 34.43049240112305, 39.2128791809082, 43.99526596069336, 48.777652740478516, 53.56003952026367, 58.34242630004883, 63.124813079833984, 67.90719604492188, 72.68959045410156, 77.47197723388672, 82.25436401367188, 87.03675079345703, 91.81913757324219, 96.60152435302734, 101.3839111328125, 106.16629791259766, 110.94866943359375, 115.7310562133789, 120.51344299316406, 125.29582977294922, 130.07821655273438, 134.860595703125, 139.6429901123047, 144.42538452148438, 149.207763671875, 153.99014282226562, 158.7725372314453, 163.554931640625, 168.33731079101562, 173.11968994140625, 177.90208435058594, 182.68447875976562, 187.46685791015625, 192.24923706054688, 197.03163146972656, 201.81402587890625, 206.59640502929688, 211.3787841796875, 216.1611785888672, 220.94357299804688, 225.7259521484375, 230.50833129882812, 235.2907257080078, 240.0731201171875, 244.85549926757812, 249.63787841796875, 254.42027282714844, 259.2026672363281, 263.98504638671875]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 7.0, 3.0, 7.0, 3.0, 8.0, 7.0, 11.0, 12.0, 15.0, 21.0, 17.0, 19.0, 23.0, 28.0, 29.0, 33.0, 47.0, 35.0, 37.0, 32.0, 37.0, 34.0, 28.0, 51.0, 36.0, 37.0, 36.0, 45.0, 33.0, 33.0, 35.0, 23.0, 21.0, 23.0, 22.0, 15.0, 18.0, 15.0, 6.0, 7.0, 13.0, 4.0, 8.0, 6.0, 6.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-101.98184204101562, -98.71770477294922, -95.45356750488281, -92.1894302368164, -88.92529296875, -85.6611557006836, -82.39701843261719, -79.13288116455078, -75.86874389648438, -72.60460662841797, -69.34046936035156, -66.07633209228516, -62.81219482421875, -59.548057556152344, -56.28392028808594, -53.01978302001953, -49.75564193725586, -46.49150466918945, -43.22736740112305, -39.96323013305664, -36.699092864990234, -33.43495178222656, -30.17081642150879, -26.906679153442383, -23.642541885375977, -20.37840461730957, -17.114267349243164, -13.850129127502441, -10.585991859436035, -7.3218536376953125, -4.057716369628906, -0.7935791015625, 2.4705581665039062, 5.7346954345703125, 8.998832702636719, 12.262970924377441, 15.527108192443848, 18.79124641418457, 22.055383682250977, 25.319520950317383, 28.58365821838379, 31.847795486450195, 35.111934661865234, 38.37607192993164, 41.64020919799805, 44.90434646606445, 48.16848373413086, 51.432621002197266, 54.69675827026367, 57.96089553833008, 61.225032806396484, 64.48917388916016, 67.75331115722656, 71.01744842529297, 74.28158569335938, 77.54572296142578, 80.80986022949219, 84.0739974975586, 87.338134765625, 90.6022720336914, 93.86640930175781, 97.13054656982422, 100.39468383789062, 103.65882110595703, 106.92295837402344]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 6.0, 5.0, 6.0, 8.0, 9.0, 11.0, 22.0, 19.0, 17.0, 23.0, 19.0, 29.0, 33.0, 28.0, 44.0, 43.0, 39.0, 47.0, 50.0, 38.0, 41.0, 31.0, 39.0, 40.0, 41.0, 48.0, 30.0, 25.0, 27.0, 29.0, 22.0, 29.0, 20.0, 13.0, 18.0, 16.0, 8.0, 7.0, 5.0, 6.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.765625, -11.3648681640625, -10.964111328125, -10.5633544921875, -10.16259765625, -9.7618408203125, -9.361083984375, -8.9603271484375, -8.5595703125, -8.1588134765625, -7.758056640625, -7.3572998046875, -6.95654296875, -6.5557861328125, -6.155029296875, -5.7542724609375, -5.353515625, -4.9527587890625, -4.552001953125, -4.1512451171875, -3.75048828125, -3.3497314453125, -2.948974609375, -2.5482177734375, -2.1474609375, -1.7467041015625, -1.345947265625, -0.9451904296875, -0.54443359375, -0.1436767578125, 0.257080078125, 0.6578369140625, 1.05859375, 1.4593505859375, 1.860107421875, 2.2608642578125, 2.66162109375, 3.0623779296875, 3.463134765625, 3.8638916015625, 4.2646484375, 4.6654052734375, 5.066162109375, 5.4669189453125, 5.86767578125, 6.2684326171875, 6.669189453125, 7.0699462890625, 7.470703125, 7.8714599609375, 8.272216796875, 8.6729736328125, 9.07373046875, 9.4744873046875, 9.875244140625, 10.2760009765625, 10.6767578125, 11.0775146484375, 11.478271484375, 11.8790283203125, 12.27978515625, 12.6805419921875, 13.081298828125, 13.4820556640625, 13.8828125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 3.0, 6.0, 4.0, 9.0, 11.0, 12.0, 10.0, 9.0, 19.0, 21.0, 24.0, 49.0, 42.0, 65.0, 107.0, 162.0, 237.0, 627.0, 2287.0, 20660.0, 1454666.0, 2665415.0, 44948.0, 3231.0, 750.0, 320.0, 160.0, 107.0, 72.0, 54.0, 43.0, 23.0, 30.0, 26.0, 17.0, 17.0, 8.0, 6.0, 7.0, 5.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.125, -38.87548828125, -37.6259765625, -36.37646484375, -35.126953125, -33.87744140625, -32.6279296875, -31.37841796875, -30.12890625, -28.87939453125, -27.6298828125, -26.38037109375, -25.130859375, -23.88134765625, -22.6318359375, -21.38232421875, -20.1328125, -18.88330078125, -17.6337890625, -16.38427734375, -15.134765625, -13.88525390625, -12.6357421875, -11.38623046875, -10.13671875, -8.88720703125, -7.6376953125, -6.38818359375, -5.138671875, -3.88916015625, -2.6396484375, -1.39013671875, -0.140625, 1.10888671875, 2.3583984375, 3.60791015625, 4.857421875, 6.10693359375, 7.3564453125, 8.60595703125, 9.85546875, 11.10498046875, 12.3544921875, 13.60400390625, 14.853515625, 16.10302734375, 17.3525390625, 18.60205078125, 19.8515625, 21.10107421875, 22.3505859375, 23.60009765625, 24.849609375, 26.09912109375, 27.3486328125, 28.59814453125, 29.84765625, 31.09716796875, 32.3466796875, 33.59619140625, 34.845703125, 36.09521484375, 37.3447265625, 38.59423828125, 39.84375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 4.0, 18.0, 23.0, 44.0, 58.0, 98.0, 177.0, 272.0, 426.0, 695.0, 800.0, 561.0, 330.0, 217.0, 135.0, 84.0, 52.0, 21.0, 19.0, 13.0, 6.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-41.9375, -40.989013671875, -40.04052734375, -39.092041015625, -38.1435546875, -37.195068359375, -36.24658203125, -35.298095703125, -34.349609375, -33.401123046875, -32.45263671875, -31.504150390625, -30.5556640625, -29.607177734375, -28.65869140625, -27.710205078125, -26.76171875, -25.813232421875, -24.86474609375, -23.916259765625, -22.9677734375, -22.019287109375, -21.07080078125, -20.122314453125, -19.173828125, -18.225341796875, -17.27685546875, -16.328369140625, -15.3798828125, -14.431396484375, -13.48291015625, -12.534423828125, -11.5859375, -10.637451171875, -9.68896484375, -8.740478515625, -7.7919921875, -6.843505859375, -5.89501953125, -4.946533203125, -3.998046875, -3.049560546875, -2.10107421875, -1.152587890625, -0.2041015625, 0.744384765625, 1.69287109375, 2.641357421875, 3.58984375, 4.538330078125, 5.48681640625, 6.435302734375, 7.3837890625, 8.332275390625, 9.28076171875, 10.229248046875, 11.177734375, 12.126220703125, 13.07470703125, 14.023193359375, 14.9716796875, 15.920166015625, 16.86865234375, 17.817138671875, 18.765625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 11.0, 12.0, 19.0, 20.0, 36.0, 38.0, 29.0, 45.0, 88.0, 81.0, 124.0, 186.0, 307.0, 559.0, 1460.0, 24900.0, 4115203.0, 48004.0, 1609.0, 497.0, 308.0, 168.0, 144.0, 85.0, 76.0, 75.0, 42.0, 36.0, 21.0, 22.0, 16.0, 13.0, 5.0, 10.0, 5.0, 4.0, 3.0, 5.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.75, -91.6494140625, -88.548828125, -85.4482421875, -82.34765625, -79.2470703125, -76.146484375, -73.0458984375, -69.9453125, -66.8447265625, -63.744140625, -60.6435546875, -57.54296875, -54.4423828125, -51.341796875, -48.2412109375, -45.140625, -42.0400390625, -38.939453125, -35.8388671875, -32.73828125, -29.6376953125, -26.537109375, -23.4365234375, -20.3359375, -17.2353515625, -14.134765625, -11.0341796875, -7.93359375, -4.8330078125, -1.732421875, 1.3681640625, 4.46875, 7.5693359375, 10.669921875, 13.7705078125, 16.87109375, 19.9716796875, 23.072265625, 26.1728515625, 29.2734375, 32.3740234375, 35.474609375, 38.5751953125, 41.67578125, 44.7763671875, 47.876953125, 50.9775390625, 54.078125, 57.1787109375, 60.279296875, 63.3798828125, 66.48046875, 69.5810546875, 72.681640625, 75.7822265625, 78.8828125, 81.9833984375, 85.083984375, 88.1845703125, 91.28515625, 94.3857421875, 97.486328125, 100.5869140625, 103.6875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 125.0, 738.0, 147.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-667.907470703125, -655.1900024414062, -642.4725952148438, -629.755126953125, -617.0377197265625, -604.3202514648438, -591.602783203125, -578.8853759765625, -566.1679077148438, -553.450439453125, -540.7330322265625, -528.0155639648438, -515.2981567382812, -502.5806884765625, -489.8632507324219, -477.14581298828125, -464.4283752441406, -451.7109375, -438.9934997558594, -426.27606201171875, -413.55859375, -400.8411560058594, -388.12371826171875, -375.4062805175781, -362.6888427734375, -349.9714050292969, -337.25396728515625, -324.5364990234375, -311.8190612792969, -299.10162353515625, -286.3841857910156, -273.666748046875, -260.94927978515625, -248.23184204101562, -235.51438903808594, -222.7969512939453, -210.07949829101562, -197.362060546875, -184.64462280273438, -171.92718505859375, -159.209716796875, -146.49227905273438, -133.7748260498047, -121.05738830566406, -108.3399429321289, -95.62249755859375, -82.90505981445312, -70.18761444091797, -57.47016906738281, -44.752723693847656, -32.035282135009766, -19.317840576171875, -6.600395202636719, 6.1170501708984375, 18.834487915039062, 31.55193328857422, 44.269378662109375, 56.98682403564453, 69.70426940917969, 82.42170715332031, 95.13915252685547, 107.85659790039062, 120.57403564453125, 133.29147338867188, 146.00892639160156]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 7.0, 7.0, 5.0, 14.0, 6.0, 5.0, 10.0, 12.0, 23.0, 21.0, 24.0, 28.0, 30.0, 37.0, 34.0, 37.0, 31.0, 49.0, 47.0, 54.0, 59.0, 53.0, 49.0, 44.0, 37.0, 37.0, 45.0, 36.0, 25.0, 18.0, 18.0, 21.0, 20.0, 11.0, 12.0, 7.0, 7.0, 8.0, 6.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.1439208984375, -62.992645263671875, -60.841373443603516, -58.690101623535156, -56.53882598876953, -54.387550354003906, -52.23627853393555, -50.08500671386719, -47.93373107910156, -45.78245544433594, -43.63118362426758, -41.47991180419922, -39.328636169433594, -37.17736053466797, -35.02608871459961, -32.87481689453125, -30.723541259765625, -28.572267532348633, -26.42099380493164, -24.26972007751465, -22.118446350097656, -19.967172622680664, -17.815898895263672, -15.66462516784668, -13.513351440429688, -11.362077713012695, -9.210803985595703, -7.059530258178711, -4.908256530761719, -2.7569828033447266, -0.6057090759277344, 1.5455646514892578, 3.6968460083007812, 5.848119735717773, 7.999393463134766, 10.150667190551758, 12.30194091796875, 14.453214645385742, 16.604488372802734, 18.755762100219727, 20.90703582763672, 23.05830955505371, 25.209583282470703, 27.360857009887695, 29.512130737304688, 31.66340446472168, 33.81467819213867, 35.96595001220703, 38.117225646972656, 40.26850128173828, 42.41977310180664, 44.571044921875, 46.722320556640625, 48.87359619140625, 51.02486801147461, 53.17613983154297, 55.327415466308594, 57.47869110107422, 59.62996292114258, 61.78123474121094, 63.93251037597656, 66.08378601074219, 68.23506164550781, 70.3863296508789, 72.53760528564453]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 5.0, 11.0, 6.0, 10.0, 10.0, 16.0, 22.0, 27.0, 23.0, 25.0, 18.0, 35.0, 36.0, 30.0, 34.0, 35.0, 43.0, 45.0, 40.0, 29.0, 38.0, 49.0, 42.0, 35.0, 39.0, 37.0, 35.0, 27.0, 26.0, 30.0, 17.0, 25.0, 19.0, 25.0, 8.0, 13.0, 7.0, 8.0, 4.0, 2.0, 4.0, 8.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.171875, -9.7777099609375, -9.383544921875, -8.9893798828125, -8.59521484375, -8.2010498046875, -7.806884765625, -7.4127197265625, -7.0185546875, -6.6243896484375, -6.230224609375, -5.8360595703125, -5.44189453125, -5.0477294921875, -4.653564453125, -4.2593994140625, -3.865234375, -3.4710693359375, -3.076904296875, -2.6827392578125, -2.28857421875, -1.8944091796875, -1.500244140625, -1.1060791015625, -0.7119140625, -0.3177490234375, 0.076416015625, 0.4705810546875, 0.86474609375, 1.2589111328125, 1.653076171875, 2.0472412109375, 2.44140625, 2.8355712890625, 3.229736328125, 3.6239013671875, 4.01806640625, 4.4122314453125, 4.806396484375, 5.2005615234375, 5.5947265625, 5.9888916015625, 6.383056640625, 6.7772216796875, 7.17138671875, 7.5655517578125, 7.959716796875, 8.3538818359375, 8.748046875, 9.1422119140625, 9.536376953125, 9.9305419921875, 10.32470703125, 10.7188720703125, 11.113037109375, 11.5072021484375, 11.9013671875, 12.2955322265625, 12.689697265625, 13.0838623046875, 13.47802734375, 13.8721923828125, 14.266357421875, 14.6605224609375, 15.0546875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 5.0, 2.0, 5.0, 6.0, 3.0, 6.0, 21.0, 43.0, 54.0, 93.0, 134.0, 231.0, 330.0, 488.0, 683.0, 1058.0, 1715.0, 2632.0, 4011.0, 6103.0, 9436.0, 14734.0, 23056.0, 36756.0, 60831.0, 109294.0, 257957.0, 250728.0, 107502.0, 60219.0, 36220.0, 22913.0, 14595.0, 9185.0, 6081.0, 4038.0, 2571.0, 1627.0, 1080.0, 741.0, 477.0, 304.0, 229.0, 118.0, 96.0, 54.0, 48.0, 22.0, 11.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.330078125, -2.2548828125, -2.1796875, -2.1044921875, -2.029296875, -1.9541015625, -1.87890625, -1.8037109375, -1.728515625, -1.6533203125, -1.578125, -1.5029296875, -1.427734375, -1.3525390625, -1.27734375, -1.2021484375, -1.126953125, -1.0517578125, -0.9765625, -0.9013671875, -0.826171875, -0.7509765625, -0.67578125, -0.6005859375, -0.525390625, -0.4501953125, -0.375, -0.2998046875, -0.224609375, -0.1494140625, -0.07421875, 0.0009765625, 0.076171875, 0.1513671875, 0.2265625, 0.3017578125, 0.376953125, 0.4521484375, 0.52734375, 0.6025390625, 0.677734375, 0.7529296875, 0.828125, 0.9033203125, 0.978515625, 1.0537109375, 1.12890625, 1.2041015625, 1.279296875, 1.3544921875, 1.4296875, 1.5048828125, 1.580078125, 1.6552734375, 1.73046875, 1.8056640625, 1.880859375, 1.9560546875, 2.03125, 2.1064453125, 2.181640625, 2.2568359375, 2.33203125, 2.4072265625, 2.482421875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 1.0, 2.0, 7.0, 9.0, 7.0, 9.0, 15.0, 9.0, 16.0, 21.0, 19.0, 22.0, 25.0, 22.0, 35.0, 44.0, 36.0, 33.0, 48.0, 48.0, 47.0, 1056.0, 44.0, 41.0, 46.0, 44.0, 25.0, 44.0, 34.0, 27.0, 24.0, 21.0, 20.0, 16.0, 21.0, 9.0, 16.0, 19.0, 10.0, 7.0, 7.0, 2.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.359375, -8.1033935546875, -7.847412109375, -7.5914306640625, -7.33544921875, -7.0794677734375, -6.823486328125, -6.5675048828125, -6.3115234375, -6.0555419921875, -5.799560546875, -5.5435791015625, -5.28759765625, -5.0316162109375, -4.775634765625, -4.5196533203125, -4.263671875, -4.0076904296875, -3.751708984375, -3.4957275390625, -3.23974609375, -2.9837646484375, -2.727783203125, -2.4718017578125, -2.2158203125, -1.9598388671875, -1.703857421875, -1.4478759765625, -1.19189453125, -0.9359130859375, -0.679931640625, -0.4239501953125, -0.16796875, 0.0880126953125, 0.343994140625, 0.5999755859375, 0.85595703125, 1.1119384765625, 1.367919921875, 1.6239013671875, 1.8798828125, 2.1358642578125, 2.391845703125, 2.6478271484375, 2.90380859375, 3.1597900390625, 3.415771484375, 3.6717529296875, 3.927734375, 4.1837158203125, 4.439697265625, 4.6956787109375, 4.95166015625, 5.2076416015625, 5.463623046875, 5.7196044921875, 5.9755859375, 6.2315673828125, 6.487548828125, 6.7435302734375, 6.99951171875, 7.2554931640625, 7.511474609375, 7.7674560546875, 8.0234375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 8.0, 9.0, 9.0, 21.0, 28.0, 41.0, 53.0, 66.0, 101.0, 189.0, 271.0, 402.0, 581.0, 812.0, 1309.0, 1915.0, 2945.0, 4511.0, 6827.0, 10535.0, 15868.0, 24817.0, 40615.0, 69651.0, 138108.0, 1392971.0, 175968.0, 81839.0, 46402.0, 28395.0, 17961.0, 11589.0, 7656.0, 4929.0, 3298.0, 2139.0, 1430.0, 919.0, 663.0, 432.0, 264.0, 190.0, 132.0, 71.0, 57.0, 41.0, 32.0, 22.0, 20.0, 10.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.439453125, -2.362335205078125, -2.28521728515625, -2.208099365234375, -2.1309814453125, -2.053863525390625, -1.97674560546875, -1.899627685546875, -1.822509765625, -1.745391845703125, -1.66827392578125, -1.591156005859375, -1.5140380859375, -1.436920166015625, -1.35980224609375, -1.282684326171875, -1.20556640625, -1.128448486328125, -1.05133056640625, -0.974212646484375, -0.8970947265625, -0.819976806640625, -0.74285888671875, -0.665740966796875, -0.588623046875, -0.511505126953125, -0.43438720703125, -0.357269287109375, -0.2801513671875, -0.203033447265625, -0.12591552734375, -0.048797607421875, 0.0283203125, 0.105438232421875, 0.18255615234375, 0.259674072265625, 0.3367919921875, 0.413909912109375, 0.49102783203125, 0.568145751953125, 0.645263671875, 0.722381591796875, 0.79949951171875, 0.876617431640625, 0.9537353515625, 1.030853271484375, 1.10797119140625, 1.185089111328125, 1.26220703125, 1.339324951171875, 1.41644287109375, 1.493560791015625, 1.5706787109375, 1.647796630859375, 1.72491455078125, 1.802032470703125, 1.879150390625, 1.956268310546875, 2.03338623046875, 2.110504150390625, 2.1876220703125, 2.264739990234375, 2.34185791015625, 2.418975830078125, 2.49609375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 7.0, 8.0, 6.0, 9.0, 8.0, 9.0, 14.0, 20.0, 19.0, 30.0, 49.0, 53.0, 65.0, 82.0, 96.0, 102.0, 86.0, 81.0, 58.0, 46.0, 30.0, 28.0, 20.0, 27.0, 10.0, 9.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0016241073608398438, -0.0015690773725509644, -0.001514047384262085, -0.0014590173959732056, -0.0014039874076843262, -0.0013489574193954468, -0.0012939274311065674, -0.001238897442817688, -0.0011838674545288086, -0.0011288374662399292, -0.0010738074779510498, -0.0010187774896621704, -0.000963747501373291, -0.0009087175130844116, -0.0008536875247955322, -0.0007986575365066528, -0.0007436275482177734, -0.000688597559928894, -0.0006335675716400146, -0.0005785375833511353, -0.0005235075950622559, -0.00046847760677337646, -0.00041344761848449707, -0.0003584176301956177, -0.0003033876419067383, -0.0002483576536178589, -0.0001933276653289795, -0.0001382976770401001, -8.32676887512207e-05, -2.823770046234131e-05, 2.6792287826538086e-05, 8.182227611541748e-05, 0.00013685226440429688, 0.00019188225269317627, 0.00024691224098205566, 0.00030194222927093506, 0.00035697221755981445, 0.00041200220584869385, 0.00046703219413757324, 0.0005220621824264526, 0.000577092170715332, 0.0006321221590042114, 0.0006871521472930908, 0.0007421821355819702, 0.0007972121238708496, 0.000852242112159729, 0.0009072721004486084, 0.0009623020887374878, 0.0010173320770263672, 0.0010723620653152466, 0.001127392053604126, 0.0011824220418930054, 0.0012374520301818848, 0.0012924820184707642, 0.0013475120067596436, 0.001402541995048523, 0.0014575719833374023, 0.0015126019716262817, 0.0015676319599151611, 0.0016226619482040405, 0.00167769193649292, 0.0017327219247817993, 0.0017877519130706787, 0.001842781901359558, 0.0018978118896484375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 3.0, 2.0, 5.0, 0.0, 6.0, 7.0, 8.0, 10.0, 17.0, 21.0, 20.0, 32.0, 52.0, 65.0, 121.0, 190.0, 436.0, 2117.0, 1040988.0, 3244.0, 543.0, 234.0, 135.0, 77.0, 53.0, 39.0, 38.0, 19.0, 15.0, 14.0, 3.0, 12.0, 10.0, 8.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.04144287109375, -0.0402073860168457, -0.038971900939941406, -0.03773641586303711, -0.03650093078613281, -0.035265445709228516, -0.03402996063232422, -0.03279447555541992, -0.031558990478515625, -0.030323505401611328, -0.02908802032470703, -0.027852535247802734, -0.026617050170898438, -0.02538156509399414, -0.024146080017089844, -0.022910594940185547, -0.02167510986328125, -0.020439624786376953, -0.019204139709472656, -0.01796865463256836, -0.016733169555664062, -0.015497684478759766, -0.014262199401855469, -0.013026714324951172, -0.011791229248046875, -0.010555744171142578, -0.009320259094238281, -0.008084774017333984, -0.0068492889404296875, -0.005613803863525391, -0.004378318786621094, -0.003142833709716797, -0.0019073486328125, -0.0006718635559082031, 0.0005636215209960938, 0.0017991065979003906, 0.0030345916748046875, 0.004270076751708984, 0.005505561828613281, 0.006741046905517578, 0.007976531982421875, 0.009212017059326172, 0.010447502136230469, 0.011682987213134766, 0.012918472290039062, 0.01415395736694336, 0.015389442443847656, 0.016624927520751953, 0.01786041259765625, 0.019095897674560547, 0.020331382751464844, 0.02156686782836914, 0.022802352905273438, 0.024037837982177734, 0.02527332305908203, 0.026508808135986328, 0.027744293212890625, 0.028979778289794922, 0.03021526336669922, 0.031450748443603516, 0.03268623352050781, 0.03392171859741211, 0.035157203674316406, 0.0363926887512207, 0.037628173828125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 42.0, 277.0, 516.0, 149.0, 19.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002594602294266224, -0.0024960734881460667, -0.0023975444491952658, -0.0022990156430751085, -0.0022004868369549513, -0.0021019577980041504, -0.002003428991883993, -0.001904900185763836, -0.0018063713796436787, -0.0017078424571081996, -0.0016093136509880424, -0.0015107847284525633, -0.001412255922332406, -0.001313726999796927, -0.001215198077261448, -0.0011166692711412907, -0.0010181403486058116, -0.0009196114842779934, -0.0008210826199501753, -0.0007225536974146962, -0.000624024891294539, -0.0005254959687590599, -0.00042696710443124175, -0.0003284382401034236, -0.00022990937577560544, -0.00013138051144778728, -3.28516325680539e-05, 6.567724631167948e-05, 0.00016420611063949764, 0.00026273500407114625, 0.0003612638683989644, 0.00045979273272678256, 0.0005583215970546007, 0.0006568504613824189, 0.000755379325710237, 0.0008539082482457161, 0.0009524370543658733, 0.0010509659769013524, 0.0011494948994368315, 0.0012480237055569887, 0.001346552511677146, 0.001445081434212625, 0.0015436102403327823, 0.0016421391628682613, 0.0017406679689884186, 0.0018391968915238976, 0.0019377258140593767, 0.002036254620179534, 0.002134783659130335, 0.002233312465250492, 0.002331841504201293, 0.0024303703103214502, 0.0025288991164416075, 0.0026274281553924084, 0.0027259569615125656, 0.002824485767632723, 0.00292301457375288, 0.0030215433798730373, 0.0031200724188238382, 0.0032186012249439955, 0.0033171300310641527, 0.0034156590700149536, 0.003514187876135111, 0.003612716682255268, 0.0037112454883754253]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 2.0, 3.0, 2.0, 4.0, 5.0, 4.0, 11.0, 7.0, 11.0, 17.0, 19.0, 11.0, 21.0, 34.0, 22.0, 22.0, 22.0, 33.0, 33.0, 33.0, 43.0, 41.0, 37.0, 33.0, 28.0, 46.0, 44.0, 33.0, 44.0, 36.0, 29.0, 33.0, 29.0, 18.0, 26.0, 22.0, 25.0, 20.0, 23.0, 21.0, 10.0, 5.0, 11.0, 8.0, 5.0, 0.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0007055401802062988, -0.0006841942667961121, -0.0006628483533859253, -0.0006415024399757385, -0.0006201565265655518, -0.000598810613155365, -0.0005774646997451782, -0.0005561187863349915, -0.0005347728729248047, -0.0005134269595146179, -0.0004920810461044312, -0.0004707351326942444, -0.0004493892192840576, -0.00042804330587387085, -0.0004066973924636841, -0.0003853514790534973, -0.00036400556564331055, -0.0003426596522331238, -0.000321313738822937, -0.00029996782541275024, -0.0002786219120025635, -0.0002572759985923767, -0.00023593008518218994, -0.00021458417177200317, -0.0001932382583618164, -0.00017189234495162964, -0.00015054643154144287, -0.0001292005181312561, -0.00010785460472106934, -8.650869131088257e-05, -6.51627779006958e-05, -4.381686449050903e-05, -2.2470951080322266e-05, -1.125037670135498e-06, 2.022087574005127e-05, 4.156678915023804e-05, 6.29127025604248e-05, 8.425861597061157e-05, 0.00010560452938079834, 0.0001269504427909851, 0.00014829635620117188, 0.00016964226961135864, 0.0001909881830215454, 0.00021233409643173218, 0.00023368000984191895, 0.0002550259232521057, 0.0002763718366622925, 0.00029771775007247925, 0.000319063663482666, 0.0003404095768928528, 0.00036175549030303955, 0.0003831014037132263, 0.0004044473171234131, 0.00042579323053359985, 0.0004471391439437866, 0.0004684850573539734, 0.0004898309707641602, 0.0005111768841743469, 0.0005325227975845337, 0.0005538687109947205, 0.0005752146244049072, 0.000596560537815094, 0.0006179064512252808, 0.0006392523646354675, 0.0006605982780456543]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 5.0, 11.0, 6.0, 10.0, 10.0, 16.0, 22.0, 27.0, 23.0, 25.0, 18.0, 35.0, 36.0, 30.0, 34.0, 35.0, 43.0, 45.0, 40.0, 29.0, 38.0, 49.0, 42.0, 35.0, 39.0, 37.0, 35.0, 27.0, 26.0, 30.0, 18.0, 24.0, 19.0, 25.0, 8.0, 13.0, 7.0, 8.0, 4.0, 2.0, 4.0, 8.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.171875, -9.7777099609375, -9.383544921875, -8.9893798828125, -8.59521484375, -8.2010498046875, -7.806884765625, -7.4127197265625, -7.0185546875, -6.6243896484375, -6.230224609375, -5.8360595703125, -5.44189453125, -5.0477294921875, -4.653564453125, -4.2593994140625, -3.865234375, -3.4710693359375, -3.076904296875, -2.6827392578125, -2.28857421875, -1.8944091796875, -1.500244140625, -1.1060791015625, -0.7119140625, -0.3177490234375, 0.076416015625, 0.4705810546875, 0.86474609375, 1.2589111328125, 1.653076171875, 2.0472412109375, 2.44140625, 2.8355712890625, 3.229736328125, 3.6239013671875, 4.01806640625, 4.4122314453125, 4.806396484375, 5.2005615234375, 5.5947265625, 5.9888916015625, 6.383056640625, 6.7772216796875, 7.17138671875, 7.5655517578125, 7.959716796875, 8.3538818359375, 8.748046875, 9.1422119140625, 9.536376953125, 9.9305419921875, 10.32470703125, 10.7188720703125, 11.113037109375, 11.5072021484375, 11.9013671875, 12.2955322265625, 12.689697265625, 13.0838623046875, 13.47802734375, 13.8721923828125, 14.266357421875, 14.6605224609375, 15.0546875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 8.0, 2.0, 7.0, 8.0, 13.0, 18.0, 22.0, 21.0, 34.0, 38.0, 71.0, 79.0, 100.0, 125.0, 162.0, 265.0, 378.0, 449.0, 611.0, 884.0, 2042.0, 13498.0, 346526.0, 657180.0, 20027.0, 2447.0, 984.0, 674.0, 468.0, 394.0, 256.0, 188.0, 149.0, 94.0, 85.0, 73.0, 44.0, 32.0, 21.0, 20.0, 12.0, 11.0, 10.0, 7.0, 10.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.765625, -24.777587890625, -23.78955078125, -22.801513671875, -21.8134765625, -20.825439453125, -19.83740234375, -18.849365234375, -17.861328125, -16.873291015625, -15.88525390625, -14.897216796875, -13.9091796875, -12.921142578125, -11.93310546875, -10.945068359375, -9.95703125, -8.968994140625, -7.98095703125, -6.992919921875, -6.0048828125, -5.016845703125, -4.02880859375, -3.040771484375, -2.052734375, -1.064697265625, -0.07666015625, 0.911376953125, 1.8994140625, 2.887451171875, 3.87548828125, 4.863525390625, 5.8515625, 6.839599609375, 7.82763671875, 8.815673828125, 9.8037109375, 10.791748046875, 11.77978515625, 12.767822265625, 13.755859375, 14.743896484375, 15.73193359375, 16.719970703125, 17.7080078125, 18.696044921875, 19.68408203125, 20.672119140625, 21.66015625, 22.648193359375, 23.63623046875, 24.624267578125, 25.6123046875, 26.600341796875, 27.58837890625, 28.576416015625, 29.564453125, 30.552490234375, 31.54052734375, 32.528564453125, 33.5166015625, 34.504638671875, 35.49267578125, 36.480712890625, 37.46875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 7.0, 7.0, 6.0, 10.0, 10.0, 11.0, 25.0, 24.0, 26.0, 47.0, 34.0, 35.0, 58.0, 60.0, 81.0, 206.0, 1843.0, 125.0, 73.0, 70.0, 45.0, 46.0, 41.0, 31.0, 27.0, 25.0, 16.0, 19.0, 10.0, 9.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.46875, -47.93798828125, -46.4072265625, -44.87646484375, -43.345703125, -41.81494140625, -40.2841796875, -38.75341796875, -37.22265625, -35.69189453125, -34.1611328125, -32.63037109375, -31.099609375, -29.56884765625, -28.0380859375, -26.50732421875, -24.9765625, -23.44580078125, -21.9150390625, -20.38427734375, -18.853515625, -17.32275390625, -15.7919921875, -14.26123046875, -12.73046875, -11.19970703125, -9.6689453125, -8.13818359375, -6.607421875, -5.07666015625, -3.5458984375, -2.01513671875, -0.484375, 1.04638671875, 2.5771484375, 4.10791015625, 5.638671875, 7.16943359375, 8.7001953125, 10.23095703125, 11.76171875, 13.29248046875, 14.8232421875, 16.35400390625, 17.884765625, 19.41552734375, 20.9462890625, 22.47705078125, 24.0078125, 25.53857421875, 27.0693359375, 28.60009765625, 30.130859375, 31.66162109375, 33.1923828125, 34.72314453125, 36.25390625, 37.78466796875, 39.3154296875, 40.84619140625, 42.376953125, 43.90771484375, 45.4384765625, 46.96923828125, 48.5]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 12.0, 14.0, 18.0, 20.0, 35.0, 35.0, 41.0, 62.0, 83.0, 150.0, 362.0, 1357.0, 3099360.0, 42771.0, 704.0, 239.0, 117.0, 66.0, 48.0, 50.0, 27.0, 31.0, 20.0, 17.0, 11.0, 9.0, 7.0, 7.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.75, -133.421875, -129.09375, -124.765625, -120.4375, -116.109375, -111.78125, -107.453125, -103.125, -98.796875, -94.46875, -90.140625, -85.8125, -81.484375, -77.15625, -72.828125, -68.5, -64.171875, -59.84375, -55.515625, -51.1875, -46.859375, -42.53125, -38.203125, -33.875, -29.546875, -25.21875, -20.890625, -16.5625, -12.234375, -7.90625, -3.578125, 0.75, 5.078125, 9.40625, 13.734375, 18.0625, 22.390625, 26.71875, 31.046875, 35.375, 39.703125, 44.03125, 48.359375, 52.6875, 57.015625, 61.34375, 65.671875, 70.0, 74.328125, 78.65625, 82.984375, 87.3125, 91.640625, 95.96875, 100.296875, 104.625, 108.953125, 113.28125, 117.609375, 121.9375, 126.265625, 130.59375, 134.921875, 139.25]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 271.0, 651.0, 89.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.67513275146484, -101.88948059082031, -97.10383605957031, -92.31818389892578, -87.53253173828125, -82.74687957763672, -77.96122741699219, -73.17558288574219, -68.38993072509766, -63.604278564453125, -58.81863021850586, -54.032981872558594, -49.24732971191406, -44.46167755126953, -39.676029205322266, -34.890380859375, -30.10472869873047, -25.31907844543457, -20.533428192138672, -15.747777938842773, -10.962127685546875, -6.176477432250977, -1.3908271789550781, 3.3948211669921875, 8.180473327636719, 12.966123580932617, 17.751773834228516, 22.537424087524414, 27.323074340820312, 32.108726501464844, 36.89437484741211, 41.680023193359375, 46.465667724609375, 51.251319885253906, 56.03696823120117, 60.82261657714844, 65.60826873779297, 70.3939208984375, 75.1795654296875, 79.96521759033203, 84.75086975097656, 89.5365219116211, 94.32217407226562, 99.10781860351562, 103.89347076416016, 108.67912292480469, 113.46476745605469, 118.25041961669922, 123.03607177734375, 127.82172393798828, 132.6073760986328, 137.3930206298828, 142.17868041992188, 146.96432495117188, 151.74996948242188, 156.53561401367188, 161.32127380371094, 166.10691833496094, 170.892578125, 175.67822265625, 180.4638671875, 185.24952697753906, 190.03517150878906, 194.82083129882812, 199.60647583007812]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 5.0, 2.0, 5.0, 9.0, 6.0, 8.0, 15.0, 15.0, 17.0, 19.0, 23.0, 20.0, 21.0, 19.0, 32.0, 30.0, 30.0, 29.0, 39.0, 38.0, 36.0, 37.0, 41.0, 47.0, 35.0, 32.0, 43.0, 27.0, 40.0, 24.0, 34.0, 28.0, 28.0, 26.0, 17.0, 23.0, 14.0, 15.0, 13.0, 8.0, 3.0, 16.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-85.07910919189453, -82.22688293457031, -79.37466430664062, -76.52244567871094, -73.67021942138672, -70.8179931640625, -67.96577453613281, -65.11355590820312, -62.261329650878906, -59.40910720825195, -56.556884765625, -53.70466232299805, -50.852439880371094, -48.00021743774414, -45.14799499511719, -42.295772552490234, -39.44355010986328, -36.59132766723633, -33.739105224609375, -30.886882781982422, -28.03466033935547, -25.182437896728516, -22.330215454101562, -19.47799301147461, -16.625770568847656, -13.773548126220703, -10.92132568359375, -8.069103240966797, -5.216880798339844, -2.3646583557128906, 0.4875640869140625, 3.3397865295410156, 6.192008972167969, 9.044231414794922, 11.896453857421875, 14.748676300048828, 17.60089874267578, 20.453121185302734, 23.305343627929688, 26.15756607055664, 29.009788513183594, 31.862010955810547, 34.7142333984375, 37.56645584106445, 40.418678283691406, 43.27090072631836, 46.12312316894531, 48.975345611572266, 51.82756805419922, 54.67979049682617, 57.532012939453125, 60.38423538208008, 63.23645782470703, 66.08868408203125, 68.94090270996094, 71.79312133789062, 74.64534759521484, 77.49757385253906, 80.34979248046875, 83.20201110839844, 86.05423736572266, 88.90646362304688, 91.75868225097656, 94.61090087890625, 97.46312713623047]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 0.0, 4.0, 3.0, 3.0, 9.0, 9.0, 14.0, 13.0, 15.0, 20.0, 19.0, 25.0, 25.0, 22.0, 37.0, 39.0, 31.0, 44.0, 34.0, 36.0, 34.0, 38.0, 39.0, 52.0, 36.0, 50.0, 28.0, 39.0, 31.0, 32.0, 31.0, 35.0, 23.0, 20.0, 23.0, 18.0, 14.0, 14.0, 10.0, 10.0, 8.0, 5.0, 1.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.734375, -10.330322265625, -9.92626953125, -9.522216796875, -9.1181640625, -8.714111328125, -8.31005859375, -7.906005859375, -7.501953125, -7.097900390625, -6.69384765625, -6.289794921875, -5.8857421875, -5.481689453125, -5.07763671875, -4.673583984375, -4.26953125, -3.865478515625, -3.46142578125, -3.057373046875, -2.6533203125, -2.249267578125, -1.84521484375, -1.441162109375, -1.037109375, -0.633056640625, -0.22900390625, 0.175048828125, 0.5791015625, 0.983154296875, 1.38720703125, 1.791259765625, 2.1953125, 2.599365234375, 3.00341796875, 3.407470703125, 3.8115234375, 4.215576171875, 4.61962890625, 5.023681640625, 5.427734375, 5.831787109375, 6.23583984375, 6.639892578125, 7.0439453125, 7.447998046875, 7.85205078125, 8.256103515625, 8.66015625, 9.064208984375, 9.46826171875, 9.872314453125, 10.2763671875, 10.680419921875, 11.08447265625, 11.488525390625, 11.892578125, 12.296630859375, 12.70068359375, 13.104736328125, 13.5087890625, 13.912841796875, 14.31689453125, 14.720947265625, 15.125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 1.0, 6.0, 7.0, 9.0, 13.0, 22.0, 21.0, 37.0, 31.0, 47.0, 43.0, 77.0, 87.0, 132.0, 129.0, 222.0, 322.0, 446.0, 763.0, 1634.0, 4907.0, 31119.0, 779987.0, 2978562.0, 371039.0, 17360.0, 3684.0, 1404.0, 656.0, 430.0, 256.0, 169.0, 148.0, 123.0, 75.0, 75.0, 49.0, 48.0, 32.0, 32.0, 19.0, 14.0, 11.0, 8.0, 10.0, 3.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.140625, -25.2509765625, -24.361328125, -23.4716796875, -22.58203125, -21.6923828125, -20.802734375, -19.9130859375, -19.0234375, -18.1337890625, -17.244140625, -16.3544921875, -15.46484375, -14.5751953125, -13.685546875, -12.7958984375, -11.90625, -11.0166015625, -10.126953125, -9.2373046875, -8.34765625, -7.4580078125, -6.568359375, -5.6787109375, -4.7890625, -3.8994140625, -3.009765625, -2.1201171875, -1.23046875, -0.3408203125, 0.548828125, 1.4384765625, 2.328125, 3.2177734375, 4.107421875, 4.9970703125, 5.88671875, 6.7763671875, 7.666015625, 8.5556640625, 9.4453125, 10.3349609375, 11.224609375, 12.1142578125, 13.00390625, 13.8935546875, 14.783203125, 15.6728515625, 16.5625, 17.4521484375, 18.341796875, 19.2314453125, 20.12109375, 21.0107421875, 21.900390625, 22.7900390625, 23.6796875, 24.5693359375, 25.458984375, 26.3486328125, 27.23828125, 28.1279296875, 29.017578125, 29.9072265625, 30.796875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 8.0, 7.0, 12.0, 19.0, 49.0, 61.0, 112.0, 170.0, 332.0, 625.0, 881.0, 752.0, 470.0, 247.0, 134.0, 79.0, 43.0, 32.0, 14.0, 15.0, 9.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.328125, -30.341796875, -29.35546875, -28.369140625, -27.3828125, -26.396484375, -25.41015625, -24.423828125, -23.4375, -22.451171875, -21.46484375, -20.478515625, -19.4921875, -18.505859375, -17.51953125, -16.533203125, -15.546875, -14.560546875, -13.57421875, -12.587890625, -11.6015625, -10.615234375, -9.62890625, -8.642578125, -7.65625, -6.669921875, -5.68359375, -4.697265625, -3.7109375, -2.724609375, -1.73828125, -0.751953125, 0.234375, 1.220703125, 2.20703125, 3.193359375, 4.1796875, 5.166015625, 6.15234375, 7.138671875, 8.125, 9.111328125, 10.09765625, 11.083984375, 12.0703125, 13.056640625, 14.04296875, 15.029296875, 16.015625, 17.001953125, 17.98828125, 18.974609375, 19.9609375, 20.947265625, 21.93359375, 22.919921875, 23.90625, 24.892578125, 25.87890625, 26.865234375, 27.8515625, 28.837890625, 29.82421875, 30.810546875, 31.796875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 14.0, 21.0, 21.0, 33.0, 45.0, 71.0, 93.0, 161.0, 236.0, 454.0, 1319.0, 10852.0, 4028516.0, 148210.0, 2575.0, 688.0, 311.0, 195.0, 127.0, 91.0, 56.0, 44.0, 40.0, 26.0, 22.0, 12.0, 5.0, 10.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.8125, -88.6181640625, -85.423828125, -82.2294921875, -79.03515625, -75.8408203125, -72.646484375, -69.4521484375, -66.2578125, -63.0634765625, -59.869140625, -56.6748046875, -53.48046875, -50.2861328125, -47.091796875, -43.8974609375, -40.703125, -37.5087890625, -34.314453125, -31.1201171875, -27.92578125, -24.7314453125, -21.537109375, -18.3427734375, -15.1484375, -11.9541015625, -8.759765625, -5.5654296875, -2.37109375, 0.8232421875, 4.017578125, 7.2119140625, 10.40625, 13.6005859375, 16.794921875, 19.9892578125, 23.18359375, 26.3779296875, 29.572265625, 32.7666015625, 35.9609375, 39.1552734375, 42.349609375, 45.5439453125, 48.73828125, 51.9326171875, 55.126953125, 58.3212890625, 61.515625, 64.7099609375, 67.904296875, 71.0986328125, 74.29296875, 77.4873046875, 80.681640625, 83.8759765625, 87.0703125, 90.2646484375, 93.458984375, 96.6533203125, 99.84765625, 103.0419921875, 106.236328125, 109.4306640625, 112.625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 261.0, 729.0, 22.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1005.7844848632812, -987.8919067382812, -969.9993896484375, -952.1068115234375, -934.2142944335938, -916.3217163085938, -898.42919921875, -880.53662109375, -862.6441040039062, -844.7515258789062, -826.8590087890625, -808.9664306640625, -791.0739135742188, -773.1813354492188, -755.288818359375, -737.396240234375, -719.503662109375, -701.611083984375, -683.7185668945312, -665.8259887695312, -647.9334716796875, -630.0408935546875, -612.1483764648438, -594.2557983398438, -576.36328125, -558.470703125, -540.5781860351562, -522.6856079101562, -504.7930908203125, -486.9005432128906, -469.00799560546875, -451.11541748046875, -433.222900390625, -415.3303527832031, -397.43780517578125, -379.5452575683594, -361.6527099609375, -343.7601623535156, -325.86761474609375, -307.97503662109375, -290.08251953125, -272.1899719238281, -254.29742431640625, -236.40487670898438, -218.5123291015625, -200.61978149414062, -182.7272186279297, -164.8346710205078, -146.94212341308594, -129.04957580566406, -111.15702819824219, -93.26447296142578, -75.3719253540039, -57.47937774658203, -39.586822509765625, -21.69427490234375, -3.801727294921875, 14.090822219848633, 31.98337173461914, 49.87592315673828, 67.76847076416016, 85.66101837158203, 103.55357360839844, 121.44612121582031, 139.3386688232422]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 8.0, 9.0, 9.0, 14.0, 12.0, 8.0, 16.0, 23.0, 22.0, 24.0, 26.0, 24.0, 34.0, 33.0, 31.0, 30.0, 26.0, 32.0, 39.0, 46.0, 50.0, 42.0, 38.0, 44.0, 35.0, 34.0, 30.0, 24.0, 32.0, 33.0, 36.0, 24.0, 27.0, 10.0, 10.0, 7.0, 7.0, 7.0, 10.0, 5.0, 8.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-52.92021942138672, -51.162864685058594, -49.40550994873047, -47.648155212402344, -45.89080047607422, -44.133445739746094, -42.37609100341797, -40.618736267089844, -38.86138153076172, -37.104026794433594, -35.34667205810547, -33.589317321777344, -31.83196258544922, -30.074607849121094, -28.3172550201416, -26.559900283813477, -24.802547454833984, -23.04519271850586, -21.287837982177734, -19.53048324584961, -17.773128509521484, -16.01577377319336, -14.258420944213867, -12.501066207885742, -10.743711471557617, -8.986356735229492, -7.229002475738525, -5.471648216247559, -3.7142934799194336, -1.9569387435913086, -0.1995849609375, 1.557769775390625, 3.31512451171875, 5.072479248046875, 6.829833507537842, 8.587187767028809, 10.344542503356934, 12.101897239685059, 13.859251022338867, 15.616605758666992, 17.373960494995117, 19.131315231323242, 20.888669967651367, 22.64602279663086, 24.403377532958984, 26.16073226928711, 27.918087005615234, 29.67544174194336, 31.432796478271484, 33.19015121459961, 34.947505950927734, 36.70486068725586, 38.462215423583984, 40.21957015991211, 41.97692108154297, 43.734275817871094, 45.49163055419922, 47.248985290527344, 49.00634002685547, 50.763694763183594, 52.52104949951172, 54.278404235839844, 56.03575897216797, 57.793113708496094, 59.55046844482422]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 10.0, 7.0, 9.0, 10.0, 9.0, 17.0, 12.0, 16.0, 20.0, 18.0, 25.0, 26.0, 32.0, 38.0, 36.0, 39.0, 35.0, 45.0, 41.0, 48.0, 38.0, 38.0, 42.0, 34.0, 35.0, 43.0, 20.0, 39.0, 38.0, 30.0, 29.0, 23.0, 11.0, 23.0, 12.0, 12.0, 11.0, 5.0, 12.0, 6.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.984375, -12.58544921875, -12.1865234375, -11.78759765625, -11.388671875, -10.98974609375, -10.5908203125, -10.19189453125, -9.79296875, -9.39404296875, -8.9951171875, -8.59619140625, -8.197265625, -7.79833984375, -7.3994140625, -7.00048828125, -6.6015625, -6.20263671875, -5.8037109375, -5.40478515625, -5.005859375, -4.60693359375, -4.2080078125, -3.80908203125, -3.41015625, -3.01123046875, -2.6123046875, -2.21337890625, -1.814453125, -1.41552734375, -1.0166015625, -0.61767578125, -0.21875, 0.18017578125, 0.5791015625, 0.97802734375, 1.376953125, 1.77587890625, 2.1748046875, 2.57373046875, 2.97265625, 3.37158203125, 3.7705078125, 4.16943359375, 4.568359375, 4.96728515625, 5.3662109375, 5.76513671875, 6.1640625, 6.56298828125, 6.9619140625, 7.36083984375, 7.759765625, 8.15869140625, 8.5576171875, 8.95654296875, 9.35546875, 9.75439453125, 10.1533203125, 10.55224609375, 10.951171875, 11.35009765625, 11.7490234375, 12.14794921875, 12.546875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 7.0, 12.0, 27.0, 42.0, 76.0, 91.0, 129.0, 227.0, 309.0, 483.0, 751.0, 1168.0, 1826.0, 2838.0, 4373.0, 6671.0, 10304.0, 16442.0, 26572.0, 42677.0, 72549.0, 139915.0, 338662.0, 170837.0, 83165.0, 48303.0, 29452.0, 18116.0, 11519.0, 7389.0, 4790.0, 3135.0, 2035.0, 1275.0, 830.0, 532.0, 325.0, 226.0, 182.0, 100.0, 73.0, 39.0, 34.0, 15.0, 6.0, 5.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.48828125, -2.409576416015625, -2.33087158203125, -2.252166748046875, -2.1734619140625, -2.094757080078125, -2.01605224609375, -1.937347412109375, -1.858642578125, -1.779937744140625, -1.70123291015625, -1.622528076171875, -1.5438232421875, -1.465118408203125, -1.38641357421875, -1.307708740234375, -1.22900390625, -1.150299072265625, -1.07159423828125, -0.992889404296875, -0.9141845703125, -0.835479736328125, -0.75677490234375, -0.678070068359375, -0.599365234375, -0.520660400390625, -0.44195556640625, -0.363250732421875, -0.2845458984375, -0.205841064453125, -0.12713623046875, -0.048431396484375, 0.0302734375, 0.108978271484375, 0.18768310546875, 0.266387939453125, 0.3450927734375, 0.423797607421875, 0.50250244140625, 0.581207275390625, 0.659912109375, 0.738616943359375, 0.81732177734375, 0.896026611328125, 0.9747314453125, 1.053436279296875, 1.13214111328125, 1.210845947265625, 1.28955078125, 1.368255615234375, 1.44696044921875, 1.525665283203125, 1.6043701171875, 1.683074951171875, 1.76177978515625, 1.840484619140625, 1.919189453125, 1.997894287109375, 2.07659912109375, 2.155303955078125, 2.2340087890625, 2.312713623046875, 2.39141845703125, 2.470123291015625, 2.548828125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 4.0, 8.0, 5.0, 12.0, 11.0, 18.0, 21.0, 23.0, 19.0, 32.0, 36.0, 33.0, 30.0, 45.0, 31.0, 45.0, 46.0, 39.0, 1052.0, 51.0, 29.0, 34.0, 42.0, 39.0, 46.0, 33.0, 29.0, 31.0, 31.0, 19.0, 18.0, 21.0, 24.0, 22.0, 10.0, 8.0, 7.0, 6.0, 5.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1953125, -7.9306640625, -7.666015625, -7.4013671875, -7.13671875, -6.8720703125, -6.607421875, -6.3427734375, -6.078125, -5.8134765625, -5.548828125, -5.2841796875, -5.01953125, -4.7548828125, -4.490234375, -4.2255859375, -3.9609375, -3.6962890625, -3.431640625, -3.1669921875, -2.90234375, -2.6376953125, -2.373046875, -2.1083984375, -1.84375, -1.5791015625, -1.314453125, -1.0498046875, -0.78515625, -0.5205078125, -0.255859375, 0.0087890625, 0.2734375, 0.5380859375, 0.802734375, 1.0673828125, 1.33203125, 1.5966796875, 1.861328125, 2.1259765625, 2.390625, 2.6552734375, 2.919921875, 3.1845703125, 3.44921875, 3.7138671875, 3.978515625, 4.2431640625, 4.5078125, 4.7724609375, 5.037109375, 5.3017578125, 5.56640625, 5.8310546875, 6.095703125, 6.3603515625, 6.625, 6.8896484375, 7.154296875, 7.4189453125, 7.68359375, 7.9482421875, 8.212890625, 8.4775390625, 8.7421875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 6.0, 23.0, 21.0, 34.0, 48.0, 87.0, 105.0, 164.0, 239.0, 371.0, 618.0, 843.0, 1324.0, 2153.0, 3404.0, 5530.0, 8746.0, 13695.0, 22179.0, 36101.0, 60632.0, 110214.0, 1315875.0, 254130.0, 108095.0, 58819.0, 35406.0, 22000.0, 13650.0, 8447.0, 5158.0, 3250.0, 1995.0, 1251.0, 869.0, 554.0, 347.0, 255.0, 155.0, 103.0, 61.0, 56.0, 38.0, 20.0, 13.0, 16.0, 7.0, 1.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-2.62890625, -2.5491943359375, -2.469482421875, -2.3897705078125, -2.31005859375, -2.2303466796875, -2.150634765625, -2.0709228515625, -1.9912109375, -1.9114990234375, -1.831787109375, -1.7520751953125, -1.67236328125, -1.5926513671875, -1.512939453125, -1.4332275390625, -1.353515625, -1.2738037109375, -1.194091796875, -1.1143798828125, -1.03466796875, -0.9549560546875, -0.875244140625, -0.7955322265625, -0.7158203125, -0.6361083984375, -0.556396484375, -0.4766845703125, -0.39697265625, -0.3172607421875, -0.237548828125, -0.1578369140625, -0.078125, 0.0015869140625, 0.081298828125, 0.1610107421875, 0.24072265625, 0.3204345703125, 0.400146484375, 0.4798583984375, 0.5595703125, 0.6392822265625, 0.718994140625, 0.7987060546875, 0.87841796875, 0.9581298828125, 1.037841796875, 1.1175537109375, 1.197265625, 1.2769775390625, 1.356689453125, 1.4364013671875, 1.51611328125, 1.5958251953125, 1.675537109375, 1.7552490234375, 1.8349609375, 1.9146728515625, 1.994384765625, 2.0740966796875, 2.15380859375, 2.2335205078125, 2.313232421875, 2.3929443359375, 2.47265625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 6.0, 7.0, 8.0, 7.0, 8.0, 16.0, 18.0, 20.0, 24.0, 30.0, 26.0, 29.0, 51.0, 43.0, 56.0, 73.0, 57.0, 55.0, 58.0, 61.0, 48.0, 35.0, 40.0, 22.0, 21.0, 20.0, 21.0, 20.0, 22.0, 14.0, 8.0, 11.0, 12.0, 9.0, 0.0, 9.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008940696716308594, -0.0008653402328491211, -0.0008366107940673828, -0.0008078813552856445, -0.0007791519165039062, -0.000750422477722168, -0.0007216930389404297, -0.0006929636001586914, -0.0006642341613769531, -0.0006355047225952148, -0.0006067752838134766, -0.0005780458450317383, -0.00054931640625, -0.0005205869674682617, -0.0004918575286865234, -0.00046312808990478516, -0.0004343986511230469, -0.0004056692123413086, -0.0003769397735595703, -0.00034821033477783203, -0.00031948089599609375, -0.00029075145721435547, -0.0002620220184326172, -0.0002332925796508789, -0.00020456314086914062, -0.00017583370208740234, -0.00014710426330566406, -0.00011837482452392578, -8.96453857421875e-05, -6.091594696044922e-05, -3.218650817871094e-05, -3.4570693969726562e-06, 2.5272369384765625e-05, 5.4001808166503906e-05, 8.273124694824219e-05, 0.00011146068572998047, 0.00014019012451171875, 0.00016891956329345703, 0.0001976490020751953, 0.0002263784408569336, 0.0002551078796386719, 0.00028383731842041016, 0.00031256675720214844, 0.0003412961959838867, 0.000370025634765625, 0.0003987550735473633, 0.00042748451232910156, 0.00045621395111083984, 0.0004849433898925781, 0.0005136728286743164, 0.0005424022674560547, 0.000571131706237793, 0.0005998611450195312, 0.0006285905838012695, 0.0006573200225830078, 0.0006860494613647461, 0.0007147789001464844, 0.0007435083389282227, 0.0007722377777099609, 0.0008009672164916992, 0.0008296966552734375, 0.0008584260940551758, 0.0008871555328369141, 0.0009158849716186523, 0.0009446144104003906]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 18.0, 11.0, 14.0, 15.0, 19.0, 20.0, 36.0, 41.0, 54.0, 73.0, 129.0, 153.0, 312.0, 679.0, 10232.0, 1028770.0, 6427.0, 631.0, 273.0, 187.0, 125.0, 75.0, 58.0, 31.0, 26.0, 27.0, 14.0, 11.0, 21.0, 12.0, 10.0, 6.0, 4.0, 9.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0229644775390625, -0.02221059799194336, -0.02145671844482422, -0.020702838897705078, -0.019948959350585938, -0.019195079803466797, -0.018441200256347656, -0.017687320709228516, -0.016933441162109375, -0.016179561614990234, -0.015425682067871094, -0.014671802520751953, -0.013917922973632812, -0.013164043426513672, -0.012410163879394531, -0.01165628433227539, -0.01090240478515625, -0.01014852523803711, -0.009394645690917969, -0.008640766143798828, -0.007886886596679688, -0.007133007049560547, -0.006379127502441406, -0.005625247955322266, -0.004871368408203125, -0.004117488861083984, -0.0033636093139648438, -0.002609729766845703, -0.0018558502197265625, -0.0011019706726074219, -0.00034809112548828125, 0.0004057884216308594, 0.00115966796875, 0.0019135475158691406, 0.0026674270629882812, 0.003421306610107422, 0.0041751861572265625, 0.004929065704345703, 0.005682945251464844, 0.006436824798583984, 0.007190704345703125, 0.007944583892822266, 0.008698463439941406, 0.009452342987060547, 0.010206222534179688, 0.010960102081298828, 0.011713981628417969, 0.01246786117553711, 0.01322174072265625, 0.01397562026977539, 0.014729499816894531, 0.015483379364013672, 0.016237258911132812, 0.016991138458251953, 0.017745018005371094, 0.018498897552490234, 0.019252777099609375, 0.020006656646728516, 0.020760536193847656, 0.021514415740966797, 0.022268295288085938, 0.023022174835205078, 0.02377605438232422, 0.02452993392944336, 0.0252838134765625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 159.0, 767.0, 80.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00251849670894444, -0.002354952972382307, -0.0021914090029895306, -0.0020278652664273977, -0.001864321529865265, -0.001700777793303132, -0.0015372339403256774, -0.0013736900873482227, -0.00121014635078609, -0.001046602614223957, -0.0008830587612465024, -0.0007195149664767087, -0.0005559711717069149, -0.00039242737693712115, -0.0002288835821673274, -6.533972918987274e-05, 9.82040073722601e-05, 0.00026174780214205384, 0.0004252915969118476, 0.0005888353916816413, 0.0007523791864514351, 0.0009159229812212288, 0.0010794667759910226, 0.0012430106289684772, 0.00140655436553061, 0.001570098102092743, 0.0017336419550701976, 0.0018971858080476522, 0.002060729544609785, 0.002224273281171918, 0.0023878170177340508, 0.0025513609871268272, 0.0027149049565196037, 0.0028784486930817366, 0.0030419924296438694, 0.003205536399036646, 0.0033690801355987787, 0.0035326238721609116, 0.003696167841553688, 0.003859711578115821, 0.004023255314677954, 0.00418679928407073, 0.004350342787802219, 0.004513886757194996, 0.004677430726587772, 0.0048409742303192616, 0.005004518199712038, 0.005168061703443527, 0.005331605672836304, 0.00549514964222908, 0.005658693145960569, 0.005822237115353346, 0.005985780619084835, 0.0061493245884776115, 0.006312868557870388, 0.0064764125272631645, 0.006639956030994654, 0.00680350000038743, 0.006967043504118919, 0.007130587473511696, 0.007294131442904472, 0.0074576749466359615, 0.007621218916028738, 0.007784762419760227, 0.007948306389153004]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 5.0, 7.0, 5.0, 3.0, 5.0, 7.0, 20.0, 15.0, 12.0, 16.0, 27.0, 23.0, 24.0, 20.0, 27.0, 21.0, 39.0, 29.0, 40.0, 33.0, 42.0, 42.0, 43.0, 53.0, 39.0, 41.0, 30.0, 31.0, 32.0, 34.0, 38.0, 30.0, 27.0, 19.0, 21.0, 24.0, 8.0, 11.0, 15.0, 14.0, 7.0, 4.0, 6.0, 4.0, 0.0, 1.0, 4.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.000576317310333252, -0.0005602911114692688, -0.0005442649126052856, -0.0005282387137413025, -0.0005122125148773193, -0.0004961863160133362, -0.00048016011714935303, -0.0004641339182853699, -0.0004481077194213867, -0.00043208152055740356, -0.0004160553216934204, -0.00040002912282943726, -0.0003840029239654541, -0.00036797672510147095, -0.0003519505262374878, -0.00033592432737350464, -0.0003198981285095215, -0.00030387192964553833, -0.0002878457307815552, -0.000271819531917572, -0.00025579333305358887, -0.0002397671341896057, -0.00022374093532562256, -0.0002077147364616394, -0.00019168853759765625, -0.0001756623387336731, -0.00015963613986968994, -0.0001436099410057068, -0.00012758374214172363, -0.00011155754327774048, -9.553134441375732e-05, -7.950514554977417e-05, -6.347894668579102e-05, -4.745274782180786e-05, -3.142654895782471e-05, -1.5400350093841553e-05, 6.258487701416016e-07, 1.6652047634124756e-05, 3.267824649810791e-05, 4.8704445362091064e-05, 6.473064422607422e-05, 8.075684309005737e-05, 9.678304195404053e-05, 0.00011280924081802368, 0.00012883543968200684, 0.00014486163854599, 0.00016088783740997314, 0.0001769140362739563, 0.00019294023513793945, 0.0002089664340019226, 0.00022499263286590576, 0.00024101883172988892, 0.00025704503059387207, 0.0002730712294578552, 0.0002890974283218384, 0.00030512362718582153, 0.0003211498260498047, 0.00033717602491378784, 0.000353202223777771, 0.00036922842264175415, 0.0003852546215057373, 0.00040128082036972046, 0.0004173070192337036, 0.00043333321809768677, 0.0004493594169616699]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 10.0, 7.0, 9.0, 10.0, 9.0, 17.0, 12.0, 16.0, 20.0, 18.0, 25.0, 26.0, 32.0, 38.0, 36.0, 39.0, 35.0, 45.0, 41.0, 48.0, 38.0, 38.0, 42.0, 34.0, 35.0, 43.0, 20.0, 39.0, 38.0, 30.0, 29.0, 23.0, 11.0, 23.0, 12.0, 12.0, 11.0, 5.0, 12.0, 6.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.984375, -12.58544921875, -12.1865234375, -11.78759765625, -11.388671875, -10.98974609375, -10.5908203125, -10.19189453125, -9.79296875, -9.39404296875, -8.9951171875, -8.59619140625, -8.197265625, -7.79833984375, -7.3994140625, -7.00048828125, -6.6015625, -6.20263671875, -5.8037109375, -5.40478515625, -5.005859375, -4.60693359375, -4.2080078125, -3.80908203125, -3.41015625, -3.01123046875, -2.6123046875, -2.21337890625, -1.814453125, -1.41552734375, -1.0166015625, -0.61767578125, -0.21875, 0.18017578125, 0.5791015625, 0.97802734375, 1.376953125, 1.77587890625, 2.1748046875, 2.57373046875, 2.97265625, 3.37158203125, 3.7705078125, 4.16943359375, 4.568359375, 4.96728515625, 5.3662109375, 5.76513671875, 6.1640625, 6.56298828125, 6.9619140625, 7.36083984375, 7.759765625, 8.15869140625, 8.5576171875, 8.95654296875, 9.35546875, 9.75439453125, 10.1533203125, 10.55224609375, 10.951171875, 11.35009765625, 11.7490234375, 12.14794921875, 12.546875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 12.0, 11.0, 16.0, 12.0, 30.0, 34.0, 37.0, 61.0, 69.0, 88.0, 103.0, 179.0, 265.0, 392.0, 735.0, 1573.0, 3930.0, 11128.0, 37735.0, 170652.0, 580925.0, 181653.0, 39478.0, 11630.0, 4050.0, 1615.0, 761.0, 439.0, 294.0, 165.0, 121.0, 86.0, 65.0, 52.0, 36.0, 35.0, 25.0, 15.0, 19.0, 11.0, 8.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.65625, -16.14404296875, -15.6318359375, -15.11962890625, -14.607421875, -14.09521484375, -13.5830078125, -13.07080078125, -12.55859375, -12.04638671875, -11.5341796875, -11.02197265625, -10.509765625, -9.99755859375, -9.4853515625, -8.97314453125, -8.4609375, -7.94873046875, -7.4365234375, -6.92431640625, -6.412109375, -5.89990234375, -5.3876953125, -4.87548828125, -4.36328125, -3.85107421875, -3.3388671875, -2.82666015625, -2.314453125, -1.80224609375, -1.2900390625, -0.77783203125, -0.265625, 0.24658203125, 0.7587890625, 1.27099609375, 1.783203125, 2.29541015625, 2.8076171875, 3.31982421875, 3.83203125, 4.34423828125, 4.8564453125, 5.36865234375, 5.880859375, 6.39306640625, 6.9052734375, 7.41748046875, 7.9296875, 8.44189453125, 8.9541015625, 9.46630859375, 9.978515625, 10.49072265625, 11.0029296875, 11.51513671875, 12.02734375, 12.53955078125, 13.0517578125, 13.56396484375, 14.076171875, 14.58837890625, 15.1005859375, 15.61279296875, 16.125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 15.0, 10.0, 11.0, 24.0, 28.0, 17.0, 20.0, 21.0, 40.0, 43.0, 56.0, 57.0, 76.0, 106.0, 365.0, 1525.0, 136.0, 88.0, 63.0, 52.0, 38.0, 36.0, 39.0, 28.0, 22.0, 22.0, 19.0, 21.0, 15.0, 12.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.8125, -31.599609375, -30.38671875, -29.173828125, -27.9609375, -26.748046875, -25.53515625, -24.322265625, -23.109375, -21.896484375, -20.68359375, -19.470703125, -18.2578125, -17.044921875, -15.83203125, -14.619140625, -13.40625, -12.193359375, -10.98046875, -9.767578125, -8.5546875, -7.341796875, -6.12890625, -4.916015625, -3.703125, -2.490234375, -1.27734375, -0.064453125, 1.1484375, 2.361328125, 3.57421875, 4.787109375, 6.0, 7.212890625, 8.42578125, 9.638671875, 10.8515625, 12.064453125, 13.27734375, 14.490234375, 15.703125, 16.916015625, 18.12890625, 19.341796875, 20.5546875, 21.767578125, 22.98046875, 24.193359375, 25.40625, 26.619140625, 27.83203125, 29.044921875, 30.2578125, 31.470703125, 32.68359375, 33.896484375, 35.109375, 36.322265625, 37.53515625, 38.748046875, 39.9609375, 41.173828125, 42.38671875, 43.599609375, 44.8125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 5.0, 10.0, 9.0, 16.0, 16.0, 26.0, 43.0, 55.0, 62.0, 76.0, 121.0, 171.0, 238.0, 395.0, 906.0, 5953.0, 626308.0, 2498915.0, 10065.0, 1056.0, 429.0, 230.0, 165.0, 109.0, 87.0, 62.0, 50.0, 35.0, 21.0, 20.0, 19.0, 13.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.21875, -49.51611328125, -47.8134765625, -46.11083984375, -44.408203125, -42.70556640625, -41.0029296875, -39.30029296875, -37.59765625, -35.89501953125, -34.1923828125, -32.48974609375, -30.787109375, -29.08447265625, -27.3818359375, -25.67919921875, -23.9765625, -22.27392578125, -20.5712890625, -18.86865234375, -17.166015625, -15.46337890625, -13.7607421875, -12.05810546875, -10.35546875, -8.65283203125, -6.9501953125, -5.24755859375, -3.544921875, -1.84228515625, -0.1396484375, 1.56298828125, 3.265625, 4.96826171875, 6.6708984375, 8.37353515625, 10.076171875, 11.77880859375, 13.4814453125, 15.18408203125, 16.88671875, 18.58935546875, 20.2919921875, 21.99462890625, 23.697265625, 25.39990234375, 27.1025390625, 28.80517578125, 30.5078125, 32.21044921875, 33.9130859375, 35.61572265625, 37.318359375, 39.02099609375, 40.7236328125, 42.42626953125, 44.12890625, 45.83154296875, 47.5341796875, 49.23681640625, 50.939453125, 52.64208984375, 54.3447265625, 56.04736328125, 57.75]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 58.0, 440.0, 438.0, 67.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.07611083984375, -163.00210571289062, -158.9281005859375, -154.8540802001953, -150.7800750732422, -146.70606994628906, -142.63206481933594, -138.55804443359375, -134.48403930664062, -130.4100341796875, -126.33602142333984, -122.26201629638672, -118.18800354003906, -114.11399841308594, -110.03999328613281, -105.96598052978516, -101.89197540283203, -97.8179702758789, -93.74395751953125, -89.66995239257812, -85.59593963623047, -81.52193450927734, -77.44792175292969, -73.37391662597656, -69.29991149902344, -65.22590637207031, -61.151893615722656, -57.07788848876953, -53.003875732421875, -48.92987060546875, -44.85586166381836, -40.78185272216797, -36.70783233642578, -32.63382339477539, -28.559814453125, -24.485807418823242, -20.41179847717285, -16.33778953552246, -12.263782501220703, -8.189773559570312, -4.115764617919922, -0.04175615310668945, 4.032252311706543, 8.106260299682617, 12.180269241333008, 16.2542781829834, 20.328285217285156, 24.402294158935547, 28.476303100585938, 32.55031204223633, 36.62432098388672, 40.698326110839844, 44.7723388671875, 48.846343994140625, 52.920352935791016, 56.994361877441406, 61.0683708190918, 65.14237976074219, 69.21638488769531, 73.29039764404297, 77.3644027709961, 81.43841552734375, 85.51242065429688, 89.58642578125, 93.66043853759766]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 10.0, 8.0, 16.0, 8.0, 20.0, 16.0, 21.0, 24.0, 19.0, 31.0, 22.0, 19.0, 41.0, 47.0, 37.0, 35.0, 35.0, 38.0, 45.0, 38.0, 45.0, 35.0, 31.0, 35.0, 33.0, 32.0, 26.0, 33.0, 19.0, 25.0, 18.0, 17.0, 15.0, 16.0, 11.0, 20.0, 16.0, 9.0, 8.0, 6.0, 6.0, 6.0, 4.0, 3.0, 3.0, 4.0], "bins": [-85.65505981445312, -83.41960144042969, -81.18414306640625, -78.94868469238281, -76.7132339477539, -74.47777557373047, -72.24231719970703, -70.0068588256836, -67.77140045166016, -65.53594207763672, -63.30048751831055, -61.06502914428711, -58.82957077026367, -56.5941162109375, -54.35865783691406, -52.123199462890625, -49.88774490356445, -47.652286529541016, -45.416831970214844, -43.181373596191406, -40.94591522216797, -38.71045684814453, -36.47500228881836, -34.23954391479492, -32.00408935546875, -29.768632888793945, -27.533174514770508, -25.297718048095703, -23.062259674072266, -20.82680320739746, -18.591346740722656, -16.35588836669922, -14.120433807373047, -11.884976387023926, -9.649518966674805, -7.4140625, -5.178605079650879, -2.943147659301758, -0.7076911926269531, 1.527766227722168, 3.763223648071289, 5.99868106842041, 8.234138488769531, 10.469594955444336, 12.705052375793457, 14.940509796142578, 17.175966262817383, 19.411422729492188, 21.646881103515625, 23.88233757019043, 26.117795944213867, 28.353252410888672, 30.58871078491211, 32.82416534423828, 35.05962371826172, 37.295082092285156, 39.530540466308594, 41.76599884033203, 44.0014533996582, 46.23691177368164, 48.47237014770508, 50.70782470703125, 52.94328308105469, 55.178741455078125, 57.4141960144043]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 4.0, 8.0, 5.0, 14.0, 8.0, 10.0, 8.0, 19.0, 19.0, 16.0, 24.0, 24.0, 29.0, 28.0, 36.0, 40.0, 37.0, 35.0, 39.0, 39.0, 49.0, 35.0, 35.0, 38.0, 37.0, 47.0, 26.0, 29.0, 36.0, 32.0, 25.0, 21.0, 20.0, 17.0, 19.0, 27.0, 10.0, 9.0, 10.0, 11.0, 11.0, 3.0, 7.0, 3.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8203125, -11.433837890625, -11.04736328125, -10.660888671875, -10.2744140625, -9.887939453125, -9.50146484375, -9.114990234375, -8.728515625, -8.342041015625, -7.95556640625, -7.569091796875, -7.1826171875, -6.796142578125, -6.40966796875, -6.023193359375, -5.63671875, -5.250244140625, -4.86376953125, -4.477294921875, -4.0908203125, -3.704345703125, -3.31787109375, -2.931396484375, -2.544921875, -2.158447265625, -1.77197265625, -1.385498046875, -0.9990234375, -0.612548828125, -0.22607421875, 0.160400390625, 0.546875, 0.933349609375, 1.31982421875, 1.706298828125, 2.0927734375, 2.479248046875, 2.86572265625, 3.252197265625, 3.638671875, 4.025146484375, 4.41162109375, 4.798095703125, 5.1845703125, 5.571044921875, 5.95751953125, 6.343994140625, 6.73046875, 7.116943359375, 7.50341796875, 7.889892578125, 8.2763671875, 8.662841796875, 9.04931640625, 9.435791015625, 9.822265625, 10.208740234375, 10.59521484375, 10.981689453125, 11.3681640625, 11.754638671875, 12.14111328125, 12.527587890625, 12.9140625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 5.0, 10.0, 9.0, 12.0, 10.0, 12.0, 9.0, 14.0, 18.0, 26.0, 24.0, 24.0, 29.0, 32.0, 53.0, 95.0, 123.0, 287.0, 685.0, 3163.0, 38401.0, 2055788.0, 2052705.0, 37960.0, 3187.0, 765.0, 283.0, 122.0, 105.0, 62.0, 42.0, 24.0, 32.0, 20.0, 19.0, 20.0, 14.0, 16.0, 9.0, 13.0, 6.0, 9.0, 10.0, 8.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0], "bins": [-39.25, -38.060546875, -36.87109375, -35.681640625, -34.4921875, -33.302734375, -32.11328125, -30.923828125, -29.734375, -28.544921875, -27.35546875, -26.166015625, -24.9765625, -23.787109375, -22.59765625, -21.408203125, -20.21875, -19.029296875, -17.83984375, -16.650390625, -15.4609375, -14.271484375, -13.08203125, -11.892578125, -10.703125, -9.513671875, -8.32421875, -7.134765625, -5.9453125, -4.755859375, -3.56640625, -2.376953125, -1.1875, 0.001953125, 1.19140625, 2.380859375, 3.5703125, 4.759765625, 5.94921875, 7.138671875, 8.328125, 9.517578125, 10.70703125, 11.896484375, 13.0859375, 14.275390625, 15.46484375, 16.654296875, 17.84375, 19.033203125, 20.22265625, 21.412109375, 22.6015625, 23.791015625, 24.98046875, 26.169921875, 27.359375, 28.548828125, 29.73828125, 30.927734375, 32.1171875, 33.306640625, 34.49609375, 35.685546875, 36.875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 12.0, 15.0, 11.0, 27.0, 55.0, 47.0, 57.0, 92.0, 162.0, 278.0, 365.0, 493.0, 558.0, 553.0, 436.0, 280.0, 181.0, 117.0, 84.0, 56.0, 42.0, 36.0, 16.0, 17.0, 19.0, 16.0, 12.0, 4.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.78125, -16.252197265625, -15.72314453125, -15.194091796875, -14.6650390625, -14.135986328125, -13.60693359375, -13.077880859375, -12.548828125, -12.019775390625, -11.49072265625, -10.961669921875, -10.4326171875, -9.903564453125, -9.37451171875, -8.845458984375, -8.31640625, -7.787353515625, -7.25830078125, -6.729248046875, -6.2001953125, -5.671142578125, -5.14208984375, -4.613037109375, -4.083984375, -3.554931640625, -3.02587890625, -2.496826171875, -1.9677734375, -1.438720703125, -0.90966796875, -0.380615234375, 0.1484375, 0.677490234375, 1.20654296875, 1.735595703125, 2.2646484375, 2.793701171875, 3.32275390625, 3.851806640625, 4.380859375, 4.909912109375, 5.43896484375, 5.968017578125, 6.4970703125, 7.026123046875, 7.55517578125, 8.084228515625, 8.61328125, 9.142333984375, 9.67138671875, 10.200439453125, 10.7294921875, 11.258544921875, 11.78759765625, 12.316650390625, 12.845703125, 13.374755859375, 13.90380859375, 14.432861328125, 14.9619140625, 15.490966796875, 16.02001953125, 16.549072265625, 17.078125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 6.0, 11.0, 10.0, 17.0, 16.0, 36.0, 37.0, 79.0, 140.0, 216.0, 580.0, 2057.0, 29225.0, 3606772.0, 543098.0, 9882.0, 1251.0, 375.0, 176.0, 93.0, 61.0, 35.0, 35.0, 20.0, 10.0, 8.0, 13.0, 9.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-66.8125, -64.947265625, -63.08203125, -61.216796875, -59.3515625, -57.486328125, -55.62109375, -53.755859375, -51.890625, -50.025390625, -48.16015625, -46.294921875, -44.4296875, -42.564453125, -40.69921875, -38.833984375, -36.96875, -35.103515625, -33.23828125, -31.373046875, -29.5078125, -27.642578125, -25.77734375, -23.912109375, -22.046875, -20.181640625, -18.31640625, -16.451171875, -14.5859375, -12.720703125, -10.85546875, -8.990234375, -7.125, -5.259765625, -3.39453125, -1.529296875, 0.3359375, 2.201171875, 4.06640625, 5.931640625, 7.796875, 9.662109375, 11.52734375, 13.392578125, 15.2578125, 17.123046875, 18.98828125, 20.853515625, 22.71875, 24.583984375, 26.44921875, 28.314453125, 30.1796875, 32.044921875, 33.91015625, 35.775390625, 37.640625, 39.505859375, 41.37109375, 43.236328125, 45.1015625, 46.966796875, 48.83203125, 50.697265625, 52.5625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 141.0, 668.0, 194.0, 10.0, 0.0, 0.0, 1.0], "bins": [-630.7893676757812, -620.00732421875, -609.2252197265625, -598.4431762695312, -587.6611328125, -576.8790893554688, -566.0969848632812, -555.31494140625, -544.5328979492188, -533.7508544921875, -522.96875, -512.1867065429688, -501.4046630859375, -490.6225891113281, -479.84051513671875, -469.0584716796875, -458.2763977050781, -447.49432373046875, -436.7122802734375, -425.9302062988281, -415.1481628417969, -404.3660888671875, -393.58404541015625, -382.8019714355469, -372.0198974609375, -361.2378234863281, -350.4557800292969, -339.6737060546875, -328.89166259765625, -318.1095886230469, -307.3275146484375, -296.54547119140625, -285.763427734375, -274.9813537597656, -264.1993103027344, -253.417236328125, -242.63519287109375, -231.85311889648438, -221.07106018066406, -210.28900146484375, -199.5069580078125, -188.7248992919922, -177.94284057617188, -167.1607666015625, -156.37872314453125, -145.59664916992188, -134.81459045410156, -124.03253173828125, -113.25047302246094, -102.46841430664062, -91.68635559082031, -80.90428924560547, -70.12223052978516, -59.340171813964844, -48.55810546875, -37.77604675292969, -26.99398422241211, -16.211923599243164, -5.429862976074219, 5.352199554443359, 16.134258270263672, 26.916316986083984, 37.69838333129883, 48.48044204711914, 59.26250076293945]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 4.0, 4.0, 9.0, 6.0, 5.0, 25.0, 12.0, 18.0, 14.0, 22.0, 20.0, 22.0, 27.0, 32.0, 36.0, 26.0, 39.0, 34.0, 45.0, 45.0, 41.0, 28.0, 44.0, 34.0, 31.0, 39.0, 42.0, 33.0, 33.0, 31.0, 29.0, 24.0, 29.0, 14.0, 20.0, 13.0, 15.0, 12.0, 18.0, 5.0, 4.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-52.5272102355957, -50.97853469848633, -49.42985916137695, -47.88118362426758, -46.3325080871582, -44.78383255004883, -43.23515701293945, -41.68648147583008, -40.1378059387207, -38.58913040161133, -37.04045486450195, -35.49177932739258, -33.9431037902832, -32.39442825317383, -30.845752716064453, -29.297077178955078, -27.748401641845703, -26.199726104736328, -24.651050567626953, -23.102375030517578, -21.553699493408203, -20.005023956298828, -18.456348419189453, -16.907672882080078, -15.358997344970703, -13.810321807861328, -12.261646270751953, -10.712970733642578, -9.164295196533203, -7.615619659423828, -6.066944122314453, -4.518268585205078, -2.969593048095703, -1.4209175109863281, 0.12775802612304688, 1.6764335632324219, 3.225109100341797, 4.773784637451172, 6.322460174560547, 7.871135711669922, 9.419811248779297, 10.968486785888672, 12.517162322998047, 14.065837860107422, 15.614513397216797, 17.163188934326172, 18.711864471435547, 20.260540008544922, 21.809215545654297, 23.357891082763672, 24.906566619873047, 26.455242156982422, 28.003917694091797, 29.552593231201172, 31.101268768310547, 32.64994430541992, 34.1986198425293, 35.74729537963867, 37.29597091674805, 38.84464645385742, 40.3933219909668, 41.94199752807617, 43.49067306518555, 45.03934860229492, 46.5880241394043]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 8.0, 7.0, 13.0, 9.0, 11.0, 16.0, 13.0, 12.0, 25.0, 23.0, 16.0, 35.0, 26.0, 25.0, 37.0, 39.0, 28.0, 38.0, 35.0, 40.0, 40.0, 38.0, 33.0, 38.0, 47.0, 37.0, 33.0, 31.0, 23.0, 25.0, 24.0, 25.0, 19.0, 17.0, 16.0, 19.0, 13.0, 11.0, 15.0, 17.0, 5.0, 3.0, 8.0, 6.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6953125, -11.3194580078125, -10.943603515625, -10.5677490234375, -10.19189453125, -9.8160400390625, -9.440185546875, -9.0643310546875, -8.6884765625, -8.3126220703125, -7.936767578125, -7.5609130859375, -7.18505859375, -6.8092041015625, -6.433349609375, -6.0574951171875, -5.681640625, -5.3057861328125, -4.929931640625, -4.5540771484375, -4.17822265625, -3.8023681640625, -3.426513671875, -3.0506591796875, -2.6748046875, -2.2989501953125, -1.923095703125, -1.5472412109375, -1.17138671875, -0.7955322265625, -0.419677734375, -0.0438232421875, 0.33203125, 0.7078857421875, 1.083740234375, 1.4595947265625, 1.83544921875, 2.2113037109375, 2.587158203125, 2.9630126953125, 3.3388671875, 3.7147216796875, 4.090576171875, 4.4664306640625, 4.84228515625, 5.2181396484375, 5.593994140625, 5.9698486328125, 6.345703125, 6.7215576171875, 7.097412109375, 7.4732666015625, 7.84912109375, 8.2249755859375, 8.600830078125, 8.9766845703125, 9.3525390625, 9.7283935546875, 10.104248046875, 10.4801025390625, 10.85595703125, 11.2318115234375, 11.607666015625, 11.9835205078125, 12.359375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 9.0, 9.0, 13.0, 16.0, 35.0, 41.0, 64.0, 90.0, 146.0, 199.0, 278.0, 459.0, 649.0, 940.0, 1456.0, 1996.0, 2924.0, 4207.0, 6195.0, 9092.0, 13000.0, 19051.0, 28719.0, 44578.0, 73205.0, 139180.0, 321608.0, 158518.0, 79679.0, 47152.0, 30108.0, 20501.0, 13797.0, 9522.0, 6638.0, 4602.0, 3134.0, 2156.0, 1449.0, 1000.0, 704.0, 459.0, 298.0, 246.0, 164.0, 82.0, 66.0, 49.0, 34.0, 16.0, 10.0, 7.0, 9.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-2.17578125, -2.10687255859375, -2.0379638671875, -1.96905517578125, -1.900146484375, -1.83123779296875, -1.7623291015625, -1.69342041015625, -1.62451171875, -1.55560302734375, -1.4866943359375, -1.41778564453125, -1.348876953125, -1.27996826171875, -1.2110595703125, -1.14215087890625, -1.0732421875, -1.00433349609375, -0.9354248046875, -0.86651611328125, -0.797607421875, -0.72869873046875, -0.6597900390625, -0.59088134765625, -0.52197265625, -0.45306396484375, -0.3841552734375, -0.31524658203125, -0.246337890625, -0.17742919921875, -0.1085205078125, -0.03961181640625, 0.029296875, 0.09820556640625, 0.1671142578125, 0.23602294921875, 0.304931640625, 0.37384033203125, 0.4427490234375, 0.51165771484375, 0.58056640625, 0.64947509765625, 0.7183837890625, 0.78729248046875, 0.856201171875, 0.92510986328125, 0.9940185546875, 1.06292724609375, 1.1318359375, 1.20074462890625, 1.2696533203125, 1.33856201171875, 1.407470703125, 1.47637939453125, 1.5452880859375, 1.61419677734375, 1.68310546875, 1.75201416015625, 1.8209228515625, 1.88983154296875, 1.958740234375, 2.02764892578125, 2.0965576171875, 2.16546630859375, 2.234375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 1.0, 2.0, 5.0, 8.0, 7.0, 2.0, 1.0, 7.0, 11.0, 15.0, 17.0, 17.0, 19.0, 13.0, 20.0, 18.0, 18.0, 16.0, 20.0, 32.0, 32.0, 36.0, 44.0, 19.0, 46.0, 35.0, 47.0, 1057.0, 37.0, 39.0, 32.0, 35.0, 24.0, 30.0, 34.0, 26.0, 19.0, 35.0, 21.0, 29.0, 13.0, 12.0, 20.0, 14.0, 10.0, 6.0, 13.0, 5.0, 1.0, 2.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.9140625, -6.68603515625, -6.4580078125, -6.22998046875, -6.001953125, -5.77392578125, -5.5458984375, -5.31787109375, -5.08984375, -4.86181640625, -4.6337890625, -4.40576171875, -4.177734375, -3.94970703125, -3.7216796875, -3.49365234375, -3.265625, -3.03759765625, -2.8095703125, -2.58154296875, -2.353515625, -2.12548828125, -1.8974609375, -1.66943359375, -1.44140625, -1.21337890625, -0.9853515625, -0.75732421875, -0.529296875, -0.30126953125, -0.0732421875, 0.15478515625, 0.3828125, 0.61083984375, 0.8388671875, 1.06689453125, 1.294921875, 1.52294921875, 1.7509765625, 1.97900390625, 2.20703125, 2.43505859375, 2.6630859375, 2.89111328125, 3.119140625, 3.34716796875, 3.5751953125, 3.80322265625, 4.03125, 4.25927734375, 4.4873046875, 4.71533203125, 4.943359375, 5.17138671875, 5.3994140625, 5.62744140625, 5.85546875, 6.08349609375, 6.3115234375, 6.53955078125, 6.767578125, 6.99560546875, 7.2236328125, 7.45166015625, 7.6796875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 6.0, 1.0, 6.0, 11.0, 11.0, 17.0, 19.0, 33.0, 62.0, 58.0, 77.0, 119.0, 228.0, 303.0, 409.0, 677.0, 894.0, 1301.0, 2010.0, 2915.0, 4396.0, 6627.0, 9666.0, 14236.0, 21046.0, 31121.0, 47735.0, 79779.0, 154003.0, 1367792.0, 139782.0, 74128.0, 46009.0, 29680.0, 19620.0, 13367.0, 9292.0, 6292.0, 4327.0, 2780.0, 2034.0, 1332.0, 920.0, 631.0, 440.0, 295.0, 225.0, 110.0, 72.0, 81.0, 60.0, 29.0, 19.0, 20.0, 16.0, 13.0, 3.0, 5.0, 4.0, 2.0], "bins": [-2.291015625, -2.222503662109375, -2.15399169921875, -2.085479736328125, -2.0169677734375, -1.948455810546875, -1.87994384765625, -1.811431884765625, -1.742919921875, -1.674407958984375, -1.60589599609375, -1.537384033203125, -1.4688720703125, -1.400360107421875, -1.33184814453125, -1.263336181640625, -1.19482421875, -1.126312255859375, -1.05780029296875, -0.989288330078125, -0.9207763671875, -0.852264404296875, -0.78375244140625, -0.715240478515625, -0.646728515625, -0.578216552734375, -0.50970458984375, -0.441192626953125, -0.3726806640625, -0.304168701171875, -0.23565673828125, -0.167144775390625, -0.0986328125, -0.030120849609375, 0.03839111328125, 0.106903076171875, 0.1754150390625, 0.243927001953125, 0.31243896484375, 0.380950927734375, 0.449462890625, 0.517974853515625, 0.58648681640625, 0.654998779296875, 0.7235107421875, 0.792022705078125, 0.86053466796875, 0.929046630859375, 0.99755859375, 1.066070556640625, 1.13458251953125, 1.203094482421875, 1.2716064453125, 1.340118408203125, 1.40863037109375, 1.477142333984375, 1.545654296875, 1.614166259765625, 1.68267822265625, 1.751190185546875, 1.8197021484375, 1.888214111328125, 1.95672607421875, 2.025238037109375, 2.09375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 6.0, 9.0, 8.0, 9.0, 19.0, 24.0, 22.0, 20.0, 28.0, 28.0, 47.0, 46.0, 42.0, 61.0, 80.0, 75.0, 74.0, 48.0, 58.0, 48.0, 45.0, 31.0, 25.0, 21.0, 20.0, 15.0, 18.0, 11.0, 8.0, 4.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0013227462768554688, -0.001277923583984375, -0.0012331008911132812, -0.0011882781982421875, -0.0011434555053710938, -0.0010986328125, -0.0010538101196289062, -0.0010089874267578125, -0.0009641647338867188, -0.000919342041015625, -0.0008745193481445312, -0.0008296966552734375, -0.0007848739624023438, -0.00074005126953125, -0.0006952285766601562, -0.0006504058837890625, -0.0006055831909179688, -0.000560760498046875, -0.0005159378051757812, -0.0004711151123046875, -0.00042629241943359375, -0.0003814697265625, -0.00033664703369140625, -0.0002918243408203125, -0.00024700164794921875, -0.000202178955078125, -0.00015735626220703125, -0.0001125335693359375, -6.771087646484375e-05, -2.288818359375e-05, 2.193450927734375e-05, 6.67572021484375e-05, 0.00011157989501953125, 0.000156402587890625, 0.00020122528076171875, 0.0002460479736328125, 0.00029087066650390625, 0.000335693359375, 0.00038051605224609375, 0.0004253387451171875, 0.00047016143798828125, 0.000514984130859375, 0.0005598068237304688, 0.0006046295166015625, 0.0006494522094726562, 0.00069427490234375, 0.0007390975952148438, 0.0007839202880859375, 0.0008287429809570312, 0.000873565673828125, 0.0009183883666992188, 0.0009632110595703125, 0.0010080337524414062, 0.0010528564453125, 0.0010976791381835938, 0.0011425018310546875, 0.0011873245239257812, 0.001232147216796875, 0.0012769699096679688, 0.0013217926025390625, 0.0013666152954101562, 0.00141143798828125, 0.0014562606811523438, 0.0015010833740234375, 0.0015459060668945312]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 9.0, 8.0, 13.0, 12.0, 22.0, 22.0, 17.0, 44.0, 55.0, 53.0, 101.0, 136.0, 196.0, 349.0, 816.0, 36485.0, 1006810.0, 1947.0, 528.0, 294.0, 129.0, 99.0, 82.0, 61.0, 44.0, 34.0, 38.0, 29.0, 14.0, 16.0, 16.0, 10.0, 9.0, 7.0, 9.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0], "bins": [-0.033050537109375, -0.032138824462890625, -0.03122711181640625, -0.030315399169921875, -0.0294036865234375, -0.028491973876953125, -0.02758026123046875, -0.026668548583984375, -0.0257568359375, -0.024845123291015625, -0.02393341064453125, -0.023021697998046875, -0.0221099853515625, -0.021198272705078125, -0.02028656005859375, -0.019374847412109375, -0.018463134765625, -0.017551422119140625, -0.01663970947265625, -0.015727996826171875, -0.0148162841796875, -0.013904571533203125, -0.01299285888671875, -0.012081146240234375, -0.01116943359375, -0.010257720947265625, -0.00934600830078125, -0.008434295654296875, -0.0075225830078125, -0.006610870361328125, -0.00569915771484375, -0.004787445068359375, -0.003875732421875, -0.002964019775390625, -0.00205230712890625, -0.001140594482421875, -0.0002288818359375, 0.000682830810546875, 0.00159454345703125, 0.002506256103515625, 0.00341796875, 0.004329681396484375, 0.00524139404296875, 0.006153106689453125, 0.0070648193359375, 0.007976531982421875, 0.00888824462890625, 0.009799957275390625, 0.010711669921875, 0.011623382568359375, 0.01253509521484375, 0.013446807861328125, 0.0143585205078125, 0.015270233154296875, 0.01618194580078125, 0.017093658447265625, 0.01800537109375, 0.018917083740234375, 0.01982879638671875, 0.020740509033203125, 0.0216522216796875, 0.022563934326171875, 0.02347564697265625, 0.024387359619140625, 0.025299072265625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 49.0, 474.0, 419.0, 60.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004267726559191942, -0.00415235897526145, -0.004036991391330957, -0.003921623807400465, -0.0038062562234699726, -0.00369088863953948, -0.0035755212884396315, -0.003460153704509139, -0.0033447861205786467, -0.0032294185366481543, -0.003114050952717662, -0.0029986833687871695, -0.0028833160176873207, -0.0027679484337568283, -0.002652580849826336, -0.0025372132658958435, -0.002421845681965351, -0.0023064780980348587, -0.0021911105141043663, -0.002075742930173874, -0.0019603753462433815, -0.001845007878728211, -0.0017296404112130404, -0.001614272827282548, -0.0014989052433520555, -0.0013835376594215631, -0.0012681700754910707, -0.0011528026079759002, -0.0010374350240454078, -0.0009220674401149154, -0.0008066999143920839, -0.0006913323886692524, -0.00057596480473876, -0.00046059724991209805, -0.0003452296950854361, -0.00022986214025877416, -0.00011449458543211222, 8.729984983801842e-07, 0.00011624052422121167, 0.00023160804994404316, 0.00034697563387453556, 0.0004623431887011975, 0.0005777107435278594, 0.0006930782692506909, 0.0008084458531811833, 0.0009238134371116757, 0.0010391809046268463, 0.0011545484885573387, 0.0012699160724878311, 0.0013852836564183235, 0.001500651240348816, 0.0016160187078639865, 0.001731386291794479, 0.0018467538757249713, 0.001962121343240142, 0.0020774889271706343, 0.0021928565111011267, 0.002308224095031619, 0.0024235916789621115, 0.002538959262892604, 0.0026543266139924526, 0.002769694197922945, 0.0028850617818534374, 0.00300042936578393, 0.0031157969497144222]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 3.0, 5.0, 12.0, 7.0, 7.0, 11.0, 13.0, 16.0, 13.0, 18.0, 22.0, 19.0, 20.0, 28.0, 20.0, 35.0, 34.0, 25.0, 36.0, 37.0, 29.0, 36.0, 29.0, 31.0, 36.0, 45.0, 36.0, 33.0, 34.0, 33.0, 33.0, 30.0, 23.0, 29.0, 23.0, 25.0, 24.0, 12.0, 13.0, 10.0, 10.0, 9.0, 8.0, 4.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0], "bins": [-0.000674903392791748, -0.0006539048627018929, -0.0006329063326120377, -0.0006119078025221825, -0.0005909092724323273, -0.0005699107423424721, -0.0005489122122526169, -0.0005279136821627617, -0.0005069151520729065, -0.0004859166219830513, -0.0004649180918931961, -0.0004439195618033409, -0.0004229210317134857, -0.0004019225016236305, -0.00038092397153377533, -0.00035992544144392014, -0.00033892691135406494, -0.00031792838126420975, -0.00029692985117435455, -0.00027593132108449936, -0.00025493279099464417, -0.00023393426090478897, -0.00021293573081493378, -0.00019193720072507858, -0.0001709386706352234, -0.0001499401405453682, -0.000128941610455513, -0.0001079430803656578, -8.694455027580261e-05, -6.594602018594742e-05, -4.4947490096092224e-05, -2.394896000623703e-05, -2.950429916381836e-06, 1.8048100173473358e-05, 3.904663026332855e-05, 6.0045160353183746e-05, 8.104369044303894e-05, 0.00010204222053289413, 0.00012304075062274933, 0.00014403928071260452, 0.00016503781080245972, 0.0001860363408923149, 0.0002070348709821701, 0.0002280334010720253, 0.0002490319311618805, 0.0002700304612517357, 0.0002910289913415909, 0.0003120275214314461, 0.00033302605152130127, 0.00035402458161115646, 0.00037502311170101166, 0.00039602164179086685, 0.00041702017188072205, 0.00043801870197057724, 0.00045901723206043243, 0.00048001576215028763, 0.0005010142922401428, 0.000522012822329998, 0.0005430113524198532, 0.0005640098825097084, 0.0005850084125995636, 0.0006060069426894188, 0.000627005472779274, 0.0006480040028691292, 0.0006690025329589844]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 8.0, 7.0, 13.0, 9.0, 11.0, 16.0, 13.0, 12.0, 25.0, 23.0, 16.0, 35.0, 26.0, 25.0, 37.0, 39.0, 28.0, 38.0, 35.0, 40.0, 40.0, 38.0, 33.0, 38.0, 47.0, 37.0, 33.0, 31.0, 23.0, 25.0, 24.0, 25.0, 19.0, 17.0, 16.0, 19.0, 13.0, 11.0, 15.0, 17.0, 5.0, 3.0, 8.0, 6.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6953125, -11.3194580078125, -10.943603515625, -10.5677490234375, -10.19189453125, -9.8160400390625, -9.440185546875, -9.0643310546875, -8.6884765625, -8.3126220703125, -7.936767578125, -7.5609130859375, -7.18505859375, -6.8092041015625, -6.433349609375, -6.0574951171875, -5.681640625, -5.3057861328125, -4.929931640625, -4.5540771484375, -4.17822265625, -3.8023681640625, -3.426513671875, -3.0506591796875, -2.6748046875, -2.2989501953125, -1.923095703125, -1.5472412109375, -1.17138671875, -0.7955322265625, -0.419677734375, -0.0438232421875, 0.33203125, 0.7078857421875, 1.083740234375, 1.4595947265625, 1.83544921875, 2.2113037109375, 2.587158203125, 2.9630126953125, 3.3388671875, 3.7147216796875, 4.090576171875, 4.4664306640625, 4.84228515625, 5.2181396484375, 5.593994140625, 5.9698486328125, 6.345703125, 6.7215576171875, 7.097412109375, 7.4732666015625, 7.84912109375, 8.2249755859375, 8.600830078125, 8.9766845703125, 9.3525390625, 9.7283935546875, 10.104248046875, 10.4801025390625, 10.85595703125, 11.2318115234375, 11.607666015625, 11.9835205078125, 12.359375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 8.0, 9.0, 12.0, 16.0, 21.0, 34.0, 35.0, 68.0, 84.0, 95.0, 143.0, 149.0, 250.0, 322.0, 426.0, 669.0, 1001.0, 1949.0, 3897.0, 8741.0, 23006.0, 74724.0, 289277.0, 452425.0, 129059.0, 37299.0, 12913.0, 5349.0, 2549.0, 1384.0, 780.0, 485.0, 341.0, 267.0, 181.0, 155.0, 114.0, 76.0, 67.0, 48.0, 40.0, 19.0, 26.0, 11.0, 13.0, 10.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.96875, -12.55322265625, -12.1376953125, -11.72216796875, -11.306640625, -10.89111328125, -10.4755859375, -10.06005859375, -9.64453125, -9.22900390625, -8.8134765625, -8.39794921875, -7.982421875, -7.56689453125, -7.1513671875, -6.73583984375, -6.3203125, -5.90478515625, -5.4892578125, -5.07373046875, -4.658203125, -4.24267578125, -3.8271484375, -3.41162109375, -2.99609375, -2.58056640625, -2.1650390625, -1.74951171875, -1.333984375, -0.91845703125, -0.5029296875, -0.08740234375, 0.328125, 0.74365234375, 1.1591796875, 1.57470703125, 1.990234375, 2.40576171875, 2.8212890625, 3.23681640625, 3.65234375, 4.06787109375, 4.4833984375, 4.89892578125, 5.314453125, 5.72998046875, 6.1455078125, 6.56103515625, 6.9765625, 7.39208984375, 7.8076171875, 8.22314453125, 8.638671875, 9.05419921875, 9.4697265625, 9.88525390625, 10.30078125, 10.71630859375, 11.1318359375, 11.54736328125, 11.962890625, 12.37841796875, 12.7939453125, 13.20947265625, 13.625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 12.0, 16.0, 9.0, 17.0, 12.0, 19.0, 25.0, 17.0, 35.0, 34.0, 48.0, 50.0, 61.0, 102.0, 188.0, 1554.0, 284.0, 110.0, 71.0, 41.0, 41.0, 41.0, 38.0, 25.0, 27.0, 27.0, 27.0, 23.0, 11.0, 16.0, 9.0, 8.0, 5.0, 4.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-36.15625, -35.08349609375, -34.0107421875, -32.93798828125, -31.865234375, -30.79248046875, -29.7197265625, -28.64697265625, -27.57421875, -26.50146484375, -25.4287109375, -24.35595703125, -23.283203125, -22.21044921875, -21.1376953125, -20.06494140625, -18.9921875, -17.91943359375, -16.8466796875, -15.77392578125, -14.701171875, -13.62841796875, -12.5556640625, -11.48291015625, -10.41015625, -9.33740234375, -8.2646484375, -7.19189453125, -6.119140625, -5.04638671875, -3.9736328125, -2.90087890625, -1.828125, -0.75537109375, 0.3173828125, 1.39013671875, 2.462890625, 3.53564453125, 4.6083984375, 5.68115234375, 6.75390625, 7.82666015625, 8.8994140625, 9.97216796875, 11.044921875, 12.11767578125, 13.1904296875, 14.26318359375, 15.3359375, 16.40869140625, 17.4814453125, 18.55419921875, 19.626953125, 20.69970703125, 21.7724609375, 22.84521484375, 23.91796875, 24.99072265625, 26.0634765625, 27.13623046875, 28.208984375, 29.28173828125, 30.3544921875, 31.42724609375, 32.5]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 11.0, 14.0, 8.0, 19.0, 15.0, 21.0, 35.0, 38.0, 65.0, 70.0, 70.0, 124.0, 168.0, 251.0, 343.0, 732.0, 2991.0, 68261.0, 3010023.0, 57685.0, 2875.0, 677.0, 332.0, 220.0, 174.0, 116.0, 72.0, 56.0, 39.0, 53.0, 31.0, 27.0, 17.0, 9.0, 14.0, 14.0, 9.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-54.125, -52.55517578125, -50.9853515625, -49.41552734375, -47.845703125, -46.27587890625, -44.7060546875, -43.13623046875, -41.56640625, -39.99658203125, -38.4267578125, -36.85693359375, -35.287109375, -33.71728515625, -32.1474609375, -30.57763671875, -29.0078125, -27.43798828125, -25.8681640625, -24.29833984375, -22.728515625, -21.15869140625, -19.5888671875, -18.01904296875, -16.44921875, -14.87939453125, -13.3095703125, -11.73974609375, -10.169921875, -8.60009765625, -7.0302734375, -5.46044921875, -3.890625, -2.32080078125, -0.7509765625, 0.81884765625, 2.388671875, 3.95849609375, 5.5283203125, 7.09814453125, 8.66796875, 10.23779296875, 11.8076171875, 13.37744140625, 14.947265625, 16.51708984375, 18.0869140625, 19.65673828125, 21.2265625, 22.79638671875, 24.3662109375, 25.93603515625, 27.505859375, 29.07568359375, 30.6455078125, 32.21533203125, 33.78515625, 35.35498046875, 36.9248046875, 38.49462890625, 40.064453125, 41.63427734375, 43.2041015625, 44.77392578125, 46.34375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 594.0, 422.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-301.8596496582031, -289.7641906738281, -277.668701171875, -265.5732421875, -253.47776794433594, -241.38229370117188, -229.28683471679688, -217.1913604736328, -205.09588623046875, -193.0004119873047, -180.90493774414062, -168.80947875976562, -156.71400451660156, -144.6185302734375, -132.5230712890625, -120.42759704589844, -108.33212280273438, -96.23664855957031, -84.14118194580078, -72.04571533203125, -59.95024108886719, -47.85477066040039, -35.759300231933594, -23.663833618164062, -11.568359375, 0.5271110534667969, 12.622581481933594, 24.71805191040039, 36.81352233886719, 48.908992767333984, 61.00446319580078, 73.09992980957031, 85.1954345703125, 97.29090881347656, 109.3863754272461, 121.48184204101562, 133.5773162841797, 145.67279052734375, 157.76824951171875, 169.8637237548828, 181.95919799804688, 194.05467224121094, 206.150146484375, 218.24560546875, 230.34107971191406, 242.43655395507812, 254.53201293945312, 266.62750244140625, 278.72296142578125, 290.81842041015625, 302.9139099121094, 315.0093688964844, 327.1048583984375, 339.2003173828125, 351.2957763671875, 363.3912353515625, 375.4867248535156, 387.5821838378906, 399.67767333984375, 411.77313232421875, 423.86859130859375, 435.9640808105469, 448.0595397949219, 460.155029296875, 472.25048828125]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 10.0, 7.0, 8.0, 13.0, 15.0, 21.0, 23.0, 25.0, 23.0, 33.0, 27.0, 40.0, 41.0, 39.0, 47.0, 54.0, 43.0, 43.0, 43.0, 43.0, 38.0, 56.0, 36.0, 35.0, 46.0, 35.0, 27.0, 26.0, 18.0, 12.0, 15.0, 12.0, 3.0, 11.0, 7.0, 11.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-81.05384826660156, -78.62247467041016, -76.19110107421875, -73.75971984863281, -71.3283462524414, -68.89697265625, -66.4655990600586, -64.03422546386719, -61.60285186767578, -59.171478271484375, -56.7401008605957, -54.3087272644043, -51.87735366821289, -49.44597625732422, -47.01460266113281, -44.583229064941406, -42.151851654052734, -39.72047805786133, -37.289100646972656, -34.85772705078125, -32.426353454589844, -29.994977951049805, -27.563602447509766, -25.13222885131836, -22.70085334777832, -20.26947784423828, -17.838104248046875, -15.406728744506836, -12.975354194641113, -10.54397964477539, -8.112604141235352, -5.681230545043945, -3.2498550415039062, -0.8184802532196045, 1.6128945350646973, 4.044269561767578, 6.475644111633301, 8.907018661499023, 11.338394165039062, 13.769767761230469, 16.201143264770508, 18.632518768310547, 21.063892364501953, 23.495267868041992, 25.92664337158203, 28.358016967773438, 30.789392471313477, 33.22076416015625, 35.65214157104492, 38.08351516723633, 40.514892578125, 42.946266174316406, 45.37763977050781, 47.80901336669922, 50.24039077758789, 52.6717643737793, 55.10314178466797, 57.534515380859375, 59.96589279174805, 62.39726638793945, 64.82864379882812, 67.26001739501953, 69.69139099121094, 72.12276458740234, 74.55413818359375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 6.0, 6.0, 7.0, 13.0, 5.0, 16.0, 17.0, 17.0, 16.0, 20.0, 19.0, 18.0, 29.0, 29.0, 30.0, 41.0, 37.0, 31.0, 24.0, 40.0, 40.0, 36.0, 43.0, 44.0, 35.0, 26.0, 44.0, 35.0, 28.0, 22.0, 31.0, 22.0, 19.0, 18.0, 21.0, 17.0, 15.0, 11.0, 15.0, 13.0, 11.0, 11.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.2890625, -11.913818359375, -11.53857421875, -11.163330078125, -10.7880859375, -10.412841796875, -10.03759765625, -9.662353515625, -9.287109375, -8.911865234375, -8.53662109375, -8.161376953125, -7.7861328125, -7.410888671875, -7.03564453125, -6.660400390625, -6.28515625, -5.909912109375, -5.53466796875, -5.159423828125, -4.7841796875, -4.408935546875, -4.03369140625, -3.658447265625, -3.283203125, -2.907958984375, -2.53271484375, -2.157470703125, -1.7822265625, -1.406982421875, -1.03173828125, -0.656494140625, -0.28125, 0.093994140625, 0.46923828125, 0.844482421875, 1.2197265625, 1.594970703125, 1.97021484375, 2.345458984375, 2.720703125, 3.095947265625, 3.47119140625, 3.846435546875, 4.2216796875, 4.596923828125, 4.97216796875, 5.347412109375, 5.72265625, 6.097900390625, 6.47314453125, 6.848388671875, 7.2236328125, 7.598876953125, 7.97412109375, 8.349365234375, 8.724609375, 9.099853515625, 9.47509765625, 9.850341796875, 10.2255859375, 10.600830078125, 10.97607421875, 11.351318359375, 11.7265625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 7.0, 5.0, 4.0, 14.0, 8.0, 12.0, 9.0, 19.0, 16.0, 21.0, 31.0, 42.0, 39.0, 52.0, 56.0, 83.0, 122.0, 152.0, 189.0, 260.0, 300.0, 372.0, 913.0, 4173360.0, 15851.0, 588.0, 413.0, 277.0, 262.0, 178.0, 149.0, 104.0, 82.0, 54.0, 40.0, 40.0, 31.0, 31.0, 16.0, 15.0, 13.0, 12.0, 9.0, 12.0, 5.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-345.5, -335.28515625, -325.0703125, -314.85546875, -304.640625, -294.42578125, -284.2109375, -273.99609375, -263.78125, -253.56640625, -243.3515625, -233.13671875, -222.921875, -212.70703125, -202.4921875, -192.27734375, -182.0625, -171.84765625, -161.6328125, -151.41796875, -141.203125, -130.98828125, -120.7734375, -110.55859375, -100.34375, -90.12890625, -79.9140625, -69.69921875, -59.484375, -49.26953125, -39.0546875, -28.83984375, -18.625, -8.41015625, 1.8046875, 12.01953125, 22.234375, 32.44921875, 42.6640625, 52.87890625, 63.09375, 73.30859375, 83.5234375, 93.73828125, 103.953125, 114.16796875, 124.3828125, 134.59765625, 144.8125, 155.02734375, 165.2421875, 175.45703125, 185.671875, 195.88671875, 206.1015625, 216.31640625, 226.53125, 236.74609375, 246.9609375, 257.17578125, 267.390625, 277.60546875, 287.8203125, 298.03515625, 308.25]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 7.0, 3.0, 7.0, 17.0, 18.0, 21.0, 20.0, 50.0, 41.0, 62.0, 96.0, 118.0, 163.0, 253.0, 407.0, 579.0, 632.0, 514.0, 333.0, 222.0, 129.0, 84.0, 67.0, 50.0, 33.0, 38.0, 32.0, 24.0, 11.0, 7.0, 7.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.859375, -18.23583984375, -17.6123046875, -16.98876953125, -16.365234375, -15.74169921875, -15.1181640625, -14.49462890625, -13.87109375, -13.24755859375, -12.6240234375, -12.00048828125, -11.376953125, -10.75341796875, -10.1298828125, -9.50634765625, -8.8828125, -8.25927734375, -7.6357421875, -7.01220703125, -6.388671875, -5.76513671875, -5.1416015625, -4.51806640625, -3.89453125, -3.27099609375, -2.6474609375, -2.02392578125, -1.400390625, -0.77685546875, -0.1533203125, 0.47021484375, 1.09375, 1.71728515625, 2.3408203125, 2.96435546875, 3.587890625, 4.21142578125, 4.8349609375, 5.45849609375, 6.08203125, 6.70556640625, 7.3291015625, 7.95263671875, 8.576171875, 9.19970703125, 9.8232421875, 10.44677734375, 11.0703125, 11.69384765625, 12.3173828125, 12.94091796875, 13.564453125, 14.18798828125, 14.8115234375, 15.43505859375, 16.05859375, 16.68212890625, 17.3056640625, 17.92919921875, 18.552734375, 19.17626953125, 19.7998046875, 20.42333984375, 21.046875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 4.0, 7.0, 11.0, 13.0, 11.0, 18.0, 16.0, 33.0, 33.0, 43.0, 44.0, 53.0, 73.0, 138.0, 483.0, 1669488.0, 2522745.0, 488.0, 152.0, 78.0, 62.0, 53.0, 48.0, 40.0, 27.0, 25.0, 26.0, 16.0, 12.0, 7.0, 10.0, 3.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-257.25, -250.298828125, -243.34765625, -236.396484375, -229.4453125, -222.494140625, -215.54296875, -208.591796875, -201.640625, -194.689453125, -187.73828125, -180.787109375, -173.8359375, -166.884765625, -159.93359375, -152.982421875, -146.03125, -139.080078125, -132.12890625, -125.177734375, -118.2265625, -111.275390625, -104.32421875, -97.373046875, -90.421875, -83.470703125, -76.51953125, -69.568359375, -62.6171875, -55.666015625, -48.71484375, -41.763671875, -34.8125, -27.861328125, -20.91015625, -13.958984375, -7.0078125, -0.056640625, 6.89453125, 13.845703125, 20.796875, 27.748046875, 34.69921875, 41.650390625, 48.6015625, 55.552734375, 62.50390625, 69.455078125, 76.40625, 83.357421875, 90.30859375, 97.259765625, 104.2109375, 111.162109375, 118.11328125, 125.064453125, 132.015625, 138.966796875, 145.91796875, 152.869140625, 159.8203125, 166.771484375, 173.72265625, 180.673828125, 187.625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 32.0, 292.0, 537.0, 140.0, 12.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-294.3432312011719, -286.2338562011719, -278.12445068359375, -270.01507568359375, -261.90570068359375, -253.7963104248047, -245.68692016601562, -237.57754516601562, -229.46817016601562, -221.35877990722656, -213.24940490722656, -205.1400146484375, -197.0306396484375, -188.92124938964844, -180.81185913085938, -172.70248413085938, -164.5930938720703, -156.48370361328125, -148.37432861328125, -140.2649383544922, -132.1555633544922, -124.04617309570312, -115.9367904663086, -107.82740783691406, -99.71802520751953, -91.608642578125, -83.49925994873047, -75.38987731933594, -67.28048706054688, -59.17110824584961, -51.06172180175781, -42.95233917236328, -34.84294128417969, -26.733558654785156, -18.624174118041992, -10.514789581298828, -2.405406951904297, 5.703975677490234, 13.813362121582031, 21.922744750976562, 30.032127380371094, 38.141510009765625, 46.250892639160156, 54.36027908325195, 62.469661712646484, 70.57904052734375, 78.68843078613281, 86.79781341552734, 94.90719604492188, 103.0165786743164, 111.12596130371094, 119.2353515625, 127.3447265625, 135.45411682128906, 143.56350708007812, 151.67288208007812, 159.78225708007812, 167.8916473388672, 176.0010223388672, 184.11041259765625, 192.21978759765625, 200.3291778564453, 208.43856811523438, 216.54794311523438, 224.65733337402344]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 5.0, 6.0, 7.0, 18.0, 17.0, 19.0, 25.0, 29.0, 30.0, 26.0, 31.0, 34.0, 42.0, 39.0, 35.0, 45.0, 40.0, 51.0, 45.0, 47.0, 33.0, 46.0, 41.0, 32.0, 37.0, 35.0, 16.0, 22.0, 15.0, 19.0, 21.0, 14.0, 12.0, 18.0, 12.0, 3.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.878536224365234, -61.82505798339844, -59.771575927734375, -57.71809387207031, -55.664615631103516, -53.61113739013672, -51.557655334472656, -49.504173278808594, -47.4506950378418, -45.397216796875, -43.34373474121094, -41.290252685546875, -39.23677444458008, -37.18329620361328, -35.12981414794922, -33.076332092285156, -31.02285385131836, -28.96937370300293, -26.9158935546875, -24.86241340637207, -22.80893325805664, -20.75545310974121, -18.70197296142578, -16.64849281311035, -14.595012664794922, -12.541532516479492, -10.488052368164062, -8.434572219848633, -6.381092071533203, -4.327611923217773, -2.2741317749023438, -0.22065162658691406, 1.8328323364257812, 3.886312484741211, 5.939792633056641, 7.99327278137207, 10.0467529296875, 12.10023307800293, 14.15371322631836, 16.20719337463379, 18.26067352294922, 20.31415367126465, 22.367633819580078, 24.421113967895508, 26.474594116210938, 28.528074264526367, 30.581554412841797, 32.635032653808594, 34.688514709472656, 36.74199676513672, 38.795475006103516, 40.84895324707031, 42.902435302734375, 44.95591735839844, 47.009395599365234, 49.06287384033203, 51.116355895996094, 53.169837951660156, 55.22331619262695, 57.27679443359375, 59.33027648925781, 61.383758544921875, 63.43723678588867, 65.49071502685547, 67.54419708251953]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 6.0, 7.0, 13.0, 17.0, 16.0, 21.0, 26.0, 28.0, 27.0, 29.0, 30.0, 38.0, 38.0, 35.0, 31.0, 38.0, 42.0, 50.0, 49.0, 45.0, 48.0, 34.0, 39.0, 28.0, 29.0, 26.0, 31.0, 34.0, 26.0, 13.0, 18.0, 16.0, 16.0, 8.0, 8.0, 5.0, 8.0, 5.0, 4.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.4609375, -13.0391845703125, -12.617431640625, -12.1956787109375, -11.77392578125, -11.3521728515625, -10.930419921875, -10.5086669921875, -10.0869140625, -9.6651611328125, -9.243408203125, -8.8216552734375, -8.39990234375, -7.9781494140625, -7.556396484375, -7.1346435546875, -6.712890625, -6.2911376953125, -5.869384765625, -5.4476318359375, -5.02587890625, -4.6041259765625, -4.182373046875, -3.7606201171875, -3.3388671875, -2.9171142578125, -2.495361328125, -2.0736083984375, -1.65185546875, -1.2301025390625, -0.808349609375, -0.3865966796875, 0.03515625, 0.4569091796875, 0.878662109375, 1.3004150390625, 1.72216796875, 2.1439208984375, 2.565673828125, 2.9874267578125, 3.4091796875, 3.8309326171875, 4.252685546875, 4.6744384765625, 5.09619140625, 5.5179443359375, 5.939697265625, 6.3614501953125, 6.783203125, 7.2049560546875, 7.626708984375, 8.0484619140625, 8.47021484375, 8.8919677734375, 9.313720703125, 9.7354736328125, 10.1572265625, 10.5789794921875, 11.000732421875, 11.4224853515625, 11.84423828125, 12.2659912109375, 12.687744140625, 13.1094970703125, 13.53125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 19.0, 16.0, 28.0, 41.0, 52.0, 72.0, 112.0, 185.0, 297.0, 478.0, 714.0, 1068.0, 1795.0, 2819.0, 4597.0, 7303.0, 12090.0, 19563.0, 33786.0, 58588.0, 112933.0, 336270.0, 233337.0, 95506.0, 51418.0, 29475.0, 17690.0, 10607.0, 6587.0, 4107.0, 2546.0, 1595.0, 984.0, 703.0, 424.0, 274.0, 168.0, 94.0, 60.0, 49.0, 31.0, 29.0, 12.0, 15.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.962890625, -2.869964599609375, -2.77703857421875, -2.684112548828125, -2.5911865234375, -2.498260498046875, -2.40533447265625, -2.312408447265625, -2.219482421875, -2.126556396484375, -2.03363037109375, -1.940704345703125, -1.8477783203125, -1.754852294921875, -1.66192626953125, -1.569000244140625, -1.47607421875, -1.383148193359375, -1.29022216796875, -1.197296142578125, -1.1043701171875, -1.011444091796875, -0.91851806640625, -0.825592041015625, -0.732666015625, -0.639739990234375, -0.54681396484375, -0.453887939453125, -0.3609619140625, -0.268035888671875, -0.17510986328125, -0.082183837890625, 0.0107421875, 0.103668212890625, 0.19659423828125, 0.289520263671875, 0.3824462890625, 0.475372314453125, 0.56829833984375, 0.661224365234375, 0.754150390625, 0.847076416015625, 0.94000244140625, 1.032928466796875, 1.1258544921875, 1.218780517578125, 1.31170654296875, 1.404632568359375, 1.49755859375, 1.590484619140625, 1.68341064453125, 1.776336669921875, 1.8692626953125, 1.962188720703125, 2.05511474609375, 2.148040771484375, 2.240966796875, 2.333892822265625, 2.42681884765625, 2.519744873046875, 2.6126708984375, 2.705596923828125, 2.79852294921875, 2.891448974609375, 2.984375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 8.0, 8.0, 11.0, 8.0, 17.0, 13.0, 17.0, 26.0, 26.0, 23.0, 28.0, 35.0, 29.0, 28.0, 30.0, 50.0, 42.0, 41.0, 54.0, 1065.0, 37.0, 44.0, 35.0, 29.0, 35.0, 36.0, 36.0, 22.0, 23.0, 26.0, 21.0, 26.0, 22.0, 12.0, 11.0, 13.0, 4.0, 5.0, 8.0, 6.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.1060791015625, -7.844970703125, -7.5838623046875, -7.32275390625, -7.0616455078125, -6.800537109375, -6.5394287109375, -6.2783203125, -6.0172119140625, -5.756103515625, -5.4949951171875, -5.23388671875, -4.9727783203125, -4.711669921875, -4.4505615234375, -4.189453125, -3.9283447265625, -3.667236328125, -3.4061279296875, -3.14501953125, -2.8839111328125, -2.622802734375, -2.3616943359375, -2.1005859375, -1.8394775390625, -1.578369140625, -1.3172607421875, -1.05615234375, -0.7950439453125, -0.533935546875, -0.2728271484375, -0.01171875, 0.2493896484375, 0.510498046875, 0.7716064453125, 1.03271484375, 1.2938232421875, 1.554931640625, 1.8160400390625, 2.0771484375, 2.3382568359375, 2.599365234375, 2.8604736328125, 3.12158203125, 3.3826904296875, 3.643798828125, 3.9049072265625, 4.166015625, 4.4271240234375, 4.688232421875, 4.9493408203125, 5.21044921875, 5.4715576171875, 5.732666015625, 5.9937744140625, 6.2548828125, 6.5159912109375, 6.777099609375, 7.0382080078125, 7.29931640625, 7.5604248046875, 7.821533203125, 8.0826416015625, 8.34375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 13.0, 17.0, 20.0, 20.0, 41.0, 55.0, 69.0, 117.0, 176.0, 231.0, 372.0, 551.0, 792.0, 1246.0, 1818.0, 2777.0, 4244.0, 6544.0, 10389.0, 16038.0, 24988.0, 40006.0, 65387.0, 123352.0, 1379817.0, 191602.0, 88135.0, 50459.0, 31502.0, 20035.0, 12860.0, 8249.0, 5224.0, 3349.0, 2263.0, 1413.0, 953.0, 634.0, 454.0, 288.0, 195.0, 149.0, 80.0, 72.0, 39.0, 24.0, 16.0, 16.0, 17.0, 5.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.494140625, -2.41558837890625, -2.3370361328125, -2.25848388671875, -2.179931640625, -2.10137939453125, -2.0228271484375, -1.94427490234375, -1.86572265625, -1.78717041015625, -1.7086181640625, -1.63006591796875, -1.551513671875, -1.47296142578125, -1.3944091796875, -1.31585693359375, -1.2373046875, -1.15875244140625, -1.0802001953125, -1.00164794921875, -0.923095703125, -0.84454345703125, -0.7659912109375, -0.68743896484375, -0.60888671875, -0.53033447265625, -0.4517822265625, -0.37322998046875, -0.294677734375, -0.21612548828125, -0.1375732421875, -0.05902099609375, 0.01953125, 0.09808349609375, 0.1766357421875, 0.25518798828125, 0.333740234375, 0.41229248046875, 0.4908447265625, 0.56939697265625, 0.64794921875, 0.72650146484375, 0.8050537109375, 0.88360595703125, 0.962158203125, 1.04071044921875, 1.1192626953125, 1.19781494140625, 1.2763671875, 1.35491943359375, 1.4334716796875, 1.51202392578125, 1.590576171875, 1.66912841796875, 1.7476806640625, 1.82623291015625, 1.90478515625, 1.98333740234375, 2.0618896484375, 2.14044189453125, 2.218994140625, 2.29754638671875, 2.3760986328125, 2.45465087890625, 2.533203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 5.0, 4.0, 5.0, 8.0, 12.0, 10.0, 9.0, 5.0, 11.0, 21.0, 12.0, 26.0, 28.0, 27.0, 40.0, 54.0, 53.0, 65.0, 55.0, 54.0, 66.0, 60.0, 36.0, 52.0, 41.0, 43.0, 29.0, 22.0, 21.0, 25.0, 17.0, 18.0, 14.0, 6.0, 5.0, 4.0, 11.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.0014677047729492188, -0.0014258027076721191, -0.0013839006423950195, -0.00134199857711792, -0.0013000965118408203, -0.0012581944465637207, -0.001216292381286621, -0.0011743903160095215, -0.0011324882507324219, -0.0010905861854553223, -0.0010486841201782227, -0.001006782054901123, -0.0009648799896240234, -0.0009229779243469238, -0.0008810758590698242, -0.0008391737937927246, -0.000797271728515625, -0.0007553696632385254, -0.0007134675979614258, -0.0006715655326843262, -0.0006296634674072266, -0.000587761402130127, -0.0005458593368530273, -0.0005039572715759277, -0.0004620552062988281, -0.0004201531410217285, -0.0003782510757446289, -0.0003363490104675293, -0.0002944469451904297, -0.0002525448799133301, -0.00021064281463623047, -0.00016874074935913086, -0.00012683868408203125, -8.493661880493164e-05, -4.303455352783203e-05, -1.1324882507324219e-06, 4.076957702636719e-05, 8.26716423034668e-05, 0.0001245737075805664, 0.00016647577285766602, 0.00020837783813476562, 0.00025027990341186523, 0.00029218196868896484, 0.00033408403396606445, 0.00037598609924316406, 0.00041788816452026367, 0.0004597902297973633, 0.0005016922950744629, 0.0005435943603515625, 0.0005854964256286621, 0.0006273984909057617, 0.0006693005561828613, 0.0007112026214599609, 0.0007531046867370605, 0.0007950067520141602, 0.0008369088172912598, 0.0008788108825683594, 0.000920712947845459, 0.0009626150131225586, 0.0010045170783996582, 0.0010464191436767578, 0.0010883212089538574, 0.001130223274230957, 0.0011721253395080566, 0.0012140274047851562]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 6.0, 3.0, 6.0, 3.0, 4.0, 9.0, 10.0, 7.0, 11.0, 15.0, 19.0, 15.0, 27.0, 35.0, 48.0, 64.0, 68.0, 90.0, 115.0, 167.0, 235.0, 395.0, 564.0, 1151.0, 96227.0, 944431.0, 2537.0, 726.0, 456.0, 282.0, 190.0, 140.0, 122.0, 73.0, 53.0, 46.0, 39.0, 31.0, 24.0, 20.0, 20.0, 19.0, 15.0, 9.0, 6.0, 6.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0233917236328125, -0.02266526222229004, -0.021938800811767578, -0.021212339401245117, -0.020485877990722656, -0.019759416580200195, -0.019032955169677734, -0.018306493759155273, -0.017580032348632812, -0.01685357093811035, -0.01612710952758789, -0.01540064811706543, -0.014674186706542969, -0.013947725296020508, -0.013221263885498047, -0.012494802474975586, -0.011768341064453125, -0.011041879653930664, -0.010315418243408203, -0.009588956832885742, -0.008862495422363281, -0.00813603401184082, -0.007409572601318359, -0.0066831111907958984, -0.0059566497802734375, -0.0052301883697509766, -0.004503726959228516, -0.0037772655487060547, -0.0030508041381835938, -0.002324342727661133, -0.0015978813171386719, -0.0008714199066162109, -0.00014495849609375, 0.0005815029144287109, 0.0013079643249511719, 0.002034425735473633, 0.0027608871459960938, 0.0034873485565185547, 0.004213809967041016, 0.0049402713775634766, 0.0056667327880859375, 0.0063931941986083984, 0.007119655609130859, 0.00784611701965332, 0.008572578430175781, 0.009299039840698242, 0.010025501251220703, 0.010751962661743164, 0.011478424072265625, 0.012204885482788086, 0.012931346893310547, 0.013657808303833008, 0.014384269714355469, 0.01511073112487793, 0.01583719253540039, 0.01656365394592285, 0.017290115356445312, 0.018016576766967773, 0.018743038177490234, 0.019469499588012695, 0.020195960998535156, 0.020922422409057617, 0.021648883819580078, 0.02237534523010254, 0.023101806640625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 56.0, 345.0, 465.0, 117.0, 20.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001998190302401781, -0.0018990898970514536, -0.0017999893752858043, -0.0017008889699354768, -0.0016017884481698275, -0.0015026880428195, -0.0014035876374691725, -0.0013044871157035232, -0.0012053865939378738, -0.0011062861885875463, -0.001007185666821897, -0.0009080852614715695, -0.0008089847397059202, -0.0007098843343555927, -0.0006107838707976043, -0.0005116834072396159, -0.0004125830018892884, -0.0003134825383313, -0.00021438208932522684, -0.00011528164031915367, -1.618117676116526e-05, 8.291925769299269e-05, 0.0001820197212509811, 0.0002811201848089695, 0.0003802206483669579, 0.0004793211119249463, 0.0005784215754829347, 0.0006775220390409231, 0.0007766224443912506, 0.000875722907949239, 0.0009748233715072274, 0.0010739238932728767, 0.0011730242986232042, 0.0012721247039735317, 0.001371225225739181, 0.0014703256310895085, 0.0015694261528551579, 0.0016685265582054853, 0.0017676269635558128, 0.0018667274853214622, 0.0019658280070871115, 0.002064928412437439, 0.0021640288177877665, 0.0022631294559687376, 0.002362229861319065, 0.0024613302666693926, 0.00256043067201972, 0.0026595313102006912, 0.002758631482720375, 0.0028577318880707026, 0.00295683229342103, 0.003055932931602001, 0.0031550333369523287, 0.003254133742302656, 0.0033532341476529837, 0.003452334553003311, 0.0035514351911842823, 0.00365053559653461, 0.0037496360018849373, 0.0038487366400659084, 0.003947836812585592, 0.004046937450766563, 0.0041460380889475346, 0.004245138261467218, 0.0043442388996481895]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 10.0, 2.0, 6.0, 10.0, 12.0, 10.0, 22.0, 15.0, 10.0, 19.0, 17.0, 28.0, 34.0, 34.0, 31.0, 24.0, 33.0, 19.0, 39.0, 31.0, 34.0, 32.0, 36.0, 31.0, 27.0, 43.0, 39.0, 29.0, 35.0, 25.0, 29.0, 28.0, 30.0, 33.0, 23.0, 15.0, 13.0, 17.0, 8.0, 6.0, 11.0, 6.0, 9.0, 5.0, 7.0, 7.0, 3.0, 4.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0006529688835144043, -0.0006329845637083054, -0.0006130002439022064, -0.0005930159240961075, -0.0005730316042900085, -0.0005530472844839096, -0.0005330629646778107, -0.0005130786448717117, -0.0004930943250656128, -0.00047311000525951385, -0.0004531256854534149, -0.000433141365647316, -0.00041315704584121704, -0.0003931727260351181, -0.00037318840622901917, -0.0003532040864229202, -0.0003332197666168213, -0.00031323544681072235, -0.0002932511270046234, -0.0002732668071985245, -0.00025328248739242554, -0.0002332981675863266, -0.00021331384778022766, -0.00019332952797412872, -0.00017334520816802979, -0.00015336088836193085, -0.0001333765685558319, -0.00011339224874973297, -9.340792894363403e-05, -7.34236091375351e-05, -5.343928933143616e-05, -3.345496952533722e-05, -1.3470649719238281e-05, 6.513670086860657e-06, 2.6497989892959595e-05, 4.648230969905853e-05, 6.646662950515747e-05, 8.645094931125641e-05, 0.00010643526911735535, 0.00012641958892345428, 0.00014640390872955322, 0.00016638822853565216, 0.0001863725483417511, 0.00020635686814785004, 0.00022634118795394897, 0.0002463255077600479, 0.00026630982756614685, 0.0002862941473722458, 0.0003062784671783447, 0.00032626278698444366, 0.0003462471067905426, 0.00036623142659664154, 0.0003862157464027405, 0.0004062000662088394, 0.00042618438601493835, 0.0004461687058210373, 0.00046615302562713623, 0.00048613734543323517, 0.0005061216652393341, 0.000526105985045433, 0.000546090304851532, 0.0005660746246576309, 0.0005860589444637299, 0.0006060432642698288, 0.0006260275840759277]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 6.0, 7.0, 13.0, 17.0, 16.0, 21.0, 26.0, 28.0, 27.0, 29.0, 30.0, 38.0, 38.0, 35.0, 31.0, 38.0, 42.0, 50.0, 49.0, 45.0, 48.0, 34.0, 39.0, 28.0, 29.0, 26.0, 31.0, 34.0, 26.0, 13.0, 18.0, 16.0, 16.0, 8.0, 8.0, 5.0, 8.0, 5.0, 4.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.4609375, -13.0391845703125, -12.617431640625, -12.1956787109375, -11.77392578125, -11.3521728515625, -10.930419921875, -10.5086669921875, -10.0869140625, -9.6651611328125, -9.243408203125, -8.8216552734375, -8.39990234375, -7.9781494140625, -7.556396484375, -7.1346435546875, -6.712890625, -6.2911376953125, -5.869384765625, -5.4476318359375, -5.02587890625, -4.6041259765625, -4.182373046875, -3.7606201171875, -3.3388671875, -2.9171142578125, -2.495361328125, -2.0736083984375, -1.65185546875, -1.2301025390625, -0.808349609375, -0.3865966796875, 0.03515625, 0.4569091796875, 0.878662109375, 1.3004150390625, 1.72216796875, 2.1439208984375, 2.565673828125, 2.9874267578125, 3.4091796875, 3.8309326171875, 4.252685546875, 4.6744384765625, 5.09619140625, 5.5179443359375, 5.939697265625, 6.3614501953125, 6.783203125, 7.2049560546875, 7.626708984375, 8.0484619140625, 8.47021484375, 8.8919677734375, 9.313720703125, 9.7354736328125, 10.1572265625, 10.5789794921875, 11.000732421875, 11.4224853515625, 11.84423828125, 12.2659912109375, 12.687744140625, 13.1094970703125, 13.53125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 7.0, 8.0, 12.0, 18.0, 29.0, 37.0, 61.0, 80.0, 107.0, 127.0, 187.0, 232.0, 347.0, 436.0, 516.0, 681.0, 896.0, 1230.0, 1804.0, 3614.0, 12813.0, 79449.0, 509099.0, 367149.0, 51140.0, 9089.0, 3097.0, 1607.0, 1082.0, 852.0, 682.0, 505.0, 399.0, 308.0, 222.0, 164.0, 127.0, 84.0, 71.0, 60.0, 27.0, 36.0, 23.0, 14.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.751220703125, -19.11181640625, -18.472412109375, -17.8330078125, -17.193603515625, -16.55419921875, -15.914794921875, -15.275390625, -14.635986328125, -13.99658203125, -13.357177734375, -12.7177734375, -12.078369140625, -11.43896484375, -10.799560546875, -10.16015625, -9.520751953125, -8.88134765625, -8.241943359375, -7.6025390625, -6.963134765625, -6.32373046875, -5.684326171875, -5.044921875, -4.405517578125, -3.76611328125, -3.126708984375, -2.4873046875, -1.847900390625, -1.20849609375, -0.569091796875, 0.0703125, 0.709716796875, 1.34912109375, 1.988525390625, 2.6279296875, 3.267333984375, 3.90673828125, 4.546142578125, 5.185546875, 5.824951171875, 6.46435546875, 7.103759765625, 7.7431640625, 8.382568359375, 9.02197265625, 9.661376953125, 10.30078125, 10.940185546875, 11.57958984375, 12.218994140625, 12.8583984375, 13.497802734375, 14.13720703125, 14.776611328125, 15.416015625, 16.055419921875, 16.69482421875, 17.334228515625, 17.9736328125, 18.613037109375, 19.25244140625, 19.891845703125, 20.53125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 9.0, 6.0, 8.0, 9.0, 12.0, 23.0, 30.0, 40.0, 36.0, 56.0, 62.0, 61.0, 84.0, 289.0, 1798.0, 126.0, 75.0, 68.0, 62.0, 47.0, 27.0, 34.0, 22.0, 17.0, 10.0, 13.0, 9.0, 6.0, 3.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.53125, -49.93359375, -48.3359375, -46.73828125, -45.140625, -43.54296875, -41.9453125, -40.34765625, -38.75, -37.15234375, -35.5546875, -33.95703125, -32.359375, -30.76171875, -29.1640625, -27.56640625, -25.96875, -24.37109375, -22.7734375, -21.17578125, -19.578125, -17.98046875, -16.3828125, -14.78515625, -13.1875, -11.58984375, -9.9921875, -8.39453125, -6.796875, -5.19921875, -3.6015625, -2.00390625, -0.40625, 1.19140625, 2.7890625, 4.38671875, 5.984375, 7.58203125, 9.1796875, 10.77734375, 12.375, 13.97265625, 15.5703125, 17.16796875, 18.765625, 20.36328125, 21.9609375, 23.55859375, 25.15625, 26.75390625, 28.3515625, 29.94921875, 31.546875, 33.14453125, 34.7421875, 36.33984375, 37.9375, 39.53515625, 41.1328125, 42.73046875, 44.328125, 45.92578125, 47.5234375, 49.12109375, 50.71875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 10.0, 12.0, 11.0, 20.0, 15.0, 32.0, 32.0, 50.0, 82.0, 152.0, 229.0, 514.0, 1711.0, 3092134.0, 48682.0, 1053.0, 366.0, 217.0, 119.0, 84.0, 54.0, 33.0, 25.0, 14.0, 15.0, 13.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.375, -134.99609375, -130.6171875, -126.23828125, -121.859375, -117.48046875, -113.1015625, -108.72265625, -104.34375, -99.96484375, -95.5859375, -91.20703125, -86.828125, -82.44921875, -78.0703125, -73.69140625, -69.3125, -64.93359375, -60.5546875, -56.17578125, -51.796875, -47.41796875, -43.0390625, -38.66015625, -34.28125, -29.90234375, -25.5234375, -21.14453125, -16.765625, -12.38671875, -8.0078125, -3.62890625, 0.75, 5.12890625, 9.5078125, 13.88671875, 18.265625, 22.64453125, 27.0234375, 31.40234375, 35.78125, 40.16015625, 44.5390625, 48.91796875, 53.296875, 57.67578125, 62.0546875, 66.43359375, 70.8125, 75.19140625, 79.5703125, 83.94921875, 88.328125, 92.70703125, 97.0859375, 101.46484375, 105.84375, 110.22265625, 114.6015625, 118.98046875, 123.359375, 127.73828125, 132.1171875, 136.49609375, 140.875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 8.0, 87.0, 678.0, 225.0, 18.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.0487823486328, -147.89520263671875, -140.7416229248047, -133.58804321289062, -126.43445587158203, -119.28087615966797, -112.12728881835938, -104.97370910644531, -97.82012939453125, -90.66654968261719, -83.51296997070312, -76.35938262939453, -69.20580291748047, -62.052223205566406, -54.89863967895508, -47.74505615234375, -40.59147644042969, -33.437896728515625, -26.284313201904297, -19.1307315826416, -11.977149963378906, -4.823570251464844, 2.3300132751464844, 9.483596801757812, 16.637176513671875, 23.79075813293457, 30.944339752197266, 38.097923278808594, 45.251502990722656, 52.40508270263672, 59.55866622924805, 66.71224975585938, 73.8658447265625, 81.01942443847656, 88.17300415039062, 95.32659149169922, 102.48017120361328, 109.63375091552734, 116.78733825683594, 123.94091796875, 131.09449768066406, 138.24807739257812, 145.4016571044922, 152.55523681640625, 159.70883178710938, 166.86239624023438, 174.0159912109375, 181.16957092285156, 188.32315063476562, 195.4767303466797, 202.63031005859375, 209.7838897705078, 216.93746948242188, 224.091064453125, 231.24464416503906, 238.39822387695312, 245.5518035888672, 252.70538330078125, 259.8589782714844, 267.0125427246094, 274.1661376953125, 281.3197021484375, 288.4732971191406, 295.62689208984375, 302.78045654296875]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 5.0, 7.0, 8.0, 4.0, 8.0, 16.0, 20.0, 17.0, 19.0, 21.0, 28.0, 42.0, 40.0, 33.0, 41.0, 53.0, 56.0, 70.0, 57.0, 58.0, 47.0, 50.0, 37.0, 31.0, 40.0, 44.0, 23.0, 18.0, 18.0, 21.0, 12.0, 8.0, 11.0, 10.0, 7.0, 7.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.5247802734375, -89.72315216064453, -85.9215316772461, -82.11990356445312, -78.31828308105469, -74.51665496826172, -70.71502685546875, -66.91340637207031, -63.111778259277344, -59.31015396118164, -55.50852966308594, -51.70690155029297, -47.905277252197266, -44.10365295410156, -40.30202865600586, -36.500404357910156, -32.69878005981445, -28.89715576171875, -25.095529556274414, -21.29390525817871, -17.492279052734375, -13.690654754638672, -9.889030456542969, -6.087404251098633, -2.2857799530029297, 1.5158450603485107, 5.317470073699951, 9.119094848632812, 12.920720100402832, 16.72234535217285, 20.523969650268555, 24.32559585571289, 28.127220153808594, 31.928844451904297, 35.73046875, 39.53209686279297, 43.33372116088867, 47.135345458984375, 50.93696975708008, 54.73859405517578, 58.54022216796875, 62.34184646606445, 66.14347076416016, 69.94509887695312, 73.74671936035156, 77.54834747314453, 81.3499755859375, 85.15159606933594, 88.95321655273438, 92.75484466552734, 96.55646514892578, 100.35809326171875, 104.15971374511719, 107.96134185791016, 111.76296997070312, 115.56459045410156, 119.36621856689453, 123.1678466796875, 126.96946716308594, 130.77108764648438, 134.57272338867188, 138.3743438720703, 142.17596435546875, 145.97760009765625, 149.7792205810547]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 4.0, 5.0, 9.0, 11.0, 12.0, 14.0, 13.0, 26.0, 17.0, 27.0, 35.0, 27.0, 30.0, 27.0, 34.0, 40.0, 31.0, 35.0, 45.0, 32.0, 51.0, 40.0, 34.0, 38.0, 45.0, 27.0, 28.0, 33.0, 31.0, 26.0, 25.0, 27.0, 23.0, 17.0, 16.0, 14.0, 6.0, 6.0, 6.0, 8.0, 3.0, 5.0, 4.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6640625, -13.2530517578125, -12.842041015625, -12.4310302734375, -12.02001953125, -11.6090087890625, -11.197998046875, -10.7869873046875, -10.3759765625, -9.9649658203125, -9.553955078125, -9.1429443359375, -8.73193359375, -8.3209228515625, -7.909912109375, -7.4989013671875, -7.087890625, -6.6768798828125, -6.265869140625, -5.8548583984375, -5.44384765625, -5.0328369140625, -4.621826171875, -4.2108154296875, -3.7998046875, -3.3887939453125, -2.977783203125, -2.5667724609375, -2.15576171875, -1.7447509765625, -1.333740234375, -0.9227294921875, -0.51171875, -0.1007080078125, 0.310302734375, 0.7213134765625, 1.13232421875, 1.5433349609375, 1.954345703125, 2.3653564453125, 2.7763671875, 3.1873779296875, 3.598388671875, 4.0093994140625, 4.42041015625, 4.8314208984375, 5.242431640625, 5.6534423828125, 6.064453125, 6.4754638671875, 6.886474609375, 7.2974853515625, 7.70849609375, 8.1195068359375, 8.530517578125, 8.9415283203125, 9.3525390625, 9.7635498046875, 10.174560546875, 10.5855712890625, 10.99658203125, 11.4075927734375, 11.818603515625, 12.2296142578125, 12.640625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 8.0, 6.0, 11.0, 11.0, 18.0, 18.0, 14.0, 29.0, 33.0, 30.0, 48.0, 61.0, 78.0, 93.0, 107.0, 129.0, 143.0, 248.0, 449.0, 1141.0, 4030.0, 29149.0, 1191278.0, 2856364.0, 100072.0, 7146.0, 1715.0, 657.0, 288.0, 211.0, 126.0, 115.0, 95.0, 67.0, 54.0, 48.0, 36.0, 32.0, 25.0, 23.0, 11.0, 13.0, 18.0, 13.0, 5.0, 5.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-40.59375, -39.33251953125, -38.0712890625, -36.81005859375, -35.548828125, -34.28759765625, -33.0263671875, -31.76513671875, -30.50390625, -29.24267578125, -27.9814453125, -26.72021484375, -25.458984375, -24.19775390625, -22.9365234375, -21.67529296875, -20.4140625, -19.15283203125, -17.8916015625, -16.63037109375, -15.369140625, -14.10791015625, -12.8466796875, -11.58544921875, -10.32421875, -9.06298828125, -7.8017578125, -6.54052734375, -5.279296875, -4.01806640625, -2.7568359375, -1.49560546875, -0.234375, 1.02685546875, 2.2880859375, 3.54931640625, 4.810546875, 6.07177734375, 7.3330078125, 8.59423828125, 9.85546875, 11.11669921875, 12.3779296875, 13.63916015625, 14.900390625, 16.16162109375, 17.4228515625, 18.68408203125, 19.9453125, 21.20654296875, 22.4677734375, 23.72900390625, 24.990234375, 26.25146484375, 27.5126953125, 28.77392578125, 30.03515625, 31.29638671875, 32.5576171875, 33.81884765625, 35.080078125, 36.34130859375, 37.6025390625, 38.86376953125, 40.125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 6.0, 14.0, 24.0, 24.0, 50.0, 120.0, 192.0, 336.0, 700.0, 1182.0, 683.0, 299.0, 211.0, 105.0, 51.0, 38.0, 15.0, 13.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.3125, -61.856689453125, -60.40087890625, -58.945068359375, -57.4892578125, -56.033447265625, -54.57763671875, -53.121826171875, -51.666015625, -50.210205078125, -48.75439453125, -47.298583984375, -45.8427734375, -44.386962890625, -42.93115234375, -41.475341796875, -40.01953125, -38.563720703125, -37.10791015625, -35.652099609375, -34.1962890625, -32.740478515625, -31.28466796875, -29.828857421875, -28.373046875, -26.917236328125, -25.46142578125, -24.005615234375, -22.5498046875, -21.093994140625, -19.63818359375, -18.182373046875, -16.7265625, -15.270751953125, -13.81494140625, -12.359130859375, -10.9033203125, -9.447509765625, -7.99169921875, -6.535888671875, -5.080078125, -3.624267578125, -2.16845703125, -0.712646484375, 0.7431640625, 2.198974609375, 3.65478515625, 5.110595703125, 6.56640625, 8.022216796875, 9.47802734375, 10.933837890625, 12.3896484375, 13.845458984375, 15.30126953125, 16.757080078125, 18.212890625, 19.668701171875, 21.12451171875, 22.580322265625, 24.0361328125, 25.491943359375, 26.94775390625, 28.403564453125, 29.859375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 7.0, 10.0, 24.0, 32.0, 46.0, 85.0, 158.0, 367.0, 863.0, 4157.0, 1642452.0, 2539963.0, 4474.0, 918.0, 310.0, 155.0, 97.0, 64.0, 34.0, 15.0, 17.0, 14.0, 6.0, 2.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.375, -104.021484375, -100.66796875, -97.314453125, -93.9609375, -90.607421875, -87.25390625, -83.900390625, -80.546875, -77.193359375, -73.83984375, -70.486328125, -67.1328125, -63.779296875, -60.42578125, -57.072265625, -53.71875, -50.365234375, -47.01171875, -43.658203125, -40.3046875, -36.951171875, -33.59765625, -30.244140625, -26.890625, -23.537109375, -20.18359375, -16.830078125, -13.4765625, -10.123046875, -6.76953125, -3.416015625, -0.0625, 3.291015625, 6.64453125, 9.998046875, 13.3515625, 16.705078125, 20.05859375, 23.412109375, 26.765625, 30.119140625, 33.47265625, 36.826171875, 40.1796875, 43.533203125, 46.88671875, 50.240234375, 53.59375, 56.947265625, 60.30078125, 63.654296875, 67.0078125, 70.361328125, 73.71484375, 77.068359375, 80.421875, 83.775390625, 87.12890625, 90.482421875, 93.8359375, 97.189453125, 100.54296875, 103.896484375, 107.25]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 12.0, 863.0, 139.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.4566650390625, -177.9335174560547, -151.41038513183594, -124.88723754882812, -98.36409759521484, -71.84095764160156, -45.31781005859375, -18.794677734375, 7.7284698486328125, 34.251609802246094, 60.77475357055664, 87.29789733886719, 113.82103729248047, 140.34417724609375, 166.86732482910156, 193.3904571533203, 219.91360473632812, 246.43675231933594, 272.95989990234375, 299.4830322265625, 326.00616455078125, 352.529296875, 379.0524597167969, 405.5755920410156, 432.0987548828125, 458.62188720703125, 485.1450500488281, 511.6681823730469, 538.1913452148438, 564.7144775390625, 591.2376098632812, 617.7607421875, 644.2838745117188, 670.8070068359375, 697.3301391601562, 723.853271484375, 750.37646484375, 776.8995971679688, 803.4227294921875, 829.9458618164062, 856.468994140625, 882.9921264648438, 909.5152587890625, 936.0384521484375, 962.5615844726562, 989.084716796875, 1015.6078491210938, 1042.1309814453125, 1068.6541748046875, 1095.1773681640625, 1121.700439453125, 1148.2236328125, 1174.7467041015625, 1201.2698974609375, 1227.79296875, 1254.316162109375, 1280.8392333984375, 1307.3624267578125, 1333.885498046875, 1360.40869140625, 1386.9317626953125, 1413.4549560546875, 1439.97802734375, 1466.501220703125, 1493.0244140625]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 1.0, 4.0, 11.0, 8.0, 8.0, 7.0, 14.0, 11.0, 15.0, 24.0, 29.0, 30.0, 31.0, 30.0, 35.0, 35.0, 42.0, 45.0, 43.0, 35.0, 46.0, 34.0, 43.0, 34.0, 38.0, 35.0, 37.0, 32.0, 32.0, 35.0, 29.0, 22.0, 24.0, 17.0, 18.0, 11.0, 10.0, 8.0, 5.0, 10.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-84.82231140136719, -82.17188262939453, -79.5214614868164, -76.87103271484375, -74.2206039428711, -71.57017517089844, -68.91975402832031, -66.26932525634766, -63.618900299072266, -60.968475341796875, -58.31804656982422, -55.66762161254883, -53.01719665527344, -50.36676788330078, -47.71634292602539, -45.06591796875, -42.415489196777344, -39.76506423950195, -37.1146354675293, -34.464210510253906, -31.813783645629883, -29.16335678100586, -26.51293182373047, -23.862504959106445, -21.212078094482422, -18.5616512298584, -15.911225318908691, -13.260799407958984, -10.610372543334961, -7.9599456787109375, -5.3095197677612305, -2.6590938568115234, -0.0086669921875, 2.6417593955993652, 5.2921857833862305, 7.942612171173096, 10.593038558959961, 13.243465423583984, 15.893891334533691, 18.5443172454834, 21.194744110107422, 23.845170974731445, 26.49559783935547, 29.14602279663086, 31.796449661254883, 34.446876525878906, 37.0973014831543, 39.74772644042969, 42.398155212402344, 45.048580169677734, 47.69900894165039, 50.34943389892578, 52.99986267089844, 55.65028762817383, 58.30071258544922, 60.951141357421875, 63.601566314697266, 66.25199127197266, 68.90242004394531, 71.55284881591797, 74.2032699584961, 76.85369873046875, 79.5041275024414, 82.15454864501953, 84.80497741699219]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 5.0, 7.0, 11.0, 16.0, 14.0, 10.0, 20.0, 25.0, 33.0, 23.0, 24.0, 33.0, 25.0, 32.0, 35.0, 37.0, 72.0, 41.0, 43.0, 49.0, 43.0, 40.0, 38.0, 40.0, 38.0, 35.0, 34.0, 34.0, 18.0, 15.0, 18.0, 17.0, 9.0, 14.0, 7.0, 13.0, 6.0, 6.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.34375, -11.965087890625, -11.58642578125, -11.207763671875, -10.8291015625, -10.450439453125, -10.07177734375, -9.693115234375, -9.314453125, -8.935791015625, -8.55712890625, -8.178466796875, -7.7998046875, -7.421142578125, -7.04248046875, -6.663818359375, -6.28515625, -5.906494140625, -5.52783203125, -5.149169921875, -4.7705078125, -4.391845703125, -4.01318359375, -3.634521484375, -3.255859375, -2.877197265625, -2.49853515625, -2.119873046875, -1.7412109375, -1.362548828125, -0.98388671875, -0.605224609375, -0.2265625, 0.152099609375, 0.53076171875, 0.909423828125, 1.2880859375, 1.666748046875, 2.04541015625, 2.424072265625, 2.802734375, 3.181396484375, 3.56005859375, 3.938720703125, 4.3173828125, 4.696044921875, 5.07470703125, 5.453369140625, 5.83203125, 6.210693359375, 6.58935546875, 6.968017578125, 7.3466796875, 7.725341796875, 8.10400390625, 8.482666015625, 8.861328125, 9.239990234375, 9.61865234375, 9.997314453125, 10.3759765625, 10.754638671875, 11.13330078125, 11.511962890625, 11.890625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 11.0, 9.0, 15.0, 23.0, 25.0, 46.0, 70.0, 109.0, 121.0, 212.0, 334.0, 465.0, 637.0, 1000.0, 1535.0, 2172.0, 3256.0, 5005.0, 7647.0, 11525.0, 17651.0, 27400.0, 42393.0, 69644.0, 135442.0, 331393.0, 170693.0, 82145.0, 48672.0, 30882.0, 19987.0, 12667.0, 8475.0, 5623.0, 3669.0, 2452.0, 1686.0, 1135.0, 757.0, 498.0, 351.0, 237.0, 162.0, 110.0, 84.0, 41.0, 30.0, 24.0, 20.0, 10.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-2.24609375, -2.177276611328125, -2.10845947265625, -2.039642333984375, -1.9708251953125, -1.902008056640625, -1.83319091796875, -1.764373779296875, -1.695556640625, -1.626739501953125, -1.55792236328125, -1.489105224609375, -1.4202880859375, -1.351470947265625, -1.28265380859375, -1.213836669921875, -1.14501953125, -1.076202392578125, -1.00738525390625, -0.938568115234375, -0.8697509765625, -0.800933837890625, -0.73211669921875, -0.663299560546875, -0.594482421875, -0.525665283203125, -0.45684814453125, -0.388031005859375, -0.3192138671875, -0.250396728515625, -0.18157958984375, -0.112762451171875, -0.0439453125, 0.024871826171875, 0.09368896484375, 0.162506103515625, 0.2313232421875, 0.300140380859375, 0.36895751953125, 0.437774658203125, 0.506591796875, 0.575408935546875, 0.64422607421875, 0.713043212890625, 0.7818603515625, 0.850677490234375, 0.91949462890625, 0.988311767578125, 1.05712890625, 1.125946044921875, 1.19476318359375, 1.263580322265625, 1.3323974609375, 1.401214599609375, 1.47003173828125, 1.538848876953125, 1.607666015625, 1.676483154296875, 1.74530029296875, 1.814117431640625, 1.8829345703125, 1.951751708984375, 2.02056884765625, 2.089385986328125, 2.158203125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 6.0, 8.0, 6.0, 8.0, 15.0, 14.0, 21.0, 21.0, 16.0, 28.0, 31.0, 18.0, 45.0, 27.0, 27.0, 33.0, 38.0, 31.0, 41.0, 1064.0, 45.0, 51.0, 41.0, 43.0, 34.0, 28.0, 25.0, 27.0, 33.0, 26.0, 25.0, 27.0, 15.0, 15.0, 15.0, 13.0, 8.0, 11.0, 6.0, 7.0, 4.0, 4.0, 6.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.1171875, -6.893310546875, -6.66943359375, -6.445556640625, -6.2216796875, -5.997802734375, -5.77392578125, -5.550048828125, -5.326171875, -5.102294921875, -4.87841796875, -4.654541015625, -4.4306640625, -4.206787109375, -3.98291015625, -3.759033203125, -3.53515625, -3.311279296875, -3.08740234375, -2.863525390625, -2.6396484375, -2.415771484375, -2.19189453125, -1.968017578125, -1.744140625, -1.520263671875, -1.29638671875, -1.072509765625, -0.8486328125, -0.624755859375, -0.40087890625, -0.177001953125, 0.046875, 0.270751953125, 0.49462890625, 0.718505859375, 0.9423828125, 1.166259765625, 1.39013671875, 1.614013671875, 1.837890625, 2.061767578125, 2.28564453125, 2.509521484375, 2.7333984375, 2.957275390625, 3.18115234375, 3.405029296875, 3.62890625, 3.852783203125, 4.07666015625, 4.300537109375, 4.5244140625, 4.748291015625, 4.97216796875, 5.196044921875, 5.419921875, 5.643798828125, 5.86767578125, 6.091552734375, 6.3154296875, 6.539306640625, 6.76318359375, 6.987060546875, 7.2109375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 9.0, 8.0, 12.0, 27.0, 31.0, 39.0, 59.0, 81.0, 115.0, 177.0, 274.0, 404.0, 568.0, 839.0, 1294.0, 1860.0, 2737.0, 4190.0, 6131.0, 9343.0, 14398.0, 22216.0, 34182.0, 53880.0, 93927.0, 217621.0, 1349603.0, 111080.0, 61696.0, 38367.0, 24707.0, 16098.0, 10467.0, 6910.0, 4611.0, 2966.0, 2086.0, 1352.0, 915.0, 598.0, 400.0, 282.0, 178.0, 116.0, 94.0, 52.0, 36.0, 29.0, 30.0, 16.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.166015625, -2.098602294921875, -2.03118896484375, -1.963775634765625, -1.8963623046875, -1.828948974609375, -1.76153564453125, -1.694122314453125, -1.626708984375, -1.559295654296875, -1.49188232421875, -1.424468994140625, -1.3570556640625, -1.289642333984375, -1.22222900390625, -1.154815673828125, -1.08740234375, -1.019989013671875, -0.95257568359375, -0.885162353515625, -0.8177490234375, -0.750335693359375, -0.68292236328125, -0.615509033203125, -0.548095703125, -0.480682373046875, -0.41326904296875, -0.345855712890625, -0.2784423828125, -0.211029052734375, -0.14361572265625, -0.076202392578125, -0.0087890625, 0.058624267578125, 0.12603759765625, 0.193450927734375, 0.2608642578125, 0.328277587890625, 0.39569091796875, 0.463104248046875, 0.530517578125, 0.597930908203125, 0.66534423828125, 0.732757568359375, 0.8001708984375, 0.867584228515625, 0.93499755859375, 1.002410888671875, 1.06982421875, 1.137237548828125, 1.20465087890625, 1.272064208984375, 1.3394775390625, 1.406890869140625, 1.47430419921875, 1.541717529296875, 1.609130859375, 1.676544189453125, 1.74395751953125, 1.811370849609375, 1.8787841796875, 1.946197509765625, 2.01361083984375, 2.081024169921875, 2.1484375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 6.0, 6.0, 8.0, 8.0, 19.0, 24.0, 29.0, 38.0, 70.0, 97.0, 109.0, 122.0, 123.0, 104.0, 75.0, 61.0, 36.0, 23.0, 8.0, 9.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0020465850830078125, -0.00198577344417572, -0.001924961805343628, -0.0018641501665115356, -0.0018033385276794434, -0.001742526888847351, -0.0016817152500152588, -0.0016209036111831665, -0.0015600919723510742, -0.001499280333518982, -0.0014384686946868896, -0.0013776570558547974, -0.001316845417022705, -0.0012560337781906128, -0.0011952221393585205, -0.0011344105005264282, -0.001073598861694336, -0.0010127872228622437, -0.0009519755840301514, -0.0008911639451980591, -0.0008303523063659668, -0.0007695406675338745, -0.0007087290287017822, -0.0006479173898696899, -0.0005871057510375977, -0.0005262941122055054, -0.0004654824733734131, -0.0004046708345413208, -0.0003438591957092285, -0.00028304755687713623, -0.00022223591804504395, -0.00016142427921295166, -0.00010061264038085938, -3.980100154876709e-05, 2.1010637283325195e-05, 8.182227611541748e-05, 0.00014263391494750977, 0.00020344555377960205, 0.00026425719261169434, 0.0003250688314437866, 0.0003858804702758789, 0.0004466921091079712, 0.0005075037479400635, 0.0005683153867721558, 0.000629127025604248, 0.0006899386644363403, 0.0007507503032684326, 0.0008115619421005249, 0.0008723735809326172, 0.0009331852197647095, 0.0009939968585968018, 0.001054808497428894, 0.0011156201362609863, 0.0011764317750930786, 0.001237243413925171, 0.0012980550527572632, 0.0013588666915893555, 0.0014196783304214478, 0.00148048996925354, 0.0015413016080856323, 0.0016021132469177246, 0.001662924885749817, 0.0017237365245819092, 0.0017845481634140015, 0.0018453598022460938]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 14.0, 8.0, 17.0, 19.0, 30.0, 46.0, 85.0, 158.0, 232.0, 382.0, 934.0, 36550.0, 1007330.0, 1378.0, 549.0, 306.0, 181.0, 96.0, 72.0, 41.0, 30.0, 17.0, 15.0, 13.0, 8.0, 11.0, 6.0, 5.0, 6.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03118896484375, -0.030155658721923828, -0.029122352600097656, -0.028089046478271484, -0.027055740356445312, -0.02602243423461914, -0.02498912811279297, -0.023955821990966797, -0.022922515869140625, -0.021889209747314453, -0.02085590362548828, -0.01982259750366211, -0.018789291381835938, -0.017755985260009766, -0.016722679138183594, -0.015689373016357422, -0.01465606689453125, -0.013622760772705078, -0.012589454650878906, -0.011556148529052734, -0.010522842407226562, -0.00948953628540039, -0.008456230163574219, -0.007422924041748047, -0.006389617919921875, -0.005356311798095703, -0.004323005676269531, -0.0032896995544433594, -0.0022563934326171875, -0.0012230873107910156, -0.00018978118896484375, 0.0008435249328613281, 0.0018768310546875, 0.002910137176513672, 0.003943443298339844, 0.004976749420166016, 0.0060100555419921875, 0.007043361663818359, 0.008076667785644531, 0.009109973907470703, 0.010143280029296875, 0.011176586151123047, 0.012209892272949219, 0.01324319839477539, 0.014276504516601562, 0.015309810638427734, 0.016343116760253906, 0.017376422882080078, 0.01840972900390625, 0.019443035125732422, 0.020476341247558594, 0.021509647369384766, 0.022542953491210938, 0.02357625961303711, 0.02460956573486328, 0.025642871856689453, 0.026676177978515625, 0.027709484100341797, 0.02874279022216797, 0.02977609634399414, 0.030809402465820312, 0.031842708587646484, 0.032876014709472656, 0.03390932083129883, 0.034942626953125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 128.0, 801.0, 84.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015713725006207824, -0.0014209036016836762, -0.0012704345863312483, -0.0011199656873941422, -0.0009694967302493751, -0.0008190277731046081, -0.0006685588741675019, -0.000518089858815074, -0.00036762095987796783, -0.00021715201728511602, -6.66830746922642e-05, 8.378585334867239e-05, 0.00023425481049343944, 0.0003847237676382065, 0.0005351926665753126, 0.0006856616819277406, 0.0008361305808648467, 0.0009865994798019528, 0.0011370684951543808, 0.001287537394091487, 0.001438006293028593, 0.001588475308381021, 0.0017389442073181272, 0.0018894132226705551, 0.0020398821216076612, 0.0021903510205447674, 0.0023408199194818735, 0.0024912888184189796, 0.0026417579501867294, 0.0027922268491238356, 0.0029426957480609417, 0.0030931648798286915, 0.0032436340115964413, 0.0033941029105335474, 0.0035445718094706535, 0.0036950409412384033, 0.0038455098401755095, 0.003995978739112616, 0.004146447405219078, 0.004296916536986828, 0.004447385668754578, 0.004597854800522327, 0.00474832346662879, 0.00489879259839654, 0.005049261264503002, 0.005199730396270752, 0.005350199528038502, 0.005500668194144964, 0.005651136860251427, 0.0058016059920191765, 0.005952074658125639, 0.006102543789893389, 0.006253012455999851, 0.006403481587767601, 0.006553950719535351, 0.006704419385641813, 0.006854888517409563, 0.007005357649177313, 0.007155826315283775, 0.007306295447051525, 0.007456764113157988, 0.007607233244925737, 0.0077577019110322, 0.00790817104279995, 0.0080586401745677]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 5.0, 4.0, 6.0, 2.0, 8.0, 5.0, 6.0, 15.0, 13.0, 19.0, 15.0, 27.0, 36.0, 32.0, 28.0, 38.0, 36.0, 45.0, 36.0, 44.0, 38.0, 55.0, 49.0, 40.0, 28.0, 35.0, 38.0, 33.0, 49.0, 35.0, 20.0, 32.0, 31.0, 25.0, 20.0, 10.0, 11.0, 8.0, 8.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0007399916648864746, -0.0007201842963695526, -0.0007003769278526306, -0.0006805695593357086, -0.0006607621908187866, -0.0006409548223018646, -0.0006211474537849426, -0.0006013400852680206, -0.0005815327167510986, -0.0005617253482341766, -0.0005419179797172546, -0.0005221106112003326, -0.0005023032426834106, -0.00048249587416648865, -0.00046268850564956665, -0.00044288113713264465, -0.00042307376861572266, -0.00040326640009880066, -0.00038345903158187866, -0.00036365166306495667, -0.00034384429454803467, -0.00032403692603111267, -0.0003042295575141907, -0.0002844221889972687, -0.0002646148204803467, -0.0002448074519634247, -0.00022500008344650269, -0.0002051927149295807, -0.0001853853464126587, -0.0001655779778957367, -0.0001457706093788147, -0.0001259632408618927, -0.0001061558723449707, -8.63485038280487e-05, -6.654113531112671e-05, -4.673376679420471e-05, -2.6926398277282715e-05, -7.119029760360718e-06, 1.268833875656128e-05, 3.2495707273483276e-05, 5.2303075790405273e-05, 7.211044430732727e-05, 9.191781282424927e-05, 0.00011172518134117126, 0.00013153254985809326, 0.00015133991837501526, 0.00017114728689193726, 0.00019095465540885925, 0.00021076202392578125, 0.00023056939244270325, 0.00025037676095962524, 0.00027018412947654724, 0.00028999149799346924, 0.00030979886651039124, 0.00032960623502731323, 0.00034941360354423523, 0.0003692209720611572, 0.0003890283405780792, 0.0004088357090950012, 0.0004286430776119232, 0.0004484504461288452, 0.0004682578146457672, 0.0004880651831626892, 0.0005078725516796112, 0.0005276799201965332]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 5.0, 7.0, 11.0, 16.0, 14.0, 10.0, 20.0, 25.0, 33.0, 23.0, 24.0, 33.0, 25.0, 32.0, 35.0, 37.0, 72.0, 41.0, 43.0, 49.0, 43.0, 40.0, 38.0, 40.0, 38.0, 35.0, 34.0, 34.0, 18.0, 15.0, 18.0, 17.0, 9.0, 14.0, 7.0, 13.0, 6.0, 6.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.34375, -11.965087890625, -11.58642578125, -11.207763671875, -10.8291015625, -10.450439453125, -10.07177734375, -9.693115234375, -9.314453125, -8.935791015625, -8.55712890625, -8.178466796875, -7.7998046875, -7.421142578125, -7.04248046875, -6.663818359375, -6.28515625, -5.906494140625, -5.52783203125, -5.149169921875, -4.7705078125, -4.391845703125, -4.01318359375, -3.634521484375, -3.255859375, -2.877197265625, -2.49853515625, -2.119873046875, -1.7412109375, -1.362548828125, -0.98388671875, -0.605224609375, -0.2265625, 0.152099609375, 0.53076171875, 0.909423828125, 1.2880859375, 1.666748046875, 2.04541015625, 2.424072265625, 2.802734375, 3.181396484375, 3.56005859375, 3.938720703125, 4.3173828125, 4.696044921875, 5.07470703125, 5.453369140625, 5.83203125, 6.210693359375, 6.58935546875, 6.968017578125, 7.3466796875, 7.725341796875, 8.10400390625, 8.482666015625, 8.861328125, 9.239990234375, 9.61865234375, 9.997314453125, 10.3759765625, 10.754638671875, 11.13330078125, 11.511962890625, 11.890625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 3.0, 1.0, 6.0, 10.0, 9.0, 15.0, 27.0, 33.0, 49.0, 71.0, 85.0, 132.0, 187.0, 289.0, 373.0, 574.0, 879.0, 1289.0, 2114.0, 4025.0, 12751.0, 111367.0, 782249.0, 109257.0, 12656.0, 3947.0, 2062.0, 1318.0, 880.0, 610.0, 378.0, 271.0, 194.0, 124.0, 95.0, 63.0, 53.0, 28.0, 20.0, 21.0, 13.0, 12.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.28125, -30.2880859375, -29.294921875, -28.3017578125, -27.30859375, -26.3154296875, -25.322265625, -24.3291015625, -23.3359375, -22.3427734375, -21.349609375, -20.3564453125, -19.36328125, -18.3701171875, -17.376953125, -16.3837890625, -15.390625, -14.3974609375, -13.404296875, -12.4111328125, -11.41796875, -10.4248046875, -9.431640625, -8.4384765625, -7.4453125, -6.4521484375, -5.458984375, -4.4658203125, -3.47265625, -2.4794921875, -1.486328125, -0.4931640625, 0.5, 1.4931640625, 2.486328125, 3.4794921875, 4.47265625, 5.4658203125, 6.458984375, 7.4521484375, 8.4453125, 9.4384765625, 10.431640625, 11.4248046875, 12.41796875, 13.4111328125, 14.404296875, 15.3974609375, 16.390625, 17.3837890625, 18.376953125, 19.3701171875, 20.36328125, 21.3564453125, 22.349609375, 23.3427734375, 24.3359375, 25.3291015625, 26.322265625, 27.3154296875, 28.30859375, 29.3017578125, 30.294921875, 31.2880859375, 32.28125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 13.0, 15.0, 19.0, 23.0, 27.0, 32.0, 42.0, 49.0, 70.0, 135.0, 359.0, 1757.0, 119.0, 87.0, 58.0, 59.0, 34.0, 34.0, 29.0, 16.0, 18.0, 10.0, 11.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.21875, -52.4765625, -50.734375, -48.9921875, -47.25, -45.5078125, -43.765625, -42.0234375, -40.28125, -38.5390625, -36.796875, -35.0546875, -33.3125, -31.5703125, -29.828125, -28.0859375, -26.34375, -24.6015625, -22.859375, -21.1171875, -19.375, -17.6328125, -15.890625, -14.1484375, -12.40625, -10.6640625, -8.921875, -7.1796875, -5.4375, -3.6953125, -1.953125, -0.2109375, 1.53125, 3.2734375, 5.015625, 6.7578125, 8.5, 10.2421875, 11.984375, 13.7265625, 15.46875, 17.2109375, 18.953125, 20.6953125, 22.4375, 24.1796875, 25.921875, 27.6640625, 29.40625, 31.1484375, 32.890625, 34.6328125, 36.375, 38.1171875, 39.859375, 41.6015625, 43.34375, 45.0859375, 46.828125, 48.5703125, 50.3125, 52.0546875, 53.796875, 55.5390625, 57.28125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 13.0, 14.0, 15.0, 49.0, 56.0, 82.0, 128.0, 226.0, 523.0, 2063.0, 3133531.0, 7569.0, 739.0, 251.0, 157.0, 99.0, 68.0, 39.0, 28.0, 16.0, 12.0, 8.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-186.0, -180.478515625, -174.95703125, -169.435546875, -163.9140625, -158.392578125, -152.87109375, -147.349609375, -141.828125, -136.306640625, -130.78515625, -125.263671875, -119.7421875, -114.220703125, -108.69921875, -103.177734375, -97.65625, -92.134765625, -86.61328125, -81.091796875, -75.5703125, -70.048828125, -64.52734375, -59.005859375, -53.484375, -47.962890625, -42.44140625, -36.919921875, -31.3984375, -25.876953125, -20.35546875, -14.833984375, -9.3125, -3.791015625, 1.73046875, 7.251953125, 12.7734375, 18.294921875, 23.81640625, 29.337890625, 34.859375, 40.380859375, 45.90234375, 51.423828125, 56.9453125, 62.466796875, 67.98828125, 73.509765625, 79.03125, 84.552734375, 90.07421875, 95.595703125, 101.1171875, 106.638671875, 112.16015625, 117.681640625, 123.203125, 128.724609375, 134.24609375, 139.767578125, 145.2890625, 150.810546875, 156.33203125, 161.853515625, 167.375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 98.0, 817.0, 95.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-659.046142578125, -645.7333984375, -632.4207153320312, -619.1079711914062, -605.7952270507812, -592.4825439453125, -579.1697998046875, -565.8570556640625, -552.5443725585938, -539.2316284179688, -525.9189453125, -512.606201171875, -499.2934875488281, -485.9807434082031, -472.66802978515625, -459.35528564453125, -446.04254150390625, -432.7298278808594, -419.4170837402344, -406.1043701171875, -392.7916564941406, -379.4789123535156, -366.16619873046875, -352.85345458984375, -339.540771484375, -326.2280578613281, -312.9153137207031, -299.60260009765625, -286.2898864746094, -272.9771423339844, -259.6644287109375, -246.35169982910156, -233.0389862060547, -219.72625732421875, -206.41354370117188, -193.10081481933594, -179.7880859375, -166.47537231445312, -153.1626434326172, -139.84991455078125, -126.53719329833984, -113.22447204589844, -99.9117431640625, -86.5990219116211, -73.28630065917969, -59.97357177734375, -46.660850524902344, -33.348121643066406, -20.035400390625, -6.7226762771606445, 6.590047836303711, 19.90277099609375, 33.21549606323242, 46.528221130371094, 59.8409423828125, 73.15367126464844, 86.46639251708984, 99.77911376953125, 113.09184265136719, 126.4045639038086, 139.71728515625, 153.03001403808594, 166.34274291992188, 179.65545654296875, 192.9681854248047]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 6.0, 2.0, 3.0, 6.0, 10.0, 7.0, 12.0, 15.0, 20.0, 18.0, 17.0, 22.0, 23.0, 25.0, 30.0, 34.0, 29.0, 27.0, 33.0, 27.0, 34.0, 45.0, 42.0, 47.0, 40.0, 45.0, 36.0, 33.0, 28.0, 38.0, 28.0, 30.0, 34.0, 34.0, 26.0, 18.0, 14.0, 14.0, 13.0, 10.0, 10.0, 5.0, 6.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-111.92774963378906, -108.70206451416016, -105.47638702392578, -102.25070190429688, -99.02501678466797, -95.79933166503906, -92.57365417480469, -89.34796905517578, -86.12228393554688, -82.89659881591797, -79.6709213256836, -76.44523620605469, -73.21955108642578, -69.99386596679688, -66.7681884765625, -63.542503356933594, -60.31682586669922, -57.09114456176758, -53.86545944213867, -50.63977813720703, -47.414093017578125, -44.188411712646484, -40.962730407714844, -37.73704528808594, -34.5113639831543, -31.285680770874023, -28.05999755859375, -24.83431625366211, -21.608633041381836, -18.382949829101562, -15.157268524169922, -11.931585311889648, -8.705902099609375, -5.48021936416626, -2.2545366287231445, 0.9711456298828125, 4.196828842163086, 7.422512054443359, 10.648193359375, 13.873876571655273, 17.099559783935547, 20.32524299621582, 23.550926208496094, 26.776607513427734, 30.002290725708008, 33.22797393798828, 36.45365524291992, 39.67933654785156, 42.90502166748047, 46.13070297241211, 49.356388092041016, 52.582069396972656, 55.80775451660156, 59.0334358215332, 62.259117126464844, 65.48480224609375, 68.71047973632812, 71.93616485595703, 75.1618423461914, 78.38752746582031, 81.61321258544922, 84.83889770507812, 88.0645751953125, 91.2902603149414, 94.51594543457031]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 7.0, 12.0, 11.0, 14.0, 14.0, 16.0, 21.0, 19.0, 18.0, 27.0, 42.0, 34.0, 26.0, 61.0, 55.0, 51.0, 49.0, 50.0, 51.0, 47.0, 46.0, 43.0, 41.0, 44.0, 36.0, 23.0, 27.0, 23.0, 16.0, 13.0, 16.0, 15.0, 5.0, 3.0, 5.0, 1.0, 4.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4921875, -14.0443115234375, -13.596435546875, -13.1485595703125, -12.70068359375, -12.2528076171875, -11.804931640625, -11.3570556640625, -10.9091796875, -10.4613037109375, -10.013427734375, -9.5655517578125, -9.11767578125, -8.6697998046875, -8.221923828125, -7.7740478515625, -7.326171875, -6.8782958984375, -6.430419921875, -5.9825439453125, -5.53466796875, -5.0867919921875, -4.638916015625, -4.1910400390625, -3.7431640625, -3.2952880859375, -2.847412109375, -2.3995361328125, -1.95166015625, -1.5037841796875, -1.055908203125, -0.6080322265625, -0.16015625, 0.2877197265625, 0.735595703125, 1.1834716796875, 1.63134765625, 2.0792236328125, 2.527099609375, 2.9749755859375, 3.4228515625, 3.8707275390625, 4.318603515625, 4.7664794921875, 5.21435546875, 5.6622314453125, 6.110107421875, 6.5579833984375, 7.005859375, 7.4537353515625, 7.901611328125, 8.3494873046875, 8.79736328125, 9.2452392578125, 9.693115234375, 10.1409912109375, 10.5888671875, 11.0367431640625, 11.484619140625, 11.9324951171875, 12.38037109375, 12.8282470703125, 13.276123046875, 13.7239990234375, 14.171875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 6.0, 4.0, 8.0, 7.0, 11.0, 12.0, 17.0, 26.0, 32.0, 51.0, 63.0, 97.0, 144.0, 241.0, 342.0, 532.0, 1024.0, 2046.0, 4309.0, 11376.0, 44304.0, 280883.0, 1641934.0, 1809204.0, 328077.0, 48149.0, 12117.0, 4608.0, 2035.0, 997.0, 586.0, 342.0, 214.0, 143.0, 97.0, 65.0, 39.0, 51.0, 20.0, 18.0, 20.0, 8.0, 7.0, 7.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-22.09375, -21.463134765625, -20.83251953125, -20.201904296875, -19.5712890625, -18.940673828125, -18.31005859375, -17.679443359375, -17.048828125, -16.418212890625, -15.78759765625, -15.156982421875, -14.5263671875, -13.895751953125, -13.26513671875, -12.634521484375, -12.00390625, -11.373291015625, -10.74267578125, -10.112060546875, -9.4814453125, -8.850830078125, -8.22021484375, -7.589599609375, -6.958984375, -6.328369140625, -5.69775390625, -5.067138671875, -4.4365234375, -3.805908203125, -3.17529296875, -2.544677734375, -1.9140625, -1.283447265625, -0.65283203125, -0.022216796875, 0.6083984375, 1.239013671875, 1.86962890625, 2.500244140625, 3.130859375, 3.761474609375, 4.39208984375, 5.022705078125, 5.6533203125, 6.283935546875, 6.91455078125, 7.545166015625, 8.17578125, 8.806396484375, 9.43701171875, 10.067626953125, 10.6982421875, 11.328857421875, 11.95947265625, 12.590087890625, 13.220703125, 13.851318359375, 14.48193359375, 15.112548828125, 15.7431640625, 16.373779296875, 17.00439453125, 17.635009765625, 18.265625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 19.0, 100.0, 1099.0, 2500.0, 329.0, 26.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.375, -152.490234375, -147.60546875, -142.720703125, -137.8359375, -132.951171875, -128.06640625, -123.181640625, -118.296875, -113.412109375, -108.52734375, -103.642578125, -98.7578125, -93.873046875, -88.98828125, -84.103515625, -79.21875, -74.333984375, -69.44921875, -64.564453125, -59.6796875, -54.794921875, -49.91015625, -45.025390625, -40.140625, -35.255859375, -30.37109375, -25.486328125, -20.6015625, -15.716796875, -10.83203125, -5.947265625, -1.0625, 3.822265625, 8.70703125, 13.591796875, 18.4765625, 23.361328125, 28.24609375, 33.130859375, 38.015625, 42.900390625, 47.78515625, 52.669921875, 57.5546875, 62.439453125, 67.32421875, 72.208984375, 77.09375, 81.978515625, 86.86328125, 91.748046875, 96.6328125, 101.517578125, 106.40234375, 111.287109375, 116.171875, 121.056640625, 125.94140625, 130.826171875, 135.7109375, 140.595703125, 145.48046875, 150.365234375, 155.25]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 22.0, 44.0, 133.0, 577.0, 3372.0, 4184753.0, 4458.0, 670.0, 163.0, 41.0, 22.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-235.375, -227.912109375, -220.44921875, -212.986328125, -205.5234375, -198.060546875, -190.59765625, -183.134765625, -175.671875, -168.208984375, -160.74609375, -153.283203125, -145.8203125, -138.357421875, -130.89453125, -123.431640625, -115.96875, -108.505859375, -101.04296875, -93.580078125, -86.1171875, -78.654296875, -71.19140625, -63.728515625, -56.265625, -48.802734375, -41.33984375, -33.876953125, -26.4140625, -18.951171875, -11.48828125, -4.025390625, 3.4375, 10.900390625, 18.36328125, 25.826171875, 33.2890625, 40.751953125, 48.21484375, 55.677734375, 63.140625, 70.603515625, 78.06640625, 85.529296875, 92.9921875, 100.455078125, 107.91796875, 115.380859375, 122.84375, 130.306640625, 137.76953125, 145.232421875, 152.6953125, 160.158203125, 167.62109375, 175.083984375, 182.546875, 190.009765625, 197.47265625, 204.935546875, 212.3984375, 219.861328125, 227.32421875, 234.787109375, 242.25]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 16.0, 201.0, 654.0, 135.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-563.9052734375, -552.4888305664062, -541.0723266601562, -529.6558837890625, -518.2394409179688, -506.8229675292969, -495.406494140625, -483.99005126953125, -472.5736083984375, -461.1571350097656, -449.7406921386719, -438.32421875, -426.90777587890625, -415.4913024902344, -404.0748291015625, -392.65838623046875, -381.2419128417969, -369.825439453125, -358.40899658203125, -346.9925231933594, -335.5760803222656, -324.15960693359375, -312.7431640625, -301.3266906738281, -289.91021728515625, -278.4937438964844, -267.0773010253906, -255.66082763671875, -244.244384765625, -232.82791137695312, -221.4114532470703, -209.9949951171875, -198.57855224609375, -187.16209411621094, -175.74563598632812, -164.32916259765625, -152.9127197265625, -141.49624633789062, -130.0797882080078, -118.663330078125, -107.24687194824219, -95.83041381835938, -84.41395568847656, -72.99748992919922, -61.581031799316406, -50.164573669433594, -38.74810791015625, -27.331649780273438, -15.915191650390625, -4.49873161315918, 6.917728424072266, 18.334190368652344, 29.750648498535156, 41.16710662841797, 52.58357238769531, 64.00003051757812, 75.41648864746094, 86.83294677734375, 98.24940490722656, 109.6658706665039, 121.08232879638672, 132.498779296875, 143.91525268554688, 155.3317108154297, 166.7481689453125]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 3.0, 6.0, 6.0, 10.0, 8.0, 12.0, 19.0, 19.0, 16.0, 21.0, 28.0, 22.0, 33.0, 39.0, 38.0, 19.0, 31.0, 52.0, 48.0, 32.0, 43.0, 36.0, 48.0, 35.0, 46.0, 41.0, 36.0, 38.0, 32.0, 34.0, 23.0, 19.0, 15.0, 14.0, 17.0, 14.0, 9.0, 9.0, 11.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.65288543701172, -94.69966888427734, -91.74644470214844, -88.79322814941406, -85.84001159667969, -82.88679504394531, -79.93357849121094, -76.98035430908203, -74.02713775634766, -71.07392120361328, -68.12069702148438, -65.16748046875, -62.214263916015625, -59.26104736328125, -56.30782699584961, -53.35460662841797, -50.401390075683594, -47.44817352294922, -44.49495315551758, -41.54173278808594, -38.58851623535156, -35.63529968261719, -32.68207931518555, -29.72886085510254, -26.77564239501953, -23.822423934936523, -20.869205474853516, -17.915987014770508, -14.9627685546875, -12.009550094604492, -9.056331634521484, -6.103113174438477, -3.1498947143554688, -0.19667625427246094, 2.756542205810547, 5.709760665893555, 8.662979125976562, 11.61619758605957, 14.569416046142578, 17.522634506225586, 20.475852966308594, 23.4290714263916, 26.38228988647461, 29.335508346557617, 32.288726806640625, 35.241943359375, 38.19516372680664, 41.14838409423828, 44.101600646972656, 47.05481719970703, 50.00803756713867, 52.96125793457031, 55.91447448730469, 58.86769104003906, 61.8209114074707, 64.77413177490234, 67.72734832763672, 70.6805648803711, 73.6337890625, 76.58700561523438, 79.54022216796875, 82.49343872070312, 85.4466552734375, 88.3998794555664, 91.35309600830078]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 5.0, 10.0, 9.0, 17.0, 17.0, 14.0, 27.0, 27.0, 20.0, 30.0, 40.0, 42.0, 53.0, 36.0, 69.0, 50.0, 54.0, 41.0, 57.0, 40.0, 44.0, 43.0, 47.0, 33.0, 36.0, 32.0, 14.0, 20.0, 13.0, 9.0, 11.0, 4.0, 8.0, 6.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-15.0234375, -14.613037109375, -14.20263671875, -13.792236328125, -13.3818359375, -12.971435546875, -12.56103515625, -12.150634765625, -11.740234375, -11.329833984375, -10.91943359375, -10.509033203125, -10.0986328125, -9.688232421875, -9.27783203125, -8.867431640625, -8.45703125, -8.046630859375, -7.63623046875, -7.225830078125, -6.8154296875, -6.405029296875, -5.99462890625, -5.584228515625, -5.173828125, -4.763427734375, -4.35302734375, -3.942626953125, -3.5322265625, -3.121826171875, -2.71142578125, -2.301025390625, -1.890625, -1.480224609375, -1.06982421875, -0.659423828125, -0.2490234375, 0.161376953125, 0.57177734375, 0.982177734375, 1.392578125, 1.802978515625, 2.21337890625, 2.623779296875, 3.0341796875, 3.444580078125, 3.85498046875, 4.265380859375, 4.67578125, 5.086181640625, 5.49658203125, 5.906982421875, 6.3173828125, 6.727783203125, 7.13818359375, 7.548583984375, 7.958984375, 8.369384765625, 8.77978515625, 9.190185546875, 9.6005859375, 10.010986328125, 10.42138671875, 10.831787109375, 11.2421875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 5.0, 11.0, 22.0, 27.0, 35.0, 60.0, 101.0, 144.0, 264.0, 337.0, 583.0, 839.0, 1415.0, 2162.0, 3492.0, 5685.0, 9726.0, 16448.0, 29034.0, 52710.0, 105408.0, 294536.0, 295838.0, 106076.0, 53253.0, 28679.0, 16369.0, 9734.0, 5918.0, 3619.0, 2225.0, 1364.0, 880.0, 523.0, 329.0, 229.0, 168.0, 89.0, 71.0, 46.0, 33.0, 19.0, 20.0, 9.0, 8.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.884765625, -2.7999267578125, -2.715087890625, -2.6302490234375, -2.54541015625, -2.4605712890625, -2.375732421875, -2.2908935546875, -2.2060546875, -2.1212158203125, -2.036376953125, -1.9515380859375, -1.86669921875, -1.7818603515625, -1.697021484375, -1.6121826171875, -1.52734375, -1.4425048828125, -1.357666015625, -1.2728271484375, -1.18798828125, -1.1031494140625, -1.018310546875, -0.9334716796875, -0.8486328125, -0.7637939453125, -0.678955078125, -0.5941162109375, -0.50927734375, -0.4244384765625, -0.339599609375, -0.2547607421875, -0.169921875, -0.0850830078125, -0.000244140625, 0.0845947265625, 0.16943359375, 0.2542724609375, 0.339111328125, 0.4239501953125, 0.5087890625, 0.5936279296875, 0.678466796875, 0.7633056640625, 0.84814453125, 0.9329833984375, 1.017822265625, 1.1026611328125, 1.1875, 1.2723388671875, 1.357177734375, 1.4420166015625, 1.52685546875, 1.6116943359375, 1.696533203125, 1.7813720703125, 1.8662109375, 1.9510498046875, 2.035888671875, 2.1207275390625, 2.20556640625, 2.2904052734375, 2.375244140625, 2.4600830078125, 2.544921875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 10.0, 9.0, 13.0, 14.0, 21.0, 20.0, 25.0, 29.0, 20.0, 31.0, 32.0, 43.0, 48.0, 52.0, 40.0, 38.0, 44.0, 1070.0, 38.0, 47.0, 33.0, 40.0, 37.0, 35.0, 37.0, 36.0, 26.0, 22.0, 20.0, 16.0, 20.0, 11.0, 7.0, 7.0, 3.0, 7.0, 6.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.6015625, -6.3673095703125, -6.133056640625, -5.8988037109375, -5.66455078125, -5.4302978515625, -5.196044921875, -4.9617919921875, -4.7275390625, -4.4932861328125, -4.259033203125, -4.0247802734375, -3.79052734375, -3.5562744140625, -3.322021484375, -3.0877685546875, -2.853515625, -2.6192626953125, -2.385009765625, -2.1507568359375, -1.91650390625, -1.6822509765625, -1.447998046875, -1.2137451171875, -0.9794921875, -0.7452392578125, -0.510986328125, -0.2767333984375, -0.04248046875, 0.1917724609375, 0.426025390625, 0.6602783203125, 0.89453125, 1.1287841796875, 1.363037109375, 1.5972900390625, 1.83154296875, 2.0657958984375, 2.300048828125, 2.5343017578125, 2.7685546875, 3.0028076171875, 3.237060546875, 3.4713134765625, 3.70556640625, 3.9398193359375, 4.174072265625, 4.4083251953125, 4.642578125, 4.8768310546875, 5.111083984375, 5.3453369140625, 5.57958984375, 5.8138427734375, 6.048095703125, 6.2823486328125, 6.5166015625, 6.7508544921875, 6.985107421875, 7.2193603515625, 7.45361328125, 7.6878662109375, 7.922119140625, 8.1563720703125, 8.390625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 14.0, 21.0, 19.0, 30.0, 40.0, 64.0, 97.0, 156.0, 184.0, 305.0, 473.0, 734.0, 1070.0, 1656.0, 2645.0, 4258.0, 7127.0, 11700.0, 19798.0, 33381.0, 58458.0, 112982.0, 1355429.0, 252190.0, 102332.0, 54148.0, 30887.0, 18075.0, 11015.0, 6725.0, 4105.0, 2470.0, 1600.0, 1004.0, 656.0, 419.0, 294.0, 191.0, 127.0, 77.0, 48.0, 36.0, 24.0, 18.0, 14.0, 10.0, 9.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.525390625, -2.450958251953125, -2.37652587890625, -2.302093505859375, -2.2276611328125, -2.153228759765625, -2.07879638671875, -2.004364013671875, -1.929931640625, -1.855499267578125, -1.78106689453125, -1.706634521484375, -1.6322021484375, -1.557769775390625, -1.48333740234375, -1.408905029296875, -1.33447265625, -1.260040283203125, -1.18560791015625, -1.111175537109375, -1.0367431640625, -0.962310791015625, -0.88787841796875, -0.813446044921875, -0.739013671875, -0.664581298828125, -0.59014892578125, -0.515716552734375, -0.4412841796875, -0.366851806640625, -0.29241943359375, -0.217987060546875, -0.1435546875, -0.069122314453125, 0.00531005859375, 0.079742431640625, 0.1541748046875, 0.228607177734375, 0.30303955078125, 0.377471923828125, 0.451904296875, 0.526336669921875, 0.60076904296875, 0.675201416015625, 0.7496337890625, 0.824066162109375, 0.89849853515625, 0.972930908203125, 1.04736328125, 1.121795654296875, 1.19622802734375, 1.270660400390625, 1.3450927734375, 1.419525146484375, 1.49395751953125, 1.568389892578125, 1.642822265625, 1.717254638671875, 1.79168701171875, 1.866119384765625, 1.9405517578125, 2.014984130859375, 2.08941650390625, 2.163848876953125, 2.23828125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 9.0, 2.0, 14.0, 16.0, 22.0, 15.0, 23.0, 30.0, 39.0, 51.0, 70.0, 89.0, 121.0, 99.0, 103.0, 71.0, 44.0, 41.0, 30.0, 27.0, 16.0, 13.0, 15.0, 14.0, 11.0, 8.0, 8.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017290115356445312, -0.0016824603080749512, -0.001635909080505371, -0.001589357852935791, -0.001542806625366211, -0.0014962553977966309, -0.0014497041702270508, -0.0014031529426574707, -0.0013566017150878906, -0.0013100504875183105, -0.0012634992599487305, -0.0012169480323791504, -0.0011703968048095703, -0.0011238455772399902, -0.0010772943496704102, -0.00103074312210083, -0.00098419189453125, -0.0009376406669616699, -0.0008910894393920898, -0.0008445382118225098, -0.0007979869842529297, -0.0007514357566833496, -0.0007048845291137695, -0.0006583333015441895, -0.0006117820739746094, -0.0005652308464050293, -0.0005186796188354492, -0.00047212839126586914, -0.00042557716369628906, -0.000379025936126709, -0.0003324747085571289, -0.00028592348098754883, -0.00023937225341796875, -0.00019282102584838867, -0.0001462697982788086, -9.971857070922852e-05, -5.316734313964844e-05, -6.616115570068359e-06, 3.993511199951172e-05, 8.64863395690918e-05, 0.00013303756713867188, 0.00017958879470825195, 0.00022614002227783203, 0.0002726912498474121, 0.0003192424774169922, 0.00036579370498657227, 0.00041234493255615234, 0.0004588961601257324, 0.0005054473876953125, 0.0005519986152648926, 0.0005985498428344727, 0.0006451010704040527, 0.0006916522979736328, 0.0007382035255432129, 0.000784754753112793, 0.000831305980682373, 0.0008778572082519531, 0.0009244084358215332, 0.0009709596633911133, 0.0010175108909606934, 0.0010640621185302734, 0.0011106133460998535, 0.0011571645736694336, 0.0012037158012390137, 0.0012502670288085938]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 6.0, 5.0, 11.0, 19.0, 27.0, 29.0, 37.0, 55.0, 81.0, 101.0, 168.0, 245.0, 414.0, 758.0, 4905.0, 1038174.0, 1818.0, 671.0, 357.0, 222.0, 112.0, 91.0, 73.0, 44.0, 40.0, 20.0, 25.0, 12.0, 10.0, 6.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02886962890625, -0.027977466583251953, -0.027085304260253906, -0.02619314193725586, -0.025300979614257812, -0.024408817291259766, -0.02351665496826172, -0.022624492645263672, -0.021732330322265625, -0.020840167999267578, -0.01994800567626953, -0.019055843353271484, -0.018163681030273438, -0.01727151870727539, -0.016379356384277344, -0.015487194061279297, -0.01459503173828125, -0.013702869415283203, -0.012810707092285156, -0.01191854476928711, -0.011026382446289062, -0.010134220123291016, -0.009242057800292969, -0.008349895477294922, -0.007457733154296875, -0.006565570831298828, -0.005673408508300781, -0.004781246185302734, -0.0038890838623046875, -0.0029969215393066406, -0.0021047592163085938, -0.0012125968933105469, -0.0003204345703125, 0.0005717277526855469, 0.0014638900756835938, 0.0023560523986816406, 0.0032482147216796875, 0.004140377044677734, 0.005032539367675781, 0.005924701690673828, 0.006816864013671875, 0.007709026336669922, 0.008601188659667969, 0.009493350982666016, 0.010385513305664062, 0.01127767562866211, 0.012169837951660156, 0.013062000274658203, 0.01395416259765625, 0.014846324920654297, 0.015738487243652344, 0.01663064956665039, 0.017522811889648438, 0.018414974212646484, 0.01930713653564453, 0.020199298858642578, 0.021091461181640625, 0.021983623504638672, 0.02287578582763672, 0.023767948150634766, 0.024660110473632812, 0.02555227279663086, 0.026444435119628906, 0.027336597442626953, 0.028228759765625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 16.0, 867.0, 127.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016239110846072435, -0.0014713670825585723, -0.0013188229640945792, -0.001166278962045908, -0.001013734843581915, -0.0008611908415332437, -0.0007086468394845724, -0.0005561027210205793, -0.0004035587189719081, -0.00025101465871557593, -9.847062756307423e-05, 5.407340358942747e-05, 0.00020661746384575963, 0.0003591615241020918, 0.000511705526150763, 0.0006642496446147561, 0.0008167936466634274, 0.0009693377069197595, 0.0011218817671760917, 0.001274425769224763, 0.001426969887688756, 0.0015795138897374272, 0.0017320578917860985, 0.0018846020102500916, 0.0020371461287140846, 0.0021896902471780777, 0.002342234132811427, 0.00249477825127542, 0.0026473223697394133, 0.0027998662553727627, 0.0029524103738367558, 0.003104954492300749, 0.003257498610764742, 0.003410042729228735, 0.0035625866148620844, 0.0037151307333260775, 0.0038676748517900705, 0.00402021873742342, 0.004172762855887413, 0.004325306974351406, 0.004477851092815399, 0.004630395211279392, 0.004782939329743385, 0.004935483448207378, 0.005088027101010084, 0.005240571219474077, 0.00539311533793807, 0.005545659456402063, 0.005698203109204769, 0.005850747227668762, 0.006003291346132755, 0.006155835464596748, 0.006308379117399454, 0.006460923235863447, 0.00661346735432744, 0.006766011472791433, 0.006918555591255426, 0.0070710997097194195, 0.0072236438281834126, 0.007376187480986118, 0.007528731599450111, 0.0076812757179141045, 0.007833819836378098, 0.00798636395484209, 0.008138908073306084]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 0.0, 1.0, 9.0, 3.0, 6.0, 9.0, 14.0, 11.0, 24.0, 17.0, 17.0, 14.0, 14.0, 23.0, 20.0, 29.0, 27.0, 35.0, 38.0, 35.0, 33.0, 42.0, 31.0, 44.0, 42.0, 43.0, 45.0, 49.0, 34.0, 27.0, 33.0, 28.0, 32.0, 19.0, 22.0, 17.0, 14.0, 23.0, 16.0, 10.0, 10.0, 12.0, 6.0, 7.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.00047343969345092773, -0.0004579499363899231, -0.00044246017932891846, -0.0004269704222679138, -0.0004114806652069092, -0.00039599090814590454, -0.0003805011510848999, -0.00036501139402389526, -0.0003495216369628906, -0.000334031879901886, -0.00031854212284088135, -0.0003030523657798767, -0.00028756260871887207, -0.00027207285165786743, -0.0002565830945968628, -0.00024109333753585815, -0.00022560358047485352, -0.00021011382341384888, -0.00019462406635284424, -0.0001791343092918396, -0.00016364455223083496, -0.00014815479516983032, -0.00013266503810882568, -0.00011717528104782104, -0.0001016855239868164, -8.619576692581177e-05, -7.070600986480713e-05, -5.521625280380249e-05, -3.972649574279785e-05, -2.4236738681793213e-05, -8.746981620788574e-06, 6.7427754402160645e-06, 2.2232532501220703e-05, 3.772228956222534e-05, 5.321204662322998e-05, 6.870180368423462e-05, 8.419156074523926e-05, 9.96813178062439e-05, 0.00011517107486724854, 0.00013066083192825317, 0.0001461505889892578, 0.00016164034605026245, 0.0001771301031112671, 0.00019261986017227173, 0.00020810961723327637, 0.000223599374294281, 0.00023908913135528564, 0.0002545788884162903, 0.0002700686454772949, 0.00028555840253829956, 0.0003010481595993042, 0.00031653791666030884, 0.0003320276737213135, 0.0003475174307823181, 0.00036300718784332275, 0.0003784969449043274, 0.00039398670196533203, 0.00040947645902633667, 0.0004249662160873413, 0.00044045597314834595, 0.0004559457302093506, 0.0004714354872703552, 0.00048692524433135986, 0.0005024150013923645, 0.0005179047584533691]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 5.0, 10.0, 9.0, 17.0, 17.0, 14.0, 27.0, 27.0, 20.0, 30.0, 40.0, 42.0, 53.0, 36.0, 69.0, 50.0, 54.0, 41.0, 57.0, 40.0, 44.0, 43.0, 47.0, 33.0, 36.0, 32.0, 14.0, 20.0, 13.0, 9.0, 11.0, 4.0, 8.0, 6.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-15.0234375, -14.613037109375, -14.20263671875, -13.792236328125, -13.3818359375, -12.971435546875, -12.56103515625, -12.150634765625, -11.740234375, -11.329833984375, -10.91943359375, -10.509033203125, -10.0986328125, -9.688232421875, -9.27783203125, -8.867431640625, -8.45703125, -8.046630859375, -7.63623046875, -7.225830078125, -6.8154296875, -6.405029296875, -5.99462890625, -5.584228515625, -5.173828125, -4.763427734375, -4.35302734375, -3.942626953125, -3.5322265625, -3.121826171875, -2.71142578125, -2.301025390625, -1.890625, -1.480224609375, -1.06982421875, -0.659423828125, -0.2490234375, 0.161376953125, 0.57177734375, 0.982177734375, 1.392578125, 1.802978515625, 2.21337890625, 2.623779296875, 3.0341796875, 3.444580078125, 3.85498046875, 4.265380859375, 4.67578125, 5.086181640625, 5.49658203125, 5.906982421875, 6.3173828125, 6.727783203125, 7.13818359375, 7.548583984375, 7.958984375, 8.369384765625, 8.77978515625, 9.190185546875, 9.6005859375, 10.010986328125, 10.42138671875, 10.831787109375, 11.2421875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 11.0, 16.0, 28.0, 33.0, 41.0, 54.0, 97.0, 130.0, 193.0, 261.0, 475.0, 782.0, 1480.0, 3265.0, 9356.0, 34469.0, 230826.0, 659684.0, 80030.0, 16932.0, 5396.0, 2198.0, 1093.0, 615.0, 375.0, 210.0, 162.0, 94.0, 67.0, 38.0, 36.0, 24.0, 16.0, 10.0, 10.0, 16.0, 8.0, 6.0, 0.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-27.59375, -26.83251953125, -26.0712890625, -25.31005859375, -24.548828125, -23.78759765625, -23.0263671875, -22.26513671875, -21.50390625, -20.74267578125, -19.9814453125, -19.22021484375, -18.458984375, -17.69775390625, -16.9365234375, -16.17529296875, -15.4140625, -14.65283203125, -13.8916015625, -13.13037109375, -12.369140625, -11.60791015625, -10.8466796875, -10.08544921875, -9.32421875, -8.56298828125, -7.8017578125, -7.04052734375, -6.279296875, -5.51806640625, -4.7568359375, -3.99560546875, -3.234375, -2.47314453125, -1.7119140625, -0.95068359375, -0.189453125, 0.57177734375, 1.3330078125, 2.09423828125, 2.85546875, 3.61669921875, 4.3779296875, 5.13916015625, 5.900390625, 6.66162109375, 7.4228515625, 8.18408203125, 8.9453125, 9.70654296875, 10.4677734375, 11.22900390625, 11.990234375, 12.75146484375, 13.5126953125, 14.27392578125, 15.03515625, 15.79638671875, 16.5576171875, 17.31884765625, 18.080078125, 18.84130859375, 19.6025390625, 20.36376953125, 21.125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 6.0, 12.0, 24.0, 23.0, 34.0, 41.0, 52.0, 54.0, 72.0, 93.0, 272.0, 1878.0, 111.0, 82.0, 66.0, 63.0, 46.0, 30.0, 17.0, 14.0, 15.0, 4.0, 11.0, 5.0, 2.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.46875, -48.7998046875, -47.130859375, -45.4619140625, -43.79296875, -42.1240234375, -40.455078125, -38.7861328125, -37.1171875, -35.4482421875, -33.779296875, -32.1103515625, -30.44140625, -28.7724609375, -27.103515625, -25.4345703125, -23.765625, -22.0966796875, -20.427734375, -18.7587890625, -17.08984375, -15.4208984375, -13.751953125, -12.0830078125, -10.4140625, -8.7451171875, -7.076171875, -5.4072265625, -3.73828125, -2.0693359375, -0.400390625, 1.2685546875, 2.9375, 4.6064453125, 6.275390625, 7.9443359375, 9.61328125, 11.2822265625, 12.951171875, 14.6201171875, 16.2890625, 17.9580078125, 19.626953125, 21.2958984375, 22.96484375, 24.6337890625, 26.302734375, 27.9716796875, 29.640625, 31.3095703125, 32.978515625, 34.6474609375, 36.31640625, 37.9853515625, 39.654296875, 41.3232421875, 42.9921875, 44.6611328125, 46.330078125, 47.9990234375, 49.66796875, 51.3369140625, 53.005859375, 54.6748046875, 56.34375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 5.0, 3.0, 10.0, 15.0, 13.0, 19.0, 40.0, 61.0, 71.0, 155.0, 317.0, 993.0, 75863.0, 3065961.0, 1294.0, 427.0, 169.0, 87.0, 64.0, 37.0, 32.0, 26.0, 16.0, 5.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-165.375, -160.525390625, -155.67578125, -150.826171875, -145.9765625, -141.126953125, -136.27734375, -131.427734375, -126.578125, -121.728515625, -116.87890625, -112.029296875, -107.1796875, -102.330078125, -97.48046875, -92.630859375, -87.78125, -82.931640625, -78.08203125, -73.232421875, -68.3828125, -63.533203125, -58.68359375, -53.833984375, -48.984375, -44.134765625, -39.28515625, -34.435546875, -29.5859375, -24.736328125, -19.88671875, -15.037109375, -10.1875, -5.337890625, -0.48828125, 4.361328125, 9.2109375, 14.060546875, 18.91015625, 23.759765625, 28.609375, 33.458984375, 38.30859375, 43.158203125, 48.0078125, 52.857421875, 57.70703125, 62.556640625, 67.40625, 72.255859375, 77.10546875, 81.955078125, 86.8046875, 91.654296875, 96.50390625, 101.353515625, 106.203125, 111.052734375, 115.90234375, 120.751953125, 125.6015625, 130.451171875, 135.30078125, 140.150390625, 145.0]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 16.0, 154.0, 718.0, 115.0, 12.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-300.0871887207031, -293.89129638671875, -287.6954040527344, -281.4995422363281, -275.30364990234375, -269.1077575683594, -262.911865234375, -256.7159729003906, -250.5200958251953, -244.32420349121094, -238.12832641601562, -231.93243408203125, -225.73654174804688, -219.54066467285156, -213.3447723388672, -207.14889526367188, -200.9530029296875, -194.75711059570312, -188.5612335205078, -182.36534118652344, -176.16946411132812, -169.97357177734375, -163.77767944335938, -157.581787109375, -151.3859100341797, -145.1900177001953, -138.994140625, -132.79824829101562, -126.60236358642578, -120.40647888183594, -114.21058654785156, -108.01470184326172, -101.81880950927734, -95.6229248046875, -89.42703247070312, -83.23114776611328, -77.03526306152344, -70.8393783569336, -64.64349365234375, -58.447601318359375, -52.25171661376953, -46.05583190917969, -39.85994338989258, -33.66405487060547, -27.468170166015625, -21.27228355407715, -15.076396942138672, -8.880508422851562, -2.6846237182617188, 3.511262893676758, 9.707149505615234, 15.903036117553711, 22.098922729492188, 28.294809341430664, 34.49069595336914, 40.68658447265625, 46.882469177246094, 53.07835388183594, 59.27424240112305, 65.47013092041016, 71.666015625, 77.86190032958984, 84.05778503417969, 90.25367736816406, 96.4495620727539]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 1.0, 7.0, 4.0, 5.0, 4.0, 5.0, 7.0, 12.0, 11.0, 16.0, 12.0, 16.0, 19.0, 18.0, 22.0, 27.0, 22.0, 42.0, 33.0, 35.0, 33.0, 43.0, 37.0, 39.0, 33.0, 35.0, 42.0, 31.0, 39.0, 35.0, 24.0, 31.0, 31.0, 21.0, 22.0, 27.0, 36.0, 24.0, 19.0, 17.0, 15.0, 7.0, 9.0, 11.0, 5.0, 3.0, 8.0, 2.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-88.22542572021484, -85.53599548339844, -82.8465576171875, -80.1571273803711, -77.46769714355469, -74.77825927734375, -72.08882904052734, -69.39939880371094, -66.7099609375, -64.0205307006836, -61.331092834472656, -58.64166259765625, -55.95222854614258, -53.262794494628906, -50.5733642578125, -47.88393020629883, -45.194496154785156, -42.505062103271484, -39.81562805175781, -37.126197814941406, -34.436763763427734, -31.747329711914062, -29.057897567749023, -26.368465423583984, -23.679031372070312, -20.98959732055664, -18.3001651763916, -15.610732078552246, -12.92129898071289, -10.231865882873535, -7.54243278503418, -4.853000640869141, -2.1635665893554688, 0.5258665084838867, 3.215299606323242, 5.904732704162598, 8.594165802001953, 11.283598899841309, 13.973031997680664, 16.662464141845703, 19.351898193359375, 22.041332244873047, 24.730764389038086, 27.420196533203125, 30.109630584716797, 32.79906463623047, 35.488494873046875, 38.17792892456055, 40.86736297607422, 43.55679702758789, 46.24623107910156, 48.93566131591797, 51.62509536743164, 54.31452941894531, 57.00395965576172, 59.69339370727539, 62.38282775878906, 65.07225799560547, 67.7616958618164, 70.45112609863281, 73.14056396484375, 75.82999420166016, 78.51942443847656, 81.2088623046875, 83.8982925415039]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 6.0, 9.0, 11.0, 21.0, 14.0, 24.0, 23.0, 38.0, 26.0, 43.0, 45.0, 48.0, 54.0, 50.0, 45.0, 59.0, 50.0, 40.0, 36.0, 40.0, 45.0, 41.0, 42.0, 38.0, 23.0, 16.0, 25.0, 16.0, 17.0, 16.0, 6.0, 10.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.09375, -17.5595703125, -17.025390625, -16.4912109375, -15.95703125, -15.4228515625, -14.888671875, -14.3544921875, -13.8203125, -13.2861328125, -12.751953125, -12.2177734375, -11.68359375, -11.1494140625, -10.615234375, -10.0810546875, -9.546875, -9.0126953125, -8.478515625, -7.9443359375, -7.41015625, -6.8759765625, -6.341796875, -5.8076171875, -5.2734375, -4.7392578125, -4.205078125, -3.6708984375, -3.13671875, -2.6025390625, -2.068359375, -1.5341796875, -1.0, -0.4658203125, 0.068359375, 0.6025390625, 1.13671875, 1.6708984375, 2.205078125, 2.7392578125, 3.2734375, 3.8076171875, 4.341796875, 4.8759765625, 5.41015625, 5.9443359375, 6.478515625, 7.0126953125, 7.546875, 8.0810546875, 8.615234375, 9.1494140625, 9.68359375, 10.2177734375, 10.751953125, 11.2861328125, 11.8203125, 12.3544921875, 12.888671875, 13.4228515625, 13.95703125, 14.4912109375, 15.025390625, 15.5595703125, 16.09375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 4.0, 4.0, 2.0, 4.0, 7.0, 11.0, 15.0, 18.0, 21.0, 31.0, 25.0, 40.0, 34.0, 41.0, 54.0, 86.0, 92.0, 127.0, 199.0, 230.0, 334.0, 446.0, 763.0, 1747.0, 7357.0, 2462960.0, 1709612.0, 5967.0, 1528.0, 745.0, 441.0, 309.0, 228.0, 171.0, 120.0, 108.0, 78.0, 59.0, 39.0, 52.0, 24.0, 29.0, 27.0, 30.0, 10.0, 12.0, 19.0, 6.0, 2.0, 7.0, 4.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-89.8125, -87.0869140625, -84.361328125, -81.6357421875, -78.91015625, -76.1845703125, -73.458984375, -70.7333984375, -68.0078125, -65.2822265625, -62.556640625, -59.8310546875, -57.10546875, -54.3798828125, -51.654296875, -48.9287109375, -46.203125, -43.4775390625, -40.751953125, -38.0263671875, -35.30078125, -32.5751953125, -29.849609375, -27.1240234375, -24.3984375, -21.6728515625, -18.947265625, -16.2216796875, -13.49609375, -10.7705078125, -8.044921875, -5.3193359375, -2.59375, 0.1318359375, 2.857421875, 5.5830078125, 8.30859375, 11.0341796875, 13.759765625, 16.4853515625, 19.2109375, 21.9365234375, 24.662109375, 27.3876953125, 30.11328125, 32.8388671875, 35.564453125, 38.2900390625, 41.015625, 43.7412109375, 46.466796875, 49.1923828125, 51.91796875, 54.6435546875, 57.369140625, 60.0947265625, 62.8203125, 65.5458984375, 68.271484375, 70.9970703125, 73.72265625, 76.4482421875, 79.173828125, 81.8994140625, 84.625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 12.0, 16.0, 27.0, 65.0, 155.0, 456.0, 1062.0, 1302.0, 576.0, 232.0, 89.0, 41.0, 19.0, 12.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-68.9375, -67.442626953125, -65.94775390625, -64.452880859375, -62.9580078125, -61.463134765625, -59.96826171875, -58.473388671875, -56.978515625, -55.483642578125, -53.98876953125, -52.493896484375, -50.9990234375, -49.504150390625, -48.00927734375, -46.514404296875, -45.01953125, -43.524658203125, -42.02978515625, -40.534912109375, -39.0400390625, -37.545166015625, -36.05029296875, -34.555419921875, -33.060546875, -31.565673828125, -30.07080078125, -28.575927734375, -27.0810546875, -25.586181640625, -24.09130859375, -22.596435546875, -21.1015625, -19.606689453125, -18.11181640625, -16.616943359375, -15.1220703125, -13.627197265625, -12.13232421875, -10.637451171875, -9.142578125, -7.647705078125, -6.15283203125, -4.657958984375, -3.1630859375, -1.668212890625, -0.17333984375, 1.321533203125, 2.81640625, 4.311279296875, 5.80615234375, 7.301025390625, 8.7958984375, 10.290771484375, 11.78564453125, 13.280517578125, 14.775390625, 16.270263671875, 17.76513671875, 19.260009765625, 20.7548828125, 22.249755859375, 23.74462890625, 25.239501953125, 26.734375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 13.0, 29.0, 54.0, 109.0, 276.0, 1307.0, 25468.0, 4122565.0, 42314.0, 1610.0, 322.0, 116.0, 39.0, 27.0, 15.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.6875, -90.080078125, -87.47265625, -84.865234375, -82.2578125, -79.650390625, -77.04296875, -74.435546875, -71.828125, -69.220703125, -66.61328125, -64.005859375, -61.3984375, -58.791015625, -56.18359375, -53.576171875, -50.96875, -48.361328125, -45.75390625, -43.146484375, -40.5390625, -37.931640625, -35.32421875, -32.716796875, -30.109375, -27.501953125, -24.89453125, -22.287109375, -19.6796875, -17.072265625, -14.46484375, -11.857421875, -9.25, -6.642578125, -4.03515625, -1.427734375, 1.1796875, 3.787109375, 6.39453125, 9.001953125, 11.609375, 14.216796875, 16.82421875, 19.431640625, 22.0390625, 24.646484375, 27.25390625, 29.861328125, 32.46875, 35.076171875, 37.68359375, 40.291015625, 42.8984375, 45.505859375, 48.11328125, 50.720703125, 53.328125, 55.935546875, 58.54296875, 61.150390625, 63.7578125, 66.365234375, 68.97265625, 71.580078125, 74.1875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 7.0, 13.0, 40.0, 80.0, 147.0, 261.0, 226.0, 127.0, 61.0, 28.0, 10.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-424.3914794921875, -416.0339050292969, -407.6763610839844, -399.31878662109375, -390.96124267578125, -382.6036682128906, -374.24609375, -365.8885498046875, -357.5309753417969, -349.17340087890625, -340.81585693359375, -332.4582824707031, -324.1007080078125, -315.7431640625, -307.3855895996094, -299.0280456542969, -290.67047119140625, -282.3128967285156, -273.9553527832031, -265.5977783203125, -257.240234375, -248.88265991210938, -240.52508544921875, -232.1675262451172, -223.80996704101562, -215.45240783691406, -207.0948486328125, -198.73727416992188, -190.3797149658203, -182.02215576171875, -173.66458129882812, -165.30702209472656, -156.94949340820312, -148.59193420410156, -140.234375, -131.87680053710938, -123.51924133300781, -115.16168212890625, -106.80411529541016, -98.44654846191406, -90.08898162841797, -81.73141479492188, -73.37385559082031, -65.01629638671875, -56.658729553222656, -48.30116653442383, -39.943603515625, -31.586040496826172, -23.228477478027344, -14.870914459228516, -6.5133514404296875, 1.8442115783691406, 10.201774597167969, 18.559337615966797, 26.916900634765625, 35.27446365356445, 43.63202667236328, 51.98958969116211, 60.34715270996094, 68.7047119140625, 77.0622787475586, 85.41984558105469, 93.77740478515625, 102.13496398925781, 110.4925308227539]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 6.0, 5.0, 8.0, 11.0, 8.0, 10.0, 9.0, 14.0, 16.0, 24.0, 19.0, 26.0, 30.0, 40.0, 38.0, 29.0, 48.0, 32.0, 43.0, 38.0, 34.0, 37.0, 38.0, 45.0, 37.0, 31.0, 33.0, 32.0, 42.0, 32.0, 23.0, 30.0, 19.0, 23.0, 14.0, 13.0, 10.0, 12.0, 10.0, 11.0, 5.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.222496032714844, -57.05686569213867, -54.8912353515625, -52.725608825683594, -50.55997848510742, -48.39434814453125, -46.228721618652344, -44.06309127807617, -41.8974609375, -39.73183059692383, -37.566200256347656, -35.40057373046875, -33.23494338989258, -31.069313049316406, -28.903684616088867, -26.738056182861328, -24.572425842285156, -22.406795501708984, -20.241167068481445, -18.075538635253906, -15.909908294677734, -13.744278907775879, -11.578649520874023, -9.413020133972168, -7.2473907470703125, -5.081761360168457, -2.9161319732666016, -0.7505025863647461, 1.4151268005371094, 3.580756187438965, 5.74638557434082, 7.912014961242676, 10.07763671875, 12.243266105651855, 14.408895492553711, 16.57452392578125, 18.740154266357422, 20.905784606933594, 23.071413040161133, 25.237041473388672, 27.402671813964844, 29.568302154541016, 31.733930587768555, 33.899559020996094, 36.065189361572266, 38.23081970214844, 40.396446228027344, 42.562076568603516, 44.72770690917969, 46.89333724975586, 49.05896759033203, 51.22459411621094, 53.39022445678711, 55.55585479736328, 57.72148132324219, 59.88711166381836, 62.05274200439453, 64.21836853027344, 66.38400268554688, 68.54962921142578, 70.71525573730469, 72.88088989257812, 75.04651641845703, 77.21215057373047, 79.37777709960938]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 4.0, 5.0, 9.0, 4.0, 13.0, 11.0, 18.0, 17.0, 16.0, 27.0, 29.0, 23.0, 34.0, 29.0, 38.0, 46.0, 50.0, 45.0, 48.0, 35.0, 41.0, 47.0, 44.0, 41.0, 32.0, 44.0, 32.0, 37.0, 30.0, 28.0, 12.0, 15.0, 17.0, 15.0, 14.0, 10.0, 9.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.75, -97.125, -93.5, -89.875, -86.25, -82.625, -79.0, -75.375, -71.75, -68.125, -64.5, -60.875, -57.25, -53.625, -50.0, -46.375, -42.75, -39.125, -35.5, -31.875, -28.25, -24.625, -21.0, -17.375, -13.75, -10.125, -6.5, -2.875, 0.75, 4.375, 8.0, 11.625, 15.25, 18.875, 22.5, 26.125, 29.75, 33.375, 37.0, 40.625, 44.25, 47.875, 51.5, 55.125, 58.75, 62.375, 66.0, 69.625, 73.25, 76.875, 80.5, 84.125, 87.75, 91.375, 95.0, 98.625, 102.25, 105.875, 109.5, 113.125, 116.75, 120.375, 124.0, 127.625, 131.25]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 14.0, 9.0, 8.0, 22.0, 33.0, 59.0, 67.0, 127.0, 157.0, 275.0, 399.0, 586.0, 944.0, 1574.0, 2616.0, 4349.0, 7266.0, 12151.0, 21433.0, 39361.0, 75465.0, 169558.0, 395390.0, 157410.0, 71996.0, 37178.0, 20514.0, 11824.0, 6963.0, 4040.0, 2517.0, 1569.0, 964.0, 622.0, 386.0, 246.0, 137.0, 111.0, 74.0, 40.0, 32.0, 23.0, 21.0, 10.0, 3.0, 7.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.640625, -25.844482421875, -25.04833984375, -24.252197265625, -23.4560546875, -22.659912109375, -21.86376953125, -21.067626953125, -20.271484375, -19.475341796875, -18.67919921875, -17.883056640625, -17.0869140625, -16.290771484375, -15.49462890625, -14.698486328125, -13.90234375, -13.106201171875, -12.31005859375, -11.513916015625, -10.7177734375, -9.921630859375, -9.12548828125, -8.329345703125, -7.533203125, -6.737060546875, -5.94091796875, -5.144775390625, -4.3486328125, -3.552490234375, -2.75634765625, -1.960205078125, -1.1640625, -0.367919921875, 0.42822265625, 1.224365234375, 2.0205078125, 2.816650390625, 3.61279296875, 4.408935546875, 5.205078125, 6.001220703125, 6.79736328125, 7.593505859375, 8.3896484375, 9.185791015625, 9.98193359375, 10.778076171875, 11.57421875, 12.370361328125, 13.16650390625, 13.962646484375, 14.7587890625, 15.554931640625, 16.35107421875, 17.147216796875, 17.943359375, 18.739501953125, 19.53564453125, 20.331787109375, 21.1279296875, 21.924072265625, 22.72021484375, 23.516357421875, 24.3125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 8.0, 8.0, 4.0, 4.0, 10.0, 18.0, 9.0, 17.0, 20.0, 18.0, 24.0, 34.0, 33.0, 27.0, 24.0, 31.0, 32.0, 43.0, 38.0, 40.0, 50.0, 1066.0, 34.0, 40.0, 40.0, 38.0, 39.0, 37.0, 30.0, 23.0, 33.0, 37.0, 18.0, 16.0, 18.0, 13.0, 9.0, 10.0, 7.0, 7.0, 4.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0], "bins": [-80.25, -78.0869140625, -75.923828125, -73.7607421875, -71.59765625, -69.4345703125, -67.271484375, -65.1083984375, -62.9453125, -60.7822265625, -58.619140625, -56.4560546875, -54.29296875, -52.1298828125, -49.966796875, -47.8037109375, -45.640625, -43.4775390625, -41.314453125, -39.1513671875, -36.98828125, -34.8251953125, -32.662109375, -30.4990234375, -28.3359375, -26.1728515625, -24.009765625, -21.8466796875, -19.68359375, -17.5205078125, -15.357421875, -13.1943359375, -11.03125, -8.8681640625, -6.705078125, -4.5419921875, -2.37890625, -0.2158203125, 1.947265625, 4.1103515625, 6.2734375, 8.4365234375, 10.599609375, 12.7626953125, 14.92578125, 17.0888671875, 19.251953125, 21.4150390625, 23.578125, 25.7412109375, 27.904296875, 30.0673828125, 32.23046875, 34.3935546875, 36.556640625, 38.7197265625, 40.8828125, 43.0458984375, 45.208984375, 47.3720703125, 49.53515625, 51.6982421875, 53.861328125, 56.0244140625, 58.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 11.0, 20.0, 26.0, 34.0, 48.0, 80.0, 111.0, 166.0, 256.0, 408.0, 650.0, 1104.0, 1690.0, 2756.0, 4362.0, 6897.0, 11354.0, 19010.0, 31018.0, 52097.0, 93557.0, 217019.0, 1379101.0, 118586.0, 62252.0, 36663.0, 22319.0, 13522.0, 8159.0, 5157.0, 3188.0, 2006.0, 1264.0, 767.0, 524.0, 329.0, 187.0, 124.0, 116.0, 68.0, 43.0, 28.0, 18.0, 15.0, 8.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.484375, -20.772216796875, -20.06005859375, -19.347900390625, -18.6357421875, -17.923583984375, -17.21142578125, -16.499267578125, -15.787109375, -15.074951171875, -14.36279296875, -13.650634765625, -12.9384765625, -12.226318359375, -11.51416015625, -10.802001953125, -10.08984375, -9.377685546875, -8.66552734375, -7.953369140625, -7.2412109375, -6.529052734375, -5.81689453125, -5.104736328125, -4.392578125, -3.680419921875, -2.96826171875, -2.256103515625, -1.5439453125, -0.831787109375, -0.11962890625, 0.592529296875, 1.3046875, 2.016845703125, 2.72900390625, 3.441162109375, 4.1533203125, 4.865478515625, 5.57763671875, 6.289794921875, 7.001953125, 7.714111328125, 8.42626953125, 9.138427734375, 9.8505859375, 10.562744140625, 11.27490234375, 11.987060546875, 12.69921875, 13.411376953125, 14.12353515625, 14.835693359375, 15.5478515625, 16.260009765625, 16.97216796875, 17.684326171875, 18.396484375, 19.108642578125, 19.82080078125, 20.532958984375, 21.2451171875, 21.957275390625, 22.66943359375, 23.381591796875, 24.09375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 0.0, 5.0, 6.0, 9.0, 6.0, 7.0, 13.0, 12.0, 14.0, 26.0, 22.0, 37.0, 48.0, 65.0, 74.0, 87.0, 100.0, 91.0, 85.0, 68.0, 55.0, 32.0, 28.0, 24.0, 16.0, 7.0, 17.0, 15.0, 6.0, 1.0, 5.0, 2.0, 1.0, 5.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.020294189453125, -0.019688129425048828, -0.019082069396972656, -0.018476009368896484, -0.017869949340820312, -0.01726388931274414, -0.01665782928466797, -0.016051769256591797, -0.015445709228515625, -0.014839649200439453, -0.014233589172363281, -0.01362752914428711, -0.013021469116210938, -0.012415409088134766, -0.011809349060058594, -0.011203289031982422, -0.01059722900390625, -0.009991168975830078, -0.009385108947753906, -0.008779048919677734, -0.008172988891601562, -0.007566928863525391, -0.006960868835449219, -0.006354808807373047, -0.005748748779296875, -0.005142688751220703, -0.004536628723144531, -0.003930568695068359, -0.0033245086669921875, -0.0027184486389160156, -0.0021123886108398438, -0.0015063285827636719, -0.0009002685546875, -0.0002942085266113281, 0.00031185150146484375, 0.0009179115295410156, 0.0015239715576171875, 0.0021300315856933594, 0.0027360916137695312, 0.003342151641845703, 0.003948211669921875, 0.004554271697998047, 0.005160331726074219, 0.005766391754150391, 0.0063724517822265625, 0.006978511810302734, 0.007584571838378906, 0.008190631866455078, 0.00879669189453125, 0.009402751922607422, 0.010008811950683594, 0.010614871978759766, 0.011220932006835938, 0.01182699203491211, 0.012433052062988281, 0.013039112091064453, 0.013645172119140625, 0.014251232147216797, 0.014857292175292969, 0.01546335220336914, 0.016069412231445312, 0.016675472259521484, 0.017281532287597656, 0.017887592315673828, 0.01849365234375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 7.0, 7.0, 7.0, 19.0, 19.0, 32.0, 21.0, 34.0, 47.0, 52.0, 75.0, 109.0, 174.0, 240.0, 412.0, 705.0, 1641.0, 4188.0, 16207.0, 99898.0, 672665.0, 213497.0, 27620.0, 6275.0, 2115.0, 950.0, 514.0, 327.0, 180.0, 134.0, 87.0, 59.0, 60.0, 47.0, 27.0, 24.0, 18.0, 9.0, 8.0, 8.0, 14.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.1268310546875, -0.12294864654541016, -0.11906623840332031, -0.11518383026123047, -0.11130142211914062, -0.10741901397705078, -0.10353660583496094, -0.0996541976928711, -0.09577178955078125, -0.0918893814086914, -0.08800697326660156, -0.08412456512451172, -0.08024215698242188, -0.07635974884033203, -0.07247734069824219, -0.06859493255615234, -0.0647125244140625, -0.060830116271972656, -0.05694770812988281, -0.05306529998779297, -0.049182891845703125, -0.04530048370361328, -0.04141807556152344, -0.037535667419433594, -0.03365325927734375, -0.029770851135253906, -0.025888442993164062, -0.02200603485107422, -0.018123626708984375, -0.014241218566894531, -0.010358810424804688, -0.006476402282714844, -0.002593994140625, 0.0012884140014648438, 0.0051708221435546875, 0.009053230285644531, 0.012935638427734375, 0.01681804656982422, 0.020700454711914062, 0.024582862854003906, 0.02846527099609375, 0.032347679138183594, 0.03623008728027344, 0.04011249542236328, 0.043994903564453125, 0.04787731170654297, 0.05175971984863281, 0.055642127990722656, 0.0595245361328125, 0.06340694427490234, 0.06728935241699219, 0.07117176055908203, 0.07505416870117188, 0.07893657684326172, 0.08281898498535156, 0.0867013931274414, 0.09058380126953125, 0.0944662094116211, 0.09834861755371094, 0.10223102569580078, 0.10611343383789062, 0.10999584197998047, 0.11387825012207031, 0.11776065826416016, 0.12164306640625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 26.0, 55.0, 122.0, 239.0, 267.0, 184.0, 75.0, 21.0, 11.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.016790717840194702, -0.01568986475467682, -0.01458901260048151, -0.013488160446286201, -0.012387307360768318, -0.011286454275250435, -0.010185602121055126, -0.009084749966859818, -0.007983896881341934, -0.006883044261485338, -0.005782191641628742, -0.004681339021772146, -0.0035804864019155502, -0.0024796337820589542, -0.0013787811622023582, -0.00027792854234576225, 0.0008229240775108337, 0.0019237766973674297, 0.0030246293172240257, 0.004125481937080622, 0.005226334556937218, 0.006327187176793814, 0.00742803979665041, 0.008528891950845718, 0.009629745036363602, 0.010730598121881485, 0.011831450276076794, 0.012932302430272102, 0.014033155515789986, 0.015134008601307869, 0.016234859824180603, 0.017335712909698486, 0.01843656226992607, 0.019537415355443954, 0.020638268440961838, 0.021739119663834572, 0.022839972749352455, 0.02394082583487034, 0.025041677057743073, 0.026142530143260956, 0.02724338322877884, 0.028344236314296722, 0.029445089399814606, 0.03054594062268734, 0.03164679557085037, 0.03274764493107796, 0.03384849801659584, 0.034949351102113724, 0.03605020418763161, 0.03715105727314949, 0.038251910358667374, 0.03935276344418526, 0.04045361280441284, 0.041554465889930725, 0.04265531897544861, 0.04375617206096649, 0.044857025146484375, 0.04595787823200226, 0.04705873131752014, 0.048159584403038025, 0.04926043748855591, 0.05036128684878349, 0.051462139934301376, 0.05256299301981926, 0.05366384610533714]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 7.0, 3.0, 9.0, 4.0, 10.0, 14.0, 17.0, 15.0, 9.0, 24.0, 25.0, 34.0, 24.0, 28.0, 33.0, 38.0, 38.0, 41.0, 41.0, 43.0, 47.0, 41.0, 62.0, 47.0, 38.0, 24.0, 39.0, 27.0, 30.0, 23.0, 24.0, 20.0, 18.0, 25.0, 14.0, 14.0, 20.0, 11.0, 4.0, 6.0, 6.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.008380234241485596, -0.008100881241261959, -0.007821528241038322, -0.007542175240814686, -0.007262822240591049, -0.006983469240367413, -0.006704116240143776, -0.006424763239920139, -0.006145410239696503, -0.005866057239472866, -0.005586704239249229, -0.005307351239025593, -0.005027998238801956, -0.0047486452385783195, -0.004469292238354683, -0.004189939238131046, -0.00391058623790741, -0.003631233237683773, -0.0033518802374601364, -0.0030725272372365, -0.002793174237012863, -0.0025138212367892265, -0.00223446823656559, -0.0019551152363419533, -0.0016757622361183167, -0.00139640923589468, -0.0011170562356710434, -0.0008377032354474068, -0.0005583502352237701, -0.0002789972350001335, 3.557652235031128e-07, 0.00027970876544713974, 0.0005590617656707764, 0.000838414765894413, 0.0011177677661180496, 0.0013971207663416862, 0.0016764737665653229, 0.0019558267667889595, 0.002235179767012596, 0.0025145327672362328, 0.0027938857674598694, 0.003073238767683506, 0.0033525917679071426, 0.0036319447681307793, 0.003911297768354416, 0.0041906507685780525, 0.004470003768801689, 0.004749356769025326, 0.005028709769248962, 0.005308062769472599, 0.005587415769696236, 0.005866768769919872, 0.006146121770143509, 0.0064254747703671455, 0.006704827770590782, 0.006984180770814419, 0.007263533771038055, 0.007542886771261692, 0.007822239771485329, 0.008101592771708965, 0.008380945771932602, 0.008660298772156239, 0.008939651772379875, 0.009219004772603512, 0.009498357772827148]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 4.0, 5.0, 9.0, 4.0, 13.0, 10.0, 19.0, 17.0, 17.0, 26.0, 29.0, 23.0, 33.0, 30.0, 38.0, 46.0, 50.0, 45.0, 49.0, 34.0, 41.0, 47.0, 44.0, 41.0, 32.0, 44.0, 32.0, 37.0, 30.0, 28.0, 12.0, 15.0, 17.0, 15.0, 14.0, 10.0, 9.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.75, -97.125, -93.5, -89.875, -86.25, -82.625, -79.0, -75.375, -71.75, -68.125, -64.5, -60.875, -57.25, -53.625, -50.0, -46.375, -42.75, -39.125, -35.5, -31.875, -28.25, -24.625, -21.0, -17.375, -13.75, -10.125, -6.5, -2.875, 0.75, 4.375, 8.0, 11.625, 15.25, 18.875, 22.5, 26.125, 29.75, 33.375, 37.0, 40.625, 44.25, 47.875, 51.5, 55.125, 58.75, 62.375, 66.0, 69.625, 73.25, 76.875, 80.5, 84.125, 87.75, 91.375, 95.0, 98.625, 102.25, 105.875, 109.5, 113.125, 116.75, 120.375, 124.0, 127.625, 131.25]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 6.0, 17.0, 15.0, 18.0, 17.0, 30.0, 44.0, 59.0, 101.0, 144.0, 226.0, 376.0, 610.0, 1115.0, 2082.0, 4272.0, 10346.0, 34536.0, 190027.0, 631234.0, 130109.0, 26356.0, 8805.0, 3714.0, 1803.0, 1003.0, 555.0, 301.0, 180.0, 115.0, 85.0, 69.0, 45.0, 35.0, 18.0, 24.0, 15.0, 10.0, 9.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.796875, -29.783935546875, -28.77099609375, -27.758056640625, -26.7451171875, -25.732177734375, -24.71923828125, -23.706298828125, -22.693359375, -21.680419921875, -20.66748046875, -19.654541015625, -18.6416015625, -17.628662109375, -16.61572265625, -15.602783203125, -14.58984375, -13.576904296875, -12.56396484375, -11.551025390625, -10.5380859375, -9.525146484375, -8.51220703125, -7.499267578125, -6.486328125, -5.473388671875, -4.46044921875, -3.447509765625, -2.4345703125, -1.421630859375, -0.40869140625, 0.604248046875, 1.6171875, 2.630126953125, 3.64306640625, 4.656005859375, 5.6689453125, 6.681884765625, 7.69482421875, 8.707763671875, 9.720703125, 10.733642578125, 11.74658203125, 12.759521484375, 13.7724609375, 14.785400390625, 15.79833984375, 16.811279296875, 17.82421875, 18.837158203125, 19.85009765625, 20.863037109375, 21.8759765625, 22.888916015625, 23.90185546875, 24.914794921875, 25.927734375, 26.940673828125, 27.95361328125, 28.966552734375, 29.9794921875, 30.992431640625, 32.00537109375, 33.018310546875, 34.03125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 10.0, 9.0, 20.0, 19.0, 15.0, 22.0, 47.0, 46.0, 63.0, 71.0, 87.0, 1949.0, 288.0, 73.0, 93.0, 56.0, 48.0, 36.0, 30.0, 20.0, 13.0, 7.0, 10.0, 3.0, 7.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-308.75, -299.0859375, -289.421875, -279.7578125, -270.09375, -260.4296875, -250.765625, -241.1015625, -231.4375, -221.7734375, -212.109375, -202.4453125, -192.78125, -183.1171875, -173.453125, -163.7890625, -154.125, -144.4609375, -134.796875, -125.1328125, -115.46875, -105.8046875, -96.140625, -86.4765625, -76.8125, -67.1484375, -57.484375, -47.8203125, -38.15625, -28.4921875, -18.828125, -9.1640625, 0.5, 10.1640625, 19.828125, 29.4921875, 39.15625, 48.8203125, 58.484375, 68.1484375, 77.8125, 87.4765625, 97.140625, 106.8046875, 116.46875, 126.1328125, 135.796875, 145.4609375, 155.125, 164.7890625, 174.453125, 184.1171875, 193.78125, 203.4453125, 213.109375, 222.7734375, 232.4375, 242.1015625, 251.765625, 261.4296875, 271.09375, 280.7578125, 290.421875, 300.0859375, 309.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 24.0, 28.0, 54.0, 80.0, 143.0, 278.0, 589.0, 1489.0, 6931.0, 377698.0, 2746131.0, 9218.0, 1666.0, 641.0, 319.0, 157.0, 92.0, 57.0, 37.0, 15.0, 15.0, 2.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.25, -79.513671875, -76.77734375, -74.041015625, -71.3046875, -68.568359375, -65.83203125, -63.095703125, -60.359375, -57.623046875, -54.88671875, -52.150390625, -49.4140625, -46.677734375, -43.94140625, -41.205078125, -38.46875, -35.732421875, -32.99609375, -30.259765625, -27.5234375, -24.787109375, -22.05078125, -19.314453125, -16.578125, -13.841796875, -11.10546875, -8.369140625, -5.6328125, -2.896484375, -0.16015625, 2.576171875, 5.3125, 8.048828125, 10.78515625, 13.521484375, 16.2578125, 18.994140625, 21.73046875, 24.466796875, 27.203125, 29.939453125, 32.67578125, 35.412109375, 38.1484375, 40.884765625, 43.62109375, 46.357421875, 49.09375, 51.830078125, 54.56640625, 57.302734375, 60.0390625, 62.775390625, 65.51171875, 68.248046875, 70.984375, 73.720703125, 76.45703125, 79.193359375, 81.9296875, 84.666015625, 87.40234375, 90.138671875, 92.875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 7.0, 8.0, 9.0, 18.0, 46.0, 127.0, 306.0, 321.0, 113.0, 30.0, 12.0, 10.0, 4.0, 3.0, 0.0, 1.0], "bins": [-1013.841796875, -995.455322265625, -977.0689086914062, -958.6824951171875, -940.2960205078125, -921.9095458984375, -903.5231323242188, -885.13671875, -866.750244140625, -848.36376953125, -829.9773559570312, -811.5909423828125, -793.2044677734375, -774.8179931640625, -756.4315795898438, -738.045166015625, -719.65869140625, -701.272216796875, -682.8858032226562, -664.4993896484375, -646.1129150390625, -627.7264404296875, -609.3400268554688, -590.95361328125, -572.567138671875, -554.1806640625, -535.7942504882812, -517.4078369140625, -499.0213623046875, -480.6349182128906, -462.24847412109375, -443.8620300292969, -425.47552490234375, -407.0890808105469, -388.70263671875, -370.3161926269531, -351.92974853515625, -333.5433044433594, -315.1568603515625, -296.7704162597656, -278.38397216796875, -259.9975280761719, -241.611083984375, -223.22463989257812, -204.83819580078125, -186.45175170898438, -168.0653076171875, -149.67886352539062, -131.29241943359375, -112.90597534179688, -94.51953125, -76.13308715820312, -57.74664306640625, -39.360198974609375, -20.9737548828125, -2.587310791015625, 15.79913330078125, 34.185577392578125, 52.572021484375, 70.95846557617188, 89.34490966796875, 107.73135375976562, 126.1177978515625, 144.50424194335938, 162.89068603515625]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 7.0, 6.0, 7.0, 6.0, 16.0, 19.0, 12.0, 16.0, 27.0, 31.0, 31.0, 43.0, 36.0, 38.0, 58.0, 59.0, 56.0, 53.0, 51.0, 49.0, 58.0, 48.0, 47.0, 44.0, 36.0, 32.0, 25.0, 19.0, 17.0, 17.0, 9.0, 5.0, 3.0, 9.0, 6.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-298.53338623046875, -289.53375244140625, -280.53411865234375, -271.5345153808594, -262.5348815917969, -253.53524780273438, -244.53562927246094, -235.5360107421875, -226.536376953125, -217.5367431640625, -208.53712463378906, -199.53750610351562, -190.53787231445312, -181.53823852539062, -172.5386199951172, -163.53900146484375, -154.53936767578125, -145.53973388671875, -136.5401153564453, -127.54048919677734, -118.54086303710938, -109.5412368774414, -100.54161071777344, -91.54198455810547, -82.5423583984375, -73.54273223876953, -64.54310607910156, -55.543479919433594, -46.543853759765625, -37.544227600097656, -28.544601440429688, -19.54497528076172, -10.54534912109375, -1.5457229614257812, 7.4539031982421875, 16.453529357910156, 25.453155517578125, 34.452781677246094, 43.45240783691406, 52.45203399658203, 61.45166015625, 70.45128631591797, 79.45091247558594, 88.4505386352539, 97.45016479492188, 106.44979095458984, 115.44941711425781, 124.44904327392578, 133.44866943359375, 142.44830322265625, 151.4479217529297, 160.44754028320312, 169.44717407226562, 178.44680786132812, 187.44642639160156, 196.446044921875, 205.4456787109375, 214.4453125, 223.44493103027344, 232.44454956054688, 241.44418334960938, 250.44381713867188, 259.44342041015625, 268.44305419921875, 277.44268798828125]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 8.0, 5.0, 13.0, 14.0, 15.0, 23.0, 18.0, 25.0, 34.0, 50.0, 57.0, 77.0, 98.0, 125.0, 198.0, 236.0, 315.0, 401.0, 586.0, 785.0, 1380.0, 1040866.0, 803.0, 597.0, 439.0, 337.0, 238.0, 200.0, 121.0, 119.0, 81.0, 71.0, 45.0, 35.0, 33.0, 24.0, 16.0, 12.0, 13.0, 11.0, 9.0, 9.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.40814971923828, -65.09004211425781, -62.771942138671875, -60.453834533691406, -58.1357307434082, -55.817626953125, -53.49951934814453, -51.18141555786133, -48.863311767578125, -46.54520797729492, -44.22710418701172, -41.90899658203125, -39.59089279174805, -37.272789001464844, -34.954681396484375, -32.63657760620117, -30.31847381591797, -28.000370025634766, -25.68226432800293, -23.364158630371094, -21.04605484008789, -18.727951049804688, -16.40984535217285, -14.091739654541016, -11.773635864257812, -9.455531120300293, -7.137426376342773, -4.819321632385254, -2.5012168884277344, -0.18311214447021484, 2.1349925994873047, 4.453098297119141, 6.771209716796875, 9.089314460754395, 11.407419204711914, 13.725523948669434, 16.043628692626953, 18.361732482910156, 20.679838180541992, 22.997943878173828, 25.31604766845703, 27.634151458740234, 29.95225715637207, 32.270362854003906, 34.58846664428711, 36.90657043457031, 39.22467803955078, 41.542781829833984, 43.86088562011719, 46.17898941040039, 48.497093200683594, 50.81520080566406, 53.133304595947266, 55.45140838623047, 57.76951599121094, 60.08761978149414, 62.405723571777344, 64.72383117675781, 67.04193115234375, 69.36003875732422, 71.67814636230469, 73.99624633789062, 76.3143539428711, 78.63246154785156, 80.9505615234375]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 8.0, 8.0, 3.0, 8.0, 11.0, 19.0, 44.0, 166.0, 51462608.0, 153.0, 42.0, 17.0, 16.0, 10.0, 5.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 7.0, 5.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8952.0, -8471.625, -7991.25, -7510.875, -7030.5, -6550.125, -6069.75, -5589.375, -5109.0, -4628.625, -4148.25, -3667.875, -3187.5, -2707.125, -2226.75, -1746.375, -1266.0, -785.625, -305.25, 175.125, 655.5, 1135.875, 1616.25, 2096.625, 2577.0, 3057.375, 3537.75, 4018.125, 4498.5, 4978.875, 5459.25, 5939.625, 6420.0, 6900.375, 7380.75, 7861.125, 8341.5, 8821.875, 9302.25, 9782.625, 10263.0, 10743.375, 11223.75, 11704.125, 12184.5, 12664.875, 13145.25, 13625.625, 14106.0, 14586.375, 15066.75, 15547.125, 16027.5, 16507.875, 16988.25, 17468.625, 17949.0, 18429.375, 18909.75, 19390.125, 19870.5, 20350.875, 20831.25, 21311.625, 21792.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 10.0, 11.0, 15.0, 37.0, 34.0, 53.0, 95.0, 109.0, 170.0, 273.0, 394.0, 485.0, 635.0, 900.0, 1391.0, 1971.0, 2718.0, 3655.0, 5374.0, 7637.0, 10253.0, 15038.0, 21520.0, 31603.0, 46989.0, 70647.0, 107675.0, 170125.0, 295742.0, 1078032.0, 3499804.0, 356905.0, 195192.0, 120321.0, 78792.0, 52073.0, 34985.0, 24122.0, 16753.0, 11462.0, 7986.0, 5681.0, 3894.0, 2807.0, 2131.0, 1477.0, 1022.0, 741.0, 526.0, 358.0, 280.0, 186.0, 100.0, 86.0, 57.0, 35.0, 31.0, 22.0, 15.0, 8.0, 5.0, 3.0, 3.0], "bins": [-8.640625, -8.363037109375, -8.08544921875, -7.807861328125, -7.5302734375, -7.252685546875, -6.97509765625, -6.697509765625, -6.419921875, -6.142333984375, -5.86474609375, -5.587158203125, -5.3095703125, -5.031982421875, -4.75439453125, -4.476806640625, -4.19921875, -3.921630859375, -3.64404296875, -3.366455078125, -3.0888671875, -2.811279296875, -2.53369140625, -2.256103515625, -1.978515625, -1.700927734375, -1.42333984375, -1.145751953125, -0.8681640625, -0.590576171875, -0.31298828125, -0.035400390625, 0.2421875, 0.519775390625, 0.79736328125, 1.074951171875, 1.3525390625, 1.630126953125, 1.90771484375, 2.185302734375, 2.462890625, 2.740478515625, 3.01806640625, 3.295654296875, 3.5732421875, 3.850830078125, 4.12841796875, 4.406005859375, 4.68359375, 4.961181640625, 5.23876953125, 5.516357421875, 5.7939453125, 6.071533203125, 6.34912109375, 6.626708984375, 6.904296875, 7.181884765625, 7.45947265625, 7.737060546875, 8.0146484375, 8.292236328125, 8.56982421875, 8.847412109375, 9.125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 8.0, 7.0, 8.0, 4.0, 1.0, 12.0, 11.0, 9.0, 8.0, 13.0, 15.0, 20.0, 24.0, 17.0, 33.0, 31.0, 31.0, 35.0, 24.0, 26.0, 36.0, 49.0, 111.0, 548.0, 383.0, 111.0, 56.0, 42.0, 47.0, 26.0, 33.0, 30.0, 30.0, 29.0, 18.0, 30.0, 16.0, 26.0, 12.0, 12.0, 14.0, 5.0, 9.0, 4.0, 4.0, 6.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.53125, -21.802734375, -21.07421875, -20.345703125, -19.6171875, -18.888671875, -18.16015625, -17.431640625, -16.703125, -15.974609375, -15.24609375, -14.517578125, -13.7890625, -13.060546875, -12.33203125, -11.603515625, -10.875, -10.146484375, -9.41796875, -8.689453125, -7.9609375, -7.232421875, -6.50390625, -5.775390625, -5.046875, -4.318359375, -3.58984375, -2.861328125, -2.1328125, -1.404296875, -0.67578125, 0.052734375, 0.78125, 1.509765625, 2.23828125, 2.966796875, 3.6953125, 4.423828125, 5.15234375, 5.880859375, 6.609375, 7.337890625, 8.06640625, 8.794921875, 9.5234375, 10.251953125, 10.98046875, 11.708984375, 12.4375, 13.166015625, 13.89453125, 14.623046875, 15.3515625, 16.080078125, 16.80859375, 17.537109375, 18.265625, 18.994140625, 19.72265625, 20.451171875, 21.1796875, 21.908203125, 22.63671875, 23.365234375, 24.09375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [6.0, 5.0, 1.0, 1.0, 8.0, 11.0, 19.0, 14.0, 26.0, 34.0, 51.0, 66.0, 86.0, 152.0, 187.0, 311.0, 401.0, 615.0, 921.0, 1304.0, 2103.0, 3152.0, 4902.0, 7676.0, 12374.0, 20184.0, 33796.0, 56552.0, 100078.0, 183828.0, 368932.0, 3281751.0, 1484884.0, 330557.0, 168263.0, 92350.0, 52866.0, 31476.0, 18776.0, 11648.0, 7235.0, 4782.0, 3007.0, 1998.0, 1291.0, 867.0, 613.0, 388.0, 269.0, 202.0, 134.0, 83.0, 69.0, 54.0, 37.0, 17.0, 14.0, 10.0, 8.0, 2.0, 2.0, 4.0, 0.0, 3.0], "bins": [-13.2578125, -12.8426513671875, -12.427490234375, -12.0123291015625, -11.59716796875, -11.1820068359375, -10.766845703125, -10.3516845703125, -9.9365234375, -9.5213623046875, -9.106201171875, -8.6910400390625, -8.27587890625, -7.8607177734375, -7.445556640625, -7.0303955078125, -6.615234375, -6.2000732421875, -5.784912109375, -5.3697509765625, -4.95458984375, -4.5394287109375, -4.124267578125, -3.7091064453125, -3.2939453125, -2.8787841796875, -2.463623046875, -2.0484619140625, -1.63330078125, -1.2181396484375, -0.802978515625, -0.3878173828125, 0.02734375, 0.4425048828125, 0.857666015625, 1.2728271484375, 1.68798828125, 2.1031494140625, 2.518310546875, 2.9334716796875, 3.3486328125, 3.7637939453125, 4.178955078125, 4.5941162109375, 5.00927734375, 5.4244384765625, 5.839599609375, 6.2547607421875, 6.669921875, 7.0850830078125, 7.500244140625, 7.9154052734375, 8.33056640625, 8.7457275390625, 9.160888671875, 9.5760498046875, 9.9912109375, 10.4063720703125, 10.821533203125, 11.2366943359375, 11.65185546875, 12.0670166015625, 12.482177734375, 12.8973388671875, 13.3125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 7.0, 6.0, 10.0, 11.0, 13.0, 15.0, 17.0, 16.0, 27.0, 17.0, 25.0, 35.0, 34.0, 37.0, 25.0, 29.0, 49.0, 63.0, 134.0, 452.0, 380.0, 128.0, 79.0, 53.0, 37.0, 49.0, 31.0, 30.0, 35.0, 20.0, 31.0, 20.0, 14.0, 22.0, 14.0, 12.0, 10.0, 9.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-17.609375, -17.05810546875, -16.5068359375, -15.95556640625, -15.404296875, -14.85302734375, -14.3017578125, -13.75048828125, -13.19921875, -12.64794921875, -12.0966796875, -11.54541015625, -10.994140625, -10.44287109375, -9.8916015625, -9.34033203125, -8.7890625, -8.23779296875, -7.6865234375, -7.13525390625, -6.583984375, -6.03271484375, -5.4814453125, -4.93017578125, -4.37890625, -3.82763671875, -3.2763671875, -2.72509765625, -2.173828125, -1.62255859375, -1.0712890625, -0.52001953125, 0.03125, 0.58251953125, 1.1337890625, 1.68505859375, 2.236328125, 2.78759765625, 3.3388671875, 3.89013671875, 4.44140625, 4.99267578125, 5.5439453125, 6.09521484375, 6.646484375, 7.19775390625, 7.7490234375, 8.30029296875, 8.8515625, 9.40283203125, 9.9541015625, 10.50537109375, 11.056640625, 11.60791015625, 12.1591796875, 12.71044921875, 13.26171875, 13.81298828125, 14.3642578125, 14.91552734375, 15.466796875, 16.01806640625, 16.5693359375, 17.12060546875, 17.671875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 6.0, 0.0, 0.0, 3.0, 16.0, 8.0, 10.0, 33.0, 22.0, 32.0, 57.0, 52.0, 70.0, 94.0, 125.0, 126.0, 201.0, 231.0, 324.0, 500.0, 633.0, 880.0, 1304.0, 1974.0, 3274.0, 5749.0, 11084.0, 26250.0, 86892.0, 5916174.0, 163718.0, 38125.0, 14580.0, 7245.0, 3787.0, 2417.0, 1597.0, 984.0, 722.0, 521.0, 426.0, 305.0, 213.0, 169.0, 129.0, 68.0, 70.0, 54.0, 59.0, 29.0, 26.0, 30.0, 18.0, 4.0, 15.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-36.53125, -35.34033203125, -34.1494140625, -32.95849609375, -31.767578125, -30.57666015625, -29.3857421875, -28.19482421875, -27.00390625, -25.81298828125, -24.6220703125, -23.43115234375, -22.240234375, -21.04931640625, -19.8583984375, -18.66748046875, -17.4765625, -16.28564453125, -15.0947265625, -13.90380859375, -12.712890625, -11.52197265625, -10.3310546875, -9.14013671875, -7.94921875, -6.75830078125, -5.5673828125, -4.37646484375, -3.185546875, -1.99462890625, -0.8037109375, 0.38720703125, 1.578125, 2.76904296875, 3.9599609375, 5.15087890625, 6.341796875, 7.53271484375, 8.7236328125, 9.91455078125, 11.10546875, 12.29638671875, 13.4873046875, 14.67822265625, 15.869140625, 17.06005859375, 18.2509765625, 19.44189453125, 20.6328125, 21.82373046875, 23.0146484375, 24.20556640625, 25.396484375, 26.58740234375, 27.7783203125, 28.96923828125, 30.16015625, 31.35107421875, 32.5419921875, 33.73291015625, 34.923828125, 36.11474609375, 37.3056640625, 38.49658203125, 39.6875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 3.0, 6.0, 5.0, 10.0, 13.0, 10.0, 15.0, 17.0, 14.0, 18.0, 36.0, 21.0, 48.0, 32.0, 42.0, 47.0, 47.0, 93.0, 161.0, 425.0, 323.0, 132.0, 99.0, 51.0, 53.0, 41.0, 39.0, 30.0, 27.0, 22.0, 26.0, 19.0, 22.0, 6.0, 16.0, 3.0, 9.0, 10.0, 5.0, 8.0, 5.0, 6.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8125, -12.3973388671875, -11.982177734375, -11.5670166015625, -11.15185546875, -10.7366943359375, -10.321533203125, -9.9063720703125, -9.4912109375, -9.0760498046875, -8.660888671875, -8.2457275390625, -7.83056640625, -7.4154052734375, -7.000244140625, -6.5850830078125, -6.169921875, -5.7547607421875, -5.339599609375, -4.9244384765625, -4.50927734375, -4.0941162109375, -3.678955078125, -3.2637939453125, -2.8486328125, -2.4334716796875, -2.018310546875, -1.6031494140625, -1.18798828125, -0.7728271484375, -0.357666015625, 0.0574951171875, 0.47265625, 0.8878173828125, 1.302978515625, 1.7181396484375, 2.13330078125, 2.5484619140625, 2.963623046875, 3.3787841796875, 3.7939453125, 4.2091064453125, 4.624267578125, 5.0394287109375, 5.45458984375, 5.8697509765625, 6.284912109375, 6.7000732421875, 7.115234375, 7.5303955078125, 7.945556640625, 8.3607177734375, 8.77587890625, 9.1910400390625, 9.606201171875, 10.0213623046875, 10.4365234375, 10.8516845703125, 11.266845703125, 11.6820068359375, 12.09716796875, 12.5123291015625, 12.927490234375, 13.3426513671875, 13.7578125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 9.0, 9.0, 13.0, 30.0, 55.0, 125.0, 435.0, 190.0, 58.0, 39.0, 14.0, 9.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.762855529785156, -22.805233001708984, -20.847612380981445, -18.889989852905273, -16.9323673248291, -14.974745750427246, -13.01712417602539, -11.059501647949219, -9.101880073547363, -7.14425802230835, -5.186635971069336, -3.2290143966674805, -1.2713923454284668, 0.6862297058105469, 2.6438512802124023, 4.601473808288574, 6.55909538269043, 8.516716957092285, 10.474339485168457, 12.431961059570312, 14.389583587646484, 16.347206115722656, 18.304826736450195, 20.262449264526367, 22.220069885253906, 24.177692413330078, 26.135313034057617, 28.09293556213379, 30.05055809020996, 32.0081787109375, 33.96580123901367, 35.923423767089844, 37.881046295166016, 39.83866882324219, 41.79629135131836, 43.75391387939453, 45.71153259277344, 47.66915512084961, 49.62677764892578, 51.58440017700195, 53.542022705078125, 55.4996452331543, 57.45726776123047, 59.414886474609375, 61.37250900268555, 63.33013153076172, 65.28775024414062, 67.24537658691406, 69.20299530029297, 71.16061401367188, 73.11824035644531, 75.07585906982422, 77.03348541259766, 78.99110412597656, 80.94873046875, 82.9063491821289, 84.86397552490234, 86.82159423828125, 88.77922058105469, 90.7368392944336, 92.69446563720703, 94.65208435058594, 96.60971069335938, 98.56732940673828, 100.52494812011719]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 2.0, 6.0, 7.0, 6.0, 9.0, 5.0, 14.0, 11.0, 9.0, 14.0, 15.0, 10.0, 12.0, 24.0, 24.0, 22.0, 21.0, 31.0, 36.0, 46.0, 34.0, 35.0, 33.0, 40.0, 37.0, 47.0, 44.0, 44.0, 32.0, 32.0, 33.0, 32.0, 22.0, 29.0, 21.0, 23.0, 15.0, 19.0, 19.0, 15.0, 12.0, 13.0, 7.0, 10.0, 11.0, 10.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.156578063964844, -16.627605438232422, -16.098630905151367, -15.569657325744629, -15.04068374633789, -14.511711120605469, -13.98273754119873, -13.453763961791992, -12.924790382385254, -12.395816802978516, -11.866843223571777, -11.337869644165039, -10.808897018432617, -10.279922485351562, -9.75094985961914, -9.221976280212402, -8.693002700805664, -8.164029121398926, -7.6350555419921875, -7.106082439422607, -6.577108860015869, -6.048135280609131, -5.519162178039551, -4.9901885986328125, -4.461215019226074, -3.932241439819336, -3.4032680988311768, -2.8742947578430176, -2.3453211784362793, -1.816347599029541, -1.2873742580413818, -0.7584009170532227, -0.2294292449951172, 0.29954421520233154, 0.8285176753997803, 1.357491135597229, 1.8864645957946777, 2.415438175201416, 2.944411516189575, 3.4733848571777344, 4.002358436584473, 4.531332015991211, 5.060305595397949, 5.589278697967529, 6.118252277374268, 6.647225856781006, 7.176198959350586, 7.705172538757324, 8.234146118164062, 8.7631196975708, 9.292093276977539, 9.821066856384277, 10.350040435791016, 10.879013061523438, 11.407986640930176, 11.936960220336914, 12.465933799743652, 12.99490737915039, 13.523880958557129, 14.052854537963867, 14.581827163696289, 15.110801696777344, 15.639774322509766, 16.168746948242188, 16.697721481323242]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 6.0, 5.0, 5.0, 10.0, 12.0, 14.0, 16.0, 24.0, 35.0, 46.0, 49.0, 70.0, 106.0, 139.0, 175.0, 246.0, 373.0, 503.0, 725.0, 1098.0, 1705.0, 2889.0, 4884.0, 9743.0, 23589.0, 114503.0, 3953316.0, 46831.0, 15541.0, 7290.0, 3850.0, 2123.0, 1420.0, 906.0, 606.0, 436.0, 274.0, 208.0, 128.0, 106.0, 73.0, 57.0, 39.0, 33.0, 11.0, 19.0, 13.0, 8.0, 7.0, 4.0, 4.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.04913330078125, -0.047655582427978516, -0.04617786407470703, -0.04470014572143555, -0.04322242736816406, -0.04174470901489258, -0.040266990661621094, -0.03878927230834961, -0.037311553955078125, -0.03583383560180664, -0.034356117248535156, -0.03287839889526367, -0.03140068054199219, -0.029922962188720703, -0.02844524383544922, -0.026967525482177734, -0.02548980712890625, -0.024012088775634766, -0.02253437042236328, -0.021056652069091797, -0.019578933715820312, -0.018101215362548828, -0.016623497009277344, -0.01514577865600586, -0.013668060302734375, -0.01219034194946289, -0.010712623596191406, -0.009234905242919922, -0.0077571868896484375, -0.006279468536376953, -0.004801750183105469, -0.0033240318298339844, -0.0018463134765625, -0.0003685951232910156, 0.0011091232299804688, 0.002586841583251953, 0.0040645599365234375, 0.005542278289794922, 0.007019996643066406, 0.00849771499633789, 0.009975433349609375, 0.01145315170288086, 0.012930870056152344, 0.014408588409423828, 0.015886306762695312, 0.017364025115966797, 0.01884174346923828, 0.020319461822509766, 0.02179718017578125, 0.023274898529052734, 0.02475261688232422, 0.026230335235595703, 0.027708053588867188, 0.029185771942138672, 0.030663490295410156, 0.03214120864868164, 0.033618927001953125, 0.03509664535522461, 0.036574363708496094, 0.03805208206176758, 0.03952980041503906, 0.04100751876831055, 0.04248523712158203, 0.043962955474853516, 0.045440673828125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 9.0, 4.0, 8.0, 6.0, 8.0, 6.0, 5.0, 8.0, 13.0, 17.0, 24.0, 777.0, 18.0, 11.0, 13.0, 11.0, 8.0, 8.0, 3.0, 8.0, 9.0, 7.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006343841552734375, -0.0061419010162353516, -0.005939960479736328, -0.005738019943237305, -0.005536079406738281, -0.005334138870239258, -0.005132198333740234, -0.004930257797241211, -0.0047283172607421875, -0.004526376724243164, -0.004324436187744141, -0.004122495651245117, -0.003920555114746094, -0.0037186145782470703, -0.003516674041748047, -0.0033147335052490234, -0.00311279296875, -0.0029108524322509766, -0.002708911895751953, -0.0025069713592529297, -0.0023050308227539062, -0.002103090286254883, -0.0019011497497558594, -0.001699209213256836, -0.0014972686767578125, -0.001295328140258789, -0.0010933876037597656, -0.0008914470672607422, -0.0006895065307617188, -0.0004875659942626953, -0.0002856254577636719, -8.368492126464844e-05, 0.000118255615234375, 0.00032019615173339844, 0.0005221366882324219, 0.0007240772247314453, 0.0009260177612304688, 0.0011279582977294922, 0.0013298988342285156, 0.001531839370727539, 0.0017337799072265625, 0.001935720443725586, 0.0021376609802246094, 0.002339601516723633, 0.0025415420532226562, 0.0027434825897216797, 0.002945423126220703, 0.0031473636627197266, 0.00334930419921875, 0.0035512447357177734, 0.003753185272216797, 0.00395512580871582, 0.004157066345214844, 0.004359006881713867, 0.004560947418212891, 0.004762887954711914, 0.0049648284912109375, 0.005166769027709961, 0.005368709564208984, 0.005570650100708008, 0.005772590637207031, 0.005974531173706055, 0.006176471710205078, 0.0063784122467041016, 0.006580352783203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 9.0, 6.0, 13.0, 13.0, 21.0, 21.0, 43.0, 64.0, 83.0, 111.0, 149.0, 257.0, 389.0, 629.0, 1174.0, 2631.0, 8485.0, 47466.0, 788289.0, 3247372.0, 78512.0, 11734.0, 3394.0, 1367.0, 757.0, 433.0, 256.0, 190.0, 108.0, 91.0, 60.0, 43.0, 30.0, 20.0, 20.0, 15.0, 9.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0667724609375, -0.06455516815185547, -0.06233787536621094, -0.060120582580566406, -0.057903289794921875, -0.055685997009277344, -0.05346870422363281, -0.05125141143798828, -0.04903411865234375, -0.04681682586669922, -0.04459953308105469, -0.042382240295410156, -0.040164947509765625, -0.037947654724121094, -0.03573036193847656, -0.03351306915283203, -0.0312957763671875, -0.02907848358154297, -0.026861190795898438, -0.024643898010253906, -0.022426605224609375, -0.020209312438964844, -0.017992019653320312, -0.01577472686767578, -0.01355743408203125, -0.011340141296386719, -0.009122848510742188, -0.006905555725097656, -0.004688262939453125, -0.0024709701538085938, -0.0002536773681640625, 0.0019636154174804688, 0.004180908203125, 0.006398200988769531, 0.008615493774414062, 0.010832786560058594, 0.013050079345703125, 0.015267372131347656, 0.017484664916992188, 0.01970195770263672, 0.02191925048828125, 0.02413654327392578, 0.026353836059570312, 0.028571128845214844, 0.030788421630859375, 0.033005714416503906, 0.03522300720214844, 0.03744029998779297, 0.0396575927734375, 0.04187488555908203, 0.04409217834472656, 0.046309471130371094, 0.048526763916015625, 0.050744056701660156, 0.05296134948730469, 0.05517864227294922, 0.05739593505859375, 0.05961322784423828, 0.06183052062988281, 0.06404781341552734, 0.06626510620117188, 0.0684823989868164, 0.07069969177246094, 0.07291698455810547, 0.07513427734375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 6.0, 10.0, 10.0, 13.0, 12.0, 12.0, 19.0, 18.0, 21.0, 39.0, 49.0, 59.0, 69.0, 95.0, 136.0, 150.0, 165.0, 337.0, 1063.0, 668.0, 264.0, 181.0, 141.0, 93.0, 99.0, 68.0, 67.0, 38.0, 43.0, 19.0, 18.0, 22.0, 11.0, 10.0, 12.0, 11.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00740814208984375, -0.007132172584533691, -0.006856203079223633, -0.006580233573913574, -0.006304264068603516, -0.006028294563293457, -0.0057523250579833984, -0.00547635555267334, -0.005200386047363281, -0.004924416542053223, -0.004648447036743164, -0.0043724775314331055, -0.004096508026123047, -0.0038205385208129883, -0.0035445690155029297, -0.003268599510192871, -0.0029926300048828125, -0.002716660499572754, -0.0024406909942626953, -0.0021647214889526367, -0.0018887519836425781, -0.0016127824783325195, -0.001336812973022461, -0.0010608434677124023, -0.0007848739624023438, -0.0005089044570922852, -0.00023293495178222656, 4.303455352783203e-05, 0.0003190040588378906, 0.0005949735641479492, 0.0008709430694580078, 0.0011469125747680664, 0.001422882080078125, 0.0016988515853881836, 0.001974821090698242, 0.0022507905960083008, 0.0025267601013183594, 0.002802729606628418, 0.0030786991119384766, 0.003354668617248535, 0.0036306381225585938, 0.003906607627868652, 0.004182577133178711, 0.0044585466384887695, 0.004734516143798828, 0.005010485649108887, 0.005286455154418945, 0.005562424659729004, 0.0058383941650390625, 0.006114363670349121, 0.00639033317565918, 0.006666302680969238, 0.006942272186279297, 0.0072182416915893555, 0.007494211196899414, 0.007770180702209473, 0.008046150207519531, 0.00832211971282959, 0.008598089218139648, 0.008874058723449707, 0.009150028228759766, 0.009425997734069824, 0.009701967239379883, 0.009977936744689941, 0.01025390625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 17.0, 33.0, 89.0, 214.0, 353.0, 174.0, 73.0, 20.0, 10.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07552838325500488, -0.07091432809829712, -0.06630027294158936, -0.06168622151017189, -0.057072170078754425, -0.05245811492204666, -0.0478440597653389, -0.04323000833392143, -0.03861595317721367, -0.034001898020505905, -0.02938784658908844, -0.024773791432380676, -0.020159738138318062, -0.015545684844255447, -0.010931629687547684, -0.0063175782561302185, -0.0017035230994224548, 0.002910530660301447, 0.007524584420025349, 0.012138638645410538, 0.016752691939473152, 0.021366745233535767, 0.02598080039024353, 0.030594851821660995, 0.03520890697836876, 0.03982296213507652, 0.04443701356649399, 0.04905106872320175, 0.053665123879909515, 0.05827917531132698, 0.06289322674274445, 0.06750728189945221, 0.07212133705615997, 0.07673539221286774, 0.0813494473695755, 0.08596350252628326, 0.09057755023241043, 0.0951916053891182, 0.09980566054582596, 0.10441970825195312, 0.10903376340866089, 0.11364781856536865, 0.11826187372207642, 0.12287592887878418, 0.12748998403549194, 0.1321040391921997, 0.13671809434890747, 0.14133213460445404, 0.145946204662323, 0.15056025981903076, 0.15517431497573853, 0.1597883701324463, 0.16440242528915405, 0.16901648044586182, 0.17363053560256958, 0.17824457585811615, 0.1828586310148239, 0.18747268617153168, 0.19208674132823944, 0.1967007964849472, 0.20131485164165497, 0.20592889189720154, 0.2105429470539093, 0.21515700221061707, 0.21977105736732483]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 11.0, 5.0, 11.0, 12.0, 21.0, 21.0, 21.0, 29.0, 30.0, 42.0, 40.0, 40.0, 47.0, 66.0, 57.0, 64.0, 58.0, 41.0, 48.0, 48.0, 41.0, 36.0, 39.0, 25.0, 30.0, 28.0, 15.0, 14.0, 11.0, 14.0, 9.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038662850856781006, -0.03730905055999756, -0.03595525026321411, -0.034601449966430664, -0.03324764966964722, -0.03189384937286377, -0.030540049076080322, -0.029186248779296875, -0.027832448482513428, -0.02647864818572998, -0.025124847888946533, -0.023771047592163086, -0.02241724729537964, -0.02106344699859619, -0.019709646701812744, -0.018355846405029297, -0.01700204610824585, -0.015648245811462402, -0.014294445514678955, -0.012940645217895508, -0.01158684492111206, -0.010233044624328613, -0.008879244327545166, -0.007525444030761719, -0.0061716437339782715, -0.004817843437194824, -0.003464043140411377, -0.0021102428436279297, -0.0007564425468444824, 0.0005973577499389648, 0.0019511580467224121, 0.0033049583435058594, 0.004658758640289307, 0.006012558937072754, 0.007366359233856201, 0.008720159530639648, 0.010073959827423096, 0.011427760124206543, 0.01278156042098999, 0.014135360717773438, 0.015489161014556885, 0.016842961311340332, 0.01819676160812378, 0.019550561904907227, 0.020904362201690674, 0.02225816249847412, 0.02361196279525757, 0.024965763092041016, 0.026319563388824463, 0.02767336368560791, 0.029027163982391357, 0.030380964279174805, 0.03173476457595825, 0.0330885648727417, 0.034442365169525146, 0.035796165466308594, 0.03714996576309204, 0.03850376605987549, 0.039857566356658936, 0.04121136665344238, 0.04256516695022583, 0.04391896724700928, 0.045272767543792725, 0.04662656784057617, 0.04798036813735962]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 7.0, 15.0, 7.0, 22.0, 31.0, 42.0, 42.0, 60.0, 84.0, 118.0, 158.0, 191.0, 248.0, 368.0, 519.0, 729.0, 977.0, 1423.0, 2212.0, 3449.0, 5493.0, 10155.0, 21172.0, 183726.0, 761162.0, 26370.0, 11645.0, 6416.0, 3797.0, 2381.0, 1660.0, 1088.0, 762.0, 507.0, 403.0, 304.0, 196.0, 153.0, 126.0, 102.0, 47.0, 41.0, 32.0, 42.0, 30.0, 9.0, 11.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.05352783203125, -0.051860809326171875, -0.05019378662109375, -0.048526763916015625, -0.0468597412109375, -0.045192718505859375, -0.04352569580078125, -0.041858673095703125, -0.040191650390625, -0.038524627685546875, -0.03685760498046875, -0.035190582275390625, -0.0335235595703125, -0.031856536865234375, -0.03018951416015625, -0.028522491455078125, -0.02685546875, -0.025188446044921875, -0.02352142333984375, -0.021854400634765625, -0.0201873779296875, -0.018520355224609375, -0.01685333251953125, -0.015186309814453125, -0.013519287109375, -0.011852264404296875, -0.01018524169921875, -0.008518218994140625, -0.0068511962890625, -0.005184173583984375, -0.00351715087890625, -0.001850128173828125, -0.00018310546875, 0.001483917236328125, 0.00315093994140625, 0.004817962646484375, 0.0064849853515625, 0.008152008056640625, 0.00981903076171875, 0.011486053466796875, 0.013153076171875, 0.014820098876953125, 0.01648712158203125, 0.018154144287109375, 0.0198211669921875, 0.021488189697265625, 0.02315521240234375, 0.024822235107421875, 0.0264892578125, 0.028156280517578125, 0.02982330322265625, 0.031490325927734375, 0.0331573486328125, 0.034824371337890625, 0.03649139404296875, 0.038158416748046875, 0.039825439453125, 0.041492462158203125, 0.04315948486328125, 0.044826507568359375, 0.0464935302734375, 0.048160552978515625, 0.04982757568359375, 0.051494598388671875, 0.05316162109375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 4.0, 5.0, 8.0, 8.0, 8.0, 7.0, 20.0, 90.0, 335.0, 315.0, 85.0, 16.0, 11.0, 14.0, 9.0, 4.0, 5.0, 7.0, 7.0, 8.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0061492919921875, -0.005951344966888428, -0.0057533979415893555, -0.005555450916290283, -0.005357503890991211, -0.005159556865692139, -0.004961609840393066, -0.004763662815093994, -0.004565715789794922, -0.00436776876449585, -0.004169821739196777, -0.003971874713897705, -0.003773927688598633, -0.0035759806632995605, -0.0033780336380004883, -0.003180086612701416, -0.0029821395874023438, -0.0027841925621032715, -0.0025862455368041992, -0.002388298511505127, -0.0021903514862060547, -0.0019924044609069824, -0.0017944574356079102, -0.0015965104103088379, -0.0013985633850097656, -0.0012006163597106934, -0.001002669334411621, -0.0008047223091125488, -0.0006067752838134766, -0.0004088282585144043, -0.00021088123321533203, -1.2934207916259766e-05, 0.0001850128173828125, 0.00038295984268188477, 0.000580906867980957, 0.0007788538932800293, 0.0009768009185791016, 0.0011747479438781738, 0.001372694969177246, 0.0015706419944763184, 0.0017685890197753906, 0.001966536045074463, 0.002164483070373535, 0.0023624300956726074, 0.0025603771209716797, 0.002758324146270752, 0.0029562711715698242, 0.0031542181968688965, 0.0033521652221679688, 0.003550112247467041, 0.0037480592727661133, 0.0039460062980651855, 0.004143953323364258, 0.00434190034866333, 0.004539847373962402, 0.004737794399261475, 0.004935741424560547, 0.005133688449859619, 0.005331635475158691, 0.005529582500457764, 0.005727529525756836, 0.005925476551055908, 0.0061234235763549805, 0.006321370601654053, 0.006519317626953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 5.0, 11.0, 18.0, 22.0, 19.0, 25.0, 42.0, 64.0, 93.0, 115.0, 159.0, 236.0, 346.0, 564.0, 870.0, 1415.0, 2688.0, 5817.0, 17034.0, 151925.0, 806225.0, 42175.0, 9442.0, 4019.0, 1968.0, 1089.0, 737.0, 419.0, 274.0, 198.0, 146.0, 118.0, 81.0, 46.0, 40.0, 23.0, 20.0, 22.0, 10.0, 11.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08587646484375, -0.08283805847167969, -0.07979965209960938, -0.07676124572753906, -0.07372283935546875, -0.07068443298339844, -0.06764602661132812, -0.06460762023925781, -0.0615692138671875, -0.05853080749511719, -0.055492401123046875, -0.05245399475097656, -0.04941558837890625, -0.04637718200683594, -0.043338775634765625, -0.04030036926269531, -0.037261962890625, -0.03422355651855469, -0.031185150146484375, -0.028146743774414062, -0.02510833740234375, -0.022069931030273438, -0.019031524658203125, -0.015993118286132812, -0.0129547119140625, -0.009916305541992188, -0.006877899169921875, -0.0038394927978515625, -0.00080108642578125, 0.0022373199462890625, 0.005275726318359375, 0.008314132690429688, 0.0113525390625, 0.014390945434570312, 0.017429351806640625, 0.020467758178710938, 0.02350616455078125, 0.026544570922851562, 0.029582977294921875, 0.03262138366699219, 0.0356597900390625, 0.03869819641113281, 0.041736602783203125, 0.04477500915527344, 0.04781341552734375, 0.05085182189941406, 0.053890228271484375, 0.05692863464355469, 0.059967041015625, 0.06300544738769531, 0.06604385375976562, 0.06908226013183594, 0.07212066650390625, 0.07515907287597656, 0.07819747924804688, 0.08123588562011719, 0.0842742919921875, 0.08731269836425781, 0.09035110473632812, 0.09338951110839844, 0.09642791748046875, 0.09946632385253906, 0.10250473022460938, 0.10554313659667969, 0.10858154296875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 4.0, 3.0, 12.0, 8.0, 11.0, 9.0, 9.0, 14.0, 15.0, 19.0, 21.0, 22.0, 26.0, 29.0, 39.0, 36.0, 39.0, 38.0, 35.0, 34.0, 33.0, 43.0, 39.0, 31.0, 39.0, 38.0, 38.0, 25.0, 33.0, 43.0, 38.0, 21.0, 21.0, 15.0, 17.0, 12.0, 19.0, 12.0, 16.0, 9.0, 8.0, 5.0, 4.0, 6.0, 6.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0231475830078125, -0.022372007369995117, -0.021596431732177734, -0.02082085609436035, -0.02004528045654297, -0.019269704818725586, -0.018494129180908203, -0.01771855354309082, -0.016942977905273438, -0.016167402267456055, -0.015391826629638672, -0.014616250991821289, -0.013840675354003906, -0.013065099716186523, -0.01228952407836914, -0.011513948440551758, -0.010738372802734375, -0.009962797164916992, -0.00918722152709961, -0.008411645889282227, -0.007636070251464844, -0.006860494613647461, -0.006084918975830078, -0.005309343338012695, -0.0045337677001953125, -0.0037581920623779297, -0.002982616424560547, -0.002207040786743164, -0.0014314651489257812, -0.0006558895111083984, 0.00011968612670898438, 0.0008952617645263672, 0.00167083740234375, 0.002446413040161133, 0.0032219886779785156, 0.0039975643157958984, 0.004773139953613281, 0.005548715591430664, 0.006324291229248047, 0.00709986686706543, 0.007875442504882812, 0.008651018142700195, 0.009426593780517578, 0.010202169418334961, 0.010977745056152344, 0.011753320693969727, 0.01252889633178711, 0.013304471969604492, 0.014080047607421875, 0.014855623245239258, 0.01563119888305664, 0.016406774520874023, 0.017182350158691406, 0.01795792579650879, 0.018733501434326172, 0.019509077072143555, 0.020284652709960938, 0.02106022834777832, 0.021835803985595703, 0.022611379623413086, 0.02338695526123047, 0.02416253089904785, 0.024938106536865234, 0.025713682174682617, 0.0264892578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 7.0, 10.0, 8.0, 8.0, 27.0, 34.0, 51.0, 65.0, 101.0, 181.0, 281.0, 593.0, 1306.0, 3519.0, 17059.0, 947592.0, 67436.0, 6433.0, 1999.0, 835.0, 401.0, 220.0, 129.0, 86.0, 48.0, 47.0, 26.0, 16.0, 9.0, 10.0, 5.0, 1.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1224365234375, -0.11900997161865234, -0.11558341979980469, -0.11215686798095703, -0.10873031616210938, -0.10530376434326172, -0.10187721252441406, -0.0984506607055664, -0.09502410888671875, -0.0915975570678711, -0.08817100524902344, -0.08474445343017578, -0.08131790161132812, -0.07789134979248047, -0.07446479797363281, -0.07103824615478516, -0.0676116943359375, -0.06418514251708984, -0.06075859069824219, -0.05733203887939453, -0.053905487060546875, -0.05047893524169922, -0.04705238342285156, -0.043625831604003906, -0.04019927978515625, -0.036772727966308594, -0.03334617614746094, -0.02991962432861328, -0.026493072509765625, -0.02306652069091797, -0.019639968872070312, -0.016213417053222656, -0.012786865234375, -0.009360313415527344, -0.0059337615966796875, -0.0025072097778320312, 0.000919342041015625, 0.004345893859863281, 0.0077724456787109375, 0.011198997497558594, 0.01462554931640625, 0.018052101135253906, 0.021478652954101562, 0.02490520477294922, 0.028331756591796875, 0.03175830841064453, 0.03518486022949219, 0.038611412048339844, 0.0420379638671875, 0.045464515686035156, 0.04889106750488281, 0.05231761932373047, 0.055744171142578125, 0.05917072296142578, 0.06259727478027344, 0.0660238265991211, 0.06945037841796875, 0.0728769302368164, 0.07630348205566406, 0.07973003387451172, 0.08315658569335938, 0.08658313751220703, 0.09000968933105469, 0.09343624114990234, 0.09686279296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 8.0, 9.0, 11.0, 13.0, 14.0, 21.0, 45.0, 41.0, 61.0, 54.0, 72.0, 116.0, 93.0, 62.0, 81.0, 60.0, 46.0, 42.0, 31.0, 28.0, 15.0, 14.0, 12.0, 11.0, 2.0, 4.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-9.834766387939453e-06, -9.57585871219635e-06, -9.316951036453247e-06, -9.058043360710144e-06, -8.799135684967041e-06, -8.540228009223938e-06, -8.281320333480835e-06, -8.022412657737732e-06, -7.763504981994629e-06, -7.504597306251526e-06, -7.245689630508423e-06, -6.98678195476532e-06, -6.727874279022217e-06, -6.468966603279114e-06, -6.210058927536011e-06, -5.951151251792908e-06, -5.692243576049805e-06, -5.433335900306702e-06, -5.174428224563599e-06, -4.915520548820496e-06, -4.656612873077393e-06, -4.3977051973342896e-06, -4.1387975215911865e-06, -3.8798898458480835e-06, -3.6209821701049805e-06, -3.3620744943618774e-06, -3.1031668186187744e-06, -2.8442591428756714e-06, -2.5853514671325684e-06, -2.3264437913894653e-06, -2.0675361156463623e-06, -1.8086284399032593e-06, -1.5497207641601562e-06, -1.2908130884170532e-06, -1.0319054126739502e-06, -7.729977369308472e-07, -5.140900611877441e-07, -2.551823854446411e-07, 3.725290298461914e-09, 2.6263296604156494e-07, 5.21540641784668e-07, 7.80448317527771e-07, 1.039355993270874e-06, 1.298263669013977e-06, 1.55717134475708e-06, 1.816079020500183e-06, 2.074986696243286e-06, 2.333894371986389e-06, 2.592802047729492e-06, 2.8517097234725952e-06, 3.1106173992156982e-06, 3.3695250749588013e-06, 3.6284327507019043e-06, 3.887340426445007e-06, 4.14624810218811e-06, 4.405155777931213e-06, 4.664063453674316e-06, 4.9229711294174194e-06, 5.1818788051605225e-06, 5.4407864809036255e-06, 5.6996941566467285e-06, 5.9586018323898315e-06, 6.2175095081329346e-06, 6.476417183876038e-06, 6.735324859619141e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 3.0, 3.0, 3.0, 8.0, 16.0, 30.0, 28.0, 32.0, 50.0, 79.0, 147.0, 246.0, 415.0, 878.0, 1830.0, 5526.0, 28361.0, 947938.0, 50779.0, 7694.0, 2305.0, 1001.0, 461.0, 283.0, 128.0, 109.0, 81.0, 39.0, 20.0, 20.0, 12.0, 11.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2144775390625, -0.20845603942871094, -0.20243453979492188, -0.1964130401611328, -0.19039154052734375, -0.1843700408935547, -0.17834854125976562, -0.17232704162597656, -0.1663055419921875, -0.16028404235839844, -0.15426254272460938, -0.1482410430908203, -0.14221954345703125, -0.1361980438232422, -0.13017654418945312, -0.12415504455566406, -0.118133544921875, -0.11211204528808594, -0.10609054565429688, -0.10006904602050781, -0.09404754638671875, -0.08802604675292969, -0.08200454711914062, -0.07598304748535156, -0.0699615478515625, -0.06394004821777344, -0.057918548583984375, -0.05189704895019531, -0.04587554931640625, -0.03985404968261719, -0.033832550048828125, -0.027811050415039062, -0.02178955078125, -0.015768051147460938, -0.009746551513671875, -0.0037250518798828125, 0.00229644775390625, 0.008317947387695312, 0.014339447021484375, 0.020360946655273438, 0.0263824462890625, 0.03240394592285156, 0.038425445556640625, 0.04444694519042969, 0.05046844482421875, 0.05648994445800781, 0.06251144409179688, 0.06853294372558594, 0.074554443359375, 0.08057594299316406, 0.08659744262695312, 0.09261894226074219, 0.09864044189453125, 0.10466194152832031, 0.11068344116210938, 0.11670494079589844, 0.1227264404296875, 0.12874794006347656, 0.13476943969726562, 0.1407909393310547, 0.14681243896484375, 0.1528339385986328, 0.15885543823242188, 0.16487693786621094, 0.1708984375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 4.0, 6.0, 5.0, 11.0, 10.0, 2.0, 9.0, 17.0, 12.0, 7.0, 20.0, 26.0, 65.0, 116.0, 441.0, 90.0, 41.0, 34.0, 23.0, 14.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10614013671875, -0.10286331176757812, -0.09958648681640625, -0.09630966186523438, -0.0930328369140625, -0.08975601196289062, -0.08647918701171875, -0.08320236206054688, -0.079925537109375, -0.07664871215820312, -0.07337188720703125, -0.07009506225585938, -0.0668182373046875, -0.06354141235351562, -0.06026458740234375, -0.056987762451171875, -0.0537109375, -0.050434112548828125, -0.04715728759765625, -0.043880462646484375, -0.0406036376953125, -0.037326812744140625, -0.03404998779296875, -0.030773162841796875, -0.027496337890625, -0.024219512939453125, -0.02094268798828125, -0.017665863037109375, -0.0143890380859375, -0.011112213134765625, -0.00783538818359375, -0.004558563232421875, -0.00128173828125, 0.001995086669921875, 0.00527191162109375, 0.008548736572265625, 0.0118255615234375, 0.015102386474609375, 0.01837921142578125, 0.021656036376953125, 0.024932861328125, 0.028209686279296875, 0.03148651123046875, 0.034763336181640625, 0.0380401611328125, 0.041316986083984375, 0.04459381103515625, 0.047870635986328125, 0.0511474609375, 0.054424285888671875, 0.05770111083984375, 0.060977935791015625, 0.0642547607421875, 0.06753158569335938, 0.07080841064453125, 0.07408523559570312, 0.077362060546875, 0.08063888549804688, 0.08391571044921875, 0.08719253540039062, 0.0904693603515625, 0.09374618530273438, 0.09702301025390625, 0.10029983520507812, 0.10357666015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 9.0, 6.0, 19.0, 30.0, 171.0, 565.0, 129.0, 28.0, 18.0, 12.0, 3.0, 3.0, 3.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5227593183517456, -1.4849562644958496, -1.4471532106399536, -1.4093501567840576, -1.3715471029281616, -1.3337440490722656, -1.2959409952163696, -1.2581379413604736, -1.220334768295288, -1.182531714439392, -1.144728660583496, -1.1069256067276, -1.069122552871704, -1.031319499015808, -0.9935163855552673, -0.9557133316993713, -0.9179103374481201, -0.8801072835922241, -0.8423042297363281, -0.8045011758804321, -0.7666981220245361, -0.7288950681686401, -0.6910919547080994, -0.6532889008522034, -0.6154858469963074, -0.5776827931404114, -0.5398797392845154, -0.5020766854286194, -0.464273601770401, -0.426470547914505, -0.3886674642562866, -0.3508644104003906, -0.31306129693984985, -0.27525824308395386, -0.23745517432689667, -0.19965210556983948, -0.16184905171394348, -0.12404599785804749, -0.0862429291009903, -0.048439860343933105, -0.01063680648803711, 0.027166254818439484, 0.06496931612491608, 0.10277237743139267, 0.14057543873786926, 0.17837849259376526, 0.21618156135082245, 0.25398463010787964, 0.29178768396377563, 0.32959073781967163, 0.3673937916755676, 0.405196875333786, 0.442999929189682, 0.480802983045578, 0.5186060667037964, 0.5564091205596924, 0.5942121744155884, 0.6320152282714844, 0.6698182821273804, 0.7076213359832764, 0.7454243898391724, 0.7832274436950684, 0.8210305571556091, 0.8588336110115051, 0.8966366648674011]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 3.0, 5.0, 9.0, 6.0, 21.0, 22.0, 33.0, 58.0, 71.0, 137.0, 137.0, 124.0, 122.0, 88.0, 50.0, 38.0, 25.0, 8.0, 11.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6240644454956055, -0.6043663024902344, -0.5846681594848633, -0.5649700164794922, -0.5452718734741211, -0.52557373046875, -0.5058755874633789, -0.4861774444580078, -0.4664793014526367, -0.4467811584472656, -0.42708301544189453, -0.40738487243652344, -0.38768672943115234, -0.36798858642578125, -0.34829044342041016, -0.32859230041503906, -0.30889415740966797, -0.2891960144042969, -0.2694978713989258, -0.2497997283935547, -0.2301015853881836, -0.2104034423828125, -0.1907052993774414, -0.1710071563720703, -0.15130901336669922, -0.13161087036132812, -0.11191272735595703, -0.09221458435058594, -0.07251644134521484, -0.05281829833984375, -0.033120155334472656, -0.013422012329101562, 0.006276071071624756, 0.02597421407699585, 0.04567235708236694, 0.06537050008773804, 0.08506864309310913, 0.10476678609848022, 0.12446492910385132, 0.1441630721092224, 0.1638612151145935, 0.1835593581199646, 0.2032575011253357, 0.2229556441307068, 0.24265378713607788, 0.262351930141449, 0.28205007314682007, 0.30174821615219116, 0.32144635915756226, 0.34114450216293335, 0.36084264516830444, 0.38054078817367554, 0.40023893117904663, 0.4199370741844177, 0.4396352171897888, 0.4593333601951599, 0.479031503200531, 0.4987296462059021, 0.5184277892112732, 0.5381259322166443, 0.5578240752220154, 0.5775222182273865, 0.5972203612327576, 0.6169185042381287, 0.6366166472434998]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 10.0, 9.0, 12.0, 13.0, 11.0, 17.0, 35.0, 40.0, 125.0, 1086.0, 42800.0, 4146638.0, 3044.0, 189.0, 74.0, 36.0, 22.0, 22.0, 21.0, 13.0, 8.0, 5.0, 5.0, 4.0, 7.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.2232666015625, -5.055908203125, -4.8885498046875, -4.72119140625, -4.5538330078125, -4.386474609375, -4.2191162109375, -4.0517578125, -3.8843994140625, -3.717041015625, -3.5496826171875, -3.38232421875, -3.2149658203125, -3.047607421875, -2.8802490234375, -2.712890625, -2.5455322265625, -2.378173828125, -2.2108154296875, -2.04345703125, -1.8760986328125, -1.708740234375, -1.5413818359375, -1.3740234375, -1.2066650390625, -1.039306640625, -0.8719482421875, -0.70458984375, -0.5372314453125, -0.369873046875, -0.2025146484375, -0.03515625, 0.1322021484375, 0.299560546875, 0.4669189453125, 0.63427734375, 0.8016357421875, 0.968994140625, 1.1363525390625, 1.3037109375, 1.4710693359375, 1.638427734375, 1.8057861328125, 1.97314453125, 2.1405029296875, 2.307861328125, 2.4752197265625, 2.642578125, 2.8099365234375, 2.977294921875, 3.1446533203125, 3.31201171875, 3.4793701171875, 3.646728515625, 3.8140869140625, 3.9814453125, 4.1488037109375, 4.316162109375, 4.4835205078125, 4.65087890625, 4.8182373046875, 4.985595703125, 5.1529541015625, 5.3203125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 4.0, 5.0, 4.0, 6.0, 5.0, 6.0, 13.0, 21.0, 42.0, 80.0, 139.0, 194.0, 171.0, 113.0, 62.0, 24.0, 22.0, 11.0, 6.0, 6.0, 8.0, 8.0, 5.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004169464111328125, -0.004033923149108887, -0.0038983821868896484, -0.00376284122467041, -0.003627300262451172, -0.0034917593002319336, -0.0033562183380126953, -0.003220677375793457, -0.0030851364135742188, -0.0029495954513549805, -0.002814054489135742, -0.002678513526916504, -0.0025429725646972656, -0.0024074316024780273, -0.002271890640258789, -0.0021363496780395508, -0.0020008087158203125, -0.0018652677536010742, -0.001729726791381836, -0.0015941858291625977, -0.0014586448669433594, -0.001323103904724121, -0.0011875629425048828, -0.0010520219802856445, -0.0009164810180664062, -0.000780940055847168, -0.0006453990936279297, -0.0005098581314086914, -0.0003743171691894531, -0.00023877620697021484, -0.00010323524475097656, 3.230571746826172e-05, 0.0001678466796875, 0.0003033876419067383, 0.00043892860412597656, 0.0005744695663452148, 0.0007100105285644531, 0.0008455514907836914, 0.0009810924530029297, 0.001116633415222168, 0.0012521743774414062, 0.0013877153396606445, 0.0015232563018798828, 0.001658797264099121, 0.0017943382263183594, 0.0019298791885375977, 0.002065420150756836, 0.0022009611129760742, 0.0023365020751953125, 0.0024720430374145508, 0.002607583999633789, 0.0027431249618530273, 0.0028786659240722656, 0.003014206886291504, 0.003149747848510742, 0.0032852888107299805, 0.0034208297729492188, 0.003556370735168457, 0.0036919116973876953, 0.0038274526596069336, 0.003962993621826172, 0.00409853458404541, 0.0042340755462646484, 0.004369616508483887, 0.004505157470703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 11.0, 7.0, 6.0, 10.0, 9.0, 14.0, 23.0, 25.0, 32.0, 40.0, 50.0, 67.0, 89.0, 87.0, 141.0, 125.0, 199.0, 527.0, 15317.0, 4174204.0, 2606.0, 209.0, 119.0, 105.0, 78.0, 53.0, 36.0, 36.0, 18.0, 16.0, 8.0, 1.0, 2.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.447265625, -1.4104843139648438, -1.3737030029296875, -1.3369216918945312, -1.300140380859375, -1.2633590698242188, -1.2265777587890625, -1.1897964477539062, -1.15301513671875, -1.1162338256835938, -1.0794525146484375, -1.0426712036132812, -1.005889892578125, -0.9691085815429688, -0.9323272705078125, -0.8955459594726562, -0.8587646484375, -0.8219833374023438, -0.7852020263671875, -0.7484207153320312, -0.711639404296875, -0.6748580932617188, -0.6380767822265625, -0.6012954711914062, -0.56451416015625, -0.5277328491210938, -0.4909515380859375, -0.45417022705078125, -0.417388916015625, -0.38060760498046875, -0.3438262939453125, -0.30704498291015625, -0.270263671875, -0.23348236083984375, -0.1967010498046875, -0.15991973876953125, -0.123138427734375, -0.08635711669921875, -0.0495758056640625, -0.01279449462890625, 0.02398681640625, 0.06076812744140625, 0.0975494384765625, 0.13433074951171875, 0.171112060546875, 0.20789337158203125, 0.2446746826171875, 0.28145599365234375, 0.3182373046875, 0.35501861572265625, 0.3917999267578125, 0.42858123779296875, 0.465362548828125, 0.5021438598632812, 0.5389251708984375, 0.5757064819335938, 0.61248779296875, 0.6492691040039062, 0.6860504150390625, 0.7228317260742188, 0.759613037109375, 0.7963943481445312, 0.8331756591796875, 0.8699569702148438, 0.90673828125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 6.0, 3.0, 3.0, 6.0, 5.0, 10.0, 12.0, 12.0, 13.0, 11.0, 13.0, 29.0, 27.0, 34.0, 52.0, 62.0, 80.0, 105.0, 118.0, 149.0, 157.0, 185.0, 266.0, 350.0, 1104.0, 327.0, 216.0, 153.0, 139.0, 120.0, 86.0, 62.0, 51.0, 31.0, 30.0, 14.0, 7.0, 4.0, 13.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.011260986328125, -0.01097559928894043, -0.01069021224975586, -0.010404825210571289, -0.010119438171386719, -0.009834051132202148, -0.009548664093017578, -0.009263277053833008, -0.008977890014648438, -0.008692502975463867, -0.008407115936279297, -0.008121728897094727, -0.007836341857910156, -0.007550954818725586, -0.007265567779541016, -0.006980180740356445, -0.006694793701171875, -0.006409406661987305, -0.006124019622802734, -0.005838632583618164, -0.005553245544433594, -0.0052678585052490234, -0.004982471466064453, -0.004697084426879883, -0.0044116973876953125, -0.004126310348510742, -0.003840923309326172, -0.0035555362701416016, -0.0032701492309570312, -0.002984762191772461, -0.0026993751525878906, -0.0024139881134033203, -0.00212860107421875, -0.0018432140350341797, -0.0015578269958496094, -0.001272439956665039, -0.0009870529174804688, -0.0007016658782958984, -0.0004162788391113281, -0.0001308917999267578, 0.0001544952392578125, 0.0004398822784423828, 0.0007252693176269531, 0.0010106563568115234, 0.0012960433959960938, 0.001581430435180664, 0.0018668174743652344, 0.0021522045135498047, 0.002437591552734375, 0.0027229785919189453, 0.0030083656311035156, 0.003293752670288086, 0.0035791397094726562, 0.0038645267486572266, 0.004149913787841797, 0.004435300827026367, 0.0047206878662109375, 0.005006074905395508, 0.005291461944580078, 0.0055768489837646484, 0.005862236022949219, 0.006147623062133789, 0.006433010101318359, 0.00671839714050293, 0.0070037841796875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 13.0, 106.0, 894.0, 5.0, 2.0], "bins": [-6.651535511016846, -6.543209552764893, -6.4348835945129395, -6.326557159423828, -6.218231201171875, -6.109905242919922, -6.001579284667969, -5.893253326416016, -5.784926891326904, -5.676600933074951, -5.568274974822998, -5.459948539733887, -5.351622581481934, -5.2432966232299805, -5.134970664978027, -5.026644706726074, -4.918318748474121, -4.809992790222168, -4.701666831970215, -4.5933403968811035, -4.48501443862915, -4.376688480377197, -4.268362522125244, -4.160036563873291, -4.05171012878418, -3.9433841705322266, -3.8350579738616943, -3.726732015609741, -3.618405818939209, -3.510079860687256, -3.4017539024353027, -3.2934277057647705, -3.1851015090942383, -3.076775550842285, -2.968449354171753, -2.8601233959198, -2.7517971992492676, -2.6434712409973145, -2.5351452827453613, -2.426819086074829, -2.318493127822876, -2.210167169570923, -2.1018409729003906, -1.9935150146484375, -1.8851889371871948, -1.7768628597259521, -1.6685367822647095, -1.5602107048034668, -1.4518847465515137, -1.343558669090271, -1.2352325916290283, -1.1269066333770752, -1.0185805559158325, -0.9102544784545898, -0.8019284009933472, -0.6936023831367493, -0.5852762460708618, -0.47695019841194153, -0.36862415075302124, -0.26029807329177856, -0.15197202563285828, -0.04364597797393799, 0.06468009948730469, 0.1730061173439026, 0.28133219480514526]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 9.0, 6.0, 14.0, 18.0, 31.0, 60.0, 78.0, 88.0, 93.0, 108.0, 115.0, 111.0, 66.0, 67.0, 44.0, 32.0, 19.0, 18.0, 11.0, 8.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4141967296600342, -0.4048404395580292, -0.39548414945602417, -0.3861278295516968, -0.3767715394496918, -0.36741524934768677, -0.35805895924568176, -0.34870266914367676, -0.33934634923934937, -0.32999005913734436, -0.32063376903533936, -0.31127744913101196, -0.30192115902900696, -0.29256486892700195, -0.28320857882499695, -0.27385228872299194, -0.26449596881866455, -0.25513967871665955, -0.24578337371349335, -0.23642708361148834, -0.22707077860832214, -0.21771448850631714, -0.20835819840431213, -0.19900189340114594, -0.18964561820030212, -0.18028932809829712, -0.17093302309513092, -0.16157673299312592, -0.15222042798995972, -0.1428641378879547, -0.1335078477859497, -0.12415154278278351, -0.11479523777961731, -0.10543894022703171, -0.0960826426744461, -0.0867263525724411, -0.0773700475692749, -0.0680137574672699, -0.058657459914684296, -0.049301162362098694, -0.03994486480951309, -0.03058856725692749, -0.021232271566987038, -0.011875975877046585, -0.0025196783244609833, 0.0068366192281246185, 0.016192913055419922, 0.025549210608005524, 0.034905508160591125, 0.04426180571317673, 0.05361810326576233, 0.06297439336776733, 0.07233069837093353, 0.08168698847293854, 0.09104328602552414, 0.10039958357810974, 0.10975588113069534, 0.11911217868328094, 0.12846846878528595, 0.13782477378845215, 0.14718106389045715, 0.15653736889362335, 0.16589365899562836, 0.17524996399879456, 0.18460625410079956]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 0.0, 14.0, 18.0, 16.0, 19.0, 21.0, 33.0, 54.0, 85.0, 95.0, 122.0, 178.0, 247.0, 284.0, 399.0, 502.0, 667.0, 902.0, 1194.0, 1662.0, 2390.0, 3443.0, 5186.0, 8465.0, 15311.0, 38231.0, 333120.0, 542105.0, 48661.0, 17290.0, 9126.0, 5578.0, 3665.0, 2486.0, 1711.0, 1323.0, 979.0, 709.0, 546.0, 388.0, 321.0, 252.0, 203.0, 155.0, 101.0, 78.0, 55.0, 49.0, 39.0, 27.0, 15.0, 6.0, 11.0, 13.0, 4.0, 4.0, 3.0, 5.0], "bins": [-0.045074462890625, -0.04371213912963867, -0.042349815368652344, -0.040987491607666016, -0.03962516784667969, -0.03826284408569336, -0.03690052032470703, -0.0355381965637207, -0.034175872802734375, -0.03281354904174805, -0.03145122528076172, -0.03008890151977539, -0.028726577758789062, -0.027364253997802734, -0.026001930236816406, -0.024639606475830078, -0.02327728271484375, -0.021914958953857422, -0.020552635192871094, -0.019190311431884766, -0.017827987670898438, -0.01646566390991211, -0.015103340148925781, -0.013741016387939453, -0.012378692626953125, -0.011016368865966797, -0.009654045104980469, -0.00829172134399414, -0.0069293975830078125, -0.005567073822021484, -0.004204750061035156, -0.002842426300048828, -0.0014801025390625, -0.00011777877807617188, 0.0012445449829101562, 0.0026068687438964844, 0.0039691925048828125, 0.005331516265869141, 0.006693840026855469, 0.008056163787841797, 0.009418487548828125, 0.010780811309814453, 0.012143135070800781, 0.01350545883178711, 0.014867782592773438, 0.016230106353759766, 0.017592430114746094, 0.018954753875732422, 0.02031707763671875, 0.021679401397705078, 0.023041725158691406, 0.024404048919677734, 0.025766372680664062, 0.02712869644165039, 0.02849102020263672, 0.029853343963623047, 0.031215667724609375, 0.0325779914855957, 0.03394031524658203, 0.03530263900756836, 0.03666496276855469, 0.038027286529541016, 0.039389610290527344, 0.04075193405151367, 0.0421142578125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 2.0, 4.0, 2.0, 5.0, 5.0, 4.0, 7.0, 8.0, 10.0, 15.0, 23.0, 41.0, 55.0, 101.0, 137.0, 159.0, 139.0, 97.0, 63.0, 30.0, 21.0, 12.0, 10.0, 6.0, 6.0, 5.0, 6.0, 6.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004032135009765625, -0.003899216651916504, -0.003766298294067383, -0.0036333799362182617, -0.0035004615783691406, -0.0033675432205200195, -0.0032346248626708984, -0.0031017065048217773, -0.0029687881469726562, -0.002835869789123535, -0.002702951431274414, -0.002570033073425293, -0.002437114715576172, -0.0023041963577270508, -0.0021712779998779297, -0.0020383596420288086, -0.0019054412841796875, -0.0017725229263305664, -0.0016396045684814453, -0.0015066862106323242, -0.0013737678527832031, -0.001240849494934082, -0.001107931137084961, -0.0009750127792358398, -0.0008420944213867188, -0.0007091760635375977, -0.0005762577056884766, -0.00044333934783935547, -0.0003104209899902344, -0.00017750263214111328, -4.458427429199219e-05, 8.83340835571289e-05, 0.00022125244140625, 0.0003541707992553711, 0.0004870891571044922, 0.0006200075149536133, 0.0007529258728027344, 0.0008858442306518555, 0.0010187625885009766, 0.0011516809463500977, 0.0012845993041992188, 0.0014175176620483398, 0.001550436019897461, 0.001683354377746582, 0.0018162727355957031, 0.0019491910934448242, 0.0020821094512939453, 0.0022150278091430664, 0.0023479461669921875, 0.0024808645248413086, 0.0026137828826904297, 0.0027467012405395508, 0.002879619598388672, 0.003012537956237793, 0.003145456314086914, 0.003278374671936035, 0.0034112930297851562, 0.0035442113876342773, 0.0036771297454833984, 0.0038100481033325195, 0.003942966461181641, 0.004075884819030762, 0.004208803176879883, 0.004341721534729004, 0.004474639892578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 5.0, 4.0, 8.0, 12.0, 17.0, 21.0, 19.0, 12.0, 29.0, 24.0, 39.0, 42.0, 65.0, 174.0, 618.0, 5640.0, 836429.0, 201485.0, 3037.0, 395.0, 125.0, 74.0, 56.0, 38.0, 26.0, 35.0, 22.0, 17.0, 10.0, 14.0, 9.0, 8.0, 9.0, 9.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.204345703125, -0.19865036010742188, -0.19295501708984375, -0.18725967407226562, -0.1815643310546875, -0.17586898803710938, -0.17017364501953125, -0.16447830200195312, -0.158782958984375, -0.15308761596679688, -0.14739227294921875, -0.14169692993164062, -0.1360015869140625, -0.13030624389648438, -0.12461090087890625, -0.11891555786132812, -0.11322021484375, -0.10752487182617188, -0.10182952880859375, -0.09613418579101562, -0.0904388427734375, -0.08474349975585938, -0.07904815673828125, -0.07335281372070312, -0.067657470703125, -0.061962127685546875, -0.05626678466796875, -0.050571441650390625, -0.0448760986328125, -0.039180755615234375, -0.03348541259765625, -0.027790069580078125, -0.0220947265625, -0.016399383544921875, -0.01070404052734375, -0.005008697509765625, 0.0006866455078125, 0.006381988525390625, 0.01207733154296875, 0.017772674560546875, 0.023468017578125, 0.029163360595703125, 0.03485870361328125, 0.040554046630859375, 0.0462493896484375, 0.051944732666015625, 0.05764007568359375, 0.06333541870117188, 0.06903076171875, 0.07472610473632812, 0.08042144775390625, 0.08611679077148438, 0.0918121337890625, 0.09750747680664062, 0.10320281982421875, 0.10889816284179688, 0.114593505859375, 0.12028884887695312, 0.12598419189453125, 0.13167953491210938, 0.1373748779296875, 0.14307022094726562, 0.14876556396484375, 0.15446090698242188, 0.16015625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 9.0, 5.0, 11.0, 12.0, 20.0, 21.0, 37.0, 18.0, 30.0, 18.0, 40.0, 27.0, 43.0, 45.0, 34.0, 23.0, 43.0, 46.0, 43.0, 45.0, 45.0, 43.0, 33.0, 49.0, 32.0, 29.0, 30.0, 21.0, 27.0, 22.0, 10.0, 14.0, 8.0, 14.0, 12.0, 13.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.019287109375, -0.01876676082611084, -0.01824641227722168, -0.01772606372833252, -0.01720571517944336, -0.0166853666305542, -0.01616501808166504, -0.01564466953277588, -0.015124320983886719, -0.014603972434997559, -0.014083623886108398, -0.013563275337219238, -0.013042926788330078, -0.012522578239440918, -0.012002229690551758, -0.011481881141662598, -0.010961532592773438, -0.010441184043884277, -0.009920835494995117, -0.009400486946105957, -0.008880138397216797, -0.008359789848327637, -0.007839441299438477, -0.007319092750549316, -0.006798744201660156, -0.006278395652770996, -0.005758047103881836, -0.005237698554992676, -0.004717350006103516, -0.0041970014572143555, -0.0036766529083251953, -0.003156304359436035, -0.002635955810546875, -0.002115607261657715, -0.0015952587127685547, -0.0010749101638793945, -0.0005545616149902344, -3.421306610107422e-05, 0.00048613548278808594, 0.001006484031677246, 0.0015268325805664062, 0.0020471811294555664, 0.0025675296783447266, 0.0030878782272338867, 0.003608226776123047, 0.004128575325012207, 0.004648923873901367, 0.005169272422790527, 0.0056896209716796875, 0.006209969520568848, 0.006730318069458008, 0.007250666618347168, 0.007771015167236328, 0.008291363716125488, 0.008811712265014648, 0.009332060813903809, 0.009852409362792969, 0.010372757911682129, 0.010893106460571289, 0.01141345500946045, 0.01193380355834961, 0.01245415210723877, 0.01297450065612793, 0.01349484920501709, 0.01401519775390625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 10.0, 33.0, 105.0, 1003.0, 1046138.0, 1105.0, 105.0, 25.0, 12.0, 6.0, 7.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.36328125, -1.32489013671875, -1.2864990234375, -1.24810791015625, -1.209716796875, -1.17132568359375, -1.1329345703125, -1.09454345703125, -1.05615234375, -1.01776123046875, -0.9793701171875, -0.94097900390625, -0.902587890625, -0.86419677734375, -0.8258056640625, -0.78741455078125, -0.7490234375, -0.71063232421875, -0.6722412109375, -0.63385009765625, -0.595458984375, -0.55706787109375, -0.5186767578125, -0.48028564453125, -0.44189453125, -0.40350341796875, -0.3651123046875, -0.32672119140625, -0.288330078125, -0.24993896484375, -0.2115478515625, -0.17315673828125, -0.134765625, -0.09637451171875, -0.0579833984375, -0.01959228515625, 0.018798828125, 0.05718994140625, 0.0955810546875, 0.13397216796875, 0.17236328125, 0.21075439453125, 0.2491455078125, 0.28753662109375, 0.325927734375, 0.36431884765625, 0.4027099609375, 0.44110107421875, 0.4794921875, 0.51788330078125, 0.5562744140625, 0.59466552734375, 0.633056640625, 0.67144775390625, 0.7098388671875, 0.74822998046875, 0.78662109375, 0.82501220703125, 0.8634033203125, 0.90179443359375, 0.940185546875, 0.97857666015625, 1.0169677734375, 1.05535888671875, 1.09375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 9.0, 12.0, 32.0, 106.0, 474.0, 219.0, 39.0, 20.0, 18.0, 15.0, 10.0, 5.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00021576881408691406, -0.0002103373408317566, -0.00020490586757659912, -0.00019947439432144165, -0.00019404292106628418, -0.0001886114478111267, -0.00018317997455596924, -0.00017774850130081177, -0.0001723170280456543, -0.00016688555479049683, -0.00016145408153533936, -0.00015602260828018188, -0.00015059113502502441, -0.00014515966176986694, -0.00013972818851470947, -0.000134296715259552, -0.00012886524200439453, -0.00012343376874923706, -0.00011800229549407959, -0.00011257082223892212, -0.00010713934898376465, -0.00010170787572860718, -9.627640247344971e-05, -9.084492921829224e-05, -8.541345596313477e-05, -7.99819827079773e-05, -7.455050945281982e-05, -6.911903619766235e-05, -6.368756294250488e-05, -5.825608968734741e-05, -5.282461643218994e-05, -4.739314317703247e-05, -4.1961669921875e-05, -3.653019666671753e-05, -3.109872341156006e-05, -2.5667250156402588e-05, -2.0235776901245117e-05, -1.4804303646087646e-05, -9.372830390930176e-06, -3.941357135772705e-06, 1.4901161193847656e-06, 6.921589374542236e-06, 1.2353062629699707e-05, 1.7784535884857178e-05, 2.321600914001465e-05, 2.864748239517212e-05, 3.407895565032959e-05, 3.951042890548706e-05, 4.494190216064453e-05, 5.0373375415802e-05, 5.580484867095947e-05, 6.123632192611694e-05, 6.666779518127441e-05, 7.209926843643188e-05, 7.753074169158936e-05, 8.296221494674683e-05, 8.83936882019043e-05, 9.382516145706177e-05, 9.925663471221924e-05, 0.00010468810796737671, 0.00011011958122253418, 0.00011555105447769165, 0.00012098252773284912, 0.0001264140009880066, 0.00013184547424316406]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 26.0, 55.0, 124.0, 858.0, 22344.0, 1022825.0, 1933.0, 249.0, 67.0, 27.0, 12.0, 6.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7568359375, -0.7317581176757812, -0.7066802978515625, -0.6816024780273438, -0.656524658203125, -0.6314468383789062, -0.6063690185546875, -0.5812911987304688, -0.55621337890625, -0.5311355590820312, -0.5060577392578125, -0.48097991943359375, -0.455902099609375, -0.43082427978515625, -0.4057464599609375, -0.38066864013671875, -0.3555908203125, -0.33051300048828125, -0.3054351806640625, -0.28035736083984375, -0.255279541015625, -0.23020172119140625, -0.2051239013671875, -0.18004608154296875, -0.15496826171875, -0.12989044189453125, -0.1048126220703125, -0.07973480224609375, -0.054656982421875, -0.02957916259765625, -0.0045013427734375, 0.02057647705078125, 0.045654296875, 0.07073211669921875, 0.0958099365234375, 0.12088775634765625, 0.145965576171875, 0.17104339599609375, 0.1961212158203125, 0.22119903564453125, 0.24627685546875, 0.27135467529296875, 0.2964324951171875, 0.32151031494140625, 0.346588134765625, 0.37166595458984375, 0.3967437744140625, 0.42182159423828125, 0.4468994140625, 0.47197723388671875, 0.4970550537109375, 0.5221328735351562, 0.547210693359375, 0.5722885131835938, 0.5973663330078125, 0.6224441528320312, 0.64752197265625, 0.6725997924804688, 0.6976776123046875, 0.7227554321289062, 0.747833251953125, 0.7729110717773438, 0.7979888916015625, 0.8230667114257812, 0.84814453125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 7.0, 18.0, 56.0, 596.0, 237.0, 39.0, 14.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1358642578125, -0.1313037872314453, -0.12674331665039062, -0.12218284606933594, -0.11762237548828125, -0.11306190490722656, -0.10850143432617188, -0.10394096374511719, -0.0993804931640625, -0.09482002258300781, -0.09025955200195312, -0.08569908142089844, -0.08113861083984375, -0.07657814025878906, -0.07201766967773438, -0.06745719909667969, -0.062896728515625, -0.05833625793457031, -0.053775787353515625, -0.04921531677246094, -0.04465484619140625, -0.04009437561035156, -0.035533905029296875, -0.030973434448242188, -0.0264129638671875, -0.021852493286132812, -0.017292022705078125, -0.012731552124023438, -0.00817108154296875, -0.0036106109619140625, 0.000949859619140625, 0.0055103302001953125, 0.01007080078125, 0.014631271362304688, 0.019191741943359375, 0.023752212524414062, 0.02831268310546875, 0.03287315368652344, 0.037433624267578125, 0.04199409484863281, 0.0465545654296875, 0.05111503601074219, 0.055675506591796875, 0.06023597717285156, 0.06479644775390625, 0.06935691833496094, 0.07391738891601562, 0.07847785949707031, 0.083038330078125, 0.08759880065917969, 0.09215927124023438, 0.09671974182128906, 0.10128021240234375, 0.10584068298339844, 0.11040115356445312, 0.11496162414550781, 0.1195220947265625, 0.12408256530761719, 0.12864303588867188, 0.13320350646972656, 0.13776397705078125, 0.14232444763183594, 0.14688491821289062, 0.1514453887939453, 0.156005859375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 13.0, 14.0, 60.0, 208.0, 474.0, 176.0, 42.0, 12.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43253469467163086, -0.4124159812927246, -0.39229729771614075, -0.3721785843372345, -0.35205990076065063, -0.3319411873817444, -0.31182247400283813, -0.2917037606239319, -0.271585077047348, -0.2514663636684418, -0.2313476800918579, -0.21122896671295166, -0.1911102682352066, -0.17099156975746155, -0.1508728563785553, -0.13075415790081024, -0.11063545942306519, -0.09051676094532013, -0.07039805501699448, -0.05027935281395912, -0.030160650610923767, -0.010041952133178711, 0.010076753795146942, 0.030195459723472595, 0.05031415820121765, 0.07043285667896271, 0.09055156260728836, 0.11067026853561401, 0.13078896701335907, 0.15090766549110413, 0.17102637887001038, 0.19114507734775543, 0.2112637758255005, 0.23138247430324554, 0.2515011727809906, 0.27161988615989685, 0.2917385697364807, 0.31185728311538696, 0.3319759964942932, 0.35209470987319946, 0.3722133934497833, 0.3923321068286896, 0.41245079040527344, 0.4325695037841797, 0.45268821716308594, 0.4728069007396698, 0.49292561411857605, 0.5130442976951599, 0.5331630110740662, 0.5532817244529724, 0.5734004378318787, 0.5935190916061401, 0.6136378049850464, 0.6337565183639526, 0.6538752317428589, 0.6739939451217651, 0.6941126585006714, 0.7142313718795776, 0.7343500852584839, 0.7544687390327454, 0.7745874524116516, 0.7947061657905579, 0.8148248791694641, 0.8349435925483704, 0.8550622463226318]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 9.0, 18.0, 10.0, 16.0, 24.0, 27.0, 29.0, 39.0, 69.0, 63.0, 84.0, 93.0, 96.0, 77.0, 81.0, 68.0, 49.0, 42.0, 30.0, 14.0, 16.0, 7.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20982682704925537, -0.20254981517791748, -0.1952728033065796, -0.1879957914352417, -0.1807187795639038, -0.17344176769256592, -0.16616475582122803, -0.15888774394989014, -0.15161073207855225, -0.14433372020721436, -0.13705670833587646, -0.12977969646453857, -0.12250268459320068, -0.11522567272186279, -0.1079486608505249, -0.10067164897918701, -0.09339463710784912, -0.08611762523651123, -0.07884061336517334, -0.07156360149383545, -0.06428658962249756, -0.05700957775115967, -0.04973256587982178, -0.04245555400848389, -0.035178542137145996, -0.027901530265808105, -0.020624518394470215, -0.013347506523132324, -0.006070494651794434, 0.001206517219543457, 0.008483529090881348, 0.01576054096221924, 0.02303755283355713, 0.03031456470489502, 0.03759157657623291, 0.0448685884475708, 0.05214560031890869, 0.05942261219024658, 0.06669962406158447, 0.07397663593292236, 0.08125364780426025, 0.08853065967559814, 0.09580767154693604, 0.10308468341827393, 0.11036169528961182, 0.11763870716094971, 0.1249157190322876, 0.1321927309036255, 0.13946974277496338, 0.14674675464630127, 0.15402376651763916, 0.16130077838897705, 0.16857779026031494, 0.17585480213165283, 0.18313181400299072, 0.1904088258743286, 0.1976858377456665, 0.2049628496170044, 0.21223986148834229, 0.21951687335968018, 0.22679388523101807, 0.23407089710235596, 0.24134790897369385, 0.24862492084503174, 0.25590193271636963]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 8.0, 4.0, 10.0, 4.0, 8.0, 6.0, 4.0, 12.0, 8.0, 8.0, 6.0, 18.0, 16.0, 26.0, 22.0, 86.0, 2524.0, 4191077.0, 193.0, 30.0, 18.0, 32.0, 20.0, 12.0, 20.0, 12.0, 16.0, 16.0, 0.0, 6.0, 8.0, 4.0, 6.0, 4.0, 6.0, 0.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0], "bins": [-3.44140625, -3.343597412109375, -3.24578857421875, -3.147979736328125, -3.0501708984375, -2.952362060546875, -2.85455322265625, -2.756744384765625, -2.658935546875, -2.561126708984375, -2.46331787109375, -2.365509033203125, -2.2677001953125, -2.169891357421875, -2.07208251953125, -1.974273681640625, -1.87646484375, -1.778656005859375, -1.68084716796875, -1.583038330078125, -1.4852294921875, -1.387420654296875, -1.28961181640625, -1.191802978515625, -1.093994140625, -0.996185302734375, -0.89837646484375, -0.800567626953125, -0.7027587890625, -0.604949951171875, -0.50714111328125, -0.409332275390625, -0.3115234375, -0.213714599609375, -0.11590576171875, -0.018096923828125, 0.0797119140625, 0.177520751953125, 0.27532958984375, 0.373138427734375, 0.470947265625, 0.568756103515625, 0.66656494140625, 0.764373779296875, 0.8621826171875, 0.959991455078125, 1.05780029296875, 1.155609130859375, 1.25341796875, 1.351226806640625, 1.44903564453125, 1.546844482421875, 1.6446533203125, 1.742462158203125, 1.84027099609375, 1.938079833984375, 2.035888671875, 2.133697509765625, 2.23150634765625, 2.329315185546875, 2.4271240234375, 2.524932861328125, 2.62274169921875, 2.720550537109375, 2.818359375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 6.0, 9.0, 2.0, 10.0, 12.0, 14.0, 34.0, 38.0, 36.0, 68.0, 95.0, 118.0, 110.0, 110.0, 89.0, 62.0, 46.0, 44.0, 18.0, 13.0, 9.0, 11.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031795501708984375, -0.003062635660171509, -0.00294572114944458, -0.0028288066387176514, -0.0027118921279907227, -0.002594977617263794, -0.0024780631065368652, -0.0023611485958099365, -0.002244234085083008, -0.002127319574356079, -0.0020104050636291504, -0.0018934905529022217, -0.001776576042175293, -0.0016596615314483643, -0.0015427470207214355, -0.0014258325099945068, -0.0013089179992675781, -0.0011920034885406494, -0.0010750889778137207, -0.000958174467086792, -0.0008412599563598633, -0.0007243454456329346, -0.0006074309349060059, -0.0004905164241790771, -0.00037360191345214844, -0.0002566874027252197, -0.00013977289199829102, -2.2858381271362305e-05, 9.40561294555664e-05, 0.00021097064018249512, 0.00032788515090942383, 0.00044479966163635254, 0.0005617141723632812, 0.00067862868309021, 0.0007955431938171387, 0.0009124577045440674, 0.001029372215270996, 0.0011462867259979248, 0.0012632012367248535, 0.0013801157474517822, 0.001497030258178711, 0.0016139447689056396, 0.0017308592796325684, 0.001847773790359497, 0.0019646883010864258, 0.0020816028118133545, 0.002198517322540283, 0.002315431833267212, 0.0024323463439941406, 0.0025492608547210693, 0.002666175365447998, 0.0027830898761749268, 0.0029000043869018555, 0.003016918897628784, 0.003133833408355713, 0.0032507479190826416, 0.0033676624298095703, 0.003484576940536499, 0.0036014914512634277, 0.0037184059619903564, 0.003835320472717285, 0.003952234983444214, 0.004069149494171143, 0.004186064004898071, 0.004302978515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 11.0, 30.0, 51.0, 185.0, 2760.0, 4190839.0, 265.0, 82.0, 28.0, 14.0, 10.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.87353515625, -0.8017501831054688, -0.7299652099609375, -0.6581802368164062, -0.586395263671875, -0.5146102905273438, -0.4428253173828125, -0.37104034423828125, -0.29925537109375, -0.22747039794921875, -0.1556854248046875, -0.08390045166015625, -0.012115478515625, 0.05966949462890625, 0.1314544677734375, 0.20323944091796875, 0.2750244140625, 0.34680938720703125, 0.4185943603515625, 0.49037933349609375, 0.562164306640625, 0.6339492797851562, 0.7057342529296875, 0.7775192260742188, 0.84930419921875, 0.9210891723632812, 0.9928741455078125, 1.0646591186523438, 1.136444091796875, 1.2082290649414062, 1.2800140380859375, 1.3517990112304688, 1.423583984375, 1.4953689575195312, 1.5671539306640625, 1.6389389038085938, 1.710723876953125, 1.7825088500976562, 1.8542938232421875, 1.9260787963867188, 1.99786376953125, 2.0696487426757812, 2.1414337158203125, 2.2132186889648438, 2.285003662109375, 2.3567886352539062, 2.4285736083984375, 2.5003585815429688, 2.5721435546875, 2.6439285278320312, 2.7157135009765625, 2.7874984741210938, 2.859283447265625, 2.9310684204101562, 3.0028533935546875, 3.0746383666992188, 3.14642333984375, 3.2182083129882812, 3.2899932861328125, 3.3617782592773438, 3.433563232421875, 3.5053482055664062, 3.5771331787109375, 3.6489181518554688, 3.720703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 7.0, 11.0, 10.0, 20.0, 34.0, 43.0, 55.0, 82.0, 121.0, 212.0, 335.0, 1063.0, 1059.0, 346.0, 182.0, 132.0, 79.0, 76.0, 49.0, 35.0, 28.0, 20.0, 15.0, 8.0, 4.0, 13.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.007320404052734375, -0.007015407085418701, -0.006710410118103027, -0.0064054131507873535, -0.00610041618347168, -0.005795419216156006, -0.005490422248840332, -0.005185425281524658, -0.004880428314208984, -0.0045754313468933105, -0.004270434379577637, -0.003965437412261963, -0.003660440444946289, -0.0033554434776306152, -0.0030504465103149414, -0.0027454495429992676, -0.0024404525756835938, -0.00213545560836792, -0.001830458641052246, -0.0015254616737365723, -0.0012204647064208984, -0.0009154677391052246, -0.0006104707717895508, -0.00030547380447387695, -4.76837158203125e-07, 0.0003045201301574707, 0.0006095170974731445, 0.0009145140647888184, 0.0012195110321044922, 0.001524507999420166, 0.0018295049667358398, 0.0021345019340515137, 0.0024394989013671875, 0.0027444958686828613, 0.003049492835998535, 0.003354489803314209, 0.003659486770629883, 0.003964483737945557, 0.0042694807052612305, 0.004574477672576904, 0.004879474639892578, 0.005184471607208252, 0.005489468574523926, 0.0057944655418396, 0.0060994625091552734, 0.006404459476470947, 0.006709456443786621, 0.007014453411102295, 0.007319450378417969, 0.007624447345733643, 0.007929444313049316, 0.00823444128036499, 0.008539438247680664, 0.008844435214996338, 0.009149432182312012, 0.009454429149627686, 0.00975942611694336, 0.010064423084259033, 0.010369420051574707, 0.01067441701889038, 0.010979413986206055, 0.011284410953521729, 0.011589407920837402, 0.011894404888153076, 0.01219940185546875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 1014.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5046516060829163, -0.3558255434036255, -0.20699948072433472, -0.058173418045043945, 0.09065264463424683, 0.2394787073135376, 0.38830476999282837, 0.5371307730674744, 0.6859568953514099, 0.8347829580307007, 0.9836090207099915, 1.1324350833892822, 1.2812612056732178, 1.4300872087478638, 1.5789132118225098, 1.7277393341064453, 1.8765654563903809, 2.0253915786743164, 2.174217700958252, 2.3230435848236084, 2.471869707107544, 2.6206958293914795, 2.769521713256836, 2.9183478355407715, 3.067173957824707, 3.2160000801086426, 3.364826202392578, 3.5136520862579346, 3.66247820854187, 3.8113043308258057, 3.960130214691162, 4.108956336975098, 4.257781982421875, 4.4066081047058105, 4.555434226989746, 4.704260349273682, 4.853086471557617, 5.0019121170043945, 5.15073823928833, 5.299564361572266, 5.448390483856201, 5.597216606140137, 5.746042728424072, 5.894868850708008, 6.043694496154785, 6.192520618438721, 6.341346740722656, 6.490172863006592, 6.638998985290527, 6.787825107574463, 6.936651229858398, 7.085477352142334, 7.2343034744262695, 7.383129119873047, 7.531955242156982, 7.680781364440918, 7.8296074867248535, 7.978433609008789, 8.127259254455566, 8.27608585357666, 8.424911499023438, 8.573738098144531, 8.722563743591309, 8.871389389038086, 9.02021598815918]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 9.0, 16.0, 38.0, 69.0, 116.0, 169.0, 192.0, 174.0, 105.0, 66.0, 34.0, 14.0, 5.0, 6.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08072179555892944, -0.0755595788359642, -0.07039736211299896, -0.06523513793945312, -0.060072921216487885, -0.054910704493522644, -0.049748484045267105, -0.044586263597011566, -0.039424046874046326, -0.034261830151081085, -0.029099609702825546, -0.023937391117215157, -0.018775172531604767, -0.013612953945994377, -0.008450735360383987, -0.0032885149121284485, 0.001873701810836792, 0.007035920396447182, 0.012198138982057571, 0.01736035756766796, 0.02252257615327835, 0.02768479473888874, 0.03284701332449913, 0.03800923377275467, 0.04317145049571991, 0.04833366721868515, 0.05349588766694069, 0.05865810811519623, 0.06382032483816147, 0.06898254156112671, 0.07414476573467255, 0.07930698245763779, 0.08446919918060303, 0.08963141590356827, 0.09479363262653351, 0.09995585680007935, 0.10511807352304459, 0.11028029024600983, 0.11544251441955566, 0.1206047311425209, 0.12576694786548615, 0.13092917203903198, 0.13609138131141663, 0.14125360548496246, 0.1464158296585083, 0.15157803893089294, 0.15674026310443878, 0.16190248727798462, 0.16706469655036926, 0.1722269207239151, 0.17738912999629974, 0.18255135416984558, 0.18771356344223022, 0.19287578761577606, 0.1980380117893219, 0.20320022106170654, 0.20836244523525238, 0.21352466940879822, 0.21868687868118286, 0.2238491028547287, 0.22901132702827454, 0.23417353630065918, 0.23933576047420502, 0.24449798464775085, 0.2496601939201355]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 10.0, 14.0, 8.0, 17.0, 17.0, 19.0, 22.0, 29.0, 38.0, 37.0, 59.0, 44.0, 60.0, 182.0, 958337.0, 89129.0, 126.0, 56.0, 53.0, 63.0, 29.0, 36.0, 29.0, 18.0, 15.0, 19.0, 9.0, 12.0, 8.0, 9.0, 5.0, 7.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.6328125, -0.610137939453125, -0.58746337890625, -0.564788818359375, -0.5421142578125, -0.519439697265625, -0.49676513671875, -0.474090576171875, -0.451416015625, -0.428741455078125, -0.40606689453125, -0.383392333984375, -0.3607177734375, -0.338043212890625, -0.31536865234375, -0.292694091796875, -0.27001953125, -0.247344970703125, -0.22467041015625, -0.201995849609375, -0.1793212890625, -0.156646728515625, -0.13397216796875, -0.111297607421875, -0.088623046875, -0.065948486328125, -0.04327392578125, -0.020599365234375, 0.0020751953125, 0.024749755859375, 0.04742431640625, 0.070098876953125, 0.0927734375, 0.115447998046875, 0.13812255859375, 0.160797119140625, 0.1834716796875, 0.206146240234375, 0.22882080078125, 0.251495361328125, 0.274169921875, 0.296844482421875, 0.31951904296875, 0.342193603515625, 0.3648681640625, 0.387542724609375, 0.41021728515625, 0.432891845703125, 0.45556640625, 0.478240966796875, 0.50091552734375, 0.523590087890625, 0.5462646484375, 0.568939208984375, 0.59161376953125, 0.614288330078125, 0.636962890625, 0.659637451171875, 0.68231201171875, 0.704986572265625, 0.7276611328125, 0.750335693359375, 0.77301025390625, 0.795684814453125, 0.818359375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 15.0, 51.0, 154.0, 267.0, 264.0, 171.0, 71.0, 15.0, 10.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0204620361328125, -0.019614458084106445, -0.01876688003540039, -0.017919301986694336, -0.01707172393798828, -0.016224145889282227, -0.015376567840576172, -0.014528989791870117, -0.013681411743164062, -0.012833833694458008, -0.011986255645751953, -0.011138677597045898, -0.010291099548339844, -0.009443521499633789, -0.008595943450927734, -0.00774836540222168, -0.006900787353515625, -0.00605320930480957, -0.005205631256103516, -0.004358053207397461, -0.0035104751586914062, -0.0026628971099853516, -0.0018153190612792969, -0.0009677410125732422, -0.0001201629638671875, 0.0007274150848388672, 0.0015749931335449219, 0.0024225711822509766, 0.0032701492309570312, 0.004117727279663086, 0.004965305328369141, 0.005812883377075195, 0.00666046142578125, 0.007508039474487305, 0.00835561752319336, 0.009203195571899414, 0.010050773620605469, 0.010898351669311523, 0.011745929718017578, 0.012593507766723633, 0.013441085815429688, 0.014288663864135742, 0.015136241912841797, 0.01598381996154785, 0.016831398010253906, 0.01767897605895996, 0.018526554107666016, 0.01937413215637207, 0.020221710205078125, 0.02106928825378418, 0.021916866302490234, 0.02276444435119629, 0.023612022399902344, 0.0244596004486084, 0.025307178497314453, 0.026154756546020508, 0.027002334594726562, 0.027849912643432617, 0.028697490692138672, 0.029545068740844727, 0.03039264678955078, 0.031240224838256836, 0.03208780288696289, 0.032935380935668945, 0.033782958984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 10.0, 13.0, 7.0, 9.0, 16.0, 26.0, 22.0, 34.0, 55.0, 80.0, 140.0, 182.0, 320.0, 704.0, 1813.0, 7097.0, 63665.0, 840180.0, 119461.0, 10590.0, 2301.0, 761.0, 377.0, 237.0, 139.0, 75.0, 56.0, 52.0, 47.0, 24.0, 9.0, 10.0, 6.0, 7.0, 7.0, 5.0, 3.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2342529296875, -0.22659873962402344, -0.21894454956054688, -0.2112903594970703, -0.20363616943359375, -0.1959819793701172, -0.18832778930664062, -0.18067359924316406, -0.1730194091796875, -0.16536521911621094, -0.15771102905273438, -0.1500568389892578, -0.14240264892578125, -0.1347484588623047, -0.12709426879882812, -0.11944007873535156, -0.111785888671875, -0.10413169860839844, -0.09647750854492188, -0.08882331848144531, -0.08116912841796875, -0.07351493835449219, -0.06586074829101562, -0.05820655822753906, -0.0505523681640625, -0.04289817810058594, -0.035243988037109375, -0.027589797973632812, -0.01993560791015625, -0.012281417846679688, -0.004627227783203125, 0.0030269622802734375, 0.01068115234375, 0.018335342407226562, 0.025989532470703125, 0.03364372253417969, 0.04129791259765625, 0.04895210266113281, 0.056606292724609375, 0.06426048278808594, 0.0719146728515625, 0.07956886291503906, 0.08722305297851562, 0.09487724304199219, 0.10253143310546875, 0.11018562316894531, 0.11783981323242188, 0.12549400329589844, 0.133148193359375, 0.14080238342285156, 0.14845657348632812, 0.1561107635498047, 0.16376495361328125, 0.1714191436767578, 0.17907333374023438, 0.18672752380371094, 0.1943817138671875, 0.20203590393066406, 0.20969009399414062, 0.2173442840576172, 0.22499847412109375, 0.2326526641845703, 0.24030685424804688, 0.24796104431152344, 0.255615234375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 11.0, 10.0, 17.0, 19.0, 22.0, 39.0, 44.0, 42.0, 42.0, 49.0, 63.0, 65.0, 59.0, 64.0, 76.0, 58.0, 56.0, 45.0, 27.0, 25.0, 30.0, 24.0, 28.0, 10.0, 19.0, 12.0, 7.0, 3.0, 9.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.060516357421875, -0.058802127838134766, -0.05708789825439453, -0.0553736686706543, -0.05365943908691406, -0.05194520950317383, -0.050230979919433594, -0.04851675033569336, -0.046802520751953125, -0.04508829116821289, -0.043374061584472656, -0.04165983200073242, -0.03994560241699219, -0.03823137283325195, -0.03651714324951172, -0.034802913665771484, -0.03308868408203125, -0.031374454498291016, -0.02966022491455078, -0.027945995330810547, -0.026231765747070312, -0.024517536163330078, -0.022803306579589844, -0.02108907699584961, -0.019374847412109375, -0.01766061782836914, -0.015946388244628906, -0.014232158660888672, -0.012517929077148438, -0.010803699493408203, -0.009089469909667969, -0.007375240325927734, -0.0056610107421875, -0.003946781158447266, -0.0022325515747070312, -0.0005183219909667969, 0.0011959075927734375, 0.002910137176513672, 0.004624366760253906, 0.006338596343994141, 0.008052825927734375, 0.00976705551147461, 0.011481285095214844, 0.013195514678955078, 0.014909744262695312, 0.016623973846435547, 0.01833820343017578, 0.020052433013916016, 0.02176666259765625, 0.023480892181396484, 0.02519512176513672, 0.026909351348876953, 0.028623580932617188, 0.030337810516357422, 0.032052040100097656, 0.03376626968383789, 0.035480499267578125, 0.03719472885131836, 0.038908958435058594, 0.04062318801879883, 0.04233741760253906, 0.0440516471862793, 0.04576587677001953, 0.047480106353759766, 0.0491943359375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 3.0, 9.0, 7.0, 8.0, 7.0, 11.0, 19.0, 27.0, 34.0, 62.0, 172.0, 648.0, 3626.0, 134186.0, 901492.0, 6802.0, 922.0, 255.0, 92.0, 29.0, 30.0, 21.0, 22.0, 9.0, 9.0, 7.0, 6.0, 9.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.5066757202148438, -0.4904022216796875, -0.47412872314453125, -0.457855224609375, -0.44158172607421875, -0.4253082275390625, -0.40903472900390625, -0.39276123046875, -0.37648773193359375, -0.3602142333984375, -0.34394073486328125, -0.327667236328125, -0.31139373779296875, -0.2951202392578125, -0.27884674072265625, -0.2625732421875, -0.24629974365234375, -0.2300262451171875, -0.21375274658203125, -0.197479248046875, -0.18120574951171875, -0.1649322509765625, -0.14865875244140625, -0.13238525390625, -0.11611175537109375, -0.0998382568359375, -0.08356475830078125, -0.067291259765625, -0.05101776123046875, -0.0347442626953125, -0.01847076416015625, -0.002197265625, 0.01407623291015625, 0.0303497314453125, 0.04662322998046875, 0.062896728515625, 0.07917022705078125, 0.0954437255859375, 0.11171722412109375, 0.12799072265625, 0.14426422119140625, 0.1605377197265625, 0.17681121826171875, 0.193084716796875, 0.20935821533203125, 0.2256317138671875, 0.24190521240234375, 0.2581787109375, 0.27445220947265625, 0.2907257080078125, 0.30699920654296875, 0.323272705078125, 0.33954620361328125, 0.3558197021484375, 0.37209320068359375, 0.38836669921875, 0.40464019775390625, 0.4209136962890625, 0.43718719482421875, 0.453460693359375, 0.46973419189453125, 0.4860076904296875, 0.5022811889648438, 0.5185546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 5.0, 8.0, 5.0, 4.0, 6.0, 17.0, 22.0, 42.0, 50.0, 122.0, 213.0, 199.0, 100.0, 59.0, 40.0, 37.0, 19.0, 13.0, 12.0, 6.0, 12.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5643577575683594e-05, -3.4594908356666565e-05, -3.3546239137649536e-05, -3.249756991863251e-05, -3.144890069961548e-05, -3.040023148059845e-05, -2.935156226158142e-05, -2.8302893042564392e-05, -2.7254223823547363e-05, -2.6205554604530334e-05, -2.5156885385513306e-05, -2.4108216166496277e-05, -2.3059546947479248e-05, -2.201087772846222e-05, -2.096220850944519e-05, -1.991353929042816e-05, -1.8864870071411133e-05, -1.7816200852394104e-05, -1.6767531633377075e-05, -1.5718862414360046e-05, -1.4670193195343018e-05, -1.3621523976325989e-05, -1.257285475730896e-05, -1.1524185538291931e-05, -1.0475516319274902e-05, -9.426847100257874e-06, -8.378177881240845e-06, -7.329508662223816e-06, -6.280839443206787e-06, -5.232170224189758e-06, -4.1835010051727295e-06, -3.1348317861557007e-06, -2.086162567138672e-06, -1.037493348121643e-06, 1.1175870895385742e-08, 1.0598450899124146e-06, 2.1085143089294434e-06, 3.157183527946472e-06, 4.205852746963501e-06, 5.25452196598053e-06, 6.303191184997559e-06, 7.351860404014587e-06, 8.400529623031616e-06, 9.449198842048645e-06, 1.0497868061065674e-05, 1.1546537280082703e-05, 1.2595206499099731e-05, 1.364387571811676e-05, 1.4692544937133789e-05, 1.5741214156150818e-05, 1.6789883375167847e-05, 1.7838552594184875e-05, 1.8887221813201904e-05, 1.9935891032218933e-05, 2.0984560251235962e-05, 2.203322947025299e-05, 2.308189868927002e-05, 2.413056790828705e-05, 2.5179237127304077e-05, 2.6227906346321106e-05, 2.7276575565338135e-05, 2.8325244784355164e-05, 2.9373914003372192e-05, 3.042258322238922e-05, 3.147125244140625e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 10.0, 23.0, 38.0, 84.0, 269.0, 1156.0, 12707.0, 945622.0, 84122.0, 3717.0, 523.0, 146.0, 51.0, 27.0, 12.0, 10.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5205078125, -0.504119873046875, -0.48773193359375, -0.471343994140625, -0.4549560546875, -0.438568115234375, -0.42218017578125, -0.405792236328125, -0.389404296875, -0.373016357421875, -0.35662841796875, -0.340240478515625, -0.3238525390625, -0.307464599609375, -0.29107666015625, -0.274688720703125, -0.25830078125, -0.241912841796875, -0.22552490234375, -0.209136962890625, -0.1927490234375, -0.176361083984375, -0.15997314453125, -0.143585205078125, -0.127197265625, -0.110809326171875, -0.09442138671875, -0.078033447265625, -0.0616455078125, -0.045257568359375, -0.02886962890625, -0.012481689453125, 0.00390625, 0.020294189453125, 0.03668212890625, 0.053070068359375, 0.0694580078125, 0.085845947265625, 0.10223388671875, 0.118621826171875, 0.135009765625, 0.151397705078125, 0.16778564453125, 0.184173583984375, 0.2005615234375, 0.216949462890625, 0.23333740234375, 0.249725341796875, 0.26611328125, 0.282501220703125, 0.29888916015625, 0.315277099609375, 0.3316650390625, 0.348052978515625, 0.36444091796875, 0.380828857421875, 0.397216796875, 0.413604736328125, 0.42999267578125, 0.446380615234375, 0.4627685546875, 0.479156494140625, 0.49554443359375, 0.511932373046875, 0.5283203125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 3.0, 11.0, 10.0, 20.0, 37.0, 47.0, 102.0, 264.0, 230.0, 109.0, 47.0, 36.0, 25.0, 16.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.170654296875, -0.1651325225830078, -0.15961074829101562, -0.15408897399902344, -0.14856719970703125, -0.14304542541503906, -0.13752365112304688, -0.1320018768310547, -0.1264801025390625, -0.12095832824707031, -0.11543655395507812, -0.10991477966308594, -0.10439300537109375, -0.09887123107910156, -0.09334945678710938, -0.08782768249511719, -0.082305908203125, -0.07678413391113281, -0.07126235961914062, -0.06574058532714844, -0.06021881103515625, -0.05469703674316406, -0.049175262451171875, -0.04365348815917969, -0.0381317138671875, -0.03260993957519531, -0.027088165283203125, -0.021566390991210938, -0.01604461669921875, -0.010522842407226562, -0.005001068115234375, 0.0005207061767578125, 0.00604248046875, 0.011564254760742188, 0.017086029052734375, 0.022607803344726562, 0.02812957763671875, 0.03365135192871094, 0.039173126220703125, 0.04469490051269531, 0.0502166748046875, 0.05573844909667969, 0.061260223388671875, 0.06678199768066406, 0.07230377197265625, 0.07782554626464844, 0.08334732055664062, 0.08886909484863281, 0.094390869140625, 0.09991264343261719, 0.10543441772460938, 0.11095619201660156, 0.11647796630859375, 0.12199974060058594, 0.12752151489257812, 0.1330432891845703, 0.1385650634765625, 0.1440868377685547, 0.14960861206054688, 0.15513038635253906, 0.16065216064453125, 0.16617393493652344, 0.17169570922851562, 0.1772174835205078, 0.1827392578125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 960.0, 51.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2916741371154785, -1.698075532913208, -1.104476809501648, -0.5108780860900879, 0.08272051811218262, 0.6763191223144531, 1.2699179649353027, 1.8635163307189941, 2.4571151733398438, 3.0507137775421143, 3.6443123817443848, 4.237911224365234, 4.831509590148926, 5.425108432769775, 6.018707275390625, 6.612305641174316, 7.205904483795166, 7.799503326416016, 8.393101692199707, 8.986700057983398, 9.580299377441406, 10.173897743225098, 10.767496109008789, 11.361095428466797, 11.954693794250488, 12.54829216003418, 13.141891479492188, 13.735489845275879, 14.32908821105957, 14.922687530517578, 15.51628589630127, 16.10988426208496, 16.703481674194336, 17.297080993652344, 17.89067840576172, 18.484277725219727, 19.077877044677734, 19.67147445678711, 20.265073776245117, 20.858673095703125, 21.4522705078125, 22.045869827270508, 22.639467239379883, 23.23306655883789, 23.8266658782959, 24.420263290405273, 25.01386260986328, 25.607460021972656, 26.201061248779297, 26.794660568237305, 27.38825798034668, 27.981857299804688, 28.575456619262695, 29.16905403137207, 29.762653350830078, 30.356250762939453, 30.94985008239746, 31.54344940185547, 32.137046813964844, 32.73064422607422, 33.32424545288086, 33.917842864990234, 34.511444091796875, 35.10504150390625, 35.698638916015625]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 10.0, 17.0, 34.0, 67.0, 140.0, 158.0, 178.0, 175.0, 116.0, 64.0, 43.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8802896738052368, -0.8288059234619141, -0.7773221135139465, -0.7258383631706238, -0.6743545532226562, -0.6228708028793335, -0.5713870525360107, -0.519903302192688, -0.46841949224472046, -0.4169357120990753, -0.3654519319534302, -0.3139681816101074, -0.2624844014644623, -0.21100062131881714, -0.15951687097549438, -0.10803309082984924, -0.0565493106842041, -0.005065537989139557, 0.04641823470592499, 0.09790199995040894, 0.14938578009605408, 0.20086956024169922, 0.252353310585022, 0.3038370907306671, 0.35532087087631226, 0.4068046510219574, 0.45828843116760254, 0.5097721815109253, 0.561255931854248, 0.6127397418022156, 0.6642234921455383, 0.7157073020935059, 0.7671909332275391, 0.8186746835708618, 0.8701584935188293, 0.9216422438621521, 0.9731260538101196, 1.0246098041534424, 1.0760935544967651, 1.127577304840088, 1.1790611743927002, 1.230544924736023, 1.2820286750793457, 1.333512544631958, 1.3849962949752808, 1.4364800453186035, 1.4879637956619263, 1.539447546005249, 1.5909312963485718, 1.6424150466918945, 1.6938987970352173, 1.74538254737854, 1.7968664169311523, 1.848350167274475, 1.8998339176177979, 1.9513176679611206, 2.0028014183044434, 2.0542852878570557, 2.105768918991089, 2.157252788543701, 2.2087364196777344, 2.2602202892303467, 2.311704158782959, 2.363187789916992, 2.4146716594696045]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 13.0, 7.0, 10.0, 13.0, 19.0, 21.0, 33.0, 30.0, 39.0, 48.0, 82.0, 258.0, 38990.0, 4153547.0, 836.0, 210.0, 74.0, 21.0, 13.0, 12.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6943359375, -1.6240692138671875, -1.553802490234375, -1.4835357666015625, -1.41326904296875, -1.3430023193359375, -1.272735595703125, -1.2024688720703125, -1.1322021484375, -1.0619354248046875, -0.991668701171875, -0.9214019775390625, -0.85113525390625, -0.7808685302734375, -0.710601806640625, -0.6403350830078125, -0.570068359375, -0.4998016357421875, -0.429534912109375, -0.3592681884765625, -0.28900146484375, -0.2187347412109375, -0.148468017578125, -0.0782012939453125, -0.0079345703125, 0.0623321533203125, 0.132598876953125, 0.2028656005859375, 0.27313232421875, 0.3433990478515625, 0.413665771484375, 0.4839324951171875, 0.55419921875, 0.6244659423828125, 0.694732666015625, 0.7649993896484375, 0.83526611328125, 0.9055328369140625, 0.975799560546875, 1.0460662841796875, 1.1163330078125, 1.1865997314453125, 1.256866455078125, 1.3271331787109375, 1.39739990234375, 1.4676666259765625, 1.537933349609375, 1.6082000732421875, 1.678466796875, 1.7487335205078125, 1.819000244140625, 1.8892669677734375, 1.95953369140625, 2.0298004150390625, 2.100067138671875, 2.1703338623046875, 2.2406005859375, 2.3108673095703125, 2.381134033203125, 2.4514007568359375, 2.52166748046875, 2.5919342041015625, 2.662200927734375, 2.7324676513671875, 2.802734375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 24.0, 42.0, 141.0, 214.0, 263.0, 182.0, 99.0, 31.0, 9.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0265350341796875, -0.025227785110473633, -0.023920536041259766, -0.0226132869720459, -0.02130603790283203, -0.019998788833618164, -0.018691539764404297, -0.01738429069519043, -0.016077041625976562, -0.014769792556762695, -0.013462543487548828, -0.012155294418334961, -0.010848045349121094, -0.009540796279907227, -0.00823354721069336, -0.006926298141479492, -0.005619049072265625, -0.004311800003051758, -0.0030045509338378906, -0.0016973018646240234, -0.00039005279541015625, 0.0009171962738037109, 0.002224445343017578, 0.0035316944122314453, 0.0048389434814453125, 0.00614619255065918, 0.007453441619873047, 0.008760690689086914, 0.010067939758300781, 0.011375188827514648, 0.012682437896728516, 0.013989686965942383, 0.01529693603515625, 0.016604185104370117, 0.017911434173583984, 0.01921868324279785, 0.02052593231201172, 0.021833181381225586, 0.023140430450439453, 0.02444767951965332, 0.025754928588867188, 0.027062177658081055, 0.028369426727294922, 0.02967667579650879, 0.030983924865722656, 0.03229117393493652, 0.03359842300415039, 0.03490567207336426, 0.036212921142578125, 0.03752017021179199, 0.03882741928100586, 0.04013466835021973, 0.041441917419433594, 0.04274916648864746, 0.04405641555786133, 0.045363664627075195, 0.04667091369628906, 0.04797816276550293, 0.0492854118347168, 0.050592660903930664, 0.05189990997314453, 0.0532071590423584, 0.054514408111572266, 0.05582165718078613, 0.05712890625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 9.0, 40.0, 35.0, 51.0, 72.0, 73.0, 121.0, 174.0, 226.0, 2806.0, 4188492.0, 1382.0, 184.0, 175.0, 112.0, 89.0, 82.0, 53.0, 36.0, 33.0, 15.0, 9.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.1328125, -3.96368408203125, -3.7945556640625, -3.62542724609375, -3.456298828125, -3.28717041015625, -3.1180419921875, -2.94891357421875, -2.77978515625, -2.61065673828125, -2.4415283203125, -2.27239990234375, -2.103271484375, -1.93414306640625, -1.7650146484375, -1.59588623046875, -1.4267578125, -1.25762939453125, -1.0885009765625, -0.91937255859375, -0.750244140625, -0.58111572265625, -0.4119873046875, -0.24285888671875, -0.07373046875, 0.09539794921875, 0.2645263671875, 0.43365478515625, 0.602783203125, 0.77191162109375, 0.9410400390625, 1.11016845703125, 1.279296875, 1.44842529296875, 1.6175537109375, 1.78668212890625, 1.955810546875, 2.12493896484375, 2.2940673828125, 2.46319580078125, 2.63232421875, 2.80145263671875, 2.9705810546875, 3.13970947265625, 3.308837890625, 3.47796630859375, 3.6470947265625, 3.81622314453125, 3.9853515625, 4.15447998046875, 4.3236083984375, 4.49273681640625, 4.661865234375, 4.83099365234375, 5.0001220703125, 5.16925048828125, 5.33837890625, 5.50750732421875, 5.6766357421875, 5.84576416015625, 6.014892578125, 6.18402099609375, 6.3531494140625, 6.52227783203125, 6.69140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 13.0, 25.0, 73.0, 172.0, 1171.0, 2341.0, 173.0, 60.0, 19.0, 10.0, 11.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13671875, -0.13184547424316406, -0.12697219848632812, -0.12209892272949219, -0.11722564697265625, -0.11235237121582031, -0.10747909545898438, -0.10260581970214844, -0.0977325439453125, -0.09285926818847656, -0.08798599243164062, -0.08311271667480469, -0.07823944091796875, -0.07336616516113281, -0.06849288940429688, -0.06361961364746094, -0.058746337890625, -0.05387306213378906, -0.048999786376953125, -0.04412651062011719, -0.03925323486328125, -0.03437995910644531, -0.029506683349609375, -0.024633407592773438, -0.0197601318359375, -0.014886856079101562, -0.010013580322265625, -0.0051403045654296875, -0.00026702880859375, 0.0046062469482421875, 0.009479522705078125, 0.014352798461914062, 0.01922607421875, 0.024099349975585938, 0.028972625732421875, 0.03384590148925781, 0.03871917724609375, 0.04359245300292969, 0.048465728759765625, 0.05333900451660156, 0.0582122802734375, 0.06308555603027344, 0.06795883178710938, 0.07283210754394531, 0.07770538330078125, 0.08257865905761719, 0.08745193481445312, 0.09232521057128906, 0.097198486328125, 0.10207176208496094, 0.10694503784179688, 0.11181831359863281, 0.11669158935546875, 0.12156486511230469, 0.12643814086914062, 0.13131141662597656, 0.1361846923828125, 0.14105796813964844, 0.14593124389648438, 0.1508045196533203, 0.15567779541015625, 0.1605510711669922, 0.16542434692382812, 0.17029762268066406, 0.1751708984375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 34.0, 257.0, 635.0, 57.0, 14.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6357803344726562, -2.3764028549194336, -2.11702561378479, -1.857648253440857, -1.5982708930969238, -1.3388935327529907, -1.0795161724090576, -0.8201388120651245, -0.5607614517211914, -0.3013840913772583, -0.042006731033325195, 0.2173706293106079, 0.476747989654541, 0.7361253499984741, 0.9955027103424072, 1.2548800706863403, 1.5142574310302734, 1.7736347913742065, 2.0330121517181396, 2.292389392852783, 2.551766872406006, 2.8111443519592285, 3.070521593093872, 3.3298988342285156, 3.5892763137817383, 3.848653793334961, 4.108031272888184, 4.367408275604248, 4.626785755157471, 4.886163234710693, 5.145540237426758, 5.4049177169799805, 5.6642961502075195, 5.923673629760742, 6.183051109313965, 6.442428112030029, 6.701805591583252, 6.961183071136475, 7.220560073852539, 7.479937553405762, 7.739315032958984, 7.998692512512207, 8.25806999206543, 8.517447471618652, 8.776824951171875, 9.036201477050781, 9.295578956604004, 9.554956436157227, 9.81433391571045, 10.073711395263672, 10.333088874816895, 10.592466354370117, 10.851842880249023, 11.111220359802246, 11.370597839355469, 11.629975318908691, 11.889352798461914, 12.148730278015137, 12.40810775756836, 12.667485237121582, 12.926862716674805, 13.186239242553711, 13.445616722106934, 13.704994201660156, 13.964371681213379]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 5.0, 9.0, 23.0, 23.0, 51.0, 95.0, 120.0, 139.0, 132.0, 112.0, 93.0, 81.0, 53.0, 27.0, 11.0, 8.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7741677761077881, -0.7501190304756165, -0.7260702848434448, -0.7020215392112732, -0.6779727935791016, -0.6539240479469299, -0.6298753023147583, -0.6058265566825867, -0.581777811050415, -0.5577290654182434, -0.5336803197860718, -0.5096315741539001, -0.4855828285217285, -0.4615340828895569, -0.43748533725738525, -0.4134365916252136, -0.389387845993042, -0.36533910036087036, -0.34129035472869873, -0.3172416090965271, -0.29319286346435547, -0.26914411783218384, -0.2450953722000122, -0.22104662656784058, -0.19699788093566895, -0.17294913530349731, -0.14890038967132568, -0.12485164403915405, -0.10080289840698242, -0.07675415277481079, -0.05270540714263916, -0.02865666151046753, -0.0046079158782958984, 0.019440829753875732, 0.04348957538604736, 0.067538321018219, 0.09158706665039062, 0.11563581228256226, 0.1396845579147339, 0.16373330354690552, 0.18778204917907715, 0.21183079481124878, 0.2358795404434204, 0.25992828607559204, 0.28397703170776367, 0.3080257773399353, 0.33207452297210693, 0.35612326860427856, 0.3801720142364502, 0.4042207598686218, 0.42826950550079346, 0.4523182511329651, 0.4763669967651367, 0.5004157423973083, 0.52446448802948, 0.5485132336616516, 0.5725619792938232, 0.5966107249259949, 0.6206594705581665, 0.6447082161903381, 0.6687569618225098, 0.6928057074546814, 0.716854453086853, 0.7409031987190247, 0.7649519443511963]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 7.0, 5.0, 8.0, 14.0, 10.0, 23.0, 36.0, 50.0, 88.0, 125.0, 215.0, 395.0, 846.0, 2584.0, 13266.0, 203358.0, 789076.0, 31498.0, 4486.0, 1256.0, 499.0, 281.0, 146.0, 94.0, 53.0, 51.0, 15.0, 17.0, 10.0, 8.0, 4.0, 7.0, 8.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84765625, -0.8164825439453125, -0.785308837890625, -0.7541351318359375, -0.72296142578125, -0.6917877197265625, -0.660614013671875, -0.6294403076171875, -0.5982666015625, -0.5670928955078125, -0.535919189453125, -0.5047454833984375, -0.47357177734375, -0.4423980712890625, -0.411224365234375, -0.3800506591796875, -0.348876953125, -0.3177032470703125, -0.286529541015625, -0.2553558349609375, -0.22418212890625, -0.1930084228515625, -0.161834716796875, -0.1306610107421875, -0.0994873046875, -0.0683135986328125, -0.037139892578125, -0.0059661865234375, 0.02520751953125, 0.0563812255859375, 0.087554931640625, 0.1187286376953125, 0.14990234375, 0.1810760498046875, 0.212249755859375, 0.2434234619140625, 0.27459716796875, 0.3057708740234375, 0.336944580078125, 0.3681182861328125, 0.3992919921875, 0.4304656982421875, 0.461639404296875, 0.4928131103515625, 0.52398681640625, 0.5551605224609375, 0.586334228515625, 0.6175079345703125, 0.648681640625, 0.6798553466796875, 0.711029052734375, 0.7422027587890625, 0.77337646484375, 0.8045501708984375, 0.835723876953125, 0.8668975830078125, 0.8980712890625, 0.9292449951171875, 0.960418701171875, 0.9915924072265625, 1.02276611328125, 1.0539398193359375, 1.085113525390625, 1.1162872314453125, 1.1474609375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 13.0, 30.0, 60.0, 118.0, 137.0, 204.0, 164.0, 123.0, 87.0, 38.0, 15.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045013427734375, -0.043263912200927734, -0.04151439666748047, -0.0397648811340332, -0.03801536560058594, -0.03626585006713867, -0.034516334533691406, -0.03276681900024414, -0.031017303466796875, -0.02926778793334961, -0.027518272399902344, -0.025768756866455078, -0.024019241333007812, -0.022269725799560547, -0.02052021026611328, -0.018770694732666016, -0.01702117919921875, -0.015271663665771484, -0.013522148132324219, -0.011772632598876953, -0.010023117065429688, -0.008273601531982422, -0.006524085998535156, -0.004774570465087891, -0.003025054931640625, -0.0012755393981933594, 0.00047397613525390625, 0.002223491668701172, 0.0039730072021484375, 0.005722522735595703, 0.007472038269042969, 0.009221553802490234, 0.0109710693359375, 0.012720584869384766, 0.014470100402832031, 0.016219615936279297, 0.017969131469726562, 0.019718647003173828, 0.021468162536621094, 0.02321767807006836, 0.024967193603515625, 0.02671670913696289, 0.028466224670410156, 0.030215740203857422, 0.03196525573730469, 0.03371477127075195, 0.03546428680419922, 0.037213802337646484, 0.03896331787109375, 0.040712833404541016, 0.04246234893798828, 0.04421186447143555, 0.04596138000488281, 0.04771089553833008, 0.049460411071777344, 0.05120992660522461, 0.052959442138671875, 0.05470895767211914, 0.056458473205566406, 0.05820798873901367, 0.05995750427246094, 0.0617070198059082, 0.06345653533935547, 0.06520605087280273, 0.06695556640625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 7.0, 4.0, 6.0, 4.0, 11.0, 14.0, 21.0, 46.0, 75.0, 84.0, 127.0, 206.0, 425.0, 790.0, 1892.0, 6354.0, 32250.0, 321924.0, 613742.0, 56300.0, 9443.0, 2667.0, 1013.0, 465.0, 236.0, 153.0, 106.0, 59.0, 43.0, 29.0, 18.0, 12.0, 10.0, 9.0, 4.0, 3.0, 0.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432861328125, -0.4205436706542969, -0.40822601318359375, -0.3959083557128906, -0.3835906982421875, -0.3712730407714844, -0.35895538330078125, -0.3466377258300781, -0.334320068359375, -0.3220024108886719, -0.30968475341796875, -0.2973670959472656, -0.2850494384765625, -0.2727317810058594, -0.26041412353515625, -0.24809646606445312, -0.23577880859375, -0.22346115112304688, -0.21114349365234375, -0.19882583618164062, -0.1865081787109375, -0.17419052124023438, -0.16187286376953125, -0.14955520629882812, -0.137237548828125, -0.12491989135742188, -0.11260223388671875, -0.10028457641601562, -0.0879669189453125, -0.07564926147460938, -0.06333160400390625, -0.051013946533203125, -0.0386962890625, -0.026378631591796875, -0.01406097412109375, -0.001743316650390625, 0.0105743408203125, 0.022891998291015625, 0.03520965576171875, 0.047527313232421875, 0.059844970703125, 0.07216262817382812, 0.08448028564453125, 0.09679794311523438, 0.1091156005859375, 0.12143325805664062, 0.13375091552734375, 0.14606857299804688, 0.15838623046875, 0.17070388793945312, 0.18302154541015625, 0.19533920288085938, 0.2076568603515625, 0.21997451782226562, 0.23229217529296875, 0.24460983276367188, 0.256927490234375, 0.2692451477050781, 0.28156280517578125, 0.2938804626464844, 0.3061981201171875, 0.3185157775878906, 0.33083343505859375, 0.3431510925292969, 0.35546875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 1.0, 2.0, 4.0, 11.0, 10.0, 13.0, 25.0, 21.0, 31.0, 30.0, 52.0, 56.0, 38.0, 50.0, 53.0, 57.0, 48.0, 46.0, 50.0, 57.0, 56.0, 39.0, 44.0, 41.0, 37.0, 25.0, 28.0, 22.0, 12.0, 8.0, 8.0, 6.0, 9.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1385498046875, -0.13428306579589844, -0.13001632690429688, -0.1257495880126953, -0.12148284912109375, -0.11721611022949219, -0.11294937133789062, -0.10868263244628906, -0.1044158935546875, -0.10014915466308594, -0.09588241577148438, -0.09161567687988281, -0.08734893798828125, -0.08308219909667969, -0.07881546020507812, -0.07454872131347656, -0.070281982421875, -0.06601524353027344, -0.061748504638671875, -0.05748176574707031, -0.05321502685546875, -0.04894828796386719, -0.044681549072265625, -0.04041481018066406, -0.0361480712890625, -0.03188133239746094, -0.027614593505859375, -0.023347854614257812, -0.01908111572265625, -0.014814376831054688, -0.010547637939453125, -0.0062808990478515625, -0.00201416015625, 0.0022525787353515625, 0.006519317626953125, 0.010786056518554688, 0.01505279541015625, 0.019319534301757812, 0.023586273193359375, 0.027853012084960938, 0.0321197509765625, 0.03638648986816406, 0.040653228759765625, 0.04491996765136719, 0.04918670654296875, 0.05345344543457031, 0.057720184326171875, 0.06198692321777344, 0.066253662109375, 0.07052040100097656, 0.07478713989257812, 0.07905387878417969, 0.08332061767578125, 0.08758735656738281, 0.09185409545898438, 0.09612083435058594, 0.1003875732421875, 0.10465431213378906, 0.10892105102539062, 0.11318778991699219, 0.11745452880859375, 0.12172126770019531, 0.12598800659179688, 0.13025474548339844, 0.134521484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 4.0, 2.0, 10.0, 9.0, 11.0, 23.0, 28.0, 46.0, 60.0, 86.0, 108.0, 216.0, 414.0, 925.0, 2677.0, 9986.0, 65724.0, 853162.0, 97217.0, 12481.0, 3209.0, 1094.0, 447.0, 214.0, 115.0, 76.0, 56.0, 38.0, 26.0, 25.0, 13.0, 12.0, 7.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.416259765625, -0.40348052978515625, -0.3907012939453125, -0.37792205810546875, -0.365142822265625, -0.35236358642578125, -0.3395843505859375, -0.32680511474609375, -0.31402587890625, -0.30124664306640625, -0.2884674072265625, -0.27568817138671875, -0.262908935546875, -0.25012969970703125, -0.2373504638671875, -0.22457122802734375, -0.2117919921875, -0.19901275634765625, -0.1862335205078125, -0.17345428466796875, -0.160675048828125, -0.14789581298828125, -0.1351165771484375, -0.12233734130859375, -0.10955810546875, -0.09677886962890625, -0.0839996337890625, -0.07122039794921875, -0.058441162109375, -0.04566192626953125, -0.0328826904296875, -0.02010345458984375, -0.00732421875, 0.00545501708984375, 0.0182342529296875, 0.03101348876953125, 0.043792724609375, 0.05657196044921875, 0.0693511962890625, 0.08213043212890625, 0.09490966796875, 0.10768890380859375, 0.1204681396484375, 0.13324737548828125, 0.146026611328125, 0.15880584716796875, 0.1715850830078125, 0.18436431884765625, 0.1971435546875, 0.20992279052734375, 0.2227020263671875, 0.23548126220703125, 0.248260498046875, 0.26103973388671875, 0.2738189697265625, 0.28659820556640625, 0.29937744140625, 0.31215667724609375, 0.3249359130859375, 0.33771514892578125, 0.350494384765625, 0.36327362060546875, 0.3760528564453125, 0.38883209228515625, 0.401611328125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 4.0, 5.0, 10.0, 13.0, 23.0, 39.0, 43.0, 63.0, 126.0, 179.0, 190.0, 111.0, 67.0, 28.0, 18.0, 27.0, 13.0, 5.0, 8.0, 9.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.073713302612305e-05, -5.9001147747039795e-05, -5.726516246795654e-05, -5.552917718887329e-05, -5.379319190979004e-05, -5.205720663070679e-05, -5.0321221351623535e-05, -4.858523607254028e-05, -4.684925079345703e-05, -4.511326551437378e-05, -4.337728023529053e-05, -4.1641294956207275e-05, -3.9905309677124023e-05, -3.816932439804077e-05, -3.643333911895752e-05, -3.469735383987427e-05, -3.2961368560791016e-05, -3.1225383281707764e-05, -2.9489398002624512e-05, -2.775341272354126e-05, -2.6017427444458008e-05, -2.4281442165374756e-05, -2.2545456886291504e-05, -2.0809471607208252e-05, -1.9073486328125e-05, -1.7337501049041748e-05, -1.5601515769958496e-05, -1.3865530490875244e-05, -1.2129545211791992e-05, -1.039355993270874e-05, -8.657574653625488e-06, -6.921589374542236e-06, -5.185604095458984e-06, -3.4496188163757324e-06, -1.7136335372924805e-06, 2.2351741790771484e-08, 1.7583370208740234e-06, 3.4943222999572754e-06, 5.230307579040527e-06, 6.966292858123779e-06, 8.702278137207031e-06, 1.0438263416290283e-05, 1.2174248695373535e-05, 1.3910233974456787e-05, 1.564621925354004e-05, 1.738220453262329e-05, 1.9118189811706543e-05, 2.0854175090789795e-05, 2.2590160369873047e-05, 2.43261456489563e-05, 2.606213092803955e-05, 2.7798116207122803e-05, 2.9534101486206055e-05, 3.127008676528931e-05, 3.300607204437256e-05, 3.474205732345581e-05, 3.647804260253906e-05, 3.8214027881622314e-05, 3.9950013160705566e-05, 4.168599843978882e-05, 4.342198371887207e-05, 4.515796899795532e-05, 4.6893954277038574e-05, 4.8629939556121826e-05, 5.036592483520508e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 3.0, 2.0, 10.0, 32.0, 56.0, 95.0, 158.0, 344.0, 769.0, 2595.0, 17406.0, 766726.0, 246799.0, 10265.0, 2005.0, 666.0, 288.0, 163.0, 71.0, 44.0, 18.0, 20.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6162109375, -0.5955886840820312, -0.5749664306640625, -0.5543441772460938, -0.533721923828125, -0.5130996704101562, -0.4924774169921875, -0.47185516357421875, -0.45123291015625, -0.43061065673828125, -0.4099884033203125, -0.38936614990234375, -0.368743896484375, -0.34812164306640625, -0.3274993896484375, -0.30687713623046875, -0.2862548828125, -0.26563262939453125, -0.2450103759765625, -0.22438812255859375, -0.203765869140625, -0.18314361572265625, -0.1625213623046875, -0.14189910888671875, -0.12127685546875, -0.10065460205078125, -0.0800323486328125, -0.05941009521484375, -0.038787841796875, -0.01816558837890625, 0.0024566650390625, 0.02307891845703125, 0.043701171875, 0.06432342529296875, 0.0849456787109375, 0.10556793212890625, 0.126190185546875, 0.14681243896484375, 0.1674346923828125, 0.18805694580078125, 0.20867919921875, 0.22930145263671875, 0.2499237060546875, 0.27054595947265625, 0.291168212890625, 0.31179046630859375, 0.3324127197265625, 0.35303497314453125, 0.3736572265625, 0.39427947998046875, 0.4149017333984375, 0.43552398681640625, 0.456146240234375, 0.47676849365234375, 0.4973907470703125, 0.5180130004882812, 0.53863525390625, 0.5592575073242188, 0.5798797607421875, 0.6005020141601562, 0.621124267578125, 0.6417465209960938, 0.6623687744140625, 0.6829910278320312, 0.70361328125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 8.0, 4.0, 24.0, 23.0, 39.0, 76.0, 140.0, 141.0, 166.0, 147.0, 81.0, 46.0, 40.0, 18.0, 12.0, 10.0, 8.0, 9.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1651611328125, -0.1583271026611328, -0.15149307250976562, -0.14465904235839844, -0.13782501220703125, -0.13099098205566406, -0.12415695190429688, -0.11732292175292969, -0.1104888916015625, -0.10365486145019531, -0.09682083129882812, -0.08998680114746094, -0.08315277099609375, -0.07631874084472656, -0.06948471069335938, -0.06265068054199219, -0.055816650390625, -0.04898262023925781, -0.042148590087890625, -0.03531455993652344, -0.02848052978515625, -0.021646499633789062, -0.014812469482421875, -0.007978439331054688, -0.0011444091796875, 0.0056896209716796875, 0.012523651123046875, 0.019357681274414062, 0.02619171142578125, 0.03302574157714844, 0.039859771728515625, 0.04669380187988281, 0.05352783203125, 0.06036186218261719, 0.06719589233398438, 0.07402992248535156, 0.08086395263671875, 0.08769798278808594, 0.09453201293945312, 0.10136604309082031, 0.1082000732421875, 0.11503410339355469, 0.12186813354492188, 0.12870216369628906, 0.13553619384765625, 0.14237022399902344, 0.14920425415039062, 0.1560382843017578, 0.162872314453125, 0.1697063446044922, 0.17654037475585938, 0.18337440490722656, 0.19020843505859375, 0.19704246520996094, 0.20387649536132812, 0.2107105255126953, 0.2175445556640625, 0.2243785858154297, 0.23121261596679688, 0.23804664611816406, 0.24488067626953125, 0.25171470642089844, 0.2585487365722656, 0.2653827667236328, 0.272216796875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 72.0, 613.0, 309.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0145845413208, -10.752126693725586, -10.489669799804688, -10.227212905883789, -9.964755058288574, -9.70229721069336, -9.439840316772461, -9.177383422851562, -8.914925575256348, -8.652467727661133, -8.390010833740234, -8.127553939819336, -7.865096092224121, -7.6026387214660645, -7.340181350708008, -7.077723979949951, -6.8152666091918945, -6.552809238433838, -6.290351867675781, -6.027894496917725, -5.765437126159668, -5.502979755401611, -5.240522384643555, -4.978065013885498, -4.715607643127441, -4.453150272369385, -4.190692901611328, -3.9282355308532715, -3.665778160095215, -3.403320789337158, -3.1408634185791016, -2.878406047821045, -2.6159486770629883, -2.3534913063049316, -2.091033935546875, -1.8285765647888184, -1.5661191940307617, -1.303661823272705, -1.0412044525146484, -0.7787470817565918, -0.5162897109985352, -0.2538323402404785, 0.008625030517578125, 0.27108240127563477, 0.5335397720336914, 0.795997142791748, 1.0584545135498047, 1.3209118843078613, 1.583369255065918, 1.8458266258239746, 2.1082839965820312, 2.370741367340088, 2.6331987380981445, 2.895656108856201, 3.158113479614258, 3.4205708503723145, 3.683028221130371, 3.9454855918884277, 4.207942962646484, 4.470400333404541, 4.732857704162598, 4.995315074920654, 5.257772445678711, 5.520229816436768, 5.782687187194824]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 6.0, 4.0, 10.0, 3.0, 14.0, 6.0, 15.0, 22.0, 16.0, 19.0, 32.0, 39.0, 44.0, 49.0, 57.0, 55.0, 56.0, 61.0, 60.0, 51.0, 46.0, 58.0, 47.0, 38.0, 44.0, 28.0, 27.0, 26.0, 24.0, 13.0, 9.0, 8.0, 7.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.860492467880249, -0.8258423209190369, -0.7911921739578247, -0.7565420269966125, -0.7218918800354004, -0.687241792678833, -0.6525916457176208, -0.6179414987564087, -0.5832913517951965, -0.5486412048339844, -0.5139910578727722, -0.47934094071388245, -0.4446907937526703, -0.41004064679145813, -0.37539052963256836, -0.3407403826713562, -0.30609023571014404, -0.2714400887489319, -0.23678995668888092, -0.20213982462882996, -0.1674896776676178, -0.13283953070640564, -0.09818939864635468, -0.06353926658630371, -0.028889119625091553, 0.0057610198855400085, 0.04041115939617157, 0.07506129890680313, 0.10971143841743469, 0.14436158537864685, 0.17901171743869781, 0.21366184949874878, 0.24831199645996094, 0.2829621434211731, 0.31761229038238525, 0.352262407541275, 0.3869125545024872, 0.42156270146369934, 0.4562128186225891, 0.49086296558380127, 0.5255131125450134, 0.5601632595062256, 0.5948134064674377, 0.6294635534286499, 0.6641136407852173, 0.6987638473510742, 0.7334139347076416, 0.7680640816688538, 0.8027142286300659, 0.8373643755912781, 0.8720145225524902, 0.9066646695137024, 0.9413148164749146, 0.9759649038314819, 1.0106151103973389, 1.0452651977539062, 1.0799152851104736, 1.114565372467041, 1.149215579032898, 1.1838656663894653, 1.2185158729553223, 1.2531659603118896, 1.2878161668777466, 1.322466254234314, 1.357116460800171]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 1.0, 1.0, 5.0, 9.0, 11.0, 8.0, 9.0, 36.0, 42.0, 44.0, 109.0, 113.0, 275.0, 591.0, 2180.0, 15450.0, 4037533.0, 128686.0, 6916.0, 1449.0, 406.0, 189.0, 104.0, 59.0, 24.0, 17.0, 4.0, 8.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.576171875, -2.502105712890625, -2.42803955078125, -2.353973388671875, -2.2799072265625, -2.205841064453125, -2.13177490234375, -2.057708740234375, -1.983642578125, -1.909576416015625, -1.83551025390625, -1.761444091796875, -1.6873779296875, -1.613311767578125, -1.53924560546875, -1.465179443359375, -1.39111328125, -1.317047119140625, -1.24298095703125, -1.168914794921875, -1.0948486328125, -1.020782470703125, -0.94671630859375, -0.872650146484375, -0.798583984375, -0.724517822265625, -0.65045166015625, -0.576385498046875, -0.5023193359375, -0.428253173828125, -0.35418701171875, -0.280120849609375, -0.2060546875, -0.131988525390625, -0.05792236328125, 0.016143798828125, 0.0902099609375, 0.164276123046875, 0.23834228515625, 0.312408447265625, 0.386474609375, 0.460540771484375, 0.53460693359375, 0.608673095703125, 0.6827392578125, 0.756805419921875, 0.83087158203125, 0.904937744140625, 0.97900390625, 1.053070068359375, 1.12713623046875, 1.201202392578125, 1.2752685546875, 1.349334716796875, 1.42340087890625, 1.497467041015625, 1.571533203125, 1.645599365234375, 1.71966552734375, 1.793731689453125, 1.8677978515625, 1.941864013671875, 2.01593017578125, 2.089996337890625, 2.1640625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 7.0, 10.0, 15.0, 24.0, 46.0, 83.0, 103.0, 108.0, 139.0, 143.0, 91.0, 100.0, 63.0, 37.0, 17.0, 9.0, 6.0, 5.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0251007080078125, -0.023402929306030273, -0.021705150604248047, -0.02000737190246582, -0.018309593200683594, -0.016611814498901367, -0.01491403579711914, -0.013216257095336914, -0.011518478393554688, -0.009820699691772461, -0.008122920989990234, -0.006425142288208008, -0.004727363586425781, -0.0030295848846435547, -0.0013318061828613281, 0.00036597251892089844, 0.002063751220703125, 0.0037615299224853516, 0.005459308624267578, 0.007157087326049805, 0.008854866027832031, 0.010552644729614258, 0.012250423431396484, 0.013948202133178711, 0.015645980834960938, 0.017343759536743164, 0.01904153823852539, 0.020739316940307617, 0.022437095642089844, 0.02413487434387207, 0.025832653045654297, 0.027530431747436523, 0.02922821044921875, 0.030925989151000977, 0.0326237678527832, 0.03432154655456543, 0.036019325256347656, 0.03771710395812988, 0.03941488265991211, 0.041112661361694336, 0.04281044006347656, 0.04450821876525879, 0.046205997467041016, 0.04790377616882324, 0.04960155487060547, 0.051299333572387695, 0.05299711227416992, 0.05469489097595215, 0.056392669677734375, 0.0580904483795166, 0.05978822708129883, 0.061486005783081055, 0.06318378448486328, 0.06488156318664551, 0.06657934188842773, 0.06827712059020996, 0.06997489929199219, 0.07167267799377441, 0.07337045669555664, 0.07506823539733887, 0.0767660140991211, 0.07846379280090332, 0.08016157150268555, 0.08185935020446777, 0.08355712890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 13.0, 35.0, 136.0, 552.0, 10451.0, 4175157.0, 7169.0, 553.0, 150.0, 33.0, 17.0, 10.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.49835205078125, -2.2974853515625, -2.09661865234375, -1.895751953125, -1.69488525390625, -1.4940185546875, -1.29315185546875, -1.09228515625, -0.89141845703125, -0.6905517578125, -0.48968505859375, -0.288818359375, -0.08795166015625, 0.1129150390625, 0.31378173828125, 0.5146484375, 0.71551513671875, 0.9163818359375, 1.11724853515625, 1.318115234375, 1.51898193359375, 1.7198486328125, 1.92071533203125, 2.12158203125, 2.32244873046875, 2.5233154296875, 2.72418212890625, 2.925048828125, 3.12591552734375, 3.3267822265625, 3.52764892578125, 3.728515625, 3.92938232421875, 4.1302490234375, 4.33111572265625, 4.531982421875, 4.73284912109375, 4.9337158203125, 5.13458251953125, 5.33544921875, 5.53631591796875, 5.7371826171875, 5.93804931640625, 6.138916015625, 6.33978271484375, 6.5406494140625, 6.74151611328125, 6.9423828125, 7.14324951171875, 7.3441162109375, 7.54498291015625, 7.745849609375, 7.94671630859375, 8.1475830078125, 8.34844970703125, 8.54931640625, 8.75018310546875, 8.9510498046875, 9.15191650390625, 9.352783203125, 9.55364990234375, 9.7545166015625, 9.95538330078125, 10.15625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 5.0, 10.0, 28.0, 69.0, 181.0, 2766.0, 837.0, 109.0, 34.0, 12.0, 5.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1463623046875, -0.13147926330566406, -0.11659622192382812, -0.10171318054199219, -0.08683013916015625, -0.07194709777832031, -0.057064056396484375, -0.04218101501464844, -0.0272979736328125, -0.012414932250976562, 0.002468109130859375, 0.017351150512695312, 0.03223419189453125, 0.04711723327636719, 0.062000274658203125, 0.07688331604003906, 0.091766357421875, 0.10664939880371094, 0.12153244018554688, 0.1364154815673828, 0.15129852294921875, 0.1661815643310547, 0.18106460571289062, 0.19594764709472656, 0.2108306884765625, 0.22571372985839844, 0.24059677124023438, 0.2554798126220703, 0.27036285400390625, 0.2852458953857422, 0.3001289367675781, 0.31501197814941406, 0.32989501953125, 0.34477806091308594, 0.3596611022949219, 0.3745441436767578, 0.38942718505859375, 0.4043102264404297, 0.4191932678222656, 0.43407630920410156, 0.4489593505859375, 0.46384239196777344, 0.4787254333496094, 0.4936084747314453, 0.5084915161132812, 0.5233745574951172, 0.5382575988769531, 0.5531406402587891, 0.568023681640625, 0.5829067230224609, 0.5977897644042969, 0.6126728057861328, 0.6275558471679688, 0.6424388885498047, 0.6573219299316406, 0.6722049713134766, 0.6870880126953125, 0.7019710540771484, 0.7168540954589844, 0.7317371368408203, 0.7466201782226562, 0.7615032196044922, 0.7763862609863281, 0.7912693023681641, 0.80615234375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 84.0, 712.0, 177.0, 25.0, 10.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.265885353088379, -11.024155616760254, -10.782425880432129, -10.540696144104004, -10.298966407775879, -10.057236671447754, -9.815506935119629, -9.573777198791504, -9.332047462463379, -9.090317726135254, -8.848587989807129, -8.606858253479004, -8.365128517150879, -8.123398780822754, -7.881669044494629, -7.639939308166504, -7.398210048675537, -7.156480312347412, -6.914750576019287, -6.673020839691162, -6.431291103363037, -6.189561367034912, -5.947832107543945, -5.70610237121582, -5.464372634887695, -5.22264289855957, -4.980913162231445, -4.73918342590332, -4.497453689575195, -4.25572395324707, -4.013994216918945, -3.7722647190093994, -3.5305352210998535, -3.2888054847717285, -3.0470757484436035, -2.8053460121154785, -2.5636162757873535, -2.3218865394592285, -2.0801570415496826, -1.8384273052215576, -1.5966975688934326, -1.3549678325653076, -1.1132380962371826, -0.8715084791183472, -0.6297787427902222, -0.38804900646209717, -0.14631938934326172, 0.09541034698486328, 0.3371400833129883, 0.5788698196411133, 0.8205994963645935, 1.0623291730880737, 1.3040589094161987, 1.5457886457443237, 1.7875182628631592, 2.029247999191284, 2.270977735519409, 2.512707471847534, 2.754437208175659, 2.996166706085205, 3.23789644241333, 3.479626178741455, 3.72135591506958, 3.963085651397705, 4.20481538772583]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 10.0, 10.0, 20.0, 36.0, 44.0, 47.0, 73.0, 88.0, 87.0, 101.0, 97.0, 99.0, 64.0, 54.0, 40.0, 50.0, 32.0, 20.0, 17.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4191651344299316, -1.3642014265060425, -1.3092378377914429, -1.2542741298675537, -1.199310541152954, -1.144346833229065, -1.0893831253051758, -1.0344195365905762, -0.979455828666687, -0.9244921803474426, -0.8695285320281982, -0.8145648241043091, -0.7596011757850647, -0.7046375274658203, -0.6496738195419312, -0.5947101712226868, -0.5397465229034424, -0.484782874584198, -0.4298191964626312, -0.37485551834106445, -0.31989187002182007, -0.2649282217025757, -0.2099645435810089, -0.15500086545944214, -0.10003721714019775, -0.045073553919792175, 0.009890109300613403, 0.06485377252101898, 0.11981743574142456, 0.17478108406066895, 0.22974476218223572, 0.2847084403038025, 0.3396720886230469, 0.39463573694229126, 0.44959941506385803, 0.5045630931854248, 0.5595267415046692, 0.6144903898239136, 0.6694540977478027, 0.7244177460670471, 0.7793813943862915, 0.8343450427055359, 0.8893086910247803, 0.9442723989486694, 0.9992360472679138, 1.0541996955871582, 1.1091634035110474, 1.1641271114349365, 1.2190907001495361, 1.2740544080734253, 1.329017996788025, 1.383981704711914, 1.4389452934265137, 1.4939090013504028, 1.548872709274292, 1.6038362979888916, 1.6588000059127808, 1.71376371383667, 1.7687273025512695, 1.8236910104751587, 1.8786547183990479, 1.9336183071136475, 1.9885820150375366, 2.043545722961426, 2.0985093116760254]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 8.0, 3.0, 9.0, 17.0, 14.0, 31.0, 41.0, 40.0, 76.0, 109.0, 158.0, 263.0, 475.0, 843.0, 1975.0, 5832.0, 25956.0, 174307.0, 689127.0, 121359.0, 19674.0, 4770.0, 1609.0, 716.0, 414.0, 249.0, 136.0, 102.0, 66.0, 43.0, 49.0, 16.0, 16.0, 12.0, 12.0, 7.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.57275390625, -0.5525970458984375, -0.532440185546875, -0.5122833251953125, -0.49212646484375, -0.4719696044921875, -0.451812744140625, -0.4316558837890625, -0.4114990234375, -0.3913421630859375, -0.371185302734375, -0.3510284423828125, -0.33087158203125, -0.3107147216796875, -0.290557861328125, -0.2704010009765625, -0.250244140625, -0.2300872802734375, -0.209930419921875, -0.1897735595703125, -0.16961669921875, -0.1494598388671875, -0.129302978515625, -0.1091461181640625, -0.0889892578125, -0.0688323974609375, -0.048675537109375, -0.0285186767578125, -0.00836181640625, 0.0117950439453125, 0.031951904296875, 0.0521087646484375, 0.072265625, 0.0924224853515625, 0.112579345703125, 0.1327362060546875, 0.15289306640625, 0.1730499267578125, 0.193206787109375, 0.2133636474609375, 0.2335205078125, 0.2536773681640625, 0.273834228515625, 0.2939910888671875, 0.31414794921875, 0.3343048095703125, 0.354461669921875, 0.3746185302734375, 0.394775390625, 0.4149322509765625, 0.435089111328125, 0.4552459716796875, 0.47540283203125, 0.4955596923828125, 0.515716552734375, 0.5358734130859375, 0.5560302734375, 0.5761871337890625, 0.596343994140625, 0.6165008544921875, 0.63665771484375, 0.6568145751953125, 0.676971435546875, 0.6971282958984375, 0.71728515625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 6.0, 16.0, 7.0, 12.0, 25.0, 24.0, 38.0, 50.0, 55.0, 56.0, 72.0, 76.0, 89.0, 88.0, 73.0, 70.0, 51.0, 46.0, 31.0, 38.0, 30.0, 14.0, 18.0, 11.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0667724609375, -0.06397819519042969, -0.061183929443359375, -0.05838966369628906, -0.05559539794921875, -0.05280113220214844, -0.050006866455078125, -0.04721260070800781, -0.0444183349609375, -0.04162406921386719, -0.038829803466796875, -0.03603553771972656, -0.03324127197265625, -0.030447006225585938, -0.027652740478515625, -0.024858474731445312, -0.022064208984375, -0.019269943237304688, -0.016475677490234375, -0.013681411743164062, -0.01088714599609375, -0.008092880249023438, -0.005298614501953125, -0.0025043487548828125, 0.0002899169921875, 0.0030841827392578125, 0.005878448486328125, 0.008672714233398438, 0.01146697998046875, 0.014261245727539062, 0.017055511474609375, 0.019849777221679688, 0.02264404296875, 0.025438308715820312, 0.028232574462890625, 0.031026840209960938, 0.03382110595703125, 0.03661537170410156, 0.039409637451171875, 0.04220390319824219, 0.0449981689453125, 0.04779243469238281, 0.050586700439453125, 0.05338096618652344, 0.05617523193359375, 0.05896949768066406, 0.061763763427734375, 0.06455802917480469, 0.067352294921875, 0.07014656066894531, 0.07294082641601562, 0.07573509216308594, 0.07852935791015625, 0.08132362365722656, 0.08411788940429688, 0.08691215515136719, 0.0897064208984375, 0.09250068664550781, 0.09529495239257812, 0.09808921813964844, 0.10088348388671875, 0.10367774963378906, 0.10647201538085938, 0.10926628112792969, 0.112060546875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 6.0, 16.0, 16.0, 24.0, 44.0, 62.0, 78.0, 171.0, 359.0, 950.0, 3213.0, 18640.0, 370516.0, 620325.0, 28041.0, 4129.0, 1091.0, 385.0, 173.0, 119.0, 54.0, 45.0, 30.0, 25.0, 14.0, 13.0, 0.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.89990234375, -0.8762741088867188, -0.8526458740234375, -0.8290176391601562, -0.805389404296875, -0.7817611694335938, -0.7581329345703125, -0.7345046997070312, -0.71087646484375, -0.6872482299804688, -0.6636199951171875, -0.6399917602539062, -0.616363525390625, -0.5927352905273438, -0.5691070556640625, -0.5454788208007812, -0.5218505859375, -0.49822235107421875, -0.4745941162109375, -0.45096588134765625, -0.427337646484375, -0.40370941162109375, -0.3800811767578125, -0.35645294189453125, -0.33282470703125, -0.30919647216796875, -0.2855682373046875, -0.26194000244140625, -0.238311767578125, -0.21468353271484375, -0.1910552978515625, -0.16742706298828125, -0.143798828125, -0.12017059326171875, -0.0965423583984375, -0.07291412353515625, -0.049285888671875, -0.02565765380859375, -0.0020294189453125, 0.02159881591796875, 0.04522705078125, 0.06885528564453125, 0.0924835205078125, 0.11611175537109375, 0.139739990234375, 0.16336822509765625, 0.1869964599609375, 0.21062469482421875, 0.2342529296875, 0.25788116455078125, 0.2815093994140625, 0.30513763427734375, 0.328765869140625, 0.35239410400390625, 0.3760223388671875, 0.39965057373046875, 0.42327880859375, 0.44690704345703125, 0.4705352783203125, 0.49416351318359375, 0.517791748046875, 0.5414199829101562, 0.5650482177734375, 0.5886764526367188, 0.6123046875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 10.0, 11.0, 11.0, 12.0, 22.0, 23.0, 25.0, 31.0, 54.0, 58.0, 74.0, 60.0, 83.0, 70.0, 75.0, 72.0, 72.0, 63.0, 40.0, 30.0, 24.0, 14.0, 23.0, 10.0, 6.0, 7.0, 11.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5615234375, -0.5478935241699219, -0.5342636108398438, -0.5206336975097656, -0.5070037841796875, -0.4933738708496094, -0.47974395751953125, -0.4661140441894531, -0.452484130859375, -0.4388542175292969, -0.42522430419921875, -0.4115943908691406, -0.3979644775390625, -0.3843345642089844, -0.37070465087890625, -0.3570747375488281, -0.34344482421875, -0.3298149108886719, -0.31618499755859375, -0.3025550842285156, -0.2889251708984375, -0.2752952575683594, -0.26166534423828125, -0.24803543090820312, -0.234405517578125, -0.22077560424804688, -0.20714569091796875, -0.19351577758789062, -0.1798858642578125, -0.16625595092773438, -0.15262603759765625, -0.13899612426757812, -0.1253662109375, -0.11173629760742188, -0.09810638427734375, -0.08447647094726562, -0.0708465576171875, -0.057216644287109375, -0.04358673095703125, -0.029956817626953125, -0.016326904296875, -0.002696990966796875, 0.01093292236328125, 0.024562835693359375, 0.0381927490234375, 0.051822662353515625, 0.06545257568359375, 0.07908248901367188, 0.09271240234375, 0.10634231567382812, 0.11997222900390625, 0.13360214233398438, 0.1472320556640625, 0.16086196899414062, 0.17449188232421875, 0.18812179565429688, 0.201751708984375, 0.21538162231445312, 0.22901153564453125, 0.24264144897460938, 0.2562713623046875, 0.2699012756347656, 0.28353118896484375, 0.2971611022949219, 0.310791015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 16.0, 6.0, 20.0, 24.0, 52.0, 76.0, 152.0, 298.0, 652.0, 1517.0, 4253.0, 16111.0, 200558.0, 777018.0, 36786.0, 6938.0, 2305.0, 880.0, 400.0, 196.0, 91.0, 75.0, 37.0, 21.0, 19.0, 13.0, 7.0, 4.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.44580078125, -0.4319610595703125, -0.418121337890625, -0.4042816162109375, -0.39044189453125, -0.3766021728515625, -0.362762451171875, -0.3489227294921875, -0.3350830078125, -0.3212432861328125, -0.307403564453125, -0.2935638427734375, -0.27972412109375, -0.2658843994140625, -0.252044677734375, -0.2382049560546875, -0.224365234375, -0.2105255126953125, -0.196685791015625, -0.1828460693359375, -0.16900634765625, -0.1551666259765625, -0.141326904296875, -0.1274871826171875, -0.1136474609375, -0.0998077392578125, -0.085968017578125, -0.0721282958984375, -0.05828857421875, -0.0444488525390625, -0.030609130859375, -0.0167694091796875, -0.0029296875, 0.0109100341796875, 0.024749755859375, 0.0385894775390625, 0.05242919921875, 0.0662689208984375, 0.080108642578125, 0.0939483642578125, 0.1077880859375, 0.1216278076171875, 0.135467529296875, 0.1493072509765625, 0.16314697265625, 0.1769866943359375, 0.190826416015625, 0.2046661376953125, 0.218505859375, 0.2323455810546875, 0.246185302734375, 0.2600250244140625, 0.27386474609375, 0.2877044677734375, 0.301544189453125, 0.3153839111328125, 0.3292236328125, 0.3430633544921875, 0.356903076171875, 0.3707427978515625, 0.38458251953125, 0.3984222412109375, 0.412261962890625, 0.4261016845703125, 0.43994140625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 10.0, 6.0, 5.0, 6.0, 8.0, 20.0, 27.0, 53.0, 68.0, 119.0, 224.0, 163.0, 109.0, 52.0, 35.0, 19.0, 12.0, 13.0, 7.0, 8.0, 7.0, 5.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.979703903198242e-05, -6.760004907846451e-05, -6.54030591249466e-05, -6.320606917142868e-05, -6.1009079217910767e-05, -5.881208926439285e-05, -5.661509931087494e-05, -5.4418109357357025e-05, -5.222111940383911e-05, -5.00241294503212e-05, -4.7827139496803284e-05, -4.563014954328537e-05, -4.3433159589767456e-05, -4.123616963624954e-05, -3.903917968273163e-05, -3.6842189729213715e-05, -3.46451997756958e-05, -3.244820982217789e-05, -3.0251219868659973e-05, -2.805422991514206e-05, -2.5857239961624146e-05, -2.366025000810623e-05, -2.1463260054588318e-05, -1.9266270101070404e-05, -1.706928014755249e-05, -1.4872290194034576e-05, -1.2675300240516663e-05, -1.0478310286998749e-05, -8.281320333480835e-06, -6.084330379962921e-06, -3.887340426445007e-06, -1.6903504729270935e-06, 5.066394805908203e-07, 2.703629434108734e-06, 4.900619387626648e-06, 7.097609341144562e-06, 9.294599294662476e-06, 1.149158924818039e-05, 1.3688579201698303e-05, 1.5885569155216217e-05, 1.808255910873413e-05, 2.0279549062252045e-05, 2.247653901576996e-05, 2.4673528969287872e-05, 2.6870518922805786e-05, 2.90675088763237e-05, 3.1264498829841614e-05, 3.346148878335953e-05, 3.565847873687744e-05, 3.7855468690395355e-05, 4.005245864391327e-05, 4.224944859743118e-05, 4.44464385509491e-05, 4.664342850446701e-05, 4.8840418457984924e-05, 5.103740841150284e-05, 5.323439836502075e-05, 5.5431388318538666e-05, 5.762837827205658e-05, 5.9825368225574493e-05, 6.202235817909241e-05, 6.421934813261032e-05, 6.641633808612823e-05, 6.861332803964615e-05, 7.081031799316406e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 6.0, 11.0, 22.0, 30.0, 62.0, 89.0, 174.0, 298.0, 602.0, 1322.0, 3023.0, 8837.0, 40019.0, 549565.0, 398511.0, 33020.0, 7851.0, 2688.0, 1192.0, 548.0, 301.0, 158.0, 85.0, 45.0, 28.0, 16.0, 11.0, 6.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33447265625, -0.3229179382324219, -0.31136322021484375, -0.2998085021972656, -0.2882537841796875, -0.2766990661621094, -0.26514434814453125, -0.2535896301269531, -0.242034912109375, -0.23048019409179688, -0.21892547607421875, -0.20737075805664062, -0.1958160400390625, -0.18426132202148438, -0.17270660400390625, -0.16115188598632812, -0.14959716796875, -0.13804244995117188, -0.12648773193359375, -0.11493301391601562, -0.1033782958984375, -0.09182357788085938, -0.08026885986328125, -0.06871414184570312, -0.057159423828125, -0.045604705810546875, -0.03404998779296875, -0.022495269775390625, -0.0109405517578125, 0.000614166259765625, 0.01216888427734375, 0.023723602294921875, 0.0352783203125, 0.046833038330078125, 0.05838775634765625, 0.06994247436523438, 0.0814971923828125, 0.09305191040039062, 0.10460662841796875, 0.11616134643554688, 0.127716064453125, 0.13927078247070312, 0.15082550048828125, 0.16238021850585938, 0.1739349365234375, 0.18548965454101562, 0.19704437255859375, 0.20859909057617188, 0.22015380859375, 0.23170852661132812, 0.24326324462890625, 0.2548179626464844, 0.2663726806640625, 0.2779273986816406, 0.28948211669921875, 0.3010368347167969, 0.312591552734375, 0.3241462707519531, 0.33570098876953125, 0.3472557067871094, 0.3588104248046875, 0.3703651428222656, 0.38191986083984375, 0.3934745788574219, 0.405029296875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 8.0, 10.0, 11.0, 13.0, 8.0, 16.0, 18.0, 33.0, 23.0, 38.0, 45.0, 48.0, 70.0, 65.0, 69.0, 74.0, 65.0, 54.0, 61.0, 40.0, 37.0, 28.0, 29.0, 34.0, 22.0, 16.0, 8.0, 12.0, 4.0, 7.0, 0.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.11669921875, -0.11297798156738281, -0.10925674438476562, -0.10553550720214844, -0.10181427001953125, -0.09809303283691406, -0.09437179565429688, -0.09065055847167969, -0.0869293212890625, -0.08320808410644531, -0.07948684692382812, -0.07576560974121094, -0.07204437255859375, -0.06832313537597656, -0.06460189819335938, -0.06088066101074219, -0.057159423828125, -0.05343818664550781, -0.049716949462890625, -0.04599571228027344, -0.04227447509765625, -0.03855323791503906, -0.034832000732421875, -0.031110763549804688, -0.0273895263671875, -0.023668289184570312, -0.019947052001953125, -0.016225814819335938, -0.01250457763671875, -0.008783340454101562, -0.005062103271484375, -0.0013408660888671875, 0.00238037109375, 0.0061016082763671875, 0.009822845458984375, 0.013544082641601562, 0.01726531982421875, 0.020986557006835938, 0.024707794189453125, 0.028429031372070312, 0.0321502685546875, 0.03587150573730469, 0.039592742919921875, 0.04331398010253906, 0.04703521728515625, 0.05075645446777344, 0.054477691650390625, 0.05819892883300781, 0.061920166015625, 0.06564140319824219, 0.06936264038085938, 0.07308387756347656, 0.07680511474609375, 0.08052635192871094, 0.08424758911132812, 0.08796882629394531, 0.0916900634765625, 0.09541130065917969, 0.09913253784179688, 0.10285377502441406, 0.10657501220703125, 0.11029624938964844, 0.11401748657226562, 0.11773872375488281, 0.1214599609375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 35.0, 120.0, 410.0, 301.0, 97.0, 23.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.70315933227539, -10.504842758178711, -10.306526184082031, -10.108210563659668, -9.909893989562988, -9.711577415466309, -9.513260841369629, -9.31494426727295, -9.116628646850586, -8.918312072753906, -8.719995498657227, -8.521679878234863, -8.323363304138184, -8.125046730041504, -7.926730155944824, -7.728414058685303, -7.530097007751465, -7.331780433654785, -7.133464336395264, -6.935147762298584, -6.7368316650390625, -6.538515090942383, -6.340198516845703, -6.141882419586182, -5.94356632232666, -5.7452497482299805, -5.546933650970459, -5.348617076873779, -5.150300979614258, -4.951984405517578, -4.753667831420898, -4.555351734161377, -4.357034683227539, -4.158718109130859, -3.960402011871338, -3.762085437774658, -3.5637691020965576, -3.365452766418457, -3.1671364307403564, -2.968820095062256, -2.7705037593841553, -2.5721874237060547, -2.373871088027954, -2.1755547523498535, -1.9772381782531738, -1.7789218425750732, -1.5806055068969727, -1.3822890520095825, -1.183972716331482, -0.9856563210487366, -0.7873399257659912, -0.5890235900878906, -0.39070719480514526, -0.1923907995223999, 0.005925536155700684, 0.20424199104309082, 0.4025583267211914, 0.6008747220039368, 0.7991911172866821, 0.9975074529647827, 1.1958239078521729, 1.3941402435302734, 1.592456579208374, 1.7907730340957642, 1.9890893697738647]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 9.0, 9.0, 12.0, 19.0, 17.0, 46.0, 42.0, 46.0, 69.0, 60.0, 77.0, 57.0, 65.0, 71.0, 66.0, 59.0, 55.0, 47.0, 42.0, 34.0, 25.0, 21.0, 17.0, 15.0, 4.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9832431077957153, -1.9075418710708618, -1.8318407535552979, -1.7561395168304443, -1.6804382801055908, -1.6047370433807373, -1.5290359258651733, -1.4533346891403198, -1.3776335716247559, -1.3019323348999023, -1.2262312173843384, -1.1505299806594849, -1.0748287439346313, -0.9991275668144226, -0.9234263896942139, -0.8477251529693604, -0.7720239162445068, -0.6963227391242981, -0.6206215023994446, -0.5449203252792358, -0.4692191183567047, -0.3935179114341736, -0.31781673431396484, -0.24211549758911133, -0.1664143204689026, -0.09071312099695206, -0.015011921525001526, 0.06068927049636841, 0.13639047741889954, 0.21209168434143066, 0.2877928614616394, 0.3634940981864929, 0.4391953945159912, 0.5148965716362, 0.5905978083610535, 0.6662989854812622, 0.7420002222061157, 0.8177013993263245, 0.8934025764465332, 0.9691038131713867, 1.0448050498962402, 1.1205062866210938, 1.1962074041366577, 1.2719086408615112, 1.3476098775863647, 1.4233109951019287, 1.4990122318267822, 1.5747134685516357, 1.6504145860671997, 1.7261158227920532, 1.8018169403076172, 1.8775181770324707, 1.9532194137573242, 2.0289206504821777, 2.1046218872070312, 2.1803231239318848, 2.256024122238159, 2.3317253589630127, 2.407426595687866, 2.4831275939941406, 2.558828830718994, 2.6345300674438477, 2.710231304168701, 2.7859325408935547, 2.861633777618408]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 6.0, 14.0, 19.0, 10.0, 13.0, 29.0, 43.0, 50.0, 87.0, 159.0, 234.0, 569.0, 1412.0, 4421.0, 27290.0, 4066457.0, 81711.0, 7900.0, 2244.0, 828.0, 356.0, 181.0, 74.0, 59.0, 30.0, 27.0, 9.0, 10.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.279296875, -2.221832275390625, -2.16436767578125, -2.106903076171875, -2.0494384765625, -1.991973876953125, -1.93450927734375, -1.877044677734375, -1.819580078125, -1.762115478515625, -1.70465087890625, -1.647186279296875, -1.5897216796875, -1.532257080078125, -1.47479248046875, -1.417327880859375, -1.35986328125, -1.302398681640625, -1.24493408203125, -1.187469482421875, -1.1300048828125, -1.072540283203125, -1.01507568359375, -0.957611083984375, -0.900146484375, -0.842681884765625, -0.78521728515625, -0.727752685546875, -0.6702880859375, -0.612823486328125, -0.55535888671875, -0.497894287109375, -0.4404296875, -0.382965087890625, -0.32550048828125, -0.268035888671875, -0.2105712890625, -0.153106689453125, -0.09564208984375, -0.038177490234375, 0.019287109375, 0.076751708984375, 0.13421630859375, 0.191680908203125, 0.2491455078125, 0.306610107421875, 0.36407470703125, 0.421539306640625, 0.47900390625, 0.536468505859375, 0.59393310546875, 0.651397705078125, 0.7088623046875, 0.766326904296875, 0.82379150390625, 0.881256103515625, 0.938720703125, 0.996185302734375, 1.05364990234375, 1.111114501953125, 1.1685791015625, 1.226043701171875, 1.28350830078125, 1.340972900390625, 1.3984375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 10.0, 8.0, 10.0, 21.0, 35.0, 35.0, 60.0, 63.0, 69.0, 83.0, 107.0, 100.0, 90.0, 79.0, 64.0, 51.0, 40.0, 31.0, 18.0, 8.0, 10.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08355712890625, -0.08021259307861328, -0.07686805725097656, -0.07352352142333984, -0.07017898559570312, -0.0668344497680664, -0.06348991394042969, -0.06014537811279297, -0.05680084228515625, -0.05345630645751953, -0.05011177062988281, -0.046767234802246094, -0.043422698974609375, -0.040078163146972656, -0.03673362731933594, -0.03338909149169922, -0.0300445556640625, -0.02670001983642578, -0.023355484008789062, -0.020010948181152344, -0.016666412353515625, -0.013321876525878906, -0.009977340698242188, -0.006632804870605469, -0.00328826904296875, 5.626678466796875e-05, 0.0034008026123046875, 0.006745338439941406, 0.010089874267578125, 0.013434410095214844, 0.016778945922851562, 0.02012348175048828, 0.023468017578125, 0.02681255340576172, 0.030157089233398438, 0.033501625061035156, 0.036846160888671875, 0.040190696716308594, 0.04353523254394531, 0.04687976837158203, 0.05022430419921875, 0.05356884002685547, 0.05691337585449219, 0.060257911682128906, 0.06360244750976562, 0.06694698333740234, 0.07029151916503906, 0.07363605499267578, 0.0769805908203125, 0.08032512664794922, 0.08366966247558594, 0.08701419830322266, 0.09035873413085938, 0.0937032699584961, 0.09704780578613281, 0.10039234161376953, 0.10373687744140625, 0.10708141326904297, 0.11042594909667969, 0.1137704849243164, 0.11711502075195312, 0.12045955657958984, 0.12380409240722656, 0.12714862823486328, 0.1304931640625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 28.0, 64.0, 202.0, 581.0, 2259.0, 4098789.0, 89888.0, 1739.0, 487.0, 153.0, 51.0, 15.0, 8.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.90625, -8.7122802734375, -8.518310546875, -8.3243408203125, -8.13037109375, -7.9364013671875, -7.742431640625, -7.5484619140625, -7.3544921875, -7.1605224609375, -6.966552734375, -6.7725830078125, -6.57861328125, -6.3846435546875, -6.190673828125, -5.9967041015625, -5.802734375, -5.6087646484375, -5.414794921875, -5.2208251953125, -5.02685546875, -4.8328857421875, -4.638916015625, -4.4449462890625, -4.2509765625, -4.0570068359375, -3.863037109375, -3.6690673828125, -3.47509765625, -3.2811279296875, -3.087158203125, -2.8931884765625, -2.69921875, -2.5052490234375, -2.311279296875, -2.1173095703125, -1.92333984375, -1.7293701171875, -1.535400390625, -1.3414306640625, -1.1474609375, -0.9534912109375, -0.759521484375, -0.5655517578125, -0.37158203125, -0.1776123046875, 0.016357421875, 0.2103271484375, 0.404296875, 0.5982666015625, 0.792236328125, 0.9862060546875, 1.18017578125, 1.3741455078125, 1.568115234375, 1.7620849609375, 1.9560546875, 2.1500244140625, 2.343994140625, 2.5379638671875, 2.73193359375, 2.9259033203125, 3.119873046875, 3.3138427734375, 3.5078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 51.0, 421.0, 3474.0, 98.0, 18.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.404296875, -1.3745613098144531, -1.3448257446289062, -1.3150901794433594, -1.2853546142578125, -1.2556190490722656, -1.2258834838867188, -1.1961479187011719, -1.166412353515625, -1.1366767883300781, -1.1069412231445312, -1.0772056579589844, -1.0474700927734375, -1.0177345275878906, -0.9879989624023438, -0.9582633972167969, -0.92852783203125, -0.8987922668457031, -0.8690567016601562, -0.8393211364746094, -0.8095855712890625, -0.7798500061035156, -0.7501144409179688, -0.7203788757324219, -0.690643310546875, -0.6609077453613281, -0.6311721801757812, -0.6014366149902344, -0.5717010498046875, -0.5419654846191406, -0.5122299194335938, -0.4824943542480469, -0.4527587890625, -0.4230232238769531, -0.39328765869140625, -0.3635520935058594, -0.3338165283203125, -0.3040809631347656, -0.27434539794921875, -0.24460983276367188, -0.214874267578125, -0.18513870239257812, -0.15540313720703125, -0.12566757202148438, -0.0959320068359375, -0.06619644165039062, -0.03646087646484375, -0.006725311279296875, 0.02301025390625, 0.052745819091796875, 0.08248138427734375, 0.11221694946289062, 0.1419525146484375, 0.17168807983398438, 0.20142364501953125, 0.23115921020507812, 0.260894775390625, 0.2906303405761719, 0.32036590576171875, 0.3501014709472656, 0.3798370361328125, 0.4095726013183594, 0.43930816650390625, 0.4690437316894531, 0.498779296875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 149.0, 837.0, 19.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.259843826293945, -10.728723526000977, -10.197602272033691, -9.666481018066406, -9.135360717773438, -8.604240417480469, -8.073119163513184, -7.541998386383057, -7.01087760925293, -6.479756832122803, -5.948636054992676, -5.417515277862549, -4.886394500732422, -4.355273723602295, -3.824152946472168, -3.293032169342041, -2.761911392211914, -2.230790615081787, -1.6996698379516602, -1.1685490608215332, -0.6374282836914062, -0.1063075065612793, 0.42481327056884766, 0.9559340476989746, 1.4870548248291016, 2.0181756019592285, 2.5492963790893555, 3.0804171562194824, 3.6115379333496094, 4.142658710479736, 4.673779487609863, 5.20490026473999, 5.73602294921875, 6.267143726348877, 6.798264503479004, 7.329385280609131, 7.860506057739258, 8.391626358032227, 8.922747611999512, 9.453868865966797, 9.984989166259766, 10.516109466552734, 11.04723072052002, 11.578351974487305, 12.109472274780273, 12.640592575073242, 13.171713829040527, 13.702835083007812, 14.233955383300781, 14.76507568359375, 15.296196937561035, 15.82731819152832, 16.35843849182129, 16.889558792114258, 17.42068099975586, 17.951801300048828, 18.482921600341797, 19.014041900634766, 19.545162200927734, 20.076284408569336, 20.607404708862305, 21.138525009155273, 21.669647216796875, 22.200767517089844, 22.731887817382812]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 14.0, 19.0, 41.0, 85.0, 114.0, 166.0, 170.0, 151.0, 112.0, 59.0, 38.0, 17.0, 11.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1737537384033203, -2.0916032791137695, -2.0094528198242188, -1.927302360534668, -1.8451519012451172, -1.7630014419555664, -1.6808509826660156, -1.5987005233764648, -1.516550064086914, -1.4343996047973633, -1.3522491455078125, -1.2700986862182617, -1.187948226928711, -1.1057977676391602, -1.0236473083496094, -0.9414967894554138, -0.8593462705612183, -0.7771958112716675, -0.6950453519821167, -0.6128948926925659, -0.5307444334030151, -0.44859394431114197, -0.3664434552192688, -0.284292995929718, -0.20214253664016724, -0.11999206990003586, -0.03784160315990448, 0.044308871030807495, 0.12645933032035828, 0.20860978960990906, 0.2907602787017822, 0.372910737991333, 0.4550611972808838, 0.5372116565704346, 0.6193621158599854, 0.7015125751495361, 0.7836630344390869, 0.8658134937286377, 0.9479640126228333, 1.0301144123077393, 1.11226487159729, 1.1944153308868408, 1.2765657901763916, 1.3587162494659424, 1.4408667087554932, 1.523017168045044, 1.6051676273345947, 1.6873180866241455, 1.7694686651229858, 1.8516191244125366, 1.9337695837020874, 2.0159201622009277, 2.0980706214904785, 2.1802210807800293, 2.26237154006958, 2.344521999359131, 2.4266724586486816, 2.5088229179382324, 2.590973377227783, 2.673123836517334, 2.7552742958068848, 2.8374247550964355, 2.9195752143859863, 3.001725673675537, 3.083876132965088]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 9.0, 6.0, 12.0, 11.0, 21.0, 33.0, 41.0, 75.0, 123.0, 178.0, 329.0, 670.0, 1606.0, 4312.0, 19014.0, 180778.0, 744886.0, 79471.0, 11341.0, 3113.0, 1225.0, 571.0, 307.0, 158.0, 90.0, 66.0, 38.0, 20.0, 18.0, 8.0, 11.0, 5.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.90283203125, -0.87799072265625, -0.8531494140625, -0.82830810546875, -0.803466796875, -0.77862548828125, -0.7537841796875, -0.72894287109375, -0.7041015625, -0.67926025390625, -0.6544189453125, -0.62957763671875, -0.604736328125, -0.57989501953125, -0.5550537109375, -0.53021240234375, -0.50537109375, -0.48052978515625, -0.4556884765625, -0.43084716796875, -0.406005859375, -0.38116455078125, -0.3563232421875, -0.33148193359375, -0.306640625, -0.28179931640625, -0.2569580078125, -0.23211669921875, -0.207275390625, -0.18243408203125, -0.1575927734375, -0.13275146484375, -0.10791015625, -0.08306884765625, -0.0582275390625, -0.03338623046875, -0.008544921875, 0.01629638671875, 0.0411376953125, 0.06597900390625, 0.0908203125, 0.11566162109375, 0.1405029296875, 0.16534423828125, 0.190185546875, 0.21502685546875, 0.2398681640625, 0.26470947265625, 0.28955078125, 0.31439208984375, 0.3392333984375, 0.36407470703125, 0.388916015625, 0.41375732421875, 0.4385986328125, 0.46343994140625, 0.48828125, 0.51312255859375, 0.5379638671875, 0.56280517578125, 0.587646484375, 0.61248779296875, 0.6373291015625, 0.66217041015625, 0.68701171875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 15.0, 15.0, 27.0, 19.0, 33.0, 44.0, 62.0, 56.0, 59.0, 61.0, 64.0, 77.0, 93.0, 70.0, 64.0, 45.0, 47.0, 31.0, 23.0, 31.0, 19.0, 13.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08294677734375, -0.08010578155517578, -0.07726478576660156, -0.07442378997802734, -0.07158279418945312, -0.0687417984008789, -0.06590080261230469, -0.06305980682373047, -0.06021881103515625, -0.05737781524658203, -0.05453681945800781, -0.051695823669433594, -0.048854827880859375, -0.046013832092285156, -0.04317283630371094, -0.04033184051513672, -0.0374908447265625, -0.03464984893798828, -0.03180885314941406, -0.028967857360839844, -0.026126861572265625, -0.023285865783691406, -0.020444869995117188, -0.01760387420654297, -0.01476287841796875, -0.011921882629394531, -0.009080886840820312, -0.006239891052246094, -0.003398895263671875, -0.0005578994750976562, 0.0022830963134765625, 0.005124092102050781, 0.007965087890625, 0.010806083679199219, 0.013647079467773438, 0.016488075256347656, 0.019329071044921875, 0.022170066833496094, 0.025011062622070312, 0.02785205841064453, 0.03069305419921875, 0.03353404998779297, 0.03637504577636719, 0.039216041564941406, 0.042057037353515625, 0.044898033142089844, 0.04773902893066406, 0.05058002471923828, 0.0534210205078125, 0.05626201629638672, 0.05910301208496094, 0.061944007873535156, 0.06478500366210938, 0.0676259994506836, 0.07046699523925781, 0.07330799102783203, 0.07614898681640625, 0.07898998260498047, 0.08183097839355469, 0.0846719741821289, 0.08751296997070312, 0.09035396575927734, 0.09319496154785156, 0.09603595733642578, 0.098876953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 13.0, 8.0, 16.0, 28.0, 28.0, 40.0, 75.0, 88.0, 172.0, 293.0, 536.0, 1112.0, 2982.0, 10614.0, 63208.0, 585161.0, 337194.0, 35841.0, 6924.0, 2162.0, 905.0, 497.0, 223.0, 144.0, 89.0, 58.0, 43.0, 29.0, 14.0, 13.0, 11.0, 7.0, 3.0, 4.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.398193359375, -0.3815040588378906, -0.36481475830078125, -0.3481254577636719, -0.3314361572265625, -0.3147468566894531, -0.29805755615234375, -0.2813682556152344, -0.264678955078125, -0.24798965454101562, -0.23130035400390625, -0.21461105346679688, -0.1979217529296875, -0.18123245239257812, -0.16454315185546875, -0.14785385131835938, -0.13116455078125, -0.11447525024414062, -0.09778594970703125, -0.08109664916992188, -0.0644073486328125, -0.047718048095703125, -0.03102874755859375, -0.014339447021484375, 0.002349853515625, 0.019039154052734375, 0.03572845458984375, 0.052417755126953125, 0.0691070556640625, 0.08579635620117188, 0.10248565673828125, 0.11917495727539062, 0.1358642578125, 0.15255355834960938, 0.16924285888671875, 0.18593215942382812, 0.2026214599609375, 0.21931076049804688, 0.23600006103515625, 0.2526893615722656, 0.269378662109375, 0.2860679626464844, 0.30275726318359375, 0.3194465637207031, 0.3361358642578125, 0.3528251647949219, 0.36951446533203125, 0.3862037658691406, 0.40289306640625, 0.4195823669433594, 0.43627166748046875, 0.4529609680175781, 0.4696502685546875, 0.4863395690917969, 0.5030288696289062, 0.5197181701660156, 0.536407470703125, 0.5530967712402344, 0.5697860717773438, 0.5864753723144531, 0.6031646728515625, 0.6198539733886719, 0.6365432739257812, 0.6532325744628906, 0.669921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 2.0, 5.0, 1.0, 5.0, 8.0, 12.0, 9.0, 12.0, 21.0, 13.0, 19.0, 24.0, 34.0, 41.0, 41.0, 45.0, 53.0, 51.0, 61.0, 55.0, 46.0, 64.0, 39.0, 43.0, 39.0, 36.0, 40.0, 41.0, 25.0, 20.0, 24.0, 18.0, 19.0, 7.0, 10.0, 13.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2274169921875, -0.21751976013183594, -0.20762252807617188, -0.1977252960205078, -0.18782806396484375, -0.1779308319091797, -0.16803359985351562, -0.15813636779785156, -0.1482391357421875, -0.13834190368652344, -0.12844467163085938, -0.11854743957519531, -0.10865020751953125, -0.09875297546386719, -0.08885574340820312, -0.07895851135253906, -0.069061279296875, -0.05916404724121094, -0.049266815185546875, -0.03936958312988281, -0.02947235107421875, -0.019575119018554688, -0.009677886962890625, 0.0002193450927734375, 0.0101165771484375, 0.020013809204101562, 0.029911041259765625, 0.03980827331542969, 0.04970550537109375, 0.05960273742675781, 0.06949996948242188, 0.07939720153808594, 0.08929443359375, 0.09919166564941406, 0.10908889770507812, 0.11898612976074219, 0.12888336181640625, 0.1387805938720703, 0.14867782592773438, 0.15857505798339844, 0.1684722900390625, 0.17836952209472656, 0.18826675415039062, 0.1981639862060547, 0.20806121826171875, 0.2179584503173828, 0.22785568237304688, 0.23775291442871094, 0.247650146484375, 0.25754737854003906, 0.2674446105957031, 0.2773418426513672, 0.28723907470703125, 0.2971363067626953, 0.3070335388183594, 0.31693077087402344, 0.3268280029296875, 0.33672523498535156, 0.3466224670410156, 0.3565196990966797, 0.36641693115234375, 0.3763141632080078, 0.3862113952636719, 0.39610862731933594, 0.406005859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 5.0, 7.0, 11.0, 19.0, 22.0, 33.0, 56.0, 116.0, 199.0, 485.0, 1235.0, 3776.0, 16793.0, 220592.0, 759400.0, 36372.0, 6171.0, 1878.0, 693.0, 286.0, 153.0, 82.0, 67.0, 24.0, 13.0, 16.0, 13.0, 7.0, 4.0, 2.0, 4.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3544921875, -0.3419189453125, -0.329345703125, -0.3167724609375, -0.30419921875, -0.2916259765625, -0.279052734375, -0.2664794921875, -0.25390625, -0.2413330078125, -0.228759765625, -0.2161865234375, -0.20361328125, -0.1910400390625, -0.178466796875, -0.1658935546875, -0.1533203125, -0.1407470703125, -0.128173828125, -0.1156005859375, -0.10302734375, -0.0904541015625, -0.077880859375, -0.0653076171875, -0.052734375, -0.0401611328125, -0.027587890625, -0.0150146484375, -0.00244140625, 0.0101318359375, 0.022705078125, 0.0352783203125, 0.0478515625, 0.0604248046875, 0.072998046875, 0.0855712890625, 0.09814453125, 0.1107177734375, 0.123291015625, 0.1358642578125, 0.1484375, 0.1610107421875, 0.173583984375, 0.1861572265625, 0.19873046875, 0.2113037109375, 0.223876953125, 0.2364501953125, 0.2490234375, 0.2615966796875, 0.274169921875, 0.2867431640625, 0.29931640625, 0.3118896484375, 0.324462890625, 0.3370361328125, 0.349609375, 0.3621826171875, 0.374755859375, 0.3873291015625, 0.39990234375, 0.4124755859375, 0.425048828125, 0.4376220703125, 0.4501953125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 5.0, 5.0, 5.0, 11.0, 8.0, 17.0, 25.0, 30.0, 39.0, 58.0, 79.0, 102.0, 126.0, 133.0, 91.0, 63.0, 64.0, 34.0, 23.0, 17.0, 10.0, 9.0, 10.0, 9.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.4286251068115234e-05, -4.311557859182358e-05, -4.194490611553192e-05, -4.0774233639240265e-05, -3.960356116294861e-05, -3.843288868665695e-05, -3.7262216210365295e-05, -3.609154373407364e-05, -3.492087125778198e-05, -3.3750198781490326e-05, -3.257952630519867e-05, -3.140885382890701e-05, -3.0238181352615356e-05, -2.90675088763237e-05, -2.7896836400032043e-05, -2.6726163923740387e-05, -2.555549144744873e-05, -2.4384818971157074e-05, -2.3214146494865417e-05, -2.204347401857376e-05, -2.0872801542282104e-05, -1.9702129065990448e-05, -1.853145658969879e-05, -1.7360784113407135e-05, -1.619011163711548e-05, -1.5019439160823822e-05, -1.3848766684532166e-05, -1.2678094208240509e-05, -1.1507421731948853e-05, -1.0336749255657196e-05, -9.16607677936554e-06, -7.995404303073883e-06, -6.8247318267822266e-06, -5.65405935049057e-06, -4.4833868741989136e-06, -3.312714397907257e-06, -2.1420419216156006e-06, -9.71369445323944e-07, 1.993030309677124e-07, 1.369975507259369e-06, 2.5406479835510254e-06, 3.711320459842682e-06, 4.881992936134338e-06, 6.052665412425995e-06, 7.223337888717651e-06, 8.394010365009308e-06, 9.564682841300964e-06, 1.0735355317592621e-05, 1.1906027793884277e-05, 1.3076700270175934e-05, 1.424737274646759e-05, 1.5418045222759247e-05, 1.6588717699050903e-05, 1.775939017534256e-05, 1.8930062651634216e-05, 2.0100735127925873e-05, 2.127140760421753e-05, 2.2442080080509186e-05, 2.3612752556800842e-05, 2.47834250330925e-05, 2.5954097509384155e-05, 2.7124769985675812e-05, 2.8295442461967468e-05, 2.9466114938259125e-05, 3.063678741455078e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 9.0, 7.0, 11.0, 13.0, 23.0, 26.0, 45.0, 73.0, 120.0, 227.0, 440.0, 976.0, 2706.0, 10761.0, 121170.0, 865714.0, 37037.0, 5914.0, 1756.0, 701.0, 349.0, 172.0, 114.0, 76.0, 40.0, 19.0, 19.0, 12.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4287109375, -0.41241455078125, -0.3961181640625, -0.37982177734375, -0.363525390625, -0.34722900390625, -0.3309326171875, -0.31463623046875, -0.29833984375, -0.28204345703125, -0.2657470703125, -0.24945068359375, -0.233154296875, -0.21685791015625, -0.2005615234375, -0.18426513671875, -0.16796875, -0.15167236328125, -0.1353759765625, -0.11907958984375, -0.102783203125, -0.08648681640625, -0.0701904296875, -0.05389404296875, -0.03759765625, -0.02130126953125, -0.0050048828125, 0.01129150390625, 0.027587890625, 0.04388427734375, 0.0601806640625, 0.07647705078125, 0.0927734375, 0.10906982421875, 0.1253662109375, 0.14166259765625, 0.157958984375, 0.17425537109375, 0.1905517578125, 0.20684814453125, 0.22314453125, 0.23944091796875, 0.2557373046875, 0.27203369140625, 0.288330078125, 0.30462646484375, 0.3209228515625, 0.33721923828125, 0.353515625, 0.36981201171875, 0.3861083984375, 0.40240478515625, 0.418701171875, 0.43499755859375, 0.4512939453125, 0.46759033203125, 0.48388671875, 0.50018310546875, 0.5164794921875, 0.53277587890625, 0.549072265625, 0.56536865234375, 0.5816650390625, 0.59796142578125, 0.6142578125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 13.0, 13.0, 8.0, 19.0, 34.0, 38.0, 72.0, 88.0, 123.0, 134.0, 120.0, 94.0, 70.0, 68.0, 26.0, 16.0, 19.0, 6.0, 6.0, 11.0, 5.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.150634765625, -0.14421463012695312, -0.13779449462890625, -0.13137435913085938, -0.1249542236328125, -0.11853408813476562, -0.11211395263671875, -0.10569381713867188, -0.099273681640625, -0.09285354614257812, -0.08643341064453125, -0.08001327514648438, -0.0735931396484375, -0.06717300415039062, -0.06075286865234375, -0.054332733154296875, -0.04791259765625, -0.041492462158203125, -0.03507232666015625, -0.028652191162109375, -0.0222320556640625, -0.015811920166015625, -0.00939178466796875, -0.002971649169921875, 0.003448486328125, 0.009868621826171875, 0.01628875732421875, 0.022708892822265625, 0.0291290283203125, 0.035549163818359375, 0.04196929931640625, 0.048389434814453125, 0.0548095703125, 0.061229705810546875, 0.06764984130859375, 0.07406997680664062, 0.0804901123046875, 0.08691024780273438, 0.09333038330078125, 0.09975051879882812, 0.106170654296875, 0.11259078979492188, 0.11901092529296875, 0.12543106079101562, 0.1318511962890625, 0.13827133178710938, 0.14469146728515625, 0.15111160278320312, 0.15753173828125, 0.16395187377929688, 0.17037200927734375, 0.17679214477539062, 0.1832122802734375, 0.18963241577148438, 0.19605255126953125, 0.20247268676757812, 0.208892822265625, 0.21531295776367188, 0.22173309326171875, 0.22815322875976562, 0.2345733642578125, 0.24099349975585938, 0.24741363525390625, 0.2538337707519531, 0.26025390625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 5.0, 15.0, 18.0, 32.0, 83.0, 161.0, 192.0, 197.0, 138.0, 76.0, 38.0, 18.0, 13.0, 10.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.616629123687744, -3.518491506576538, -3.420354127883911, -3.322216510772705, -3.224079132080078, -3.125941514968872, -3.027804136276245, -2.929666519165039, -2.831529140472412, -2.733391523361206, -2.635254144668579, -2.537116527557373, -2.438979148864746, -2.34084153175354, -2.242704153060913, -2.144566535949707, -2.04642915725708, -1.9482916593551636, -1.850154161453247, -1.7520166635513306, -1.653879165649414, -1.5557416677474976, -1.457604169845581, -1.359466552734375, -1.261328935623169, -1.1631914377212524, -1.065053939819336, -0.9669164419174194, -0.8687789440155029, -0.7706414461135864, -0.6725038886070251, -0.5743663907051086, -0.4762289524078369, -0.3780914545059204, -0.2799539566040039, -0.18181642889976501, -0.08367893099784851, 0.014458566904067993, 0.11259609460830688, 0.2107335925102234, 0.3088710904121399, 0.4070085883140564, 0.5051460862159729, 0.6032836437225342, 0.7014211416244507, 0.7995586395263672, 0.8976961374282837, 0.9958336353302002, 1.0939711332321167, 1.1921086311340332, 1.2902461290359497, 1.3883836269378662, 1.4865211248397827, 1.5846586227416992, 1.6827962398529053, 1.7809336185455322, 1.8790712356567383, 1.9772087335586548, 2.0753462314605713, 2.1734838485717773, 2.2716212272644043, 2.3697588443756104, 2.4678962230682373, 2.5660338401794434, 2.6641712188720703]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 9.0, 4.0, 5.0, 8.0, 7.0, 13.0, 10.0, 22.0, 17.0, 15.0, 25.0, 30.0, 47.0, 28.0, 38.0, 49.0, 47.0, 54.0, 43.0, 48.0, 55.0, 42.0, 43.0, 46.0, 38.0, 44.0, 35.0, 27.0, 25.0, 28.0, 20.0, 16.0, 9.0, 12.0, 12.0, 5.0, 11.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0], "bins": [-1.9739840030670166, -1.9223936796188354, -1.8708032369613647, -1.8192129135131836, -1.767622470855713, -1.7160321474075317, -1.664441704750061, -1.6128513813018799, -1.5612609386444092, -1.509670615196228, -1.4580801725387573, -1.4064898490905762, -1.3548994064331055, -1.3033090829849243, -1.2517186403274536, -1.2001283168792725, -1.1485378742218018, -1.0969475507736206, -1.04535710811615, -0.993766725063324, -0.942176342010498, -0.8905860185623169, -0.8389955759048462, -0.787405252456665, -0.7358149290084839, -0.684224545955658, -0.632634162902832, -0.5810437798500061, -0.5294533967971802, -0.47786304354667664, -0.4262726604938507, -0.3746822774410248, -0.32309186458587646, -0.27150148153305054, -0.2199110984802246, -0.16832073032855988, -0.11673034727573395, -0.06513997912406921, -0.013549596071243286, 0.03804078698158264, 0.08963117003440857, 0.1412215530872345, 0.19281193614006042, 0.24440230429172516, 0.2959926724433899, 0.3475830554962158, 0.39917343854904175, 0.4507638216018677, 0.5023542046546936, 0.5539445877075195, 0.6055349707603455, 0.6571253538131714, 0.7087157368659973, 0.7603061199188232, 0.8118964433670044, 0.8634868860244751, 0.9150772094726562, 0.9666675925254822, 1.018257975578308, 1.0698482990264893, 1.12143874168396, 1.1730290651321411, 1.2246195077896118, 1.276209831237793, 1.3278002738952637]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 3.0, 10.0, 5.0, 12.0, 18.0, 30.0, 34.0, 49.0, 57.0, 68.0, 115.0, 192.0, 324.0, 582.0, 1234.0, 2980.0, 10494.0, 59118.0, 3926299.0, 164523.0, 19108.0, 5294.0, 1919.0, 847.0, 417.0, 211.0, 120.0, 76.0, 45.0, 39.0, 15.0, 14.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.7197265625, -1.6794281005859375, -1.639129638671875, -1.5988311767578125, -1.55853271484375, -1.5182342529296875, -1.477935791015625, -1.4376373291015625, -1.3973388671875, -1.3570404052734375, -1.316741943359375, -1.2764434814453125, -1.23614501953125, -1.1958465576171875, -1.155548095703125, -1.1152496337890625, -1.074951171875, -1.0346527099609375, -0.994354248046875, -0.9540557861328125, -0.91375732421875, -0.8734588623046875, -0.833160400390625, -0.7928619384765625, -0.7525634765625, -0.7122650146484375, -0.671966552734375, -0.6316680908203125, -0.59136962890625, -0.5510711669921875, -0.510772705078125, -0.4704742431640625, -0.43017578125, -0.3898773193359375, -0.349578857421875, -0.3092803955078125, -0.26898193359375, -0.2286834716796875, -0.188385009765625, -0.1480865478515625, -0.1077880859375, -0.0674896240234375, -0.027191162109375, 0.0131072998046875, 0.05340576171875, 0.0937042236328125, 0.134002685546875, 0.1743011474609375, 0.214599609375, 0.2548980712890625, 0.295196533203125, 0.3354949951171875, 0.37579345703125, 0.4160919189453125, 0.456390380859375, 0.4966888427734375, 0.5369873046875, 0.5772857666015625, 0.617584228515625, 0.6578826904296875, 0.69818115234375, 0.7384796142578125, 0.778778076171875, 0.8190765380859375, 0.859375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 15.0, 6.0, 6.0, 22.0, 23.0, 17.0, 37.0, 41.0, 35.0, 42.0, 45.0, 55.0, 45.0, 59.0, 85.0, 67.0, 66.0, 57.0, 61.0, 44.0, 41.0, 28.0, 33.0, 14.0, 16.0, 10.0, 7.0, 10.0, 10.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0675048828125, -0.06503582000732422, -0.06256675720214844, -0.060097694396972656, -0.057628631591796875, -0.055159568786621094, -0.05269050598144531, -0.05022144317626953, -0.04775238037109375, -0.04528331756591797, -0.04281425476074219, -0.040345191955566406, -0.037876129150390625, -0.035407066345214844, -0.03293800354003906, -0.03046894073486328, -0.0279998779296875, -0.02553081512451172, -0.023061752319335938, -0.020592689514160156, -0.018123626708984375, -0.015654563903808594, -0.013185501098632812, -0.010716438293457031, -0.00824737548828125, -0.005778312683105469, -0.0033092498779296875, -0.0008401870727539062, 0.001628875732421875, 0.004097938537597656, 0.0065670013427734375, 0.009036064147949219, 0.011505126953125, 0.013974189758300781, 0.016443252563476562, 0.018912315368652344, 0.021381378173828125, 0.023850440979003906, 0.026319503784179688, 0.02878856658935547, 0.03125762939453125, 0.03372669219970703, 0.03619575500488281, 0.038664817810058594, 0.041133880615234375, 0.043602943420410156, 0.04607200622558594, 0.04854106903076172, 0.0510101318359375, 0.05347919464111328, 0.05594825744628906, 0.058417320251464844, 0.060886383056640625, 0.0633554458618164, 0.06582450866699219, 0.06829357147216797, 0.07076263427734375, 0.07323169708251953, 0.07570075988769531, 0.0781698226928711, 0.08063888549804688, 0.08310794830322266, 0.08557701110839844, 0.08804607391357422, 0.09051513671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 13.0, 23.0, 20.0, 51.0, 101.0, 192.0, 763.0, 7729.0, 4177451.0, 6677.0, 744.0, 236.0, 113.0, 75.0, 39.0, 20.0, 15.0, 13.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.60546875, -3.37274169921875, -3.1400146484375, -2.90728759765625, -2.674560546875, -2.44183349609375, -2.2091064453125, -1.97637939453125, -1.74365234375, -1.51092529296875, -1.2781982421875, -1.04547119140625, -0.812744140625, -0.58001708984375, -0.3472900390625, -0.11456298828125, 0.1181640625, 0.35089111328125, 0.5836181640625, 0.81634521484375, 1.049072265625, 1.28179931640625, 1.5145263671875, 1.74725341796875, 1.97998046875, 2.21270751953125, 2.4454345703125, 2.67816162109375, 2.910888671875, 3.14361572265625, 3.3763427734375, 3.60906982421875, 3.841796875, 4.07452392578125, 4.3072509765625, 4.53997802734375, 4.772705078125, 5.00543212890625, 5.2381591796875, 5.47088623046875, 5.70361328125, 5.93634033203125, 6.1690673828125, 6.40179443359375, 6.634521484375, 6.86724853515625, 7.0999755859375, 7.33270263671875, 7.5654296875, 7.79815673828125, 8.0308837890625, 8.26361083984375, 8.496337890625, 8.72906494140625, 8.9617919921875, 9.19451904296875, 9.42724609375, 9.65997314453125, 9.8927001953125, 10.12542724609375, 10.358154296875, 10.59088134765625, 10.8236083984375, 11.05633544921875, 11.2890625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 6.0, 3.0, 9.0, 17.0, 40.0, 99.0, 925.0, 2762.0, 157.0, 40.0, 11.0, 8.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.391357421875, -0.3562049865722656, -0.32105255126953125, -0.2859001159667969, -0.2507476806640625, -0.21559524536132812, -0.18044281005859375, -0.14529037475585938, -0.110137939453125, -0.07498550415039062, -0.03983306884765625, -0.004680633544921875, 0.0304718017578125, 0.06562423706054688, 0.10077667236328125, 0.13592910766601562, 0.17108154296875, 0.20623397827148438, 0.24138641357421875, 0.2765388488769531, 0.3116912841796875, 0.3468437194824219, 0.38199615478515625, 0.4171485900878906, 0.452301025390625, 0.4874534606933594, 0.5226058959960938, 0.5577583312988281, 0.5929107666015625, 0.6280632019042969, 0.6632156372070312, 0.6983680725097656, 0.7335205078125, 0.7686729431152344, 0.8038253784179688, 0.8389778137207031, 0.8741302490234375, 0.9092826843261719, 0.9444351196289062, 0.9795875549316406, 1.014739990234375, 1.0498924255371094, 1.0850448608398438, 1.1201972961425781, 1.1553497314453125, 1.1905021667480469, 1.2256546020507812, 1.2608070373535156, 1.29595947265625, 1.3311119079589844, 1.3662643432617188, 1.4014167785644531, 1.4365692138671875, 1.4717216491699219, 1.5068740844726562, 1.5420265197753906, 1.577178955078125, 1.6123313903808594, 1.6474838256835938, 1.6826362609863281, 1.7177886962890625, 1.7529411315917969, 1.7880935668945312, 1.8232460021972656, 1.8583984375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 12.0, 125.0, 784.0, 72.0, 11.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.818769454956055, -22.293041229248047, -21.76731300354004, -21.24158477783203, -20.715858459472656, -20.19013023376465, -19.66440200805664, -19.138673782348633, -18.612945556640625, -18.087217330932617, -17.56148910522461, -17.0357608795166, -16.510032653808594, -15.984305381774902, -15.458578109741211, -14.932849884033203, -14.407121658325195, -13.881393432617188, -13.35566520690918, -12.829937934875488, -12.30420970916748, -11.778481483459473, -11.252754211425781, -10.727025985717773, -10.201297760009766, -9.675569534301758, -9.14984130859375, -8.624114036560059, -8.09838581085205, -7.572657585144043, -7.046929836273193, -6.521202087402344, -5.9954729080200195, -5.469744682312012, -4.944016933441162, -4.4182891845703125, -3.8925609588623047, -3.366832971572876, -2.8411049842834473, -2.3153769969940186, -1.7896490097045898, -1.2639210224151611, -0.7381930351257324, -0.2124650478363037, 0.313262939453125, 0.8389909267425537, 1.3647189140319824, 1.8904469013214111, 2.41617488861084, 2.9419028759002686, 3.4676308631896973, 3.993358850479126, 4.519086837768555, 5.0448150634765625, 5.570542812347412, 6.096270561218262, 6.6219987869262695, 7.147727012634277, 7.673454761505127, 8.199182510375977, 8.724910736083984, 9.250638961791992, 9.7763671875, 10.302094459533691, 10.8278226852417]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 1.0, 0.0, 8.0, 19.0, 17.0, 42.0, 49.0, 52.0, 94.0, 107.0, 114.0, 109.0, 87.0, 83.0, 71.0, 48.0, 37.0, 19.0, 20.0, 7.0, 8.0, 4.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7925572395324707, -3.6911697387695312, -3.589782238006592, -3.4883947372436523, -3.387007474899292, -3.2856199741363525, -3.184232473373413, -3.0828449726104736, -2.981457471847534, -2.8800699710845947, -2.7786824703216553, -2.677295207977295, -2.5759077072143555, -2.474520206451416, -2.3731327056884766, -2.271745204925537, -2.1703577041625977, -2.068970203399658, -1.9675828218460083, -1.8661953210830688, -1.7648078203201294, -1.6634204387664795, -1.56203293800354, -1.4606454372406006, -1.3592581748962402, -1.2578706741333008, -1.1564832925796509, -1.0550957918167114, -0.953708291053772, -0.8523208498954773, -0.7509334087371826, -0.6495459079742432, -0.5481584072113037, -0.44677093625068665, -0.3453834652900696, -0.2439960241317749, -0.14260855317115784, -0.04122108221054077, 0.060166358947753906, 0.16155385971069336, 0.26294130086898804, 0.3643287718296051, 0.46571624279022217, 0.5671036839485168, 0.6684911251068115, 0.769878625869751, 0.8712660670280457, 0.9726535677909851, 1.0740410089492798, 1.1754285097122192, 1.2768158912658691, 1.3782033920288086, 1.479590892791748, 1.5809783935546875, 1.6823657751083374, 1.7837532758712769, 1.8851406574249268, 1.9865281581878662, 2.0879156589508057, 2.189302921295166, 2.2906904220581055, 2.392077922821045, 2.4934654235839844, 2.594852924346924, 2.6962404251098633]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 10.0, 14.0, 23.0, 26.0, 35.0, 63.0, 91.0, 122.0, 201.0, 309.0, 514.0, 836.0, 1654.0, 4183.0, 15312.0, 100504.0, 711979.0, 180031.0, 22427.0, 5466.0, 2207.0, 1014.0, 580.0, 350.0, 203.0, 141.0, 90.0, 48.0, 31.0, 31.0, 19.0, 10.0, 8.0, 7.0, 3.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80810546875, -0.7817153930664062, -0.7553253173828125, -0.7289352416992188, -0.702545166015625, -0.6761550903320312, -0.6497650146484375, -0.6233749389648438, -0.59698486328125, -0.5705947875976562, -0.5442047119140625, -0.5178146362304688, -0.491424560546875, -0.46503448486328125, -0.4386444091796875, -0.41225433349609375, -0.3858642578125, -0.35947418212890625, -0.3330841064453125, -0.30669403076171875, -0.280303955078125, -0.25391387939453125, -0.2275238037109375, -0.20113372802734375, -0.17474365234375, -0.14835357666015625, -0.1219635009765625, -0.09557342529296875, -0.069183349609375, -0.04279327392578125, -0.0164031982421875, 0.00998687744140625, 0.036376953125, 0.06276702880859375, 0.0891571044921875, 0.11554718017578125, 0.141937255859375, 0.16832733154296875, 0.1947174072265625, 0.22110748291015625, 0.24749755859375, 0.27388763427734375, 0.3002777099609375, 0.32666778564453125, 0.353057861328125, 0.37944793701171875, 0.4058380126953125, 0.43222808837890625, 0.4586181640625, 0.48500823974609375, 0.5113983154296875, 0.5377883911132812, 0.564178466796875, 0.5905685424804688, 0.6169586181640625, 0.6433486938476562, 0.66973876953125, 0.6961288452148438, 0.7225189208984375, 0.7489089965820312, 0.775299072265625, 0.8016891479492188, 0.8280792236328125, 0.8544692993164062, 0.880859375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 4.0, 13.0, 16.0, 27.0, 36.0, 40.0, 52.0, 55.0, 67.0, 81.0, 72.0, 71.0, 93.0, 68.0, 58.0, 42.0, 58.0, 46.0, 24.0, 21.0, 13.0, 15.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.154052734375, -0.1501312255859375, -0.146209716796875, -0.1422882080078125, -0.13836669921875, -0.1344451904296875, -0.130523681640625, -0.1266021728515625, -0.1226806640625, -0.1187591552734375, -0.114837646484375, -0.1109161376953125, -0.10699462890625, -0.1030731201171875, -0.099151611328125, -0.0952301025390625, -0.09130859375, -0.0873870849609375, -0.083465576171875, -0.0795440673828125, -0.07562255859375, -0.0717010498046875, -0.067779541015625, -0.0638580322265625, -0.0599365234375, -0.0560150146484375, -0.052093505859375, -0.0481719970703125, -0.04425048828125, -0.0403289794921875, -0.036407470703125, -0.0324859619140625, -0.028564453125, -0.0246429443359375, -0.020721435546875, -0.0167999267578125, -0.01287841796875, -0.0089569091796875, -0.005035400390625, -0.0011138916015625, 0.0028076171875, 0.0067291259765625, 0.010650634765625, 0.0145721435546875, 0.01849365234375, 0.0224151611328125, 0.026336669921875, 0.0302581787109375, 0.0341796875, 0.0381011962890625, 0.042022705078125, 0.0459442138671875, 0.04986572265625, 0.0537872314453125, 0.057708740234375, 0.0616302490234375, 0.0655517578125, 0.0694732666015625, 0.073394775390625, 0.0773162841796875, 0.08123779296875, 0.0851593017578125, 0.089080810546875, 0.0930023193359375, 0.096923828125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 4.0, 3.0, 4.0, 9.0, 9.0, 16.0, 16.0, 28.0, 42.0, 62.0, 100.0, 185.0, 391.0, 924.0, 2826.0, 10762.0, 57871.0, 397164.0, 486332.0, 73604.0, 12921.0, 3345.0, 991.0, 405.0, 209.0, 97.0, 68.0, 31.0, 29.0, 31.0, 16.0, 13.0, 10.0, 8.0, 11.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.402587890625, -0.3887367248535156, -0.37488555908203125, -0.3610343933105469, -0.3471832275390625, -0.3333320617675781, -0.31948089599609375, -0.3056297302246094, -0.291778564453125, -0.2779273986816406, -0.26407623291015625, -0.2502250671386719, -0.2363739013671875, -0.22252273559570312, -0.20867156982421875, -0.19482040405273438, -0.18096923828125, -0.16711807250976562, -0.15326690673828125, -0.13941574096679688, -0.1255645751953125, -0.11171340942382812, -0.09786224365234375, -0.08401107788085938, -0.070159912109375, -0.056308746337890625, -0.04245758056640625, -0.028606414794921875, -0.0147552490234375, -0.000904083251953125, 0.01294708251953125, 0.026798248291015625, 0.0406494140625, 0.054500579833984375, 0.06835174560546875, 0.08220291137695312, 0.0960540771484375, 0.10990524291992188, 0.12375640869140625, 0.13760757446289062, 0.151458740234375, 0.16530990600585938, 0.17916107177734375, 0.19301223754882812, 0.2068634033203125, 0.22071456909179688, 0.23456573486328125, 0.24841690063476562, 0.26226806640625, 0.2761192321777344, 0.28997039794921875, 0.3038215637207031, 0.3176727294921875, 0.3315238952636719, 0.34537506103515625, 0.3592262268066406, 0.373077392578125, 0.3869285583496094, 0.40077972412109375, 0.4146308898925781, 0.4284820556640625, 0.4423332214355469, 0.45618438720703125, 0.4700355529785156, 0.48388671875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 2.0, 5.0, 3.0, 3.0, 8.0, 13.0, 9.0, 9.0, 17.0, 16.0, 22.0, 23.0, 20.0, 20.0, 30.0, 26.0, 25.0, 31.0, 35.0, 44.0, 48.0, 45.0, 43.0, 35.0, 37.0, 46.0, 40.0, 33.0, 34.0, 32.0, 29.0, 27.0, 30.0, 27.0, 20.0, 10.0, 13.0, 14.0, 17.0, 10.0, 13.0, 8.0, 7.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.2548828125, -0.24712562561035156, -0.23936843872070312, -0.2316112518310547, -0.22385406494140625, -0.2160968780517578, -0.20833969116210938, -0.20058250427246094, -0.1928253173828125, -0.18506813049316406, -0.17731094360351562, -0.1695537567138672, -0.16179656982421875, -0.1540393829345703, -0.14628219604492188, -0.13852500915527344, -0.130767822265625, -0.12301063537597656, -0.11525344848632812, -0.10749626159667969, -0.09973907470703125, -0.09198188781738281, -0.08422470092773438, -0.07646751403808594, -0.0687103271484375, -0.06095314025878906, -0.053195953369140625, -0.04543876647949219, -0.03768157958984375, -0.029924392700195312, -0.022167205810546875, -0.014410018920898438, -0.00665283203125, 0.0011043548583984375, 0.008861541748046875, 0.016618728637695312, 0.02437591552734375, 0.03213310241699219, 0.039890289306640625, 0.04764747619628906, 0.0554046630859375, 0.06316184997558594, 0.07091903686523438, 0.07867622375488281, 0.08643341064453125, 0.09419059753417969, 0.10194778442382812, 0.10970497131347656, 0.117462158203125, 0.12521934509277344, 0.13297653198242188, 0.1407337188720703, 0.14849090576171875, 0.1562480926513672, 0.16400527954101562, 0.17176246643066406, 0.1795196533203125, 0.18727684020996094, 0.19503402709960938, 0.2027912139892578, 0.21054840087890625, 0.2183055877685547, 0.22606277465820312, 0.23381996154785156, 0.2415771484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 7.0, 7.0, 16.0, 19.0, 37.0, 86.0, 143.0, 261.0, 496.0, 974.0, 1945.0, 4602.0, 14531.0, 81412.0, 760116.0, 152719.0, 20445.0, 5928.0, 2392.0, 1118.0, 600.0, 302.0, 192.0, 90.0, 50.0, 26.0, 17.0, 7.0, 8.0, 6.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.30615234375, -0.2975578308105469, -0.28896331787109375, -0.2803688049316406, -0.2717742919921875, -0.2631797790527344, -0.25458526611328125, -0.24599075317382812, -0.237396240234375, -0.22880172729492188, -0.22020721435546875, -0.21161270141601562, -0.2030181884765625, -0.19442367553710938, -0.18582916259765625, -0.17723464965820312, -0.16864013671875, -0.16004562377929688, -0.15145111083984375, -0.14285659790039062, -0.1342620849609375, -0.12566757202148438, -0.11707305908203125, -0.10847854614257812, -0.099884033203125, -0.09128952026367188, -0.08269500732421875, -0.07410049438476562, -0.0655059814453125, -0.056911468505859375, -0.04831695556640625, -0.039722442626953125, -0.0311279296875, -0.022533416748046875, -0.01393890380859375, -0.005344390869140625, 0.0032501220703125, 0.011844635009765625, 0.02043914794921875, 0.029033660888671875, 0.037628173828125, 0.046222686767578125, 0.05481719970703125, 0.06341171264648438, 0.0720062255859375, 0.08060073852539062, 0.08919525146484375, 0.09778976440429688, 0.10638427734375, 0.11497879028320312, 0.12357330322265625, 0.13216781616210938, 0.1407623291015625, 0.14935684204101562, 0.15795135498046875, 0.16654586791992188, 0.175140380859375, 0.18373489379882812, 0.19232940673828125, 0.20092391967773438, 0.2095184326171875, 0.21811294555664062, 0.22670745849609375, 0.23530197143554688, 0.243896484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 10.0, 15.0, 25.0, 28.0, 37.0, 90.0, 169.0, 219.0, 154.0, 103.0, 43.0, 29.0, 19.0, 19.0, 10.0, 9.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4776668548583984e-05, -5.263276398181915e-05, -5.048885941505432e-05, -4.834495484828949e-05, -4.620105028152466e-05, -4.405714571475983e-05, -4.1913241147994995e-05, -3.9769336581230164e-05, -3.762543201446533e-05, -3.54815274477005e-05, -3.333762288093567e-05, -3.119371831417084e-05, -2.9049813747406006e-05, -2.6905909180641174e-05, -2.4762004613876343e-05, -2.261810004711151e-05, -2.047419548034668e-05, -1.8330290913581848e-05, -1.6186386346817017e-05, -1.4042481780052185e-05, -1.1898577213287354e-05, -9.754672646522522e-06, -7.6107680797576904e-06, -5.466863512992859e-06, -3.3229589462280273e-06, -1.1790543794631958e-06, 9.648501873016357e-07, 3.1087547540664673e-06, 5.252659320831299e-06, 7.39656388759613e-06, 9.540468454360962e-06, 1.1684373021125793e-05, 1.3828277587890625e-05, 1.5972182154655457e-05, 1.8116086721420288e-05, 2.025999128818512e-05, 2.240389585494995e-05, 2.4547800421714783e-05, 2.6691704988479614e-05, 2.8835609555244446e-05, 3.097951412200928e-05, 3.312341868877411e-05, 3.526732325553894e-05, 3.741122782230377e-05, 3.9555132389068604e-05, 4.1699036955833435e-05, 4.3842941522598267e-05, 4.59868460893631e-05, 4.813075065612793e-05, 5.027465522289276e-05, 5.241855978965759e-05, 5.4562464356422424e-05, 5.6706368923187256e-05, 5.885027348995209e-05, 6.099417805671692e-05, 6.313808262348175e-05, 6.528198719024658e-05, 6.742589175701141e-05, 6.956979632377625e-05, 7.171370089054108e-05, 7.385760545730591e-05, 7.600151002407074e-05, 7.814541459083557e-05, 8.02893191576004e-05, 8.243322372436523e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 8.0, 4.0, 12.0, 15.0, 29.0, 45.0, 105.0, 229.0, 464.0, 1066.0, 2613.0, 7386.0, 35376.0, 758713.0, 216877.0, 17233.0, 4962.0, 1922.0, 803.0, 369.0, 158.0, 77.0, 39.0, 15.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34521484375, -0.3327980041503906, -0.32038116455078125, -0.3079643249511719, -0.2955474853515625, -0.2831306457519531, -0.27071380615234375, -0.2582969665527344, -0.245880126953125, -0.23346328735351562, -0.22104644775390625, -0.20862960815429688, -0.1962127685546875, -0.18379592895507812, -0.17137908935546875, -0.15896224975585938, -0.14654541015625, -0.13412857055664062, -0.12171173095703125, -0.10929489135742188, -0.0968780517578125, -0.08446121215820312, -0.07204437255859375, -0.059627532958984375, -0.047210693359375, -0.034793853759765625, -0.02237701416015625, -0.009960174560546875, 0.0024566650390625, 0.014873504638671875, 0.02729034423828125, 0.039707183837890625, 0.0521240234375, 0.06454086303710938, 0.07695770263671875, 0.08937454223632812, 0.1017913818359375, 0.11420822143554688, 0.12662506103515625, 0.13904190063476562, 0.151458740234375, 0.16387557983398438, 0.17629241943359375, 0.18870925903320312, 0.2011260986328125, 0.21354293823242188, 0.22595977783203125, 0.23837661743164062, 0.25079345703125, 0.2632102966308594, 0.27562713623046875, 0.2880439758300781, 0.3004608154296875, 0.3128776550292969, 0.32529449462890625, 0.3377113342285156, 0.350128173828125, 0.3625450134277344, 0.37496185302734375, 0.3873786926269531, 0.3997955322265625, 0.4122123718261719, 0.42462921142578125, 0.4370460510253906, 0.449462890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 5.0, 7.0, 7.0, 8.0, 6.0, 10.0, 17.0, 32.0, 30.0, 59.0, 88.0, 92.0, 128.0, 147.0, 103.0, 71.0, 59.0, 43.0, 25.0, 10.0, 10.0, 8.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.172119140625, -0.16617584228515625, -0.1602325439453125, -0.15428924560546875, -0.148345947265625, -0.14240264892578125, -0.1364593505859375, -0.13051605224609375, -0.12457275390625, -0.11862945556640625, -0.1126861572265625, -0.10674285888671875, -0.100799560546875, -0.09485626220703125, -0.0889129638671875, -0.08296966552734375, -0.0770263671875, -0.07108306884765625, -0.0651397705078125, -0.05919647216796875, -0.053253173828125, -0.04730987548828125, -0.0413665771484375, -0.03542327880859375, -0.02947998046875, -0.02353668212890625, -0.0175933837890625, -0.01165008544921875, -0.005706787109375, 0.00023651123046875, 0.0061798095703125, 0.01212310791015625, 0.01806640625, 0.02400970458984375, 0.0299530029296875, 0.03589630126953125, 0.041839599609375, 0.04778289794921875, 0.0537261962890625, 0.05966949462890625, 0.06561279296875, 0.07155609130859375, 0.0774993896484375, 0.08344268798828125, 0.089385986328125, 0.09532928466796875, 0.1012725830078125, 0.10721588134765625, 0.1131591796875, 0.11910247802734375, 0.1250457763671875, 0.13098907470703125, 0.136932373046875, 0.14287567138671875, 0.1488189697265625, 0.15476226806640625, 0.16070556640625, 0.16664886474609375, 0.1725921630859375, 0.17853546142578125, 0.184478759765625, 0.19042205810546875, 0.1963653564453125, 0.20230865478515625, 0.208251953125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 13.0, 34.0, 199.0, 498.0, 213.0, 43.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.953251838684082, -12.691709518432617, -12.430166244506836, -12.168623924255371, -11.90708065032959, -11.645538330078125, -11.383995056152344, -11.122452735900879, -10.860910415649414, -10.59936809539795, -10.337824821472168, -10.076282501220703, -9.814739227294922, -9.553196907043457, -9.291653633117676, -9.030111312866211, -8.76856803894043, -8.507025718688965, -8.245482444763184, -7.9839396476745605, -7.7223968505859375, -7.460854530334473, -7.19931173324585, -6.937768936157227, -6.6762261390686035, -6.4146833419799805, -6.153140544891357, -5.891597747802734, -5.6300554275512695, -5.368512153625488, -5.106969833374023, -4.8454270362854, -4.583883285522461, -4.322340488433838, -4.060797691345215, -3.799255132675171, -3.537712335586548, -3.276169538497925, -3.014626979827881, -2.753084182739258, -2.4915413856506348, -2.2299985885620117, -1.9684559106826782, -1.7069132328033447, -1.4453704357147217, -1.1838276386260986, -0.9222849607467651, -0.6607422828674316, -0.3991994857788086, -0.13765674829483032, 0.12388598918914795, 0.3854287266731262, 0.6469714641571045, 0.9085142612457275, 1.170056939125061, 1.4315996170043945, 1.6931424140930176, 1.9546852111816406, 2.2162280082702637, 2.4777705669403076, 2.7393133640289307, 3.0008561611175537, 3.2623987197875977, 3.5239415168762207, 3.7854843139648438]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 9.0, 7.0, 18.0, 11.0, 8.0, 18.0, 17.0, 20.0, 32.0, 38.0, 32.0, 45.0, 32.0, 33.0, 56.0, 46.0, 50.0, 39.0, 55.0, 52.0, 49.0, 46.0, 45.0, 43.0, 34.0, 39.0, 33.0, 16.0, 18.0, 13.0, 8.0, 5.0, 11.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.314886450767517, -1.2609148025512695, -1.2069432735443115, -1.152971625328064, -1.0989999771118164, -1.0450284481048584, -0.9910567998886108, -0.9370852112770081, -0.8831136226654053, -0.8291420340538025, -0.7751704454421997, -0.7211987972259521, -0.6672272086143494, -0.6132556200027466, -0.559283971786499, -0.5053123831748962, -0.45134079456329346, -0.3973692059516907, -0.3433975875377655, -0.28942596912384033, -0.23545438051223755, -0.18148279190063477, -0.1275111734867096, -0.07353955507278442, -0.01956796646118164, 0.034403637051582336, 0.08837524056434631, 0.1423468440771103, 0.19631844758987427, 0.25029003620147705, 0.3042616546154022, 0.3582332730293274, 0.4122049808502197, 0.4661765694618225, 0.5201481580734253, 0.5741198062896729, 0.6280913949012756, 0.6820629835128784, 0.736034631729126, 0.7900062203407288, 0.8439778089523315, 0.8979493975639343, 0.9519209861755371, 1.0058926343917847, 1.0598642826080322, 1.1138358116149902, 1.1678074598312378, 1.2217791080474854, 1.2757506370544434, 1.329722285270691, 1.383693814277649, 1.4376654624938965, 1.4916369915008545, 1.545608639717102, 1.5995802879333496, 1.6535518169403076, 1.7075234651565552, 1.7614951133728027, 1.8154666423797607, 1.8694382905960083, 1.9234099388122559, 1.9773814678192139, 2.031352996826172, 2.085324764251709, 2.139296293258667]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 2.0, 7.0, 17.0, 24.0, 24.0, 26.0, 31.0, 49.0, 63.0, 45.0, 82.0, 108.0, 152.0, 198.0, 289.0, 498.0, 1018.0, 2326.0, 6708.0, 29136.0, 4042306.0, 92702.0, 11167.0, 3820.0, 1609.0, 774.0, 390.0, 222.0, 129.0, 101.0, 51.0, 44.0, 35.0, 34.0, 14.0, 18.0, 17.0, 8.0, 10.0, 7.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.16796875, -1.128631591796875, -1.08929443359375, -1.049957275390625, -1.0106201171875, -0.971282958984375, -0.93194580078125, -0.892608642578125, -0.853271484375, -0.813934326171875, -0.77459716796875, -0.735260009765625, -0.6959228515625, -0.656585693359375, -0.61724853515625, -0.577911376953125, -0.53857421875, -0.499237060546875, -0.45989990234375, -0.420562744140625, -0.3812255859375, -0.341888427734375, -0.30255126953125, -0.263214111328125, -0.223876953125, -0.184539794921875, -0.14520263671875, -0.105865478515625, -0.0665283203125, -0.027191162109375, 0.01214599609375, 0.051483154296875, 0.0908203125, 0.130157470703125, 0.16949462890625, 0.208831787109375, 0.2481689453125, 0.287506103515625, 0.32684326171875, 0.366180419921875, 0.405517578125, 0.444854736328125, 0.48419189453125, 0.523529052734375, 0.5628662109375, 0.602203369140625, 0.64154052734375, 0.680877685546875, 0.72021484375, 0.759552001953125, 0.79888916015625, 0.838226318359375, 0.8775634765625, 0.916900634765625, 0.95623779296875, 0.995574951171875, 1.034912109375, 1.074249267578125, 1.11358642578125, 1.152923583984375, 1.1922607421875, 1.231597900390625, 1.27093505859375, 1.310272216796875, 1.349609375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 9.0, 6.0, 14.0, 17.0, 29.0, 35.0, 44.0, 56.0, 51.0, 58.0, 73.0, 73.0, 77.0, 59.0, 65.0, 75.0, 49.0, 41.0, 43.0, 38.0, 16.0, 11.0, 16.0, 13.0, 12.0, 3.0, 2.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1444091796875, -0.14074325561523438, -0.13707733154296875, -0.13341140747070312, -0.1297454833984375, -0.12607955932617188, -0.12241363525390625, -0.11874771118164062, -0.115081787109375, -0.11141586303710938, -0.10774993896484375, -0.10408401489257812, -0.1004180908203125, -0.09675216674804688, -0.09308624267578125, -0.08942031860351562, -0.08575439453125, -0.08208847045898438, -0.07842254638671875, -0.07475662231445312, -0.0710906982421875, -0.06742477416992188, -0.06375885009765625, -0.060092926025390625, -0.056427001953125, -0.052761077880859375, -0.04909515380859375, -0.045429229736328125, -0.0417633056640625, -0.038097381591796875, -0.03443145751953125, -0.030765533447265625, -0.027099609375, -0.023433685302734375, -0.01976776123046875, -0.016101837158203125, -0.0124359130859375, -0.008769989013671875, -0.00510406494140625, -0.001438140869140625, 0.002227783203125, 0.005893707275390625, 0.00955963134765625, 0.013225555419921875, 0.0168914794921875, 0.020557403564453125, 0.02422332763671875, 0.027889251708984375, 0.03155517578125, 0.035221099853515625, 0.03888702392578125, 0.042552947998046875, 0.0462188720703125, 0.049884796142578125, 0.05355072021484375, 0.057216644287109375, 0.060882568359375, 0.06454849243164062, 0.06821441650390625, 0.07188034057617188, 0.0755462646484375, 0.07921218872070312, 0.08287811279296875, 0.08654403686523438, 0.0902099609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 11.0, 10.0, 24.0, 29.0, 66.0, 88.0, 154.0, 330.0, 1178.0, 16566.0, 4159722.0, 14200.0, 1124.0, 355.0, 151.0, 111.0, 63.0, 40.0, 22.0, 16.0, 14.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.943634033203125, -1.83843994140625, -1.733245849609375, -1.6280517578125, -1.522857666015625, -1.41766357421875, -1.312469482421875, -1.207275390625, -1.102081298828125, -0.99688720703125, -0.891693115234375, -0.7864990234375, -0.681304931640625, -0.57611083984375, -0.470916748046875, -0.36572265625, -0.260528564453125, -0.15533447265625, -0.050140380859375, 0.0550537109375, 0.160247802734375, 0.26544189453125, 0.370635986328125, 0.475830078125, 0.581024169921875, 0.68621826171875, 0.791412353515625, 0.8966064453125, 1.001800537109375, 1.10699462890625, 1.212188720703125, 1.3173828125, 1.422576904296875, 1.52777099609375, 1.632965087890625, 1.7381591796875, 1.843353271484375, 1.94854736328125, 2.053741455078125, 2.158935546875, 2.264129638671875, 2.36932373046875, 2.474517822265625, 2.5797119140625, 2.684906005859375, 2.79010009765625, 2.895294189453125, 3.00048828125, 3.105682373046875, 3.21087646484375, 3.316070556640625, 3.4212646484375, 3.526458740234375, 3.63165283203125, 3.736846923828125, 3.842041015625, 3.947235107421875, 4.05242919921875, 4.157623291015625, 4.2628173828125, 4.368011474609375, 4.47320556640625, 4.578399658203125, 4.68359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 11.0, 24.0, 53.0, 119.0, 1270.0, 2355.0, 129.0, 47.0, 28.0, 14.0, 13.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40673828125, -0.38910675048828125, -0.3714752197265625, -0.35384368896484375, -0.336212158203125, -0.31858062744140625, -0.3009490966796875, -0.28331756591796875, -0.26568603515625, -0.24805450439453125, -0.2304229736328125, -0.21279144287109375, -0.195159912109375, -0.17752838134765625, -0.1598968505859375, -0.14226531982421875, -0.1246337890625, -0.10700225830078125, -0.0893707275390625, -0.07173919677734375, -0.054107666015625, -0.03647613525390625, -0.0188446044921875, -0.00121307373046875, 0.01641845703125, 0.03404998779296875, 0.0516815185546875, 0.06931304931640625, 0.086944580078125, 0.10457611083984375, 0.1222076416015625, 0.13983917236328125, 0.157470703125, 0.17510223388671875, 0.1927337646484375, 0.21036529541015625, 0.227996826171875, 0.24562835693359375, 0.2632598876953125, 0.28089141845703125, 0.29852294921875, 0.31615447998046875, 0.3337860107421875, 0.35141754150390625, 0.369049072265625, 0.38668060302734375, 0.4043121337890625, 0.42194366455078125, 0.4395751953125, 0.45720672607421875, 0.4748382568359375, 0.49246978759765625, 0.510101318359375, 0.5277328491210938, 0.5453643798828125, 0.5629959106445312, 0.58062744140625, 0.5982589721679688, 0.6158905029296875, 0.6335220336914062, 0.651153564453125, 0.6687850952148438, 0.6864166259765625, 0.7040481567382812, 0.7216796875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 13.0, 54.0, 432.0, 425.0, 64.0, 18.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.034736633300781, -8.842652320861816, -8.650568962097168, -8.458484649658203, -8.266400337219238, -8.07431697845459, -7.882232666015625, -7.69014835357666, -7.4980645179748535, -7.305980682373047, -7.113896369934082, -6.921812534332275, -6.729728698730469, -6.537644386291504, -6.345560550689697, -6.153476715087891, -5.961392402648926, -5.769308567047119, -5.577224254608154, -5.385140419006348, -5.193056583404541, -5.000972270965576, -4.8088884353637695, -4.616804122924805, -4.424720764160156, -4.23263692855835, -4.040552616119385, -3.848468780517578, -3.6563847064971924, -3.4643006324768066, -3.272216796875, -3.0801327228546143, -2.8880486488342285, -2.6959645748138428, -2.503880739212036, -2.3117966651916504, -2.1197125911712646, -1.9276286363601685, -1.7355446815490723, -1.5434606075286865, -1.3513766527175903, -1.1592926979064941, -0.9672086238861084, -0.7751246690750122, -0.5830406546592712, -0.3909566402435303, -0.19887268543243408, -0.00678861141204834, 0.18529534339904785, 0.3773793578147888, 0.5694633722305298, 0.761547327041626, 0.9536313414573669, 1.145715355873108, 1.337799310684204, 1.5298833847045898, 1.721967339515686, 1.9140512943267822, 2.106135368347168, 2.2982192039489746, 2.4903032779693604, 2.682387351989746, 2.8744711875915527, 3.0665555000305176, 3.258639335632324]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 10.0, 7.0, 5.0, 10.0, 9.0, 10.0, 17.0, 12.0, 27.0, 26.0, 34.0, 41.0, 45.0, 46.0, 45.0, 43.0, 41.0, 48.0, 60.0, 56.0, 49.0, 51.0, 47.0, 35.0, 40.0, 30.0, 31.0, 29.0, 21.0, 15.0, 15.0, 7.0, 11.0, 13.0, 3.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8361718058586121, -0.8124577403068542, -0.7887436747550964, -0.7650296688079834, -0.7413156032562256, -0.7176015377044678, -0.69388747215271, -0.6701734066009521, -0.6464593410491943, -0.6227452754974365, -0.5990312099456787, -0.5753171443939209, -0.5516031384468079, -0.52788907289505, -0.5041750073432922, -0.4804609417915344, -0.456746906042099, -0.4330328404903412, -0.40931880474090576, -0.38560473918914795, -0.36189067363739014, -0.3381766080856323, -0.3144625723361969, -0.2907485067844391, -0.26703447103500366, -0.24332042038440704, -0.21960635483264923, -0.1958923041820526, -0.1721782386302948, -0.14846418797969818, -0.12475013732910156, -0.10103607177734375, -0.07732200622558594, -0.05360794812440872, -0.029893893748521805, -0.006179839372634888, 0.017534218728542328, 0.04124827682971954, 0.06496232748031616, 0.08867639303207397, 0.1123904436826706, 0.1361044943332672, 0.15981855988502502, 0.18353261053562164, 0.20724666118621826, 0.23096072673797607, 0.2546747922897339, 0.2783888578414917, 0.3021028935909271, 0.32581695914268494, 0.34953099489212036, 0.3732450604438782, 0.396959125995636, 0.4206731915473938, 0.4443872272968292, 0.46810129284858704, 0.49181532859802246, 0.5155293941497803, 0.5392434597015381, 0.5629575252532959, 0.5866715312004089, 0.6103855967521667, 0.6340996623039246, 0.6578137278556824, 0.6815277934074402]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 7.0, 8.0, 8.0, 12.0, 16.0, 23.0, 31.0, 36.0, 33.0, 48.0, 72.0, 120.0, 147.0, 186.0, 277.0, 493.0, 907.0, 1815.0, 4184.0, 11022.0, 40240.0, 285683.0, 594000.0, 80031.0, 17722.0, 5865.0, 2494.0, 1182.0, 697.0, 397.0, 229.0, 161.0, 125.0, 66.0, 65.0, 39.0, 28.0, 21.0, 22.0, 14.0, 14.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64208984375, -0.6201019287109375, -0.598114013671875, -0.5761260986328125, -0.55413818359375, -0.5321502685546875, -0.510162353515625, -0.4881744384765625, -0.4661865234375, -0.4441986083984375, -0.422210693359375, -0.4002227783203125, -0.37823486328125, -0.3562469482421875, -0.334259033203125, -0.3122711181640625, -0.290283203125, -0.2682952880859375, -0.246307373046875, -0.2243194580078125, -0.20233154296875, -0.1803436279296875, -0.158355712890625, -0.1363677978515625, -0.1143798828125, -0.0923919677734375, -0.070404052734375, -0.0484161376953125, -0.02642822265625, -0.0044403076171875, 0.017547607421875, 0.0395355224609375, 0.0615234375, 0.0835113525390625, 0.105499267578125, 0.1274871826171875, 0.14947509765625, 0.1714630126953125, 0.193450927734375, 0.2154388427734375, 0.2374267578125, 0.2594146728515625, 0.281402587890625, 0.3033905029296875, 0.32537841796875, 0.3473663330078125, 0.369354248046875, 0.3913421630859375, 0.413330078125, 0.4353179931640625, 0.457305908203125, 0.4792938232421875, 0.50128173828125, 0.5232696533203125, 0.545257568359375, 0.5672454833984375, 0.5892333984375, 0.6112213134765625, 0.633209228515625, 0.6551971435546875, 0.67718505859375, 0.6991729736328125, 0.721160888671875, 0.7431488037109375, 0.76513671875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 3.0, 9.0, 13.0, 26.0, 25.0, 38.0, 42.0, 57.0, 58.0, 69.0, 68.0, 75.0, 62.0, 78.0, 68.0, 61.0, 56.0, 44.0, 34.0, 27.0, 22.0, 12.0, 10.0, 7.0, 8.0, 6.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139892578125, -0.1357889175415039, -0.1316852569580078, -0.12758159637451172, -0.12347793579101562, -0.11937427520751953, -0.11527061462402344, -0.11116695404052734, -0.10706329345703125, -0.10295963287353516, -0.09885597229003906, -0.09475231170654297, -0.09064865112304688, -0.08654499053955078, -0.08244132995605469, -0.0783376693725586, -0.0742340087890625, -0.0701303482055664, -0.06602668762207031, -0.06192302703857422, -0.057819366455078125, -0.05371570587158203, -0.04961204528808594, -0.045508384704589844, -0.04140472412109375, -0.037301063537597656, -0.03319740295410156, -0.02909374237060547, -0.024990081787109375, -0.02088642120361328, -0.016782760620117188, -0.012679100036621094, -0.008575439453125, -0.004471778869628906, -0.0003681182861328125, 0.0037355422973632812, 0.007839202880859375, 0.011942863464355469, 0.016046524047851562, 0.020150184631347656, 0.02425384521484375, 0.028357505798339844, 0.03246116638183594, 0.03656482696533203, 0.040668487548828125, 0.04477214813232422, 0.04887580871582031, 0.052979469299316406, 0.0570831298828125, 0.061186790466308594, 0.06529045104980469, 0.06939411163330078, 0.07349777221679688, 0.07760143280029297, 0.08170509338378906, 0.08580875396728516, 0.08991241455078125, 0.09401607513427734, 0.09811973571777344, 0.10222339630126953, 0.10632705688476562, 0.11043071746826172, 0.11453437805175781, 0.1186380386352539, 0.12274169921875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 10.0, 13.0, 17.0, 23.0, 28.0, 54.0, 89.0, 143.0, 303.0, 567.0, 1224.0, 2864.0, 7981.0, 30044.0, 185754.0, 648301.0, 135860.0, 23909.0, 6661.0, 2497.0, 1013.0, 541.0, 281.0, 140.0, 82.0, 44.0, 35.0, 22.0, 17.0, 8.0, 6.0, 8.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.372314453125, -0.3576698303222656, -0.34302520751953125, -0.3283805847167969, -0.3137359619140625, -0.2990913391113281, -0.28444671630859375, -0.2698020935058594, -0.255157470703125, -0.24051284790039062, -0.22586822509765625, -0.21122360229492188, -0.1965789794921875, -0.18193435668945312, -0.16728973388671875, -0.15264511108398438, -0.13800048828125, -0.12335586547851562, -0.10871124267578125, -0.09406661987304688, -0.0794219970703125, -0.06477737426757812, -0.05013275146484375, -0.035488128662109375, -0.020843505859375, -0.006198883056640625, 0.00844573974609375, 0.023090362548828125, 0.0377349853515625, 0.052379608154296875, 0.06702423095703125, 0.08166885375976562, 0.0963134765625, 0.11095809936523438, 0.12560272216796875, 0.14024734497070312, 0.1548919677734375, 0.16953659057617188, 0.18418121337890625, 0.19882583618164062, 0.213470458984375, 0.22811508178710938, 0.24275970458984375, 0.2574043273925781, 0.2720489501953125, 0.2866935729980469, 0.30133819580078125, 0.3159828186035156, 0.33062744140625, 0.3452720642089844, 0.35991668701171875, 0.3745613098144531, 0.3892059326171875, 0.4038505554199219, 0.41849517822265625, 0.4331398010253906, 0.447784423828125, 0.4624290466308594, 0.47707366943359375, 0.4917182922363281, 0.5063629150390625, 0.5210075378417969, 0.5356521606445312, 0.5502967834472656, 0.56494140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 11.0, 11.0, 13.0, 6.0, 13.0, 21.0, 20.0, 22.0, 29.0, 29.0, 32.0, 50.0, 48.0, 56.0, 53.0, 51.0, 50.0, 59.0, 54.0, 48.0, 37.0, 32.0, 47.0, 33.0, 27.0, 25.0, 24.0, 18.0, 15.0, 21.0, 11.0, 7.0, 3.0, 6.0, 8.0, 4.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.354248046875, -0.3427276611328125, -0.331207275390625, -0.3196868896484375, -0.30816650390625, -0.2966461181640625, -0.285125732421875, -0.2736053466796875, -0.2620849609375, -0.2505645751953125, -0.239044189453125, -0.2275238037109375, -0.21600341796875, -0.2044830322265625, -0.192962646484375, -0.1814422607421875, -0.169921875, -0.1584014892578125, -0.146881103515625, -0.1353607177734375, -0.12384033203125, -0.1123199462890625, -0.100799560546875, -0.0892791748046875, -0.0777587890625, -0.0662384033203125, -0.054718017578125, -0.0431976318359375, -0.03167724609375, -0.0201568603515625, -0.008636474609375, 0.0028839111328125, 0.014404296875, 0.0259246826171875, 0.037445068359375, 0.0489654541015625, 0.06048583984375, 0.0720062255859375, 0.083526611328125, 0.0950469970703125, 0.1065673828125, 0.1180877685546875, 0.129608154296875, 0.1411285400390625, 0.15264892578125, 0.1641693115234375, 0.175689697265625, 0.1872100830078125, 0.19873046875, 0.2102508544921875, 0.221771240234375, 0.2332916259765625, 0.24481201171875, 0.2563323974609375, 0.267852783203125, 0.2793731689453125, 0.2908935546875, 0.3024139404296875, 0.313934326171875, 0.3254547119140625, 0.33697509765625, 0.3484954833984375, 0.360015869140625, 0.3715362548828125, 0.383056640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 7.0, 8.0, 6.0, 11.0, 24.0, 38.0, 51.0, 87.0, 139.0, 249.0, 449.0, 942.0, 1792.0, 3885.0, 10321.0, 34301.0, 199144.0, 637847.0, 120248.0, 24589.0, 7910.0, 3269.0, 1495.0, 739.0, 392.0, 251.0, 129.0, 83.0, 54.0, 28.0, 24.0, 18.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.21630859375, -0.21052169799804688, -0.20473480224609375, -0.19894790649414062, -0.1931610107421875, -0.18737411499023438, -0.18158721923828125, -0.17580032348632812, -0.170013427734375, -0.16422653198242188, -0.15843963623046875, -0.15265274047851562, -0.1468658447265625, -0.14107894897460938, -0.13529205322265625, -0.12950515747070312, -0.12371826171875, -0.11793136596679688, -0.11214447021484375, -0.10635757446289062, -0.1005706787109375, -0.09478378295898438, -0.08899688720703125, -0.08320999145507812, -0.077423095703125, -0.07163619995117188, -0.06584930419921875, -0.060062408447265625, -0.0542755126953125, -0.048488616943359375, -0.04270172119140625, -0.036914825439453125, -0.0311279296875, -0.025341033935546875, -0.01955413818359375, -0.013767242431640625, -0.0079803466796875, -0.002193450927734375, 0.00359344482421875, 0.009380340576171875, 0.015167236328125, 0.020954132080078125, 0.02674102783203125, 0.032527923583984375, 0.0383148193359375, 0.044101715087890625, 0.04988861083984375, 0.055675506591796875, 0.06146240234375, 0.06724929809570312, 0.07303619384765625, 0.07882308959960938, 0.0846099853515625, 0.09039688110351562, 0.09618377685546875, 0.10197067260742188, 0.107757568359375, 0.11354446411132812, 0.11933135986328125, 0.12511825561523438, 0.1309051513671875, 0.13669204711914062, 0.14247894287109375, 0.14826583862304688, 0.154052734375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 11.0, 5.0, 9.0, 16.0, 15.0, 32.0, 48.0, 60.0, 100.0, 118.0, 167.0, 142.0, 88.0, 51.0, 25.0, 30.0, 13.0, 18.0, 10.0, 5.0, 5.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.4226646423339844e-05, -4.282314330339432e-05, -4.141964018344879e-05, -4.0016137063503265e-05, -3.861263394355774e-05, -3.720913082361221e-05, -3.580562770366669e-05, -3.440212458372116e-05, -3.2998621463775635e-05, -3.159511834383011e-05, -3.0191615223884583e-05, -2.8788112103939056e-05, -2.738460898399353e-05, -2.5981105864048004e-05, -2.4577602744102478e-05, -2.3174099624156952e-05, -2.1770596504211426e-05, -2.03670933842659e-05, -1.8963590264320374e-05, -1.7560087144374847e-05, -1.615658402442932e-05, -1.4753080904483795e-05, -1.3349577784538269e-05, -1.1946074664592743e-05, -1.0542571544647217e-05, -9.13906842470169e-06, -7.735565304756165e-06, -6.3320621848106384e-06, -4.928559064865112e-06, -3.525055944919586e-06, -2.12155282497406e-06, -7.180497050285339e-07, 6.854534149169922e-07, 2.0889565348625183e-06, 3.4924596548080444e-06, 4.8959627747535706e-06, 6.299465894699097e-06, 7.702969014644623e-06, 9.106472134590149e-06, 1.0509975254535675e-05, 1.1913478374481201e-05, 1.3316981494426727e-05, 1.4720484614372253e-05, 1.612398773431778e-05, 1.7527490854263306e-05, 1.8930993974208832e-05, 2.0334497094154358e-05, 2.1738000214099884e-05, 2.314150333404541e-05, 2.4545006453990936e-05, 2.5948509573936462e-05, 2.735201269388199e-05, 2.8755515813827515e-05, 3.015901893377304e-05, 3.156252205371857e-05, 3.296602517366409e-05, 3.436952829360962e-05, 3.5773031413555145e-05, 3.717653453350067e-05, 3.85800376534462e-05, 3.9983540773391724e-05, 4.138704389333725e-05, 4.2790547013282776e-05, 4.41940501332283e-05, 4.559755325317383e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 9.0, 14.0, 16.0, 25.0, 48.0, 64.0, 125.0, 204.0, 439.0, 993.0, 2119.0, 6202.0, 29211.0, 452437.0, 513959.0, 31665.0, 6812.0, 2261.0, 930.0, 467.0, 248.0, 119.0, 71.0, 41.0, 31.0, 11.0, 15.0, 9.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.28173828125, -0.2723541259765625, -0.262969970703125, -0.2535858154296875, -0.24420166015625, -0.2348175048828125, -0.225433349609375, -0.2160491943359375, -0.2066650390625, -0.1972808837890625, -0.187896728515625, -0.1785125732421875, -0.16912841796875, -0.1597442626953125, -0.150360107421875, -0.1409759521484375, -0.131591796875, -0.1222076416015625, -0.112823486328125, -0.1034393310546875, -0.09405517578125, -0.0846710205078125, -0.075286865234375, -0.0659027099609375, -0.0565185546875, -0.0471343994140625, -0.037750244140625, -0.0283660888671875, -0.01898193359375, -0.0095977783203125, -0.000213623046875, 0.0091705322265625, 0.0185546875, 0.0279388427734375, 0.037322998046875, 0.0467071533203125, 0.05609130859375, 0.0654754638671875, 0.074859619140625, 0.0842437744140625, 0.0936279296875, 0.1030120849609375, 0.112396240234375, 0.1217803955078125, 0.13116455078125, 0.1405487060546875, 0.149932861328125, 0.1593170166015625, 0.168701171875, 0.1780853271484375, 0.187469482421875, 0.1968536376953125, 0.20623779296875, 0.2156219482421875, 0.225006103515625, 0.2343902587890625, 0.2437744140625, 0.2531585693359375, 0.262542724609375, 0.2719268798828125, 0.28131103515625, 0.2906951904296875, 0.300079345703125, 0.3094635009765625, 0.31884765625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 5.0, 8.0, 11.0, 14.0, 11.0, 24.0, 28.0, 37.0, 57.0, 56.0, 89.0, 138.0, 112.0, 88.0, 106.0, 54.0, 37.0, 20.0, 31.0, 19.0, 10.0, 10.0, 6.0, 3.0, 5.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.159912109375, -0.15479278564453125, -0.1496734619140625, -0.14455413818359375, -0.139434814453125, -0.13431549072265625, -0.1291961669921875, -0.12407684326171875, -0.11895751953125, -0.11383819580078125, -0.1087188720703125, -0.10359954833984375, -0.098480224609375, -0.09336090087890625, -0.0882415771484375, -0.08312225341796875, -0.0780029296875, -0.07288360595703125, -0.0677642822265625, -0.06264495849609375, -0.057525634765625, -0.05240631103515625, -0.0472869873046875, -0.04216766357421875, -0.03704833984375, -0.03192901611328125, -0.0268096923828125, -0.02169036865234375, -0.016571044921875, -0.01145172119140625, -0.0063323974609375, -0.00121307373046875, 0.00390625, 0.00902557373046875, 0.0141448974609375, 0.01926422119140625, 0.024383544921875, 0.02950286865234375, 0.0346221923828125, 0.03974151611328125, 0.04486083984375, 0.04998016357421875, 0.0550994873046875, 0.06021881103515625, 0.065338134765625, 0.07045745849609375, 0.0755767822265625, 0.08069610595703125, 0.0858154296875, 0.09093475341796875, 0.0960540771484375, 0.10117340087890625, 0.106292724609375, 0.11141204833984375, 0.1165313720703125, 0.12165069580078125, 0.12677001953125, 0.13188934326171875, 0.1370086669921875, 0.14212799072265625, 0.147247314453125, 0.15236663818359375, 0.1574859619140625, 0.16260528564453125, 0.167724609375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 16.0, 41.0, 137.0, 375.0, 307.0, 103.0, 18.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7570672035217285, -4.540345668792725, -4.3236236572265625, -4.106902122497559, -3.8901805877685547, -3.6734588146209717, -3.4567370414733887, -3.2400155067443848, -3.0232937335968018, -2.8065719604492188, -2.589850425720215, -2.373128652572632, -2.156406879425049, -1.939685344696045, -1.722963571548462, -1.5062419176101685, -1.289520263671875, -1.0727986097335815, -0.8560768961906433, -0.6393551826477051, -0.4226335287094116, -0.20591187477111816, 0.010809898376464844, 0.2275315523147583, 0.44425320625305176, 0.6609748601913452, 0.8776965737342834, 1.0944182872772217, 1.3111399412155151, 1.5278615951538086, 1.7445833683013916, 1.961305022239685, 2.1780261993408203, 2.3947479724884033, 2.6114695072174072, 2.8281912803649902, 3.044912815093994, 3.261634588241577, 3.47835636138916, 3.695077896118164, 3.911799669265747, 4.12852144241333, 4.345242977142334, 4.561964988708496, 4.7786865234375, 4.995408058166504, 5.212129592895508, 5.42885160446167, 5.645573139190674, 5.862294673919678, 6.07901668548584, 6.295738220214844, 6.512459754943848, 6.729181289672852, 6.945903301239014, 7.162624835968018, 7.37934684753418, 7.596068382263184, 7.812790393829346, 8.029512405395508, 8.246233940124512, 8.462955474853516, 8.67967700958252, 8.896398544311523, 9.113120079040527]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 10.0, 10.0, 14.0, 7.0, 7.0, 18.0, 21.0, 15.0, 20.0, 21.0, 27.0, 40.0, 36.0, 39.0, 41.0, 39.0, 44.0, 42.0, 45.0, 46.0, 31.0, 40.0, 36.0, 37.0, 27.0, 35.0, 29.0, 30.0, 29.0, 22.0, 18.0, 18.0, 11.0, 18.0, 12.0, 12.0, 11.0, 11.0, 7.0, 3.0, 1.0, 1.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7789396047592163, -1.7249284982681274, -1.6709175109863281, -1.6169064044952393, -1.56289541721344, -1.508884310722351, -1.4548733234405518, -1.400862216949463, -1.346851110458374, -1.2928400039672852, -1.2388290166854858, -1.184817910194397, -1.1308069229125977, -1.0767958164215088, -1.02278470993042, -0.9687737226486206, -0.9147627353668213, -0.8607516884803772, -0.8067406415939331, -0.7527295351028442, -0.6987185478210449, -0.644707441329956, -0.590696394443512, -0.5366853475570679, -0.4826743006706238, -0.4286632537841797, -0.3746522068977356, -0.3206411302089691, -0.266630083322525, -0.21261903643608093, -0.15860795974731445, -0.10459691286087036, -0.05058574676513672, 0.00342530757188797, 0.05743636190891266, 0.11144742369651794, 0.16545847058296204, 0.21946951746940613, 0.2734805941581726, 0.3274916410446167, 0.3815026879310608, 0.4355137348175049, 0.489524781703949, 0.5435358285903931, 0.5975469350814819, 0.6515579223632812, 0.7055690288543701, 0.7595800757408142, 0.8135911226272583, 0.8676021695137024, 0.9216132164001465, 0.9756243228912354, 1.0296353101730347, 1.0836464166641235, 1.1376574039459229, 1.1916685104370117, 1.2456796169281006, 1.2996907234191895, 1.3537017107009888, 1.4077128171920776, 1.461723804473877, 1.5157349109649658, 1.5697460174560547, 1.623757004737854, 1.6777679920196533]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 10.0, 8.0, 12.0, 15.0, 22.0, 27.0, 43.0, 66.0, 97.0, 150.0, 262.0, 465.0, 905.0, 2345.0, 8555.0, 126287.0, 4029817.0, 18685.0, 3931.0, 1322.0, 568.0, 277.0, 127.0, 106.0, 58.0, 29.0, 22.0, 22.0, 13.0, 7.0, 7.0, 3.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4267578125, -1.377899169921875, -1.32904052734375, -1.280181884765625, -1.2313232421875, -1.182464599609375, -1.13360595703125, -1.084747314453125, -1.035888671875, -0.987030029296875, -0.93817138671875, -0.889312744140625, -0.8404541015625, -0.791595458984375, -0.74273681640625, -0.693878173828125, -0.64501953125, -0.596160888671875, -0.54730224609375, -0.498443603515625, -0.4495849609375, -0.400726318359375, -0.35186767578125, -0.303009033203125, -0.254150390625, -0.205291748046875, -0.15643310546875, -0.107574462890625, -0.0587158203125, -0.009857177734375, 0.03900146484375, 0.087860107421875, 0.13671875, 0.185577392578125, 0.23443603515625, 0.283294677734375, 0.3321533203125, 0.381011962890625, 0.42987060546875, 0.478729248046875, 0.527587890625, 0.576446533203125, 0.62530517578125, 0.674163818359375, 0.7230224609375, 0.771881103515625, 0.82073974609375, 0.869598388671875, 0.91845703125, 0.967315673828125, 1.01617431640625, 1.065032958984375, 1.1138916015625, 1.162750244140625, 1.21160888671875, 1.260467529296875, 1.309326171875, 1.358184814453125, 1.40704345703125, 1.455902099609375, 1.5047607421875, 1.553619384765625, 1.60247802734375, 1.651336669921875, 1.7001953125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 5.0, 8.0, 9.0, 11.0, 13.0, 18.0, 32.0, 47.0, 47.0, 39.0, 51.0, 71.0, 62.0, 72.0, 71.0, 53.0, 59.0, 50.0, 52.0, 40.0, 45.0, 36.0, 25.0, 26.0, 6.0, 11.0, 10.0, 6.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13330078125, -0.12950611114501953, -0.12571144104003906, -0.1219167709350586, -0.11812210083007812, -0.11432743072509766, -0.11053276062011719, -0.10673809051513672, -0.10294342041015625, -0.09914875030517578, -0.09535408020019531, -0.09155941009521484, -0.08776473999023438, -0.0839700698852539, -0.08017539978027344, -0.07638072967529297, -0.0725860595703125, -0.06879138946533203, -0.06499671936035156, -0.061202049255371094, -0.057407379150390625, -0.053612709045410156, -0.04981803894042969, -0.04602336883544922, -0.04222869873046875, -0.03843402862548828, -0.03463935852050781, -0.030844688415527344, -0.027050018310546875, -0.023255348205566406, -0.019460678100585938, -0.01566600799560547, -0.011871337890625, -0.008076667785644531, -0.0042819976806640625, -0.00048732757568359375, 0.003307342529296875, 0.007102012634277344, 0.010896682739257812, 0.014691352844238281, 0.01848602294921875, 0.02228069305419922, 0.026075363159179688, 0.029870033264160156, 0.033664703369140625, 0.037459373474121094, 0.04125404357910156, 0.04504871368408203, 0.0488433837890625, 0.05263805389404297, 0.05643272399902344, 0.060227394104003906, 0.06402206420898438, 0.06781673431396484, 0.07161140441894531, 0.07540607452392578, 0.07920074462890625, 0.08299541473388672, 0.08679008483886719, 0.09058475494384766, 0.09437942504882812, 0.0981740951538086, 0.10196876525878906, 0.10576343536376953, 0.10955810546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 8.0, 8.0, 30.0, 44.0, 75.0, 130.0, 267.0, 728.0, 4631.0, 4083887.0, 101117.0, 2356.0, 506.0, 207.0, 123.0, 63.0, 50.0, 20.0, 13.0, 9.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.330078125, -2.223480224609375, -2.11688232421875, -2.010284423828125, -1.9036865234375, -1.797088623046875, -1.69049072265625, -1.583892822265625, -1.477294921875, -1.370697021484375, -1.26409912109375, -1.157501220703125, -1.0509033203125, -0.944305419921875, -0.83770751953125, -0.731109619140625, -0.62451171875, -0.517913818359375, -0.41131591796875, -0.304718017578125, -0.1981201171875, -0.091522216796875, 0.01507568359375, 0.121673583984375, 0.228271484375, 0.334869384765625, 0.44146728515625, 0.548065185546875, 0.6546630859375, 0.761260986328125, 0.86785888671875, 0.974456787109375, 1.0810546875, 1.187652587890625, 1.29425048828125, 1.400848388671875, 1.5074462890625, 1.614044189453125, 1.72064208984375, 1.827239990234375, 1.933837890625, 2.040435791015625, 2.14703369140625, 2.253631591796875, 2.3602294921875, 2.466827392578125, 2.57342529296875, 2.680023193359375, 2.78662109375, 2.893218994140625, 2.99981689453125, 3.106414794921875, 3.2130126953125, 3.319610595703125, 3.42620849609375, 3.532806396484375, 3.639404296875, 3.746002197265625, 3.85260009765625, 3.959197998046875, 4.0657958984375, 4.172393798828125, 4.27899169921875, 4.385589599609375, 4.4921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 16.0, 25.0, 30.0, 99.0, 1660.0, 2048.0, 107.0, 53.0, 17.0, 9.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5224609375, -0.4976043701171875, -0.472747802734375, -0.4478912353515625, -0.42303466796875, -0.3981781005859375, -0.373321533203125, -0.3484649658203125, -0.3236083984375, -0.2987518310546875, -0.273895263671875, -0.2490386962890625, -0.22418212890625, -0.1993255615234375, -0.174468994140625, -0.1496124267578125, -0.124755859375, -0.0998992919921875, -0.075042724609375, -0.0501861572265625, -0.02532958984375, -0.0004730224609375, 0.024383544921875, 0.0492401123046875, 0.0740966796875, 0.0989532470703125, 0.123809814453125, 0.1486663818359375, 0.17352294921875, 0.1983795166015625, 0.223236083984375, 0.2480926513671875, 0.27294921875, 0.2978057861328125, 0.322662353515625, 0.3475189208984375, 0.37237548828125, 0.3972320556640625, 0.422088623046875, 0.4469451904296875, 0.4718017578125, 0.4966583251953125, 0.521514892578125, 0.5463714599609375, 0.57122802734375, 0.5960845947265625, 0.620941162109375, 0.6457977294921875, 0.670654296875, 0.6955108642578125, 0.720367431640625, 0.7452239990234375, 0.77008056640625, 0.7949371337890625, 0.819793701171875, 0.8446502685546875, 0.8695068359375, 0.8943634033203125, 0.919219970703125, 0.9440765380859375, 0.96893310546875, 0.9937896728515625, 1.018646240234375, 1.0435028076171875, 1.068359375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 19.0, 60.0, 235.0, 463.0, 145.0, 52.0, 8.0, 10.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.52065372467041, -6.373555660247803, -6.226457595825195, -6.079359531402588, -5.9322614669799805, -5.785163879394531, -5.638065814971924, -5.490967750549316, -5.343869686126709, -5.196771621704102, -5.049673557281494, -4.902575492858887, -4.7554779052734375, -4.60837984085083, -4.461281776428223, -4.314183712005615, -4.167085647583008, -4.0199875831604, -3.872889518737793, -3.7257916927337646, -3.5786936283111572, -3.43159556388855, -3.2844977378845215, -3.137399673461914, -2.9903016090393066, -2.843203544616699, -2.696105480194092, -2.5490076541900635, -2.401909589767456, -2.2548115253448486, -2.1077136993408203, -1.960615634918213, -1.8135180473327637, -1.6664199829101562, -1.5193220376968384, -1.3722240924835205, -1.225126028060913, -1.0780279636383057, -0.9309300184249878, -0.7838320732116699, -0.6367340087890625, -0.48963600397109985, -0.3425379991531372, -0.19543999433517456, -0.048341989517211914, 0.09875601530075073, 0.24585402011871338, 0.39295196533203125, 0.5400500297546387, 0.6871480345726013, 0.834246039390564, 0.9813440442085266, 1.1284420490264893, 1.2755401134490967, 1.4226380586624146, 1.5697360038757324, 1.7168340682983398, 1.8639321327209473, 2.0110301971435547, 2.158128023147583, 2.3052260875701904, 2.452324151992798, 2.599421977996826, 2.7465200424194336, 2.893618106842041]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 11.0, 19.0, 26.0, 33.0, 50.0, 71.0, 96.0, 103.0, 113.0, 90.0, 92.0, 79.0, 76.0, 48.0, 28.0, 24.0, 14.0, 9.0, 9.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7571296691894531, -1.6938321590423584, -1.6305346488952637, -1.567237138748169, -1.5039396286010742, -1.4406421184539795, -1.3773447275161743, -1.3140472173690796, -1.2507497072219849, -1.1874521970748901, -1.1241546869277954, -1.0608571767807007, -0.9975597262382507, -0.934262216091156, -0.870964765548706, -0.8076672554016113, -0.7443697452545166, -0.6810722351074219, -0.6177747249603271, -0.5544772744178772, -0.49117976427078247, -0.42788225412368774, -0.3645847737789154, -0.30128729343414307, -0.23798978328704834, -0.1746922880411148, -0.11139479279518127, -0.04809729754924774, 0.015200197696685791, 0.07849770784378052, 0.14179518818855286, 0.2050926685333252, 0.2683901786804199, 0.33168768882751465, 0.394985169172287, 0.4582826495170593, 0.521580159664154, 0.5848776698112488, 0.6481751203536987, 0.7114726305007935, 0.7747701406478882, 0.8380676507949829, 0.9013651609420776, 0.9646626114845276, 1.0279600620269775, 1.0912575721740723, 1.154555082321167, 1.2178525924682617, 1.2811501026153564, 1.3444476127624512, 1.407745122909546, 1.4710426330566406, 1.5343401432037354, 1.59763765335083, 1.6609350442886353, 1.72423255443573, 1.7875300645828247, 1.8508275747299194, 1.9141250848770142, 1.9774225950241089, 2.040719985961914, 2.104017496109009, 2.1673150062561035, 2.2306125164031982, 2.293910026550293]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 8.0, 7.0, 10.0, 20.0, 23.0, 42.0, 59.0, 86.0, 182.0, 242.0, 435.0, 845.0, 1920.0, 5179.0, 19603.0, 150139.0, 743585.0, 102610.0, 15699.0, 4275.0, 1751.0, 746.0, 411.0, 258.0, 142.0, 113.0, 46.0, 25.0, 27.0, 18.0, 12.0, 11.0, 2.0, 2.0, 4.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.78369140625, -0.7570571899414062, -0.7304229736328125, -0.7037887573242188, -0.677154541015625, -0.6505203247070312, -0.6238861083984375, -0.5972518920898438, -0.57061767578125, -0.5439834594726562, -0.5173492431640625, -0.49071502685546875, -0.464080810546875, -0.43744659423828125, -0.4108123779296875, -0.38417816162109375, -0.3575439453125, -0.33090972900390625, -0.3042755126953125, -0.27764129638671875, -0.251007080078125, -0.22437286376953125, -0.1977386474609375, -0.17110443115234375, -0.14447021484375, -0.11783599853515625, -0.0912017822265625, -0.06456756591796875, -0.037933349609375, -0.01129913330078125, 0.0153350830078125, 0.04196929931640625, 0.068603515625, 0.09523773193359375, 0.1218719482421875, 0.14850616455078125, 0.175140380859375, 0.20177459716796875, 0.2284088134765625, 0.25504302978515625, 0.28167724609375, 0.30831146240234375, 0.3349456787109375, 0.36157989501953125, 0.388214111328125, 0.41484832763671875, 0.4414825439453125, 0.46811676025390625, 0.4947509765625, 0.5213851928710938, 0.5480194091796875, 0.5746536254882812, 0.601287841796875, 0.6279220581054688, 0.6545562744140625, 0.6811904907226562, 0.70782470703125, 0.7344589233398438, 0.7610931396484375, 0.7877273559570312, 0.814361572265625, 0.8409957885742188, 0.8676300048828125, 0.8942642211914062, 0.9208984375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 5.0, 10.0, 11.0, 17.0, 18.0, 18.0, 33.0, 42.0, 44.0, 58.0, 52.0, 61.0, 53.0, 57.0, 55.0, 68.0, 51.0, 42.0, 41.0, 50.0, 30.0, 43.0, 22.0, 19.0, 20.0, 12.0, 11.0, 10.0, 4.0, 5.0, 5.0, 3.0, 4.0, 6.0, 2.0, 0.0, 1.0, 5.0], "bins": [-0.1470947265625, -0.1434154510498047, -0.13973617553710938, -0.13605690002441406, -0.13237762451171875, -0.12869834899902344, -0.12501907348632812, -0.12133979797363281, -0.1176605224609375, -0.11398124694824219, -0.11030197143554688, -0.10662269592285156, -0.10294342041015625, -0.09926414489746094, -0.09558486938476562, -0.09190559387207031, -0.088226318359375, -0.08454704284667969, -0.08086776733398438, -0.07718849182128906, -0.07350921630859375, -0.06982994079589844, -0.06615066528320312, -0.06247138977050781, -0.0587921142578125, -0.05511283874511719, -0.051433563232421875, -0.04775428771972656, -0.04407501220703125, -0.04039573669433594, -0.036716461181640625, -0.03303718566894531, -0.02935791015625, -0.025678634643554688, -0.021999359130859375, -0.018320083618164062, -0.01464080810546875, -0.010961532592773438, -0.007282257080078125, -0.0036029815673828125, 7.62939453125e-05, 0.0037555694580078125, 0.007434844970703125, 0.011114120483398438, 0.01479339599609375, 0.018472671508789062, 0.022151947021484375, 0.025831222534179688, 0.029510498046875, 0.03318977355957031, 0.036869049072265625, 0.04054832458496094, 0.04422760009765625, 0.04790687561035156, 0.051586151123046875, 0.05526542663574219, 0.0589447021484375, 0.06262397766113281, 0.06630325317382812, 0.06998252868652344, 0.07366180419921875, 0.07734107971191406, 0.08102035522460938, 0.08469963073730469, 0.08837890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 6.0, 15.0, 21.0, 18.0, 43.0, 54.0, 97.0, 160.0, 293.0, 625.0, 1668.0, 5080.0, 20011.0, 139923.0, 710948.0, 141235.0, 20306.0, 5017.0, 1643.0, 628.0, 297.0, 170.0, 94.0, 69.0, 29.0, 13.0, 13.0, 20.0, 8.0, 8.0, 9.0, 5.0, 2.0, 8.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.525390625, -0.5087127685546875, -0.492034912109375, -0.4753570556640625, -0.45867919921875, -0.4420013427734375, -0.425323486328125, -0.4086456298828125, -0.3919677734375, -0.3752899169921875, -0.358612060546875, -0.3419342041015625, -0.32525634765625, -0.3085784912109375, -0.291900634765625, -0.2752227783203125, -0.258544921875, -0.2418670654296875, -0.225189208984375, -0.2085113525390625, -0.19183349609375, -0.1751556396484375, -0.158477783203125, -0.1417999267578125, -0.1251220703125, -0.1084442138671875, -0.091766357421875, -0.0750885009765625, -0.05841064453125, -0.0417327880859375, -0.025054931640625, -0.0083770751953125, 0.00830078125, 0.0249786376953125, 0.041656494140625, 0.0583343505859375, 0.07501220703125, 0.0916900634765625, 0.108367919921875, 0.1250457763671875, 0.1417236328125, 0.1584014892578125, 0.175079345703125, 0.1917572021484375, 0.20843505859375, 0.2251129150390625, 0.241790771484375, 0.2584686279296875, 0.275146484375, 0.2918243408203125, 0.308502197265625, 0.3251800537109375, 0.34185791015625, 0.3585357666015625, 0.375213623046875, 0.3918914794921875, 0.4085693359375, 0.4252471923828125, 0.441925048828125, 0.4586029052734375, 0.47528076171875, 0.4919586181640625, 0.508636474609375, 0.5253143310546875, 0.5419921875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 8.0, 15.0, 16.0, 14.0, 14.0, 19.0, 20.0, 24.0, 27.0, 31.0, 38.0, 36.0, 40.0, 44.0, 51.0, 54.0, 61.0, 39.0, 49.0, 51.0, 36.0, 36.0, 39.0, 36.0, 28.0, 32.0, 16.0, 23.0, 23.0, 17.0, 10.0, 9.0, 9.0, 7.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3583984375, -0.34630584716796875, -0.3342132568359375, -0.32212066650390625, -0.310028076171875, -0.29793548583984375, -0.2858428955078125, -0.27375030517578125, -0.26165771484375, -0.24956512451171875, -0.2374725341796875, -0.22537994384765625, -0.213287353515625, -0.20119476318359375, -0.1891021728515625, -0.17700958251953125, -0.1649169921875, -0.15282440185546875, -0.1407318115234375, -0.12863922119140625, -0.116546630859375, -0.10445404052734375, -0.0923614501953125, -0.08026885986328125, -0.06817626953125, -0.05608367919921875, -0.0439910888671875, -0.03189849853515625, -0.019805908203125, -0.00771331787109375, 0.0043792724609375, 0.01647186279296875, 0.028564453125, 0.04065704345703125, 0.0527496337890625, 0.06484222412109375, 0.076934814453125, 0.08902740478515625, 0.1011199951171875, 0.11321258544921875, 0.12530517578125, 0.13739776611328125, 0.1494903564453125, 0.16158294677734375, 0.173675537109375, 0.18576812744140625, 0.1978607177734375, 0.20995330810546875, 0.2220458984375, 0.23413848876953125, 0.2462310791015625, 0.25832366943359375, 0.270416259765625, 0.28250885009765625, 0.2946014404296875, 0.30669403076171875, 0.31878662109375, 0.33087921142578125, 0.3429718017578125, 0.35506439208984375, 0.367156982421875, 0.37924957275390625, 0.3913421630859375, 0.40343475341796875, 0.41552734375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 9.0, 5.0, 12.0, 19.0, 24.0, 29.0, 60.0, 83.0, 164.0, 254.0, 479.0, 1073.0, 2888.0, 10464.0, 61322.0, 593243.0, 333653.0, 33931.0, 6971.0, 2072.0, 843.0, 392.0, 203.0, 108.0, 83.0, 50.0, 37.0, 25.0, 13.0, 8.0, 7.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1461181640625, -0.14067649841308594, -0.13523483276367188, -0.1297931671142578, -0.12435150146484375, -0.11890983581542969, -0.11346817016601562, -0.10802650451660156, -0.1025848388671875, -0.09714317321777344, -0.09170150756835938, -0.08625984191894531, -0.08081817626953125, -0.07537651062011719, -0.06993484497070312, -0.06449317932128906, -0.059051513671875, -0.05360984802246094, -0.048168182373046875, -0.04272651672363281, -0.03728485107421875, -0.03184318542480469, -0.026401519775390625, -0.020959854125976562, -0.0155181884765625, -0.010076522827148438, -0.004634857177734375, 0.0008068084716796875, 0.00624847412109375, 0.011690139770507812, 0.017131805419921875, 0.022573471069335938, 0.02801513671875, 0.03345680236816406, 0.038898468017578125, 0.04434013366699219, 0.04978179931640625, 0.05522346496582031, 0.060665130615234375, 0.06610679626464844, 0.0715484619140625, 0.07699012756347656, 0.08243179321289062, 0.08787345886230469, 0.09331512451171875, 0.09875679016113281, 0.10419845581054688, 0.10964012145996094, 0.115081787109375, 0.12052345275878906, 0.12596511840820312, 0.1314067840576172, 0.13684844970703125, 0.1422901153564453, 0.14773178100585938, 0.15317344665527344, 0.1586151123046875, 0.16405677795410156, 0.16949844360351562, 0.1749401092529297, 0.18038177490234375, 0.1858234405517578, 0.19126510620117188, 0.19670677185058594, 0.2021484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 7.0, 3.0, 4.0, 10.0, 17.0, 15.0, 25.0, 25.0, 43.0, 70.0, 81.0, 138.0, 145.0, 111.0, 84.0, 57.0, 35.0, 25.0, 28.0, 20.0, 10.0, 7.0, 12.0, 6.0, 4.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.647804260253906e-05, -3.5313889384269714e-05, -3.4149736166000366e-05, -3.298558294773102e-05, -3.182142972946167e-05, -3.065727651119232e-05, -2.9493123292922974e-05, -2.8328970074653625e-05, -2.7164816856384277e-05, -2.600066363811493e-05, -2.483651041984558e-05, -2.3672357201576233e-05, -2.2508203983306885e-05, -2.1344050765037537e-05, -2.017989754676819e-05, -1.901574432849884e-05, -1.7851591110229492e-05, -1.6687437891960144e-05, -1.5523284673690796e-05, -1.4359131455421448e-05, -1.31949782371521e-05, -1.2030825018882751e-05, -1.0866671800613403e-05, -9.702518582344055e-06, -8.538365364074707e-06, -7.374212145805359e-06, -6.210058927536011e-06, -5.045905709266663e-06, -3.8817524909973145e-06, -2.7175992727279663e-06, -1.5534460544586182e-06, -3.8929283618927e-07, 7.748603820800781e-07, 1.9390136003494263e-06, 3.1031668186187744e-06, 4.2673200368881226e-06, 5.431473255157471e-06, 6.595626473426819e-06, 7.759779691696167e-06, 8.923932909965515e-06, 1.0088086128234863e-05, 1.1252239346504211e-05, 1.241639256477356e-05, 1.3580545783042908e-05, 1.4744699001312256e-05, 1.5908852219581604e-05, 1.7073005437850952e-05, 1.82371586561203e-05, 1.940131187438965e-05, 2.0565465092658997e-05, 2.1729618310928345e-05, 2.2893771529197693e-05, 2.405792474746704e-05, 2.522207796573639e-05, 2.6386231184005737e-05, 2.7550384402275085e-05, 2.8714537620544434e-05, 2.9878690838813782e-05, 3.104284405708313e-05, 3.220699727535248e-05, 3.3371150493621826e-05, 3.4535303711891174e-05, 3.569945693016052e-05, 3.686361014842987e-05, 3.802776336669922e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 15.0, 17.0, 23.0, 44.0, 94.0, 203.0, 398.0, 1141.0, 3965.0, 20100.0, 264550.0, 706593.0, 41988.0, 6629.0, 1714.0, 559.0, 265.0, 108.0, 49.0, 28.0, 21.0, 10.0, 13.0, 2.0, 2.0, 5.0, 8.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.32861328125, -0.3206329345703125, -0.312652587890625, -0.3046722412109375, -0.29669189453125, -0.2887115478515625, -0.280731201171875, -0.2727508544921875, -0.2647705078125, -0.2567901611328125, -0.248809814453125, -0.2408294677734375, -0.23284912109375, -0.2248687744140625, -0.216888427734375, -0.2089080810546875, -0.200927734375, -0.1929473876953125, -0.184967041015625, -0.1769866943359375, -0.16900634765625, -0.1610260009765625, -0.153045654296875, -0.1450653076171875, -0.1370849609375, -0.1291046142578125, -0.121124267578125, -0.1131439208984375, -0.10516357421875, -0.0971832275390625, -0.089202880859375, -0.0812225341796875, -0.0732421875, -0.0652618408203125, -0.057281494140625, -0.0493011474609375, -0.04132080078125, -0.0333404541015625, -0.025360107421875, -0.0173797607421875, -0.0093994140625, -0.0014190673828125, 0.006561279296875, 0.0145416259765625, 0.02252197265625, 0.0305023193359375, 0.038482666015625, 0.0464630126953125, 0.054443359375, 0.0624237060546875, 0.070404052734375, 0.0783843994140625, 0.08636474609375, 0.0943450927734375, 0.102325439453125, 0.1103057861328125, 0.1182861328125, 0.1262664794921875, 0.134246826171875, 0.1422271728515625, 0.15020751953125, 0.1581878662109375, 0.166168212890625, 0.1741485595703125, 0.18212890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 6.0, 7.0, 15.0, 4.0, 22.0, 3.0, 23.0, 37.0, 58.0, 80.0, 97.0, 142.0, 107.0, 113.0, 75.0, 61.0, 49.0, 24.0, 19.0, 13.0, 10.0, 8.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1724853515625, -0.1674365997314453, -0.16238784790039062, -0.15733909606933594, -0.15229034423828125, -0.14724159240722656, -0.14219284057617188, -0.1371440887451172, -0.1320953369140625, -0.1270465850830078, -0.12199783325195312, -0.11694908142089844, -0.11190032958984375, -0.10685157775878906, -0.10180282592773438, -0.09675407409667969, -0.091705322265625, -0.08665657043457031, -0.08160781860351562, -0.07655906677246094, -0.07151031494140625, -0.06646156311035156, -0.061412811279296875, -0.05636405944824219, -0.0513153076171875, -0.04626655578613281, -0.041217803955078125, -0.03616905212402344, -0.03112030029296875, -0.026071548461914062, -0.021022796630859375, -0.015974044799804688, -0.01092529296875, -0.0058765411376953125, -0.000827789306640625, 0.0042209625244140625, 0.00926971435546875, 0.014318466186523438, 0.019367218017578125, 0.024415969848632812, 0.0294647216796875, 0.03451347351074219, 0.039562225341796875, 0.04461097717285156, 0.04965972900390625, 0.05470848083496094, 0.059757232666015625, 0.06480598449707031, 0.069854736328125, 0.07490348815917969, 0.07995223999023438, 0.08500099182128906, 0.09004974365234375, 0.09509849548339844, 0.10014724731445312, 0.10519599914550781, 0.1102447509765625, 0.11529350280761719, 0.12034225463867188, 0.12539100646972656, 0.13043975830078125, 0.13548851013183594, 0.14053726196289062, 0.1455860137939453, 0.150634765625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 7.0, 24.0, 196.0, 561.0, 186.0, 38.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.596883773803711, -14.302331924438477, -14.007779121398926, -13.713227272033691, -13.41867446899414, -13.124122619628906, -12.829569816589355, -12.535017967224121, -12.24046516418457, -11.945913314819336, -11.651360511779785, -11.35680866241455, -11.062255859375, -10.767704010009766, -10.473151206970215, -10.17859935760498, -9.884047508239746, -9.589495658874512, -9.294942855834961, -9.000391006469727, -8.705838203430176, -8.411286354064941, -8.11673355102539, -7.822181701660156, -7.527629375457764, -7.233077049255371, -6.9385247230529785, -6.643972396850586, -6.349420547485352, -6.054867744445801, -5.760315895080566, -5.465763568878174, -5.171210289001465, -4.876657962799072, -4.58210563659668, -4.287553310394287, -3.9930012226104736, -3.698448896408081, -3.4038968086242676, -3.109344482421875, -2.8147921562194824, -2.52023983001709, -2.2256875038146973, -1.9311354160308838, -1.6365830898284912, -1.3420307636260986, -1.0474785566329956, -0.7529263496398926, -0.4583740234375, -0.1638217568397522, 0.1307305097579956, 0.4252827763557434, 0.7198350429534912, 1.0143873691558838, 1.3089395761489868, 1.6034917831420898, 1.8980441093444824, 2.192596435546875, 2.4871487617492676, 2.781700849533081, 3.0762531757354736, 3.370805501937866, 3.6653575897216797, 3.9599099159240723, 4.254462242126465]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 7.0, 9.0, 15.0, 12.0, 26.0, 21.0, 14.0, 23.0, 30.0, 32.0, 33.0, 44.0, 46.0, 33.0, 47.0, 36.0, 35.0, 49.0, 39.0, 49.0, 38.0, 53.0, 49.0, 30.0, 22.0, 32.0, 24.0, 24.0, 14.0, 10.0, 15.0, 14.0, 10.0, 20.0, 8.0, 8.0, 8.0, 4.0, 2.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7205265760421753, -1.66422438621521, -1.6079221963882446, -1.5516200065612793, -1.495317816734314, -1.4390156269073486, -1.3827133178710938, -1.326411247253418, -1.270108938217163, -1.2138067483901978, -1.1575045585632324, -1.101202368736267, -1.0449001789093018, -0.9885979890823364, -0.9322957396507263, -0.875993549823761, -0.8196914196014404, -0.7633892297744751, -0.7070870399475098, -0.6507848501205444, -0.5944826602935791, -0.5381804704666138, -0.48187822103500366, -0.42557603120803833, -0.369273841381073, -0.31297165155410767, -0.25666946172714233, -0.20036724209785461, -0.14406505227088928, -0.08776286244392395, -0.03146064281463623, 0.0248415470123291, 0.08114361763000488, 0.13744580745697021, 0.19374801218509674, 0.25005021691322327, 0.3063524067401886, 0.36265459656715393, 0.41895681619644165, 0.475259006023407, 0.5315611958503723, 0.5878633856773376, 0.644165575504303, 0.7004678249359131, 0.7567700147628784, 0.8130722045898438, 0.8693743944168091, 0.9256765842437744, 0.9819787740707397, 1.038280963897705, 1.0945831537246704, 1.1508853435516357, 1.207187533378601, 1.2634897232055664, 1.3197920322418213, 1.376094102859497, 1.432396411895752, 1.4886986017227173, 1.5450007915496826, 1.601302981376648, 1.6576051712036133, 1.7139073610305786, 1.770209550857544, 1.8265118598937988, 1.8828139305114746]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 6.0, 2.0, 7.0, 7.0, 8.0, 5.0, 5.0, 12.0, 17.0, 24.0, 28.0, 64.0, 106.0, 135.0, 268.0, 502.0, 876.0, 2649.0, 19050.0, 4152345.0, 14031.0, 2317.0, 836.0, 401.0, 224.0, 130.0, 84.0, 34.0, 31.0, 19.0, 12.0, 8.0, 8.0, 5.0, 10.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5390625, -2.460784912109375, -2.38250732421875, -2.304229736328125, -2.2259521484375, -2.147674560546875, -2.06939697265625, -1.991119384765625, -1.912841796875, -1.834564208984375, -1.75628662109375, -1.678009033203125, -1.5997314453125, -1.521453857421875, -1.44317626953125, -1.364898681640625, -1.28662109375, -1.208343505859375, -1.13006591796875, -1.051788330078125, -0.9735107421875, -0.895233154296875, -0.81695556640625, -0.738677978515625, -0.660400390625, -0.582122802734375, -0.50384521484375, -0.425567626953125, -0.3472900390625, -0.269012451171875, -0.19073486328125, -0.112457275390625, -0.0341796875, 0.044097900390625, 0.12237548828125, 0.200653076171875, 0.2789306640625, 0.357208251953125, 0.43548583984375, 0.513763427734375, 0.592041015625, 0.670318603515625, 0.74859619140625, 0.826873779296875, 0.9051513671875, 0.983428955078125, 1.06170654296875, 1.139984130859375, 1.21826171875, 1.296539306640625, 1.37481689453125, 1.453094482421875, 1.5313720703125, 1.609649658203125, 1.68792724609375, 1.766204833984375, 1.844482421875, 1.922760009765625, 2.00103759765625, 2.079315185546875, 2.1575927734375, 2.235870361328125, 2.31414794921875, 2.392425537109375, 2.470703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 7.0, 4.0, 10.0, 15.0, 14.0, 12.0, 26.0, 29.0, 33.0, 48.0, 51.0, 46.0, 68.0, 60.0, 53.0, 59.0, 60.0, 55.0, 50.0, 44.0, 44.0, 30.0, 31.0, 27.0, 25.0, 20.0, 15.0, 18.0, 9.0, 5.0, 8.0, 4.0, 1.0, 6.0, 3.0, 4.0, 6.0, 1.0, 1.0], "bins": [-0.150146484375, -0.14642906188964844, -0.14271163940429688, -0.1389942169189453, -0.13527679443359375, -0.1315593719482422, -0.12784194946289062, -0.12412452697753906, -0.1204071044921875, -0.11668968200683594, -0.11297225952148438, -0.10925483703613281, -0.10553741455078125, -0.10181999206542969, -0.09810256958007812, -0.09438514709472656, -0.090667724609375, -0.08695030212402344, -0.08323287963867188, -0.07951545715332031, -0.07579803466796875, -0.07208061218261719, -0.06836318969726562, -0.06464576721191406, -0.0609283447265625, -0.05721092224121094, -0.053493499755859375, -0.04977607727050781, -0.04605865478515625, -0.04234123229980469, -0.038623809814453125, -0.03490638732910156, -0.03118896484375, -0.027471542358398438, -0.023754119873046875, -0.020036697387695312, -0.01631927490234375, -0.012601852416992188, -0.008884429931640625, -0.0051670074462890625, -0.0014495849609375, 0.0022678375244140625, 0.005985260009765625, 0.009702682495117188, 0.01342010498046875, 0.017137527465820312, 0.020854949951171875, 0.024572372436523438, 0.028289794921875, 0.03200721740722656, 0.035724639892578125, 0.03944206237792969, 0.04315948486328125, 0.04687690734863281, 0.050594329833984375, 0.05431175231933594, 0.0580291748046875, 0.06174659729003906, 0.06546401977539062, 0.06918144226074219, 0.07289886474609375, 0.07661628723144531, 0.08033370971679688, 0.08405113220214844, 0.0877685546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 9.0, 7.0, 5.0, 15.0, 13.0, 24.0, 33.0, 43.0, 58.0, 80.0, 163.0, 458.0, 3053.0, 4183549.0, 5697.0, 577.0, 170.0, 99.0, 61.0, 48.0, 40.0, 24.0, 22.0, 16.0, 9.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.375, -4.1395263671875, -3.904052734375, -3.6685791015625, -3.43310546875, -3.1976318359375, -2.962158203125, -2.7266845703125, -2.4912109375, -2.2557373046875, -2.020263671875, -1.7847900390625, -1.54931640625, -1.3138427734375, -1.078369140625, -0.8428955078125, -0.607421875, -0.3719482421875, -0.136474609375, 0.0989990234375, 0.33447265625, 0.5699462890625, 0.805419921875, 1.0408935546875, 1.2763671875, 1.5118408203125, 1.747314453125, 1.9827880859375, 2.21826171875, 2.4537353515625, 2.689208984375, 2.9246826171875, 3.16015625, 3.3956298828125, 3.631103515625, 3.8665771484375, 4.10205078125, 4.3375244140625, 4.572998046875, 4.8084716796875, 5.0439453125, 5.2794189453125, 5.514892578125, 5.7503662109375, 5.98583984375, 6.2213134765625, 6.456787109375, 6.6922607421875, 6.927734375, 7.1632080078125, 7.398681640625, 7.6341552734375, 7.86962890625, 8.1051025390625, 8.340576171875, 8.5760498046875, 8.8115234375, 9.0469970703125, 9.282470703125, 9.5179443359375, 9.75341796875, 9.9888916015625, 10.224365234375, 10.4598388671875, 10.6953125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 9.0, 24.0, 127.0, 3803.0, 87.0, 25.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75634765625, -0.7039718627929688, -0.6515960693359375, -0.5992202758789062, -0.546844482421875, -0.49446868896484375, -0.4420928955078125, -0.38971710205078125, -0.33734130859375, -0.28496551513671875, -0.2325897216796875, -0.18021392822265625, -0.127838134765625, -0.07546234130859375, -0.0230865478515625, 0.02928924560546875, 0.0816650390625, 0.13404083251953125, 0.1864166259765625, 0.23879241943359375, 0.291168212890625, 0.34354400634765625, 0.3959197998046875, 0.44829559326171875, 0.50067138671875, 0.5530471801757812, 0.6054229736328125, 0.6577987670898438, 0.710174560546875, 0.7625503540039062, 0.8149261474609375, 0.8673019409179688, 0.919677734375, 0.9720535278320312, 1.0244293212890625, 1.0768051147460938, 1.129180908203125, 1.1815567016601562, 1.2339324951171875, 1.2863082885742188, 1.33868408203125, 1.3910598754882812, 1.4434356689453125, 1.4958114624023438, 1.548187255859375, 1.6005630493164062, 1.6529388427734375, 1.7053146362304688, 1.7576904296875, 1.8100662231445312, 1.8624420166015625, 1.9148178100585938, 1.967193603515625, 2.0195693969726562, 2.0719451904296875, 2.1243209838867188, 2.17669677734375, 2.2290725708007812, 2.2814483642578125, 2.3338241577148438, 2.386199951171875, 2.4385757446289062, 2.4909515380859375, 2.5433273315429688, 2.595703125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 8.0, 12.0, 24.0, 79.0, 446.0, 324.0, 68.0, 28.0, 15.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.499883651733398, -6.258271217346191, -6.016658782958984, -5.775046348571777, -5.53343391418457, -5.291821479797363, -5.050209045410156, -4.808596611022949, -4.566984176635742, -4.325371742248535, -4.083759307861328, -3.842146873474121, -3.600534439086914, -3.358922004699707, -3.117309808731079, -2.875697374343872, -2.634085178375244, -2.392472743988037, -2.15086030960083, -1.9092479944229126, -1.6676355600357056, -1.4260231256484985, -1.184410810470581, -0.942798376083374, -0.701185941696167, -0.45957353711128235, -0.2179611325263977, 0.02365124225616455, 0.2652636766433716, 0.5068761110305786, 0.7484884262084961, 0.9901008605957031, 1.2317132949829102, 1.4733257293701172, 1.7149381637573242, 1.9565504789352417, 2.1981630325317383, 2.4397754669189453, 2.6813876628875732, 2.9230000972747803, 3.1646125316619873, 3.4062249660491943, 3.6478374004364014, 3.8894495964050293, 4.131062030792236, 4.372674465179443, 4.61428689956665, 4.855899333953857, 5.0975117683410645, 5.3391242027282715, 5.5807366371154785, 5.8223490715026855, 6.063961505889893, 6.3055739402771, 6.547185897827148, 6.7887983322143555, 7.0304107666015625, 7.2720232009887695, 7.513635635375977, 7.755248069763184, 7.996860504150391, 8.238472938537598, 8.480085372924805, 8.721697807312012, 8.963310241699219]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 3.0, 11.0, 22.0, 35.0, 82.0, 122.0, 167.0, 148.0, 146.0, 126.0, 62.0, 35.0, 10.0, 16.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.834344863891602, -4.701873302459717, -4.569401741027832, -4.436930179595947, -4.3044586181640625, -4.171987056732178, -4.039515495300293, -3.907043933868408, -3.7745723724365234, -3.6421008110046387, -3.509629249572754, -3.377157688140869, -3.2446861267089844, -3.1122145652770996, -2.979743003845215, -2.84727144241333, -2.7148001194000244, -2.5823285579681396, -2.449856996536255, -2.31738543510437, -2.1849138736724854, -2.0524423122406006, -1.9199708700180054, -1.7874993085861206, -1.6550277471542358, -1.522556185722351, -1.3900846242904663, -1.257613182067871, -1.1251416206359863, -0.9926699995994568, -0.8601984977722168, -0.727726936340332, -0.5952553749084473, -0.4627838134765625, -0.3303122818470001, -0.19784075021743774, -0.06536918878555298, 0.06710237264633179, 0.19957387447357178, 0.33204543590545654, 0.4645169973373413, 0.5969885587692261, 0.7294601202011108, 0.8619316220283508, 0.9944031834602356, 1.1268746852874756, 1.2593462467193604, 1.3918178081512451, 1.5242893695831299, 1.6567609310150146, 1.7892324924468994, 1.9217040538787842, 2.054175615310669, 2.1866471767425537, 2.3191184997558594, 2.451590061187744, 2.584061622619629, 2.7165331840515137, 2.8490047454833984, 2.981476306915283, 3.113947868347168, 3.2464194297790527, 3.3788909912109375, 3.5113625526428223, 3.643834114074707]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 10.0, 15.0, 21.0, 29.0, 34.0, 42.0, 70.0, 94.0, 136.0, 218.0, 313.0, 552.0, 985.0, 1825.0, 4039.0, 10507.0, 37414.0, 233058.0, 628491.0, 96637.0, 20911.0, 6906.0, 2843.0, 1386.0, 735.0, 453.0, 248.0, 179.0, 113.0, 81.0, 60.0, 38.0, 32.0, 16.0, 15.0, 11.0, 7.0, 6.0, 3.0, 5.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.71826171875, -0.6953048706054688, -0.6723480224609375, -0.6493911743164062, -0.626434326171875, -0.6034774780273438, -0.5805206298828125, -0.5575637817382812, -0.53460693359375, -0.5116500854492188, -0.4886932373046875, -0.46573638916015625, -0.442779541015625, -0.41982269287109375, -0.3968658447265625, -0.37390899658203125, -0.3509521484375, -0.32799530029296875, -0.3050384521484375, -0.28208160400390625, -0.259124755859375, -0.23616790771484375, -0.2132110595703125, -0.19025421142578125, -0.16729736328125, -0.14434051513671875, -0.1213836669921875, -0.09842681884765625, -0.075469970703125, -0.05251312255859375, -0.0295562744140625, -0.00659942626953125, 0.016357421875, 0.03931427001953125, 0.0622711181640625, 0.08522796630859375, 0.108184814453125, 0.13114166259765625, 0.1540985107421875, 0.17705535888671875, 0.20001220703125, 0.22296905517578125, 0.2459259033203125, 0.26888275146484375, 0.291839599609375, 0.31479644775390625, 0.3377532958984375, 0.36071014404296875, 0.3836669921875, 0.40662384033203125, 0.4295806884765625, 0.45253753662109375, 0.475494384765625, 0.49845123291015625, 0.5214080810546875, 0.5443649291992188, 0.56732177734375, 0.5902786254882812, 0.6132354736328125, 0.6361923217773438, 0.659149169921875, 0.6821060180664062, 0.7050628662109375, 0.7280197143554688, 0.7509765625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 3.0, 7.0, 0.0, 7.0, 13.0, 13.0, 22.0, 38.0, 41.0, 60.0, 74.0, 72.0, 78.0, 98.0, 69.0, 84.0, 75.0, 63.0, 48.0, 41.0, 23.0, 27.0, 13.0, 8.0, 8.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255126953125, -0.24779129028320312, -0.24045562744140625, -0.23311996459960938, -0.2257843017578125, -0.21844863891601562, -0.21111297607421875, -0.20377731323242188, -0.196441650390625, -0.18910598754882812, -0.18177032470703125, -0.17443466186523438, -0.1670989990234375, -0.15976333618164062, -0.15242767333984375, -0.14509201049804688, -0.13775634765625, -0.13042068481445312, -0.12308502197265625, -0.11574935913085938, -0.1084136962890625, -0.10107803344726562, -0.09374237060546875, -0.08640670776367188, -0.079071044921875, -0.07173538208007812, -0.06439971923828125, -0.057064056396484375, -0.0497283935546875, -0.042392730712890625, -0.03505706787109375, -0.027721405029296875, -0.0203857421875, -0.013050079345703125, -0.00571441650390625, 0.001621246337890625, 0.0089569091796875, 0.016292572021484375, 0.02362823486328125, 0.030963897705078125, 0.038299560546875, 0.045635223388671875, 0.05297088623046875, 0.060306549072265625, 0.0676422119140625, 0.07497787475585938, 0.08231353759765625, 0.08964920043945312, 0.09698486328125, 0.10432052612304688, 0.11165618896484375, 0.11899185180664062, 0.1263275146484375, 0.13366317749023438, 0.14099884033203125, 0.14833450317382812, 0.155670166015625, 0.16300582885742188, 0.17034149169921875, 0.17767715454101562, 0.1850128173828125, 0.19234848022460938, 0.19968414306640625, 0.20701980590820312, 0.21435546875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 0.0, 4.0, 6.0, 9.0, 11.0, 19.0, 23.0, 26.0, 36.0, 55.0, 112.0, 232.0, 477.0, 1105.0, 3053.0, 11389.0, 61851.0, 479376.0, 421674.0, 54080.0, 10238.0, 2782.0, 1057.0, 420.0, 214.0, 100.0, 67.0, 32.0, 29.0, 14.0, 13.0, 12.0, 9.0, 8.0, 3.0, 1.0, 3.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4775390625, -0.46105194091796875, -0.4445648193359375, -0.42807769775390625, -0.411590576171875, -0.39510345458984375, -0.3786163330078125, -0.36212921142578125, -0.34564208984375, -0.32915496826171875, -0.3126678466796875, -0.29618072509765625, -0.279693603515625, -0.26320648193359375, -0.2467193603515625, -0.23023223876953125, -0.2137451171875, -0.19725799560546875, -0.1807708740234375, -0.16428375244140625, -0.147796630859375, -0.13130950927734375, -0.1148223876953125, -0.09833526611328125, -0.08184814453125, -0.06536102294921875, -0.0488739013671875, -0.03238677978515625, -0.015899658203125, 0.00058746337890625, 0.0170745849609375, 0.03356170654296875, 0.050048828125, 0.06653594970703125, 0.0830230712890625, 0.09951019287109375, 0.115997314453125, 0.13248443603515625, 0.1489715576171875, 0.16545867919921875, 0.18194580078125, 0.19843292236328125, 0.2149200439453125, 0.23140716552734375, 0.247894287109375, 0.26438140869140625, 0.2808685302734375, 0.29735565185546875, 0.3138427734375, 0.33032989501953125, 0.3468170166015625, 0.36330413818359375, 0.379791259765625, 0.39627838134765625, 0.4127655029296875, 0.42925262451171875, 0.44573974609375, 0.46222686767578125, 0.4787139892578125, 0.49520111083984375, 0.511688232421875, 0.5281753540039062, 0.5446624755859375, 0.5611495971679688, 0.57763671875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 7.0, 14.0, 10.0, 13.0, 19.0, 14.0, 18.0, 26.0, 27.0, 37.0, 45.0, 40.0, 42.0, 36.0, 36.0, 44.0, 54.0, 47.0, 28.0, 34.0, 41.0, 40.0, 38.0, 34.0, 33.0, 29.0, 29.0, 22.0, 16.0, 19.0, 16.0, 17.0, 19.0, 8.0, 7.0, 4.0, 3.0, 6.0, 8.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389892578125, -0.3774566650390625, -0.365020751953125, -0.3525848388671875, -0.34014892578125, -0.3277130126953125, -0.315277099609375, -0.3028411865234375, -0.2904052734375, -0.2779693603515625, -0.265533447265625, -0.2530975341796875, -0.24066162109375, -0.2282257080078125, -0.215789794921875, -0.2033538818359375, -0.19091796875, -0.1784820556640625, -0.166046142578125, -0.1536102294921875, -0.14117431640625, -0.1287384033203125, -0.116302490234375, -0.1038665771484375, -0.0914306640625, -0.0789947509765625, -0.066558837890625, -0.0541229248046875, -0.04168701171875, -0.0292510986328125, -0.016815185546875, -0.0043792724609375, 0.008056640625, 0.0204925537109375, 0.032928466796875, 0.0453643798828125, 0.05780029296875, 0.0702362060546875, 0.082672119140625, 0.0951080322265625, 0.1075439453125, 0.1199798583984375, 0.132415771484375, 0.1448516845703125, 0.15728759765625, 0.1697235107421875, 0.182159423828125, 0.1945953369140625, 0.20703125, 0.2194671630859375, 0.231903076171875, 0.2443389892578125, 0.25677490234375, 0.2692108154296875, 0.281646728515625, 0.2940826416015625, 0.3065185546875, 0.3189544677734375, 0.331390380859375, 0.3438262939453125, 0.35626220703125, 0.3686981201171875, 0.381134033203125, 0.3935699462890625, 0.406005859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 18.0, 18.0, 38.0, 51.0, 83.0, 130.0, 252.0, 383.0, 668.0, 1316.0, 2941.0, 8656.0, 52742.0, 791991.0, 165794.0, 15466.0, 4220.0, 1741.0, 878.0, 472.0, 255.0, 178.0, 103.0, 56.0, 47.0, 27.0, 11.0, 9.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35205078125, -0.3416023254394531, -0.33115386962890625, -0.3207054138183594, -0.3102569580078125, -0.2998085021972656, -0.28936004638671875, -0.2789115905761719, -0.268463134765625, -0.2580146789550781, -0.24756622314453125, -0.23711776733398438, -0.2266693115234375, -0.21622085571289062, -0.20577239990234375, -0.19532394409179688, -0.18487548828125, -0.17442703247070312, -0.16397857666015625, -0.15353012084960938, -0.1430816650390625, -0.13263320922851562, -0.12218475341796875, -0.11173629760742188, -0.101287841796875, -0.09083938598632812, -0.08039093017578125, -0.06994247436523438, -0.0594940185546875, -0.049045562744140625, -0.03859710693359375, -0.028148651123046875, -0.0177001953125, -0.007251739501953125, 0.00319671630859375, 0.013645172119140625, 0.0240936279296875, 0.034542083740234375, 0.04499053955078125, 0.055438995361328125, 0.065887451171875, 0.07633590698242188, 0.08678436279296875, 0.09723281860351562, 0.1076812744140625, 0.11812973022460938, 0.12857818603515625, 0.13902664184570312, 0.14947509765625, 0.15992355346679688, 0.17037200927734375, 0.18082046508789062, 0.1912689208984375, 0.20171737670898438, 0.21216583251953125, 0.22261428833007812, 0.233062744140625, 0.24351119995117188, 0.25395965576171875, 0.2644081115722656, 0.2748565673828125, 0.2853050231933594, 0.29575347900390625, 0.3062019348144531, 0.316650390625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 7.0, 8.0, 12.0, 15.0, 36.0, 48.0, 96.0, 176.0, 232.0, 170.0, 81.0, 45.0, 26.0, 15.0, 7.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.285045623779297e-05, -8.064322173595428e-05, -7.84359872341156e-05, -7.622875273227692e-05, -7.402151823043823e-05, -7.181428372859955e-05, -6.960704922676086e-05, -6.739981472492218e-05, -6.51925802230835e-05, -6.298534572124481e-05, -6.077811121940613e-05, -5.8570876717567444e-05, -5.636364221572876e-05, -5.4156407713890076e-05, -5.194917321205139e-05, -4.974193871021271e-05, -4.7534704208374023e-05, -4.532746970653534e-05, -4.3120235204696655e-05, -4.091300070285797e-05, -3.870576620101929e-05, -3.64985316991806e-05, -3.429129719734192e-05, -3.2084062695503235e-05, -2.987682819366455e-05, -2.7669593691825867e-05, -2.5462359189987183e-05, -2.32551246881485e-05, -2.1047890186309814e-05, -1.884065568447113e-05, -1.6633421182632446e-05, -1.4426186680793762e-05, -1.2218952178955078e-05, -1.0011717677116394e-05, -7.80448317527771e-06, -5.597248673439026e-06, -3.390014171600342e-06, -1.1827796697616577e-06, 1.0244548320770264e-06, 3.2316893339157104e-06, 5.4389238357543945e-06, 7.646158337593079e-06, 9.853392839431763e-06, 1.2060627341270447e-05, 1.4267861843109131e-05, 1.6475096344947815e-05, 1.86823308467865e-05, 2.0889565348625183e-05, 2.3096799850463867e-05, 2.530403435230255e-05, 2.7511268854141235e-05, 2.971850335597992e-05, 3.1925737857818604e-05, 3.413297235965729e-05, 3.634020686149597e-05, 3.8547441363334656e-05, 4.075467586517334e-05, 4.2961910367012024e-05, 4.516914486885071e-05, 4.737637937068939e-05, 4.9583613872528076e-05, 5.179084837436676e-05, 5.3998082876205444e-05, 5.620531737804413e-05, 5.841255187988281e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 8.0, 3.0, 6.0, 21.0, 29.0, 49.0, 89.0, 196.0, 496.0, 1551.0, 6150.0, 38308.0, 758732.0, 221433.0, 16595.0, 3367.0, 969.0, 302.0, 121.0, 52.0, 26.0, 16.0, 19.0, 10.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.232177734375, -0.22044754028320312, -0.20871734619140625, -0.19698715209960938, -0.1852569580078125, -0.17352676391601562, -0.16179656982421875, -0.15006637573242188, -0.138336181640625, -0.12660598754882812, -0.11487579345703125, -0.10314559936523438, -0.0914154052734375, -0.07968521118164062, -0.06795501708984375, -0.056224822998046875, -0.04449462890625, -0.032764434814453125, -0.02103424072265625, -0.009304046630859375, 0.0024261474609375, 0.014156341552734375, 0.02588653564453125, 0.037616729736328125, 0.049346923828125, 0.061077117919921875, 0.07280731201171875, 0.08453750610351562, 0.0962677001953125, 0.10799789428710938, 0.11972808837890625, 0.13145828247070312, 0.1431884765625, 0.15491867065429688, 0.16664886474609375, 0.17837905883789062, 0.1901092529296875, 0.20183944702148438, 0.21356964111328125, 0.22529983520507812, 0.237030029296875, 0.24876022338867188, 0.26049041748046875, 0.2722206115722656, 0.2839508056640625, 0.2956809997558594, 0.30741119384765625, 0.3191413879394531, 0.33087158203125, 0.3426017761230469, 0.35433197021484375, 0.3660621643066406, 0.3777923583984375, 0.3895225524902344, 0.40125274658203125, 0.4129829406738281, 0.424713134765625, 0.4364433288574219, 0.44817352294921875, 0.4599037170410156, 0.4716339111328125, 0.4833641052246094, 0.49509429931640625, 0.5068244934082031, 0.5185546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 12.0, 9.0, 9.0, 12.0, 22.0, 26.0, 40.0, 59.0, 101.0, 113.0, 131.0, 127.0, 106.0, 78.0, 48.0, 29.0, 15.0, 25.0, 10.0, 7.0, 5.0, 5.0, 5.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1019287109375, -0.09494972229003906, -0.08797073364257812, -0.08099174499511719, -0.07401275634765625, -0.06703376770019531, -0.060054779052734375, -0.05307579040527344, -0.0460968017578125, -0.03911781311035156, -0.032138824462890625, -0.025159835815429688, -0.01818084716796875, -0.011201858520507812, -0.004222869873046875, 0.0027561187744140625, 0.009735107421875, 0.016714096069335938, 0.023693084716796875, 0.030672073364257812, 0.03765106201171875, 0.04463005065917969, 0.051609039306640625, 0.05858802795410156, 0.0655670166015625, 0.07254600524902344, 0.07952499389648438, 0.08650398254394531, 0.09348297119140625, 0.10046195983886719, 0.10744094848632812, 0.11441993713378906, 0.12139892578125, 0.12837791442871094, 0.13535690307617188, 0.1423358917236328, 0.14931488037109375, 0.1562938690185547, 0.16327285766601562, 0.17025184631347656, 0.1772308349609375, 0.18420982360839844, 0.19118881225585938, 0.1981678009033203, 0.20514678955078125, 0.2121257781982422, 0.21910476684570312, 0.22608375549316406, 0.233062744140625, 0.24004173278808594, 0.24702072143554688, 0.2539997100830078, 0.26097869873046875, 0.2679576873779297, 0.2749366760253906, 0.28191566467285156, 0.2888946533203125, 0.29587364196777344, 0.3028526306152344, 0.3098316192626953, 0.31681060791015625, 0.3237895965576172, 0.3307685852050781, 0.33774757385253906, 0.3447265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 16.0, 68.0, 343.0, 439.0, 120.0, 20.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.581859588623047, -17.262699127197266, -16.94353675842285, -16.62437629699707, -16.305213928222656, -15.986052513122559, -15.666891098022461, -15.347729682922363, -15.028568267822266, -14.709406852722168, -14.39024543762207, -14.071084022521973, -13.751922607421875, -13.432761192321777, -13.11359977722168, -12.794438362121582, -12.475276947021484, -12.156115531921387, -11.836954116821289, -11.517792701721191, -11.198631286621094, -10.879469871520996, -10.560308456420898, -10.2411470413208, -9.92198657989502, -9.602825164794922, -9.283663749694824, -8.964502334594727, -8.645340919494629, -8.326179504394531, -8.007018089294434, -7.687856674194336, -7.3686957359313965, -7.049534320831299, -6.730372905731201, -6.4112114906311035, -6.092050075531006, -5.772888660430908, -5.453727722167969, -5.134566307067871, -4.815404891967773, -4.496243476867676, -4.177082061767578, -3.8579206466674805, -3.538759231567383, -3.219597816467285, -2.9004366397857666, -2.581275224685669, -2.262113571166992, -1.9429521560668945, -1.6237907409667969, -1.3046294450759888, -0.9854680299758911, -0.6663066148757935, -0.34714531898498535, -0.027983903884887695, 0.29117751121520996, 0.6103389263153076, 0.9295002818107605, 1.2486616373062134, 1.567823052406311, 1.8869844675064087, 2.206145763397217, 2.5253071784973145, 2.844468593597412]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 9.0, 9.0, 13.0, 14.0, 9.0, 15.0, 28.0, 27.0, 18.0, 30.0, 25.0, 29.0, 39.0, 45.0, 40.0, 31.0, 35.0, 44.0, 37.0, 32.0, 43.0, 26.0, 32.0, 42.0, 32.0, 34.0, 33.0, 32.0, 33.0, 28.0, 21.0, 18.0, 13.0, 15.0, 12.0, 10.0, 11.0, 4.0, 4.0, 3.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.8922216892242432, -1.8328442573547363, -1.773466944694519, -1.7140895128250122, -1.654712200164795, -1.595334768295288, -1.5359573364257812, -1.476580023765564, -1.4172025918960571, -1.3578251600265503, -1.298447847366333, -1.2390704154968262, -1.1796931028366089, -1.120315670967102, -1.0609383583068848, -1.001560926437378, -0.9421835541725159, -0.8828061819076538, -0.8234288096427917, -0.7640514373779297, -0.7046740055084229, -0.6452966332435608, -0.5859192609786987, -0.5265418291091919, -0.4671644866466522, -0.40778711438179016, -0.3484097123146057, -0.28903234004974365, -0.2296549528837204, -0.17027756571769714, -0.11090019345283508, -0.051522791385650635, 0.007854580879211426, 0.06723196804523468, 0.12660935521125793, 0.18598672747612, 0.24536411464214325, 0.3047415018081665, 0.36411887407302856, 0.423496276140213, 0.4828736484050751, 0.5422510504722595, 0.6016284227371216, 0.6610057950019836, 0.7203831672668457, 0.7797605991363525, 0.8391379117965698, 0.8985153436660767, 0.9578927159309387, 1.0172700881958008, 1.0766475200653076, 1.136024832725525, 1.1954022645950317, 1.254779577255249, 1.3141570091247559, 1.3735344409942627, 1.43291175365448, 1.4922891855239868, 1.551666498184204, 1.611043930053711, 1.6704212427139282, 1.729798674583435, 1.7891759872436523, 1.8485534191131592, 1.907930850982666]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 7.0, 6.0, 8.0, 8.0, 14.0, 22.0, 18.0, 27.0, 52.0, 63.0, 92.0, 150.0, 235.0, 407.0, 752.0, 1700.0, 4654.0, 27813.0, 4121201.0, 28650.0, 5023.0, 1626.0, 753.0, 414.0, 212.0, 98.0, 98.0, 43.0, 29.0, 27.0, 17.0, 16.0, 7.0, 7.0, 4.0, 5.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.65625, -2.5814208984375, -2.506591796875, -2.4317626953125, -2.35693359375, -2.2821044921875, -2.207275390625, -2.1324462890625, -2.0576171875, -1.9827880859375, -1.907958984375, -1.8331298828125, -1.75830078125, -1.6834716796875, -1.608642578125, -1.5338134765625, -1.458984375, -1.3841552734375, -1.309326171875, -1.2344970703125, -1.15966796875, -1.0848388671875, -1.010009765625, -0.9351806640625, -0.8603515625, -0.7855224609375, -0.710693359375, -0.6358642578125, -0.56103515625, -0.4862060546875, -0.411376953125, -0.3365478515625, -0.26171875, -0.1868896484375, -0.112060546875, -0.0372314453125, 0.03759765625, 0.1124267578125, 0.187255859375, 0.2620849609375, 0.3369140625, 0.4117431640625, 0.486572265625, 0.5614013671875, 0.63623046875, 0.7110595703125, 0.785888671875, 0.8607177734375, 0.935546875, 1.0103759765625, 1.085205078125, 1.1600341796875, 1.23486328125, 1.3096923828125, 1.384521484375, 1.4593505859375, 1.5341796875, 1.6090087890625, 1.683837890625, 1.7586669921875, 1.83349609375, 1.9083251953125, 1.983154296875, 2.0579833984375, 2.1328125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 0.0, 3.0, 4.0, 1.0, 5.0, 15.0, 15.0, 21.0, 34.0, 30.0, 51.0, 54.0, 57.0, 73.0, 89.0, 94.0, 71.0, 64.0, 64.0, 77.0, 35.0, 42.0, 31.0, 17.0, 21.0, 11.0, 5.0, 3.0, 8.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24072265625, -0.23375511169433594, -0.22678756713867188, -0.2198200225830078, -0.21285247802734375, -0.2058849334716797, -0.19891738891601562, -0.19194984436035156, -0.1849822998046875, -0.17801475524902344, -0.17104721069335938, -0.1640796661376953, -0.15711212158203125, -0.1501445770263672, -0.14317703247070312, -0.13620948791503906, -0.129241943359375, -0.12227439880371094, -0.11530685424804688, -0.10833930969238281, -0.10137176513671875, -0.09440422058105469, -0.08743667602539062, -0.08046913146972656, -0.0735015869140625, -0.06653404235839844, -0.059566497802734375, -0.05259895324707031, -0.04563140869140625, -0.03866386413574219, -0.031696319580078125, -0.024728775024414062, -0.01776123046875, -0.010793685913085938, -0.003826141357421875, 0.0031414031982421875, 0.01010894775390625, 0.017076492309570312, 0.024044036865234375, 0.031011581420898438, 0.0379791259765625, 0.04494667053222656, 0.051914215087890625, 0.05888175964355469, 0.06584930419921875, 0.07281684875488281, 0.07978439331054688, 0.08675193786621094, 0.093719482421875, 0.10068702697753906, 0.10765457153320312, 0.11462211608886719, 0.12158966064453125, 0.1285572052001953, 0.13552474975585938, 0.14249229431152344, 0.1494598388671875, 0.15642738342285156, 0.16339492797851562, 0.1703624725341797, 0.17733001708984375, 0.1842975616455078, 0.19126510620117188, 0.19823265075683594, 0.2052001953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 7.0, 6.0, 9.0, 15.0, 19.0, 36.0, 53.0, 86.0, 145.0, 199.0, 394.0, 777.0, 2202.0, 8923.0, 180407.0, 3983389.0, 12739.0, 2856.0, 985.0, 411.0, 226.0, 126.0, 85.0, 69.0, 39.0, 18.0, 15.0, 13.0, 11.0, 8.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-3.595703125, -3.5102996826171875, -3.424896240234375, -3.3394927978515625, -3.25408935546875, -3.1686859130859375, -3.083282470703125, -2.9978790283203125, -2.9124755859375, -2.8270721435546875, -2.741668701171875, -2.6562652587890625, -2.57086181640625, -2.4854583740234375, -2.400054931640625, -2.3146514892578125, -2.229248046875, -2.1438446044921875, -2.058441162109375, -1.9730377197265625, -1.88763427734375, -1.8022308349609375, -1.716827392578125, -1.6314239501953125, -1.5460205078125, -1.4606170654296875, -1.375213623046875, -1.2898101806640625, -1.20440673828125, -1.1190032958984375, -1.033599853515625, -0.9481964111328125, -0.86279296875, -0.7773895263671875, -0.691986083984375, -0.6065826416015625, -0.52117919921875, -0.4357757568359375, -0.350372314453125, -0.2649688720703125, -0.1795654296875, -0.0941619873046875, -0.008758544921875, 0.0766448974609375, 0.16204833984375, 0.2474517822265625, 0.332855224609375, 0.4182586669921875, 0.503662109375, 0.5890655517578125, 0.674468994140625, 0.7598724365234375, 0.84527587890625, 0.9306793212890625, 1.016082763671875, 1.1014862060546875, 1.1868896484375, 1.2722930908203125, 1.357696533203125, 1.4430999755859375, 1.52850341796875, 1.6139068603515625, 1.699310302734375, 1.7847137451171875, 1.8701171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 2.0, 2.0, 9.0, 8.0, 14.0, 22.0, 40.0, 126.0, 3244.0, 456.0, 67.0, 24.0, 22.0, 16.0, 9.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.86962890625, -0.8488235473632812, -0.8280181884765625, -0.8072128295898438, -0.786407470703125, -0.7656021118164062, -0.7447967529296875, -0.7239913940429688, -0.70318603515625, -0.6823806762695312, -0.6615753173828125, -0.6407699584960938, -0.619964599609375, -0.5991592407226562, -0.5783538818359375, -0.5575485229492188, -0.5367431640625, -0.5159378051757812, -0.4951324462890625, -0.47432708740234375, -0.453521728515625, -0.43271636962890625, -0.4119110107421875, -0.39110565185546875, -0.37030029296875, -0.34949493408203125, -0.3286895751953125, -0.30788421630859375, -0.287078857421875, -0.26627349853515625, -0.2454681396484375, -0.22466278076171875, -0.203857421875, -0.18305206298828125, -0.1622467041015625, -0.14144134521484375, -0.120635986328125, -0.09983062744140625, -0.0790252685546875, -0.05821990966796875, -0.03741455078125, -0.01660919189453125, 0.0041961669921875, 0.02500152587890625, 0.045806884765625, 0.06661224365234375, 0.0874176025390625, 0.10822296142578125, 0.1290283203125, 0.14983367919921875, 0.1706390380859375, 0.19144439697265625, 0.212249755859375, 0.23305511474609375, 0.2538604736328125, 0.27466583251953125, 0.29547119140625, 0.31627655029296875, 0.3370819091796875, 0.35788726806640625, 0.378692626953125, 0.39949798583984375, 0.4203033447265625, 0.44110870361328125, 0.4619140625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 13.0, 18.0, 56.0, 147.0, 363.0, 234.0, 83.0, 38.0, 20.0, 9.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0790014266967773, -2.968052864074707, -2.8571040630340576, -2.746155261993408, -2.635206699371338, -2.5242581367492676, -2.413309335708618, -2.3023605346679688, -2.1914119720458984, -2.080463409423828, -1.9695146083831787, -1.8585659265518188, -1.747617244720459, -1.6366685628890991, -1.5257198810577393, -1.4147711992263794, -1.3038225173950195, -1.1928738355636597, -1.0819251537322998, -0.9709764719009399, -0.8600277900695801, -0.7490791082382202, -0.6381304264068604, -0.5271817445755005, -0.4162330627441406, -0.30528438091278076, -0.1943356990814209, -0.08338701725006104, 0.027561664581298828, 0.1385103464126587, 0.24945902824401855, 0.3604077100753784, 0.4713563919067383, 0.5823050737380981, 0.693253755569458, 0.8042024374008179, 0.9151511192321777, 1.0260998010635376, 1.1370484828948975, 1.2479971647262573, 1.3589458465576172, 1.469894528388977, 1.580843210220337, 1.6917918920516968, 1.8027405738830566, 1.9136892557144165, 2.0246379375457764, 2.135586738586426, 2.246535301208496, 2.3574838638305664, 2.468432664871216, 2.5793814659118652, 2.6903300285339355, 2.801278591156006, 2.9122273921966553, 3.0231761932373047, 3.134124755859375, 3.2450733184814453, 3.3560221195220947, 3.466970920562744, 3.5779194831848145, 3.6888680458068848, 3.799816846847534, 3.9107656478881836, 4.021714210510254]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 14.0, 20.0, 31.0, 46.0, 66.0, 77.0, 90.0, 116.0, 112.0, 105.0, 78.0, 73.0, 58.0, 33.0, 27.0, 20.0, 13.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9555420875549316, -1.8951339721679688, -1.8347258567810059, -1.774317741394043, -1.71390962600708, -1.6535015106201172, -1.5930933952331543, -1.5326852798461914, -1.4722771644592285, -1.4118690490722656, -1.3514609336853027, -1.2910528182983398, -1.230644702911377, -1.170236587524414, -1.1098284721374512, -1.0494203567504883, -0.9890123009681702, -0.9286041855812073, -0.8681960701942444, -0.8077879548072815, -0.7473798394203186, -0.6869717836380005, -0.6265636682510376, -0.5661555528640747, -0.5057474374771118, -0.4453393220901489, -0.38493120670318604, -0.32452309131622314, -0.26411497592926025, -0.20370689034461975, -0.14329877495765686, -0.08289065957069397, -0.02248251438140869, 0.0379255972802639, 0.09833370894193649, 0.1587418168783188, 0.21914993226528168, 0.2795580327510834, 0.33996614813804626, 0.40037426352500916, 0.46078237891197205, 0.5211904644966125, 0.5815985798835754, 0.6420066952705383, 0.7024148106575012, 0.7628229260444641, 0.823231041431427, 0.8836391568183899, 0.9440472722053528, 1.004455327987671, 1.0648634433746338, 1.1252715587615967, 1.1856796741485596, 1.2460877895355225, 1.3064959049224854, 1.3669040203094482, 1.4273121356964111, 1.487720251083374, 1.548128366470337, 1.6085364818572998, 1.6689445972442627, 1.7293527126312256, 1.7897608280181885, 1.8501689434051514, 1.9105770587921143]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 8.0, 8.0, 9.0, 14.0, 16.0, 18.0, 19.0, 30.0, 38.0, 74.0, 86.0, 125.0, 157.0, 275.0, 399.0, 709.0, 1206.0, 2303.0, 5093.0, 13277.0, 44668.0, 257357.0, 585929.0, 97785.0, 23399.0, 7991.0, 3401.0, 1673.0, 877.0, 510.0, 313.0, 228.0, 160.0, 99.0, 79.0, 44.0, 38.0, 36.0, 22.0, 19.0, 12.0, 13.0, 7.0, 4.0, 3.0, 5.0, 1.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.798828125, -0.7748031616210938, -0.7507781982421875, -0.7267532348632812, -0.702728271484375, -0.6787033081054688, -0.6546783447265625, -0.6306533813476562, -0.60662841796875, -0.5826034545898438, -0.5585784912109375, -0.5345535278320312, -0.510528564453125, -0.48650360107421875, -0.4624786376953125, -0.43845367431640625, -0.4144287109375, -0.39040374755859375, -0.3663787841796875, -0.34235382080078125, -0.318328857421875, -0.29430389404296875, -0.2702789306640625, -0.24625396728515625, -0.22222900390625, -0.19820404052734375, -0.1741790771484375, -0.15015411376953125, -0.126129150390625, -0.10210418701171875, -0.0780792236328125, -0.05405426025390625, -0.030029296875, -0.00600433349609375, 0.0180206298828125, 0.04204559326171875, 0.066070556640625, 0.09009552001953125, 0.1141204833984375, 0.13814544677734375, 0.16217041015625, 0.18619537353515625, 0.2102203369140625, 0.23424530029296875, 0.258270263671875, 0.28229522705078125, 0.3063201904296875, 0.33034515380859375, 0.3543701171875, 0.37839508056640625, 0.4024200439453125, 0.42644500732421875, 0.450469970703125, 0.47449493408203125, 0.4985198974609375, 0.5225448608398438, 0.54656982421875, 0.5705947875976562, 0.5946197509765625, 0.6186447143554688, 0.642669677734375, 0.6666946411132812, 0.6907196044921875, 0.7147445678710938, 0.73876953125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 2.0, 10.0, 17.0, 25.0, 29.0, 39.0, 48.0, 65.0, 67.0, 91.0, 80.0, 85.0, 69.0, 76.0, 66.0, 56.0, 41.0, 29.0, 32.0, 18.0, 17.0, 8.0, 9.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2765789031982422, -0.2687339782714844, -0.26088905334472656, -0.25304412841796875, -0.24519920349121094, -0.23735427856445312, -0.2295093536376953, -0.2216644287109375, -0.2138195037841797, -0.20597457885742188, -0.19812965393066406, -0.19028472900390625, -0.18243980407714844, -0.17459487915039062, -0.1667499542236328, -0.158905029296875, -0.1510601043701172, -0.14321517944335938, -0.13537025451660156, -0.12752532958984375, -0.11968040466308594, -0.11183547973632812, -0.10399055480957031, -0.0961456298828125, -0.08830070495605469, -0.08045578002929688, -0.07261085510253906, -0.06476593017578125, -0.05692100524902344, -0.049076080322265625, -0.04123115539550781, -0.03338623046875, -0.025541305541992188, -0.017696380615234375, -0.009851455688476562, -0.00200653076171875, 0.0058383941650390625, 0.013683319091796875, 0.021528244018554688, 0.0293731689453125, 0.03721809387207031, 0.045063018798828125, 0.05290794372558594, 0.06075286865234375, 0.06859779357910156, 0.07644271850585938, 0.08428764343261719, 0.092132568359375, 0.09997749328613281, 0.10782241821289062, 0.11566734313964844, 0.12351226806640625, 0.13135719299316406, 0.13920211791992188, 0.1470470428466797, 0.1548919677734375, 0.1627368927001953, 0.17058181762695312, 0.17842674255371094, 0.18627166748046875, 0.19411659240722656, 0.20196151733398438, 0.2098064422607422, 0.2176513671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 7.0, 5.0, 1.0, 9.0, 14.0, 17.0, 27.0, 38.0, 58.0, 86.0, 170.0, 290.0, 639.0, 1452.0, 4381.0, 15688.0, 82079.0, 617582.0, 275672.0, 36922.0, 8630.0, 2739.0, 1006.0, 440.0, 238.0, 144.0, 81.0, 42.0, 28.0, 23.0, 10.0, 14.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59375, -0.5750656127929688, -0.5563812255859375, -0.5376968383789062, -0.519012451171875, -0.5003280639648438, -0.4816436767578125, -0.46295928955078125, -0.44427490234375, -0.42559051513671875, -0.4069061279296875, -0.38822174072265625, -0.369537353515625, -0.35085296630859375, -0.3321685791015625, -0.31348419189453125, -0.2947998046875, -0.27611541748046875, -0.2574310302734375, -0.23874664306640625, -0.220062255859375, -0.20137786865234375, -0.1826934814453125, -0.16400909423828125, -0.14532470703125, -0.12664031982421875, -0.1079559326171875, -0.08927154541015625, -0.070587158203125, -0.05190277099609375, -0.0332183837890625, -0.01453399658203125, 0.004150390625, 0.02283477783203125, 0.0415191650390625, 0.06020355224609375, 0.078887939453125, 0.09757232666015625, 0.1162567138671875, 0.13494110107421875, 0.15362548828125, 0.17230987548828125, 0.1909942626953125, 0.20967864990234375, 0.228363037109375, 0.24704742431640625, 0.2657318115234375, 0.28441619873046875, 0.3031005859375, 0.32178497314453125, 0.3404693603515625, 0.35915374755859375, 0.377838134765625, 0.39652252197265625, 0.4152069091796875, 0.43389129638671875, 0.45257568359375, 0.47126007080078125, 0.4899444580078125, 0.5086288452148438, 0.527313232421875, 0.5459976196289062, 0.5646820068359375, 0.5833663940429688, 0.60205078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 5.0, 5.0, 13.0, 10.0, 16.0, 16.0, 20.0, 20.0, 21.0, 21.0, 29.0, 31.0, 28.0, 31.0, 46.0, 32.0, 46.0, 49.0, 34.0, 39.0, 52.0, 41.0, 50.0, 28.0, 40.0, 23.0, 34.0, 36.0, 30.0, 31.0, 23.0, 15.0, 14.0, 7.0, 10.0, 10.0, 9.0, 7.0, 2.0, 6.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.493896484375, -0.4783287048339844, -0.46276092529296875, -0.4471931457519531, -0.4316253662109375, -0.4160575866699219, -0.40048980712890625, -0.3849220275878906, -0.369354248046875, -0.3537864685058594, -0.33821868896484375, -0.3226509094238281, -0.3070831298828125, -0.2915153503417969, -0.27594757080078125, -0.2603797912597656, -0.24481201171875, -0.22924423217773438, -0.21367645263671875, -0.19810867309570312, -0.1825408935546875, -0.16697311401367188, -0.15140533447265625, -0.13583755493164062, -0.120269775390625, -0.10470199584960938, -0.08913421630859375, -0.07356643676757812, -0.0579986572265625, -0.042430877685546875, -0.02686309814453125, -0.011295318603515625, 0.0042724609375, 0.019840240478515625, 0.03540802001953125, 0.050975799560546875, 0.0665435791015625, 0.08211135864257812, 0.09767913818359375, 0.11324691772460938, 0.128814697265625, 0.14438247680664062, 0.15995025634765625, 0.17551803588867188, 0.1910858154296875, 0.20665359497070312, 0.22222137451171875, 0.23778915405273438, 0.25335693359375, 0.2689247131347656, 0.28449249267578125, 0.3000602722167969, 0.3156280517578125, 0.3311958312988281, 0.34676361083984375, 0.3623313903808594, 0.377899169921875, 0.3934669494628906, 0.40903472900390625, 0.4246025085449219, 0.4401702880859375, 0.4557380676269531, 0.47130584716796875, 0.4868736267089844, 0.50244140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 8.0, 5.0, 20.0, 26.0, 53.0, 96.0, 188.0, 353.0, 902.0, 3289.0, 21723.0, 298388.0, 669272.0, 46018.0, 5937.0, 1325.0, 437.0, 234.0, 109.0, 79.0, 38.0, 23.0, 11.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.275146484375, -0.26421356201171875, -0.2532806396484375, -0.24234771728515625, -0.231414794921875, -0.22048187255859375, -0.2095489501953125, -0.19861602783203125, -0.18768310546875, -0.17675018310546875, -0.1658172607421875, -0.15488433837890625, -0.143951416015625, -0.13301849365234375, -0.1220855712890625, -0.11115264892578125, -0.1002197265625, -0.08928680419921875, -0.0783538818359375, -0.06742095947265625, -0.056488037109375, -0.04555511474609375, -0.0346221923828125, -0.02368927001953125, -0.01275634765625, -0.00182342529296875, 0.0091094970703125, 0.02004241943359375, 0.030975341796875, 0.04190826416015625, 0.0528411865234375, 0.06377410888671875, 0.07470703125, 0.08563995361328125, 0.0965728759765625, 0.10750579833984375, 0.118438720703125, 0.12937164306640625, 0.1403045654296875, 0.15123748779296875, 0.16217041015625, 0.17310333251953125, 0.1840362548828125, 0.19496917724609375, 0.205902099609375, 0.21683502197265625, 0.2277679443359375, 0.23870086669921875, 0.2496337890625, 0.26056671142578125, 0.2714996337890625, 0.28243255615234375, 0.293365478515625, 0.30429840087890625, 0.3152313232421875, 0.32616424560546875, 0.33709716796875, 0.34803009033203125, 0.3589630126953125, 0.36989593505859375, 0.380828857421875, 0.39176177978515625, 0.4026947021484375, 0.41362762451171875, 0.424560546875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 12.0, 6.0, 7.0, 18.0, 24.0, 51.0, 77.0, 117.0, 170.0, 176.0, 128.0, 74.0, 46.0, 37.0, 25.0, 13.0, 5.0, 6.0, 8.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.470348358154297e-05, -4.233699291944504e-05, -3.997050225734711e-05, -3.7604011595249176e-05, -3.5237520933151245e-05, -3.2871030271053314e-05, -3.0504539608955383e-05, -2.8138048946857452e-05, -2.577155828475952e-05, -2.340506762266159e-05, -2.103857696056366e-05, -1.867208629846573e-05, -1.6305595636367798e-05, -1.3939104974269867e-05, -1.1572614312171936e-05, -9.206123650074005e-06, -6.839632987976074e-06, -4.473142325878143e-06, -2.1066516637802124e-06, 2.598389983177185e-07, 2.6263296604156494e-06, 4.99282032251358e-06, 7.359310984611511e-06, 9.725801646709442e-06, 1.2092292308807373e-05, 1.4458782970905304e-05, 1.6825273633003235e-05, 1.9191764295101166e-05, 2.1558254957199097e-05, 2.3924745619297028e-05, 2.629123628139496e-05, 2.865772694349289e-05, 3.102421760559082e-05, 3.339070826768875e-05, 3.575719892978668e-05, 3.812368959188461e-05, 4.0490180253982544e-05, 4.2856670916080475e-05, 4.5223161578178406e-05, 4.758965224027634e-05, 4.995614290237427e-05, 5.23226335644722e-05, 5.468912422657013e-05, 5.705561488866806e-05, 5.942210555076599e-05, 6.178859621286392e-05, 6.415508687496185e-05, 6.652157753705978e-05, 6.888806819915771e-05, 7.125455886125565e-05, 7.362104952335358e-05, 7.598754018545151e-05, 7.835403084754944e-05, 8.072052150964737e-05, 8.30870121717453e-05, 8.545350283384323e-05, 8.781999349594116e-05, 9.018648415803909e-05, 9.255297482013702e-05, 9.491946548223495e-05, 9.728595614433289e-05, 9.965244680643082e-05, 0.00010201893746852875, 0.00010438542813062668, 0.00010675191879272461]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 8.0, 15.0, 12.0, 17.0, 42.0, 56.0, 106.0, 229.0, 423.0, 1086.0, 2659.0, 7535.0, 23250.0, 91196.0, 430330.0, 380465.0, 79722.0, 20715.0, 6406.0, 2359.0, 954.0, 444.0, 222.0, 110.0, 68.0, 49.0, 26.0, 12.0, 10.0, 8.0, 3.0, 8.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.252197265625, -0.2449817657470703, -0.23776626586914062, -0.23055076599121094, -0.22333526611328125, -0.21611976623535156, -0.20890426635742188, -0.2016887664794922, -0.1944732666015625, -0.1872577667236328, -0.18004226684570312, -0.17282676696777344, -0.16561126708984375, -0.15839576721191406, -0.15118026733398438, -0.1439647674560547, -0.136749267578125, -0.1295337677001953, -0.12231826782226562, -0.11510276794433594, -0.10788726806640625, -0.10067176818847656, -0.09345626831054688, -0.08624076843261719, -0.0790252685546875, -0.07180976867675781, -0.06459426879882812, -0.05737876892089844, -0.05016326904296875, -0.04294776916503906, -0.035732269287109375, -0.028516769409179688, -0.02130126953125, -0.014085769653320312, -0.006870269775390625, 0.0003452301025390625, 0.00756072998046875, 0.014776229858398438, 0.021991729736328125, 0.029207229614257812, 0.0364227294921875, 0.04363822937011719, 0.050853729248046875, 0.05806922912597656, 0.06528472900390625, 0.07250022888183594, 0.07971572875976562, 0.08693122863769531, 0.094146728515625, 0.10136222839355469, 0.10857772827148438, 0.11579322814941406, 0.12300872802734375, 0.13022422790527344, 0.13743972778320312, 0.1446552276611328, 0.1518707275390625, 0.1590862274169922, 0.16630172729492188, 0.17351722717285156, 0.18073272705078125, 0.18794822692871094, 0.19516372680664062, 0.2023792266845703, 0.2095947265625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 10.0, 7.0, 15.0, 15.0, 11.0, 25.0, 33.0, 30.0, 35.0, 56.0, 61.0, 47.0, 54.0, 53.0, 85.0, 77.0, 61.0, 41.0, 48.0, 41.0, 33.0, 30.0, 21.0, 30.0, 18.0, 11.0, 12.0, 10.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1517333984375, -0.14715003967285156, -0.14256668090820312, -0.1379833221435547, -0.13339996337890625, -0.1288166046142578, -0.12423324584960938, -0.11964988708496094, -0.1150665283203125, -0.11048316955566406, -0.10589981079101562, -0.10131645202636719, -0.09673309326171875, -0.09214973449707031, -0.08756637573242188, -0.08298301696777344, -0.078399658203125, -0.07381629943847656, -0.06923294067382812, -0.06464958190917969, -0.06006622314453125, -0.05548286437988281, -0.050899505615234375, -0.04631614685058594, -0.0417327880859375, -0.03714942932128906, -0.032566070556640625, -0.027982711791992188, -0.02339935302734375, -0.018815994262695312, -0.014232635498046875, -0.009649276733398438, -0.00506591796875, -0.0004825592041015625, 0.004100799560546875, 0.008684158325195312, 0.01326751708984375, 0.017850875854492188, 0.022434234619140625, 0.027017593383789062, 0.0316009521484375, 0.03618431091308594, 0.040767669677734375, 0.04535102844238281, 0.04993438720703125, 0.05451774597167969, 0.059101104736328125, 0.06368446350097656, 0.068267822265625, 0.07285118103027344, 0.07743453979492188, 0.08201789855957031, 0.08660125732421875, 0.09118461608886719, 0.09576797485351562, 0.10035133361816406, 0.1049346923828125, 0.10951805114746094, 0.11410140991210938, 0.11868476867675781, 0.12326812744140625, 0.1278514862060547, 0.13243484497070312, 0.13701820373535156, 0.1416015625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 13.0, 16.0, 31.0, 79.0, 155.0, 207.0, 233.0, 137.0, 84.0, 28.0, 11.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.218921661376953, -9.038656234741211, -8.858390808105469, -8.678125381469727, -8.497859001159668, -8.317593574523926, -8.137328147888184, -7.957062721252441, -7.776797294616699, -7.596531867980957, -7.416265964508057, -7.2360005378723145, -7.055735111236572, -6.875469207763672, -6.69520378112793, -6.5149383544921875, -6.334672451019287, -6.154407024383545, -5.9741411209106445, -5.793875694274902, -5.61361026763916, -5.433344841003418, -5.253078937530518, -5.072813510894775, -4.892547607421875, -4.712282180786133, -4.532016277313232, -4.35175085067749, -4.171485424041748, -3.9912197589874268, -3.8109540939331055, -3.6306886672973633, -3.450423002243042, -3.2701573371887207, -3.0898919105529785, -2.9096262454986572, -2.729360580444336, -2.5490951538085938, -2.3688294887542725, -2.188563823699951, -2.008298397064209, -1.8280328512191772, -1.6477673053741455, -1.4675016403198242, -1.2872360944747925, -1.1069705486297607, -0.9267048835754395, -0.7464393377304077, -0.566173791885376, -0.38590821623802185, -0.20564264059066772, -0.02537703514099121, 0.15488851070404053, 0.33515405654907227, 0.5154197216033936, 0.6956852674484253, 0.875950813293457, 1.0562163591384888, 1.2364819049835205, 1.4167475700378418, 1.5970131158828735, 1.7772786617279053, 1.9575443267822266, 2.1378097534179688, 2.31807541847229]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 7.0, 13.0, 10.0, 8.0, 16.0, 21.0, 21.0, 13.0, 14.0, 31.0, 24.0, 34.0, 48.0, 44.0, 39.0, 36.0, 46.0, 41.0, 32.0, 43.0, 40.0, 41.0, 41.0, 40.0, 25.0, 34.0, 30.0, 31.0, 27.0, 24.0, 19.0, 19.0, 12.0, 11.0, 15.0, 12.0, 3.0, 5.0, 8.0, 9.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2936625480651855, -2.2171123027801514, -2.140562057495117, -2.064011573791504, -1.9874613285064697, -1.9109110832214355, -1.8343608379364014, -1.7578105926513672, -1.6812602281570435, -1.6047099828720093, -1.5281596183776855, -1.4516093730926514, -1.3750591278076172, -1.2985087633132935, -1.2219585180282593, -1.1454081535339355, -1.0688579082489014, -0.9923076033592224, -0.9157572984695435, -0.8392070531845093, -0.7626567482948303, -0.6861064434051514, -0.6095561981201172, -0.5330058932304382, -0.4564555883407593, -0.3799052834510803, -0.30335500836372375, -0.226804718375206, -0.15025442838668823, -0.07370412349700928, 0.00284615159034729, 0.07939642667770386, 0.1559467315673828, 0.23249702155590057, 0.30904731154441833, 0.3855975866317749, 0.46214789152145386, 0.5386981964111328, 0.615248441696167, 0.691798746585846, 0.7683490514755249, 0.8448993563652039, 0.9214496612548828, 0.997999906539917, 1.0745501518249512, 1.151100516319275, 1.227650761604309, 1.3042011260986328, 1.380751371383667, 1.4573016166687012, 1.533851981163025, 1.610402226448059, 1.6869525909423828, 1.763502836227417, 1.8400530815124512, 1.9166033267974854, 1.993153691291809, 2.069704055786133, 2.146254301071167, 2.222804546356201, 2.2993547916412354, 2.3759050369262695, 2.452455520629883, 2.529005765914917, 2.605556011199951]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 3.0, 9.0, 13.0, 9.0, 16.0, 25.0, 30.0, 49.0, 58.0, 107.0, 165.0, 220.0, 465.0, 893.0, 2296.0, 8157.0, 118049.0, 4043248.0, 14496.0, 3432.0, 1251.0, 577.0, 294.0, 151.0, 89.0, 60.0, 35.0, 23.0, 14.0, 14.0, 8.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.5, -2.4308624267578125, -2.361724853515625, -2.2925872802734375, -2.22344970703125, -2.1543121337890625, -2.085174560546875, -2.0160369873046875, -1.9468994140625, -1.8777618408203125, -1.808624267578125, -1.7394866943359375, -1.67034912109375, -1.6012115478515625, -1.532073974609375, -1.4629364013671875, -1.393798828125, -1.3246612548828125, -1.255523681640625, -1.1863861083984375, -1.11724853515625, -1.0481109619140625, -0.978973388671875, -0.9098358154296875, -0.8406982421875, -0.7715606689453125, -0.702423095703125, -0.6332855224609375, -0.56414794921875, -0.4950103759765625, -0.425872802734375, -0.3567352294921875, -0.28759765625, -0.2184600830078125, -0.149322509765625, -0.0801849365234375, -0.01104736328125, 0.0580902099609375, 0.127227783203125, 0.1963653564453125, 0.2655029296875, 0.3346405029296875, 0.403778076171875, 0.4729156494140625, 0.54205322265625, 0.6111907958984375, 0.680328369140625, 0.7494659423828125, 0.818603515625, 0.8877410888671875, 0.956878662109375, 1.0260162353515625, 1.09515380859375, 1.1642913818359375, 1.233428955078125, 1.3025665283203125, 1.3717041015625, 1.4408416748046875, 1.509979248046875, 1.5791168212890625, 1.64825439453125, 1.7173919677734375, 1.786529541015625, 1.8556671142578125, 1.9248046875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 3.0, 7.0, 8.0, 18.0, 27.0, 31.0, 35.0, 63.0, 49.0, 63.0, 83.0, 108.0, 82.0, 83.0, 71.0, 57.0, 64.0, 34.0, 32.0, 26.0, 21.0, 9.0, 11.0, 12.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.283447265625, -0.2753753662109375, -0.267303466796875, -0.2592315673828125, -0.25115966796875, -0.2430877685546875, -0.235015869140625, -0.2269439697265625, -0.2188720703125, -0.2108001708984375, -0.202728271484375, -0.1946563720703125, -0.18658447265625, -0.1785125732421875, -0.170440673828125, -0.1623687744140625, -0.154296875, -0.1462249755859375, -0.138153076171875, -0.1300811767578125, -0.12200927734375, -0.1139373779296875, -0.105865478515625, -0.0977935791015625, -0.0897216796875, -0.0816497802734375, -0.073577880859375, -0.0655059814453125, -0.05743408203125, -0.0493621826171875, -0.041290283203125, -0.0332183837890625, -0.025146484375, -0.0170745849609375, -0.009002685546875, -0.0009307861328125, 0.00714111328125, 0.0152130126953125, 0.023284912109375, 0.0313568115234375, 0.0394287109375, 0.0475006103515625, 0.055572509765625, 0.0636444091796875, 0.07171630859375, 0.0797882080078125, 0.087860107421875, 0.0959320068359375, 0.10400390625, 0.1120758056640625, 0.120147705078125, 0.1282196044921875, 0.13629150390625, 0.1443634033203125, 0.152435302734375, 0.1605072021484375, 0.1685791015625, 0.1766510009765625, 0.184722900390625, 0.1927947998046875, 0.20086669921875, 0.2089385986328125, 0.217010498046875, 0.2250823974609375, 0.233154296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 13.0, 15.0, 26.0, 50.0, 46.0, 72.0, 143.0, 227.0, 337.0, 640.0, 1148.0, 2489.0, 6286.0, 22470.0, 3946624.0, 190844.0, 13975.0, 4655.0, 1922.0, 946.0, 505.0, 283.0, 189.0, 129.0, 81.0, 54.0, 32.0, 28.0, 11.0, 8.0, 8.0, 4.0, 8.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5947265625, -1.5353240966796875, -1.475921630859375, -1.4165191650390625, -1.35711669921875, -1.2977142333984375, -1.238311767578125, -1.1789093017578125, -1.1195068359375, -1.0601043701171875, -1.000701904296875, -0.9412994384765625, -0.88189697265625, -0.8224945068359375, -0.763092041015625, -0.7036895751953125, -0.644287109375, -0.5848846435546875, -0.525482177734375, -0.4660797119140625, -0.40667724609375, -0.3472747802734375, -0.287872314453125, -0.2284698486328125, -0.1690673828125, -0.1096649169921875, -0.050262451171875, 0.0091400146484375, 0.06854248046875, 0.1279449462890625, 0.187347412109375, 0.2467498779296875, 0.30615234375, 0.3655548095703125, 0.424957275390625, 0.4843597412109375, 0.54376220703125, 0.6031646728515625, 0.662567138671875, 0.7219696044921875, 0.7813720703125, 0.8407745361328125, 0.900177001953125, 0.9595794677734375, 1.01898193359375, 1.0783843994140625, 1.137786865234375, 1.1971893310546875, 1.256591796875, 1.3159942626953125, 1.375396728515625, 1.4347991943359375, 1.49420166015625, 1.5536041259765625, 1.613006591796875, 1.6724090576171875, 1.7318115234375, 1.7912139892578125, 1.850616455078125, 1.9100189208984375, 1.96942138671875, 2.0288238525390625, 2.088226318359375, 2.1476287841796875, 2.20703125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 2.0, 6.0, 7.0, 12.0, 7.0, 13.0, 19.0, 68.0, 176.0, 3184.0, 383.0, 91.0, 45.0, 18.0, 7.0, 9.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60302734375, -0.5804290771484375, -0.557830810546875, -0.5352325439453125, -0.51263427734375, -0.4900360107421875, -0.467437744140625, -0.4448394775390625, -0.4222412109375, -0.3996429443359375, -0.377044677734375, -0.3544464111328125, -0.33184814453125, -0.3092498779296875, -0.286651611328125, -0.2640533447265625, -0.241455078125, -0.2188568115234375, -0.196258544921875, -0.1736602783203125, -0.15106201171875, -0.1284637451171875, -0.105865478515625, -0.0832672119140625, -0.0606689453125, -0.0380706787109375, -0.015472412109375, 0.0071258544921875, 0.02972412109375, 0.0523223876953125, 0.074920654296875, 0.0975189208984375, 0.1201171875, 0.1427154541015625, 0.165313720703125, 0.1879119873046875, 0.21051025390625, 0.2331085205078125, 0.255706787109375, 0.2783050537109375, 0.3009033203125, 0.3235015869140625, 0.346099853515625, 0.3686981201171875, 0.39129638671875, 0.4138946533203125, 0.436492919921875, 0.4590911865234375, 0.481689453125, 0.5042877197265625, 0.526885986328125, 0.5494842529296875, 0.57208251953125, 0.5946807861328125, 0.617279052734375, 0.6398773193359375, 0.6624755859375, 0.6850738525390625, 0.707672119140625, 0.7302703857421875, 0.75286865234375, 0.7754669189453125, 0.798065185546875, 0.8206634521484375, 0.84326171875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 21.0, 77.0, 388.0, 414.0, 63.0, 25.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.38399887084961, -11.125666618347168, -10.86733341217041, -10.609001159667969, -10.350668907165527, -10.092336654663086, -9.834003448486328, -9.575671195983887, -9.317338943481445, -9.059006690979004, -8.800673484802246, -8.542341232299805, -8.284008979797363, -8.025676727294922, -7.767343521118164, -7.509011268615723, -7.250678062438965, -6.992345333099365, -6.734013080596924, -6.475680351257324, -6.217348098754883, -5.959015369415283, -5.700682640075684, -5.442350387573242, -5.184017658233643, -4.925684928894043, -4.667352676391602, -4.409019947052002, -4.150687217712402, -3.892354965209961, -3.6340222358703613, -3.375689744949341, -3.117356300354004, -2.8590238094329834, -2.600691318511963, -2.3423585891723633, -2.0840260982513428, -1.8256936073303223, -1.5673609972000122, -1.3090283870697021, -1.0506958961486816, -0.7923633456230164, -0.5340307950973511, -0.2756982445716858, -0.017365694046020508, 0.240966796875, 0.49929940700531006, 0.7576320171356201, 1.0159645080566406, 1.2742969989776611, 1.5326296091079712, 1.7909622192382812, 2.0492947101593018, 2.3076272010803223, 2.565959930419922, 2.8242924213409424, 3.082624912261963, 3.3409574031829834, 3.599289894104004, 3.8576226234436035, 4.115955352783203, 4.3742876052856445, 4.632620334625244, 4.890953063964844, 5.149285316467285]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 9.0, 25.0, 29.0, 46.0, 54.0, 67.0, 101.0, 94.0, 112.0, 102.0, 102.0, 88.0, 69.0, 40.0, 21.0, 16.0, 9.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1993274688720703, -3.115741491317749, -3.0321555137634277, -2.9485695362091064, -2.864983558654785, -2.781397819519043, -2.6978116035461426, -2.6142258644104004, -2.530639886856079, -2.447053909301758, -2.3634679317474365, -2.2798819541931152, -2.196295976638794, -2.1127099990844727, -2.0291242599487305, -1.9455382823944092, -1.8619521856307983, -1.778366208076477, -1.6947802305221558, -1.611194372177124, -1.5276083946228027, -1.4440224170684814, -1.3604364395141602, -1.2768504619598389, -1.1932644844055176, -1.1096785068511963, -1.026092529296875, -0.9425066113471985, -0.858920693397522, -0.7753347158432007, -0.6917487382888794, -0.6081628203392029, -0.5245769023895264, -0.44099095463752747, -0.35740500688552856, -0.2738190293312073, -0.19023308157920837, -0.10664713382720947, -0.023061156272888184, 0.06052476167678833, 0.14411073923110962, 0.22769668698310852, 0.3112826347351074, 0.3948686122894287, 0.4784545600414276, 0.5620405077934265, 0.6456264853477478, 0.7292124032974243, 0.8127983808517456, 0.8963843584060669, 0.9799702763557434, 1.06355619430542, 1.1471421718597412, 1.2307281494140625, 1.3143141269683838, 1.397900104522705, 1.4814860820770264, 1.5650720596313477, 1.648658037185669, 1.7322440147399902, 1.815829873085022, 1.8994158506393433, 1.9830018281936646, 2.0665876865386963, 2.1501736640930176]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 5.0, 3.0, 3.0, 4.0, 4.0, 10.0, 18.0, 20.0, 16.0, 28.0, 37.0, 71.0, 88.0, 133.0, 226.0, 344.0, 610.0, 1104.0, 2405.0, 5647.0, 19052.0, 96586.0, 666151.0, 209208.0, 31882.0, 8447.0, 3077.0, 1394.0, 724.0, 445.0, 240.0, 174.0, 125.0, 71.0, 54.0, 37.0, 38.0, 21.0, 10.0, 4.0, 14.0, 13.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.0302734375, -1.0005645751953125, -0.970855712890625, -0.9411468505859375, -0.91143798828125, -0.8817291259765625, -0.852020263671875, -0.8223114013671875, -0.7926025390625, -0.7628936767578125, -0.733184814453125, -0.7034759521484375, -0.67376708984375, -0.6440582275390625, -0.614349365234375, -0.5846405029296875, -0.554931640625, -0.5252227783203125, -0.495513916015625, -0.4658050537109375, -0.43609619140625, -0.4063873291015625, -0.376678466796875, -0.3469696044921875, -0.3172607421875, -0.2875518798828125, -0.257843017578125, -0.2281341552734375, -0.19842529296875, -0.1687164306640625, -0.139007568359375, -0.1092987060546875, -0.07958984375, -0.0498809814453125, -0.020172119140625, 0.0095367431640625, 0.03924560546875, 0.0689544677734375, 0.098663330078125, 0.1283721923828125, 0.1580810546875, 0.1877899169921875, 0.217498779296875, 0.2472076416015625, 0.27691650390625, 0.3066253662109375, 0.336334228515625, 0.3660430908203125, 0.395751953125, 0.4254608154296875, 0.455169677734375, 0.4848785400390625, 0.51458740234375, 0.5442962646484375, 0.574005126953125, 0.6037139892578125, 0.6334228515625, 0.6631317138671875, 0.692840576171875, 0.7225494384765625, 0.75225830078125, 0.7819671630859375, 0.811676025390625, 0.8413848876953125, 0.87109375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 4.0, 9.0, 8.0, 16.0, 21.0, 29.0, 43.0, 37.0, 62.0, 71.0, 76.0, 116.0, 67.0, 84.0, 66.0, 74.0, 46.0, 45.0, 28.0, 33.0, 22.0, 18.0, 13.0, 10.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302001953125, -0.2931938171386719, -0.28438568115234375, -0.2755775451660156, -0.2667694091796875, -0.2579612731933594, -0.24915313720703125, -0.24034500122070312, -0.231536865234375, -0.22272872924804688, -0.21392059326171875, -0.20511245727539062, -0.1963043212890625, -0.18749618530273438, -0.17868804931640625, -0.16987991333007812, -0.16107177734375, -0.15226364135742188, -0.14345550537109375, -0.13464736938476562, -0.1258392333984375, -0.11703109741210938, -0.10822296142578125, -0.09941482543945312, -0.090606689453125, -0.08179855346679688, -0.07299041748046875, -0.06418228149414062, -0.0553741455078125, -0.046566009521484375, -0.03775787353515625, -0.028949737548828125, -0.0201416015625, -0.011333465576171875, -0.00252532958984375, 0.006282806396484375, 0.0150909423828125, 0.023899078369140625, 0.03270721435546875, 0.041515350341796875, 0.050323486328125, 0.059131622314453125, 0.06793975830078125, 0.07674789428710938, 0.0855560302734375, 0.09436416625976562, 0.10317230224609375, 0.11198043823242188, 0.12078857421875, 0.12959671020507812, 0.13840484619140625, 0.14721298217773438, 0.1560211181640625, 0.16482925415039062, 0.17363739013671875, 0.18244552612304688, 0.191253662109375, 0.20006179809570312, 0.20886993408203125, 0.21767807006835938, 0.2264862060546875, 0.23529434204101562, 0.24410247802734375, 0.2529106140136719, 0.26171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 9.0, 16.0, 13.0, 20.0, 35.0, 50.0, 70.0, 99.0, 156.0, 305.0, 512.0, 975.0, 2129.0, 5923.0, 18402.0, 76256.0, 468128.0, 386369.0, 63851.0, 15856.0, 5212.0, 2047.0, 896.0, 461.0, 272.0, 149.0, 100.0, 62.0, 48.0, 43.0, 23.0, 14.0, 16.0, 6.0, 3.0, 7.0, 7.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.580078125, -0.562469482421875, -0.54486083984375, -0.527252197265625, -0.5096435546875, -0.492034912109375, -0.47442626953125, -0.456817626953125, -0.439208984375, -0.421600341796875, -0.40399169921875, -0.386383056640625, -0.3687744140625, -0.351165771484375, -0.33355712890625, -0.315948486328125, -0.29833984375, -0.280731201171875, -0.26312255859375, -0.245513916015625, -0.2279052734375, -0.210296630859375, -0.19268798828125, -0.175079345703125, -0.157470703125, -0.139862060546875, -0.12225341796875, -0.104644775390625, -0.0870361328125, -0.069427490234375, -0.05181884765625, -0.034210205078125, -0.0166015625, 0.001007080078125, 0.01861572265625, 0.036224365234375, 0.0538330078125, 0.071441650390625, 0.08905029296875, 0.106658935546875, 0.124267578125, 0.141876220703125, 0.15948486328125, 0.177093505859375, 0.1947021484375, 0.212310791015625, 0.22991943359375, 0.247528076171875, 0.26513671875, 0.282745361328125, 0.30035400390625, 0.317962646484375, 0.3355712890625, 0.353179931640625, 0.37078857421875, 0.388397216796875, 0.406005859375, 0.423614501953125, 0.44122314453125, 0.458831787109375, 0.4764404296875, 0.494049072265625, 0.51165771484375, 0.529266357421875, 0.546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 5.0, 6.0, 10.0, 12.0, 12.0, 15.0, 18.0, 19.0, 31.0, 23.0, 30.0, 36.0, 43.0, 43.0, 42.0, 46.0, 43.0, 39.0, 34.0, 47.0, 46.0, 35.0, 47.0, 42.0, 34.0, 42.0, 31.0, 27.0, 26.0, 23.0, 20.0, 16.0, 15.0, 11.0, 5.0, 8.0, 10.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6689453125, -0.649139404296875, -0.62933349609375, -0.609527587890625, -0.5897216796875, -0.569915771484375, -0.55010986328125, -0.530303955078125, -0.510498046875, -0.490692138671875, -0.47088623046875, -0.451080322265625, -0.4312744140625, -0.411468505859375, -0.39166259765625, -0.371856689453125, -0.35205078125, -0.332244873046875, -0.31243896484375, -0.292633056640625, -0.2728271484375, -0.253021240234375, -0.23321533203125, -0.213409423828125, -0.193603515625, -0.173797607421875, -0.15399169921875, -0.134185791015625, -0.1143798828125, -0.094573974609375, -0.07476806640625, -0.054962158203125, -0.03515625, -0.015350341796875, 0.00445556640625, 0.024261474609375, 0.0440673828125, 0.063873291015625, 0.08367919921875, 0.103485107421875, 0.123291015625, 0.143096923828125, 0.16290283203125, 0.182708740234375, 0.2025146484375, 0.222320556640625, 0.24212646484375, 0.261932373046875, 0.28173828125, 0.301544189453125, 0.32135009765625, 0.341156005859375, 0.3609619140625, 0.380767822265625, 0.40057373046875, 0.420379638671875, 0.440185546875, 0.459991455078125, 0.47979736328125, 0.499603271484375, 0.5194091796875, 0.539215087890625, 0.55902099609375, 0.578826904296875, 0.5986328125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 7.0, 3.0, 10.0, 23.0, 22.0, 44.0, 78.0, 151.0, 262.0, 532.0, 1014.0, 2393.0, 6419.0, 24129.0, 211515.0, 712925.0, 69224.0, 12630.0, 3945.0, 1609.0, 748.0, 395.0, 194.0, 119.0, 68.0, 33.0, 33.0, 10.0, 5.0, 12.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.361083984375, -0.35189056396484375, -0.3426971435546875, -0.33350372314453125, -0.324310302734375, -0.31511688232421875, -0.3059234619140625, -0.29673004150390625, -0.28753662109375, -0.27834320068359375, -0.2691497802734375, -0.25995635986328125, -0.250762939453125, -0.24156951904296875, -0.2323760986328125, -0.22318267822265625, -0.2139892578125, -0.20479583740234375, -0.1956024169921875, -0.18640899658203125, -0.177215576171875, -0.16802215576171875, -0.1588287353515625, -0.14963531494140625, -0.14044189453125, -0.13124847412109375, -0.1220550537109375, -0.11286163330078125, -0.103668212890625, -0.09447479248046875, -0.0852813720703125, -0.07608795166015625, -0.06689453125, -0.05770111083984375, -0.0485076904296875, -0.03931427001953125, -0.030120849609375, -0.02092742919921875, -0.0117340087890625, -0.00254058837890625, 0.00665283203125, 0.01584625244140625, 0.0250396728515625, 0.03423309326171875, 0.043426513671875, 0.05261993408203125, 0.0618133544921875, 0.07100677490234375, 0.0802001953125, 0.08939361572265625, 0.0985870361328125, 0.10778045654296875, 0.116973876953125, 0.12616729736328125, 0.1353607177734375, 0.14455413818359375, 0.15374755859375, 0.16294097900390625, 0.1721343994140625, 0.18132781982421875, 0.190521240234375, 0.19971466064453125, 0.2089080810546875, 0.21810150146484375, 0.227294921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 14.0, 9.0, 38.0, 52.0, 74.0, 128.0, 196.0, 181.0, 109.0, 83.0, 42.0, 24.0, 11.0, 4.0, 4.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.204843521118164e-05, -5.9645622968673706e-05, -5.724281072616577e-05, -5.483999848365784e-05, -5.24371862411499e-05, -5.003437399864197e-05, -4.763156175613403e-05, -4.52287495136261e-05, -4.2825937271118164e-05, -4.042312502861023e-05, -3.8020312786102295e-05, -3.561750054359436e-05, -3.3214688301086426e-05, -3.081187605857849e-05, -2.8409063816070557e-05, -2.6006251573562622e-05, -2.3603439331054688e-05, -2.1200627088546753e-05, -1.879781484603882e-05, -1.6395002603530884e-05, -1.399219036102295e-05, -1.1589378118515015e-05, -9.18656587600708e-06, -6.7837536334991455e-06, -4.380941390991211e-06, -1.9781291484832764e-06, 4.246830940246582e-07, 2.8274953365325928e-06, 5.230307579040527e-06, 7.633119821548462e-06, 1.0035932064056396e-05, 1.2438744306564331e-05, 1.4841556549072266e-05, 1.72443687915802e-05, 1.9647181034088135e-05, 2.204999327659607e-05, 2.4452805519104004e-05, 2.685561776161194e-05, 2.9258430004119873e-05, 3.166124224662781e-05, 3.406405448913574e-05, 3.646686673164368e-05, 3.886967897415161e-05, 4.1272491216659546e-05, 4.367530345916748e-05, 4.6078115701675415e-05, 4.848092794418335e-05, 5.0883740186691284e-05, 5.328655242919922e-05, 5.568936467170715e-05, 5.809217691421509e-05, 6.049498915672302e-05, 6.289780139923096e-05, 6.530061364173889e-05, 6.770342588424683e-05, 7.010623812675476e-05, 7.25090503692627e-05, 7.491186261177063e-05, 7.731467485427856e-05, 7.97174870967865e-05, 8.212029933929443e-05, 8.452311158180237e-05, 8.69259238243103e-05, 8.932873606681824e-05, 9.173154830932617e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 8.0, 11.0, 16.0, 18.0, 39.0, 51.0, 88.0, 110.0, 199.0, 332.0, 622.0, 1207.0, 2348.0, 5606.0, 17403.0, 93781.0, 708789.0, 178970.0, 25393.0, 7351.0, 3029.0, 1385.0, 738.0, 403.0, 218.0, 160.0, 99.0, 62.0, 39.0, 24.0, 19.0, 17.0, 1.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.28515625, -0.275848388671875, -0.26654052734375, -0.257232666015625, -0.2479248046875, -0.238616943359375, -0.22930908203125, -0.220001220703125, -0.210693359375, -0.201385498046875, -0.19207763671875, -0.182769775390625, -0.1734619140625, -0.164154052734375, -0.15484619140625, -0.145538330078125, -0.13623046875, -0.126922607421875, -0.11761474609375, -0.108306884765625, -0.0989990234375, -0.089691162109375, -0.08038330078125, -0.071075439453125, -0.061767578125, -0.052459716796875, -0.04315185546875, -0.033843994140625, -0.0245361328125, -0.015228271484375, -0.00592041015625, 0.003387451171875, 0.0126953125, 0.022003173828125, 0.03131103515625, 0.040618896484375, 0.0499267578125, 0.059234619140625, 0.06854248046875, 0.077850341796875, 0.087158203125, 0.096466064453125, 0.10577392578125, 0.115081787109375, 0.1243896484375, 0.133697509765625, 0.14300537109375, 0.152313232421875, 0.16162109375, 0.170928955078125, 0.18023681640625, 0.189544677734375, 0.1988525390625, 0.208160400390625, 0.21746826171875, 0.226776123046875, 0.236083984375, 0.245391845703125, 0.25469970703125, 0.264007568359375, 0.2733154296875, 0.282623291015625, 0.29193115234375, 0.301239013671875, 0.310546875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 8.0, 5.0, 16.0, 14.0, 21.0, 27.0, 36.0, 43.0, 78.0, 80.0, 107.0, 90.0, 102.0, 87.0, 71.0, 51.0, 44.0, 28.0, 20.0, 13.0, 8.0, 13.0, 8.0, 4.0, 7.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2091064453125, -0.2022686004638672, -0.19543075561523438, -0.18859291076660156, -0.18175506591796875, -0.17491722106933594, -0.16807937622070312, -0.1612415313720703, -0.1544036865234375, -0.1475658416748047, -0.14072799682617188, -0.13389015197753906, -0.12705230712890625, -0.12021446228027344, -0.11337661743164062, -0.10653877258300781, -0.099700927734375, -0.09286308288574219, -0.08602523803710938, -0.07918739318847656, -0.07234954833984375, -0.06551170349121094, -0.058673858642578125, -0.05183601379394531, -0.0449981689453125, -0.03816032409667969, -0.031322479248046875, -0.024484634399414062, -0.01764678955078125, -0.010808944702148438, -0.003971099853515625, 0.0028667449951171875, 0.00970458984375, 0.016542434692382812, 0.023380279541015625, 0.030218124389648438, 0.03705596923828125, 0.04389381408691406, 0.050731658935546875, 0.05756950378417969, 0.0644073486328125, 0.07124519348144531, 0.07808303833007812, 0.08492088317871094, 0.09175872802734375, 0.09859657287597656, 0.10543441772460938, 0.11227226257324219, 0.119110107421875, 0.1259479522705078, 0.13278579711914062, 0.13962364196777344, 0.14646148681640625, 0.15329933166503906, 0.16013717651367188, 0.1669750213623047, 0.1738128662109375, 0.1806507110595703, 0.18748855590820312, 0.19432640075683594, 0.20116424560546875, 0.20800209045410156, 0.21483993530273438, 0.2216777801513672, 0.228515625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 20.0, 107.0, 475.0, 323.0, 72.0, 11.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.858182907104492, -4.408928394317627, -3.9596736431121826, -3.5104188919067383, -3.061164379119873, -2.6119096279144287, -2.1626548767089844, -1.7134003639221191, -1.2641456127166748, -0.81489098072052, -0.36563628911972046, 0.0836184024810791, 0.5328730344772339, 0.9821276664733887, 1.431382417678833, 1.8806369304656982, 2.3298916816711426, 2.779146432876587, 3.228400945663452, 3.6776556968688965, 4.126910209655762, 4.576165199279785, 5.02541971206665, 5.474674224853516, 5.923929214477539, 6.373183727264404, 6.822438716888428, 7.271693229675293, 7.720947742462158, 8.170202255249023, 8.619457244873047, 9.06871223449707, 9.517966270446777, 9.9672212600708, 10.416475296020508, 10.865730285644531, 11.314985275268555, 11.764239311218262, 12.213494300842285, 12.662748336791992, 13.112003326416016, 13.561258316040039, 14.010512351989746, 14.45976734161377, 14.909022331237793, 15.3582763671875, 15.807531356811523, 16.256786346435547, 16.70604133605957, 17.155296325683594, 17.604551315307617, 18.05380630493164, 18.50305938720703, 18.952314376831055, 19.401569366455078, 19.8508243560791, 20.300077438354492, 20.749332427978516, 21.19858741760254, 21.647842407226562, 22.097095489501953, 22.546350479125977, 22.99560546875, 23.444860458374023, 23.894115447998047]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 4.0, 3.0, 5.0, 10.0, 9.0, 6.0, 11.0, 17.0, 15.0, 19.0, 20.0, 14.0, 32.0, 29.0, 40.0, 30.0, 45.0, 51.0, 56.0, 38.0, 45.0, 60.0, 50.0, 38.0, 51.0, 37.0, 34.0, 40.0, 26.0, 29.0, 16.0, 21.0, 18.0, 11.0, 10.0, 10.0, 9.0, 6.0, 5.0, 5.0, 3.0, 10.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.0028162002563477, -2.9053938388824463, -2.807971477508545, -2.7105491161346436, -2.613126754760742, -2.5157041549682617, -2.4182817935943604, -2.320859432220459, -2.2234370708465576, -2.1260147094726562, -2.028592348098755, -1.931169867515564, -1.8337475061416626, -1.7363251447677612, -1.6389026641845703, -1.541480302810669, -1.4440579414367676, -1.3466355800628662, -1.2492132186889648, -1.151790738105774, -1.0543683767318726, -0.9569460153579712, -0.859523594379425, -0.7621011734008789, -0.6646788120269775, -0.5672564506530762, -0.46983402967453003, -0.3724116384983063, -0.2749892473220825, -0.17756685614585876, -0.08014446496963501, 0.017277956008911133, 0.1147000789642334, 0.21212247014045715, 0.3095448613166809, 0.40696725249290466, 0.5043896436691284, 0.6018120050430298, 0.6992344260215759, 0.7966568470001221, 0.8940792083740234, 0.9915015697479248, 1.0889239311218262, 1.186346411705017, 1.2837687730789185, 1.3811911344528198, 1.4786136150360107, 1.576035976409912, 1.6734583377838135, 1.7708806991577148, 1.8683030605316162, 1.9657255411148071, 2.063148021697998, 2.1605703830718994, 2.257992744445801, 2.355415105819702, 2.4528374671936035, 2.550259828567505, 2.6476821899414062, 2.7451045513153076, 2.842526912689209, 2.9399495124816895, 3.037371873855591, 3.134794235229492, 3.2322165966033936]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 4.0, 6.0, 11.0, 7.0, 17.0, 43.0, 41.0, 86.0, 101.0, 233.0, 693.0, 6357.0, 4184468.0, 1452.0, 362.0, 146.0, 95.0, 42.0, 43.0, 19.0, 19.0, 11.0, 2.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.609375, -7.386962890625, -7.16455078125, -6.942138671875, -6.7197265625, -6.497314453125, -6.27490234375, -6.052490234375, -5.830078125, -5.607666015625, -5.38525390625, -5.162841796875, -4.9404296875, -4.718017578125, -4.49560546875, -4.273193359375, -4.05078125, -3.828369140625, -3.60595703125, -3.383544921875, -3.1611328125, -2.938720703125, -2.71630859375, -2.493896484375, -2.271484375, -2.049072265625, -1.82666015625, -1.604248046875, -1.3818359375, -1.159423828125, -0.93701171875, -0.714599609375, -0.4921875, -0.269775390625, -0.04736328125, 0.175048828125, 0.3974609375, 0.619873046875, 0.84228515625, 1.064697265625, 1.287109375, 1.509521484375, 1.73193359375, 1.954345703125, 2.1767578125, 2.399169921875, 2.62158203125, 2.843994140625, 3.06640625, 3.288818359375, 3.51123046875, 3.733642578125, 3.9560546875, 4.178466796875, 4.40087890625, 4.623291015625, 4.845703125, 5.068115234375, 5.29052734375, 5.512939453125, 5.7353515625, 5.957763671875, 6.18017578125, 6.402587890625, 6.625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 14.0, 10.0, 30.0, 28.0, 37.0, 54.0, 62.0, 76.0, 84.0, 97.0, 90.0, 77.0, 57.0, 66.0, 45.0, 35.0, 44.0, 22.0, 10.0, 20.0, 19.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3046875, -0.29571533203125, -0.2867431640625, -0.27777099609375, -0.268798828125, -0.25982666015625, -0.2508544921875, -0.24188232421875, -0.23291015625, -0.22393798828125, -0.2149658203125, -0.20599365234375, -0.197021484375, -0.18804931640625, -0.1790771484375, -0.17010498046875, -0.1611328125, -0.15216064453125, -0.1431884765625, -0.13421630859375, -0.125244140625, -0.11627197265625, -0.1072998046875, -0.09832763671875, -0.08935546875, -0.08038330078125, -0.0714111328125, -0.06243896484375, -0.053466796875, -0.04449462890625, -0.0355224609375, -0.02655029296875, -0.017578125, -0.00860595703125, 0.0003662109375, 0.00933837890625, 0.018310546875, 0.02728271484375, 0.0362548828125, 0.04522705078125, 0.05419921875, 0.06317138671875, 0.0721435546875, 0.08111572265625, 0.090087890625, 0.09906005859375, 0.1080322265625, 0.11700439453125, 0.1259765625, 0.13494873046875, 0.1439208984375, 0.15289306640625, 0.161865234375, 0.17083740234375, 0.1798095703125, 0.18878173828125, 0.19775390625, 0.20672607421875, 0.2156982421875, 0.22467041015625, 0.233642578125, 0.24261474609375, 0.2515869140625, 0.26055908203125, 0.26953125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 6.0, 7.0, 11.0, 8.0, 13.0, 22.0, 25.0, 29.0, 33.0, 51.0, 71.0, 131.0, 248.0, 434.0, 919.0, 2477.0, 19109.0, 4162955.0, 4982.0, 1341.0, 570.0, 289.0, 165.0, 117.0, 62.0, 43.0, 37.0, 26.0, 21.0, 14.0, 15.0, 8.0, 14.0, 5.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.134765625, -3.048248291015625, -2.96173095703125, -2.875213623046875, -2.7886962890625, -2.702178955078125, -2.61566162109375, -2.529144287109375, -2.442626953125, -2.356109619140625, -2.26959228515625, -2.183074951171875, -2.0965576171875, -2.010040283203125, -1.92352294921875, -1.837005615234375, -1.75048828125, -1.663970947265625, -1.57745361328125, -1.490936279296875, -1.4044189453125, -1.317901611328125, -1.23138427734375, -1.144866943359375, -1.058349609375, -0.971832275390625, -0.88531494140625, -0.798797607421875, -0.7122802734375, -0.625762939453125, -0.53924560546875, -0.452728271484375, -0.3662109375, -0.279693603515625, -0.19317626953125, -0.106658935546875, -0.0201416015625, 0.066375732421875, 0.15289306640625, 0.239410400390625, 0.325927734375, 0.412445068359375, 0.49896240234375, 0.585479736328125, 0.6719970703125, 0.758514404296875, 0.84503173828125, 0.931549072265625, 1.01806640625, 1.104583740234375, 1.19110107421875, 1.277618408203125, 1.3641357421875, 1.450653076171875, 1.53717041015625, 1.623687744140625, 1.710205078125, 1.796722412109375, 1.88323974609375, 1.969757080078125, 2.0562744140625, 2.142791748046875, 2.22930908203125, 2.315826416015625, 2.40234375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 36.0, 3967.0, 38.0, 7.0, 6.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26611328125, -0.25247955322265625, -0.2388458251953125, -0.22521209716796875, -0.211578369140625, -0.19794464111328125, -0.1843109130859375, -0.17067718505859375, -0.15704345703125, -0.14340972900390625, -0.1297760009765625, -0.11614227294921875, -0.102508544921875, -0.08887481689453125, -0.0752410888671875, -0.06160736083984375, -0.0479736328125, -0.03433990478515625, -0.0207061767578125, -0.00707244873046875, 0.006561279296875, 0.02019500732421875, 0.0338287353515625, 0.04746246337890625, 0.06109619140625, 0.07472991943359375, 0.0883636474609375, 0.10199737548828125, 0.115631103515625, 0.12926483154296875, 0.1428985595703125, 0.15653228759765625, 0.170166015625, 0.18379974365234375, 0.1974334716796875, 0.21106719970703125, 0.224700927734375, 0.23833465576171875, 0.2519683837890625, 0.26560211181640625, 0.27923583984375, 0.29286956787109375, 0.3065032958984375, 0.32013702392578125, 0.333770751953125, 0.34740447998046875, 0.3610382080078125, 0.37467193603515625, 0.3883056640625, 0.40193939208984375, 0.4155731201171875, 0.42920684814453125, 0.442840576171875, 0.45647430419921875, 0.4701080322265625, 0.48374176025390625, 0.49737548828125, 0.5110092163085938, 0.5246429443359375, 0.5382766723632812, 0.551910400390625, 0.5655441284179688, 0.5791778564453125, 0.5928115844726562, 0.6064453125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 16.0, 35.0, 49.0, 79.0, 213.0, 326.0, 151.0, 63.0, 27.0, 15.0, 10.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9659733772277832, -1.9196730852127075, -1.8733729124069214, -1.8270726203918457, -1.7807724475860596, -1.7344721555709839, -1.6881719827651978, -1.641871690750122, -1.595571517944336, -1.5492712259292603, -1.5029710531234741, -1.4566707611083984, -1.4103705883026123, -1.3640702962875366, -1.3177701234817505, -1.2714698314666748, -1.2251696586608887, -1.178869366645813, -1.1325691938400269, -1.0862689018249512, -1.039968729019165, -0.9936684966087341, -0.9473682641983032, -0.9010679721832275, -0.8547676801681519, -0.808467447757721, -0.76216721534729, -0.7158669829368591, -0.6695667505264282, -0.6232665181159973, -0.5769662857055664, -0.5306659936904907, -0.4843657612800598, -0.4380655288696289, -0.391765296459198, -0.3454650640487671, -0.2991648316383362, -0.2528645992279053, -0.20656433701515198, -0.16026410460472107, -0.11396387219429016, -0.06766363978385925, -0.021363399922847748, 0.024936839938163757, 0.07123707234859467, 0.11753730475902557, 0.16383755207061768, 0.21013778448104858, 0.2564380168914795, 0.3027382493019104, 0.3490384817123413, 0.3953387141227722, 0.4416389465332031, 0.48793917894363403, 0.5342394113540649, 0.5805397033691406, 0.6268398761749268, 0.6731401085853577, 0.7194403409957886, 0.7657405734062195, 0.8120408058166504, 0.8583410382270813, 0.9046412706375122, 0.9509415626525879, 0.9972417950630188]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 4.0, 7.0, 11.0, 11.0, 11.0, 13.0, 13.0, 17.0, 19.0, 16.0, 20.0, 23.0, 34.0, 38.0, 37.0, 39.0, 44.0, 55.0, 30.0, 39.0, 50.0, 43.0, 55.0, 40.0, 33.0, 36.0, 31.0, 35.0, 34.0, 28.0, 17.0, 25.0, 22.0, 11.0, 8.0, 7.0, 12.0, 7.0, 8.0, 7.0, 7.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.4631257653236389, -0.450195848941803, -0.43726593255996704, -0.4243360161781311, -0.41140609979629517, -0.39847618341445923, -0.3855462968349457, -0.37261638045310974, -0.3596864640712738, -0.34675654768943787, -0.33382663130760193, -0.320896714925766, -0.30796682834625244, -0.2950369119644165, -0.28210699558258057, -0.26917707920074463, -0.2562471628189087, -0.24331724643707275, -0.23038733005523682, -0.21745742857456207, -0.20452751219272614, -0.1915975958108902, -0.17866769433021545, -0.16573777794837952, -0.15280786156654358, -0.13987794518470764, -0.1269480288028717, -0.11401812732219696, -0.10108821094036102, -0.08815829455852509, -0.07522838562726974, -0.062298476696014404, -0.04936856031417847, -0.03643864765763283, -0.02350873500108719, -0.01057882234454155, 0.0023510903120040894, 0.015281006693840027, 0.028210915625095367, 0.04114082455635071, 0.054070740938186646, 0.06700065732002258, 0.07993056625127792, 0.09286047518253326, 0.1057903915643692, 0.11872030794620514, 0.13165020942687988, 0.14458012580871582, 0.15751004219055176, 0.1704399585723877, 0.18336987495422363, 0.19629977643489838, 0.20922969281673431, 0.22215960919857025, 0.235089510679245, 0.24801942706108093, 0.26094934344291687, 0.2738792598247528, 0.28680917620658875, 0.2997390925884247, 0.31266897916793823, 0.32559889554977417, 0.3385288119316101, 0.35145872831344604, 0.364388644695282]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 6.0, 9.0, 11.0, 12.0, 16.0, 27.0, 41.0, 55.0, 62.0, 85.0, 113.0, 157.0, 226.0, 337.0, 612.0, 1019.0, 1816.0, 3728.0, 7962.0, 20061.0, 59765.0, 227062.0, 485840.0, 164617.0, 45458.0, 15677.0, 6542.0, 3070.0, 1631.0, 890.0, 523.0, 333.0, 201.0, 155.0, 97.0, 80.0, 68.0, 43.0, 38.0, 27.0, 19.0, 19.0, 12.0, 8.0, 4.0, 6.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.479736328125, -0.4639472961425781, -0.44815826416015625, -0.4323692321777344, -0.4165802001953125, -0.4007911682128906, -0.38500213623046875, -0.3692131042480469, -0.353424072265625, -0.3376350402832031, -0.32184600830078125, -0.3060569763183594, -0.2902679443359375, -0.2744789123535156, -0.25868988037109375, -0.24290084838867188, -0.22711181640625, -0.21132278442382812, -0.19553375244140625, -0.17974472045898438, -0.1639556884765625, -0.14816665649414062, -0.13237762451171875, -0.11658859252929688, -0.100799560546875, -0.08501052856445312, -0.06922149658203125, -0.053432464599609375, -0.0376434326171875, -0.021854400634765625, -0.00606536865234375, 0.009723663330078125, 0.0255126953125, 0.041301727294921875, 0.05709075927734375, 0.07287979125976562, 0.0886688232421875, 0.10445785522460938, 0.12024688720703125, 0.13603591918945312, 0.151824951171875, 0.16761398315429688, 0.18340301513671875, 0.19919204711914062, 0.2149810791015625, 0.23077011108398438, 0.24655914306640625, 0.2623481750488281, 0.27813720703125, 0.2939262390136719, 0.30971527099609375, 0.3255043029785156, 0.3412933349609375, 0.3570823669433594, 0.37287139892578125, 0.3886604309082031, 0.404449462890625, 0.4202384948730469, 0.43602752685546875, 0.4518165588378906, 0.4676055908203125, 0.4833946228027344, 0.49918365478515625, 0.5149726867675781, 0.53076171875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 7.0, 13.0, 25.0, 29.0, 40.0, 48.0, 50.0, 62.0, 71.0, 75.0, 83.0, 63.0, 78.0, 71.0, 49.0, 43.0, 50.0, 38.0, 26.0, 22.0, 17.0, 8.0, 8.0, 8.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302490234375, -0.2935600280761719, -0.28462982177734375, -0.2756996154785156, -0.2667694091796875, -0.2578392028808594, -0.24890899658203125, -0.23997879028320312, -0.231048583984375, -0.22211837768554688, -0.21318817138671875, -0.20425796508789062, -0.1953277587890625, -0.18639755249023438, -0.17746734619140625, -0.16853713989257812, -0.15960693359375, -0.15067672729492188, -0.14174652099609375, -0.13281631469726562, -0.1238861083984375, -0.11495590209960938, -0.10602569580078125, -0.09709548950195312, -0.088165283203125, -0.07923507690429688, -0.07030487060546875, -0.061374664306640625, -0.0524444580078125, -0.043514251708984375, -0.03458404541015625, -0.025653839111328125, -0.0167236328125, -0.007793426513671875, 0.00113677978515625, 0.010066986083984375, 0.0189971923828125, 0.027927398681640625, 0.03685760498046875, 0.045787811279296875, 0.054718017578125, 0.06364822387695312, 0.07257843017578125, 0.08150863647460938, 0.0904388427734375, 0.09936904907226562, 0.10829925537109375, 0.11722946166992188, 0.12615966796875, 0.13508987426757812, 0.14402008056640625, 0.15295028686523438, 0.1618804931640625, 0.17081069946289062, 0.17974090576171875, 0.18867111206054688, 0.197601318359375, 0.20653152465820312, 0.21546173095703125, 0.22439193725585938, 0.2333221435546875, 0.24225234985351562, 0.25118255615234375, 0.2601127624511719, 0.26904296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 6.0, 7.0, 6.0, 7.0, 8.0, 21.0, 26.0, 33.0, 45.0, 88.0, 176.0, 322.0, 598.0, 1172.0, 2931.0, 7485.0, 24501.0, 118728.0, 657310.0, 185615.0, 33379.0, 9634.0, 3467.0, 1456.0, 663.0, 346.0, 167.0, 129.0, 65.0, 44.0, 32.0, 27.0, 17.0, 8.0, 10.0, 9.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5693359375, -0.55010986328125, -0.5308837890625, -0.51165771484375, -0.492431640625, -0.47320556640625, -0.4539794921875, -0.43475341796875, -0.41552734375, -0.39630126953125, -0.3770751953125, -0.35784912109375, -0.338623046875, -0.31939697265625, -0.3001708984375, -0.28094482421875, -0.26171875, -0.24249267578125, -0.2232666015625, -0.20404052734375, -0.184814453125, -0.16558837890625, -0.1463623046875, -0.12713623046875, -0.10791015625, -0.08868408203125, -0.0694580078125, -0.05023193359375, -0.031005859375, -0.01177978515625, 0.0074462890625, 0.02667236328125, 0.0458984375, 0.06512451171875, 0.0843505859375, 0.10357666015625, 0.122802734375, 0.14202880859375, 0.1612548828125, 0.18048095703125, 0.19970703125, 0.21893310546875, 0.2381591796875, 0.25738525390625, 0.276611328125, 0.29583740234375, 0.3150634765625, 0.33428955078125, 0.353515625, 0.37274169921875, 0.3919677734375, 0.41119384765625, 0.430419921875, 0.44964599609375, 0.4688720703125, 0.48809814453125, 0.50732421875, 0.52655029296875, 0.5457763671875, 0.56500244140625, 0.584228515625, 0.60345458984375, 0.6226806640625, 0.64190673828125, 0.6611328125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 10.0, 6.0, 3.0, 9.0, 8.0, 15.0, 9.0, 23.0, 20.0, 16.0, 14.0, 26.0, 20.0, 20.0, 31.0, 36.0, 33.0, 27.0, 46.0, 41.0, 46.0, 42.0, 41.0, 37.0, 38.0, 34.0, 23.0, 24.0, 24.0, 26.0, 36.0, 25.0, 27.0, 20.0, 23.0, 21.0, 18.0, 10.0, 14.0, 14.0, 9.0, 7.0, 4.0, 4.0, 9.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0], "bins": [-0.65478515625, -0.6360092163085938, -0.6172332763671875, -0.5984573364257812, -0.579681396484375, -0.5609054565429688, -0.5421295166015625, -0.5233535766601562, -0.50457763671875, -0.48580169677734375, -0.4670257568359375, -0.44824981689453125, -0.429473876953125, -0.41069793701171875, -0.3919219970703125, -0.37314605712890625, -0.3543701171875, -0.33559417724609375, -0.3168182373046875, -0.29804229736328125, -0.279266357421875, -0.26049041748046875, -0.2417144775390625, -0.22293853759765625, -0.20416259765625, -0.18538665771484375, -0.1666107177734375, -0.14783477783203125, -0.129058837890625, -0.11028289794921875, -0.0915069580078125, -0.07273101806640625, -0.053955078125, -0.03517913818359375, -0.0164031982421875, 0.00237274169921875, 0.021148681640625, 0.03992462158203125, 0.0587005615234375, 0.07747650146484375, 0.09625244140625, 0.11502838134765625, 0.1338043212890625, 0.15258026123046875, 0.171356201171875, 0.19013214111328125, 0.2089080810546875, 0.22768402099609375, 0.2464599609375, 0.26523590087890625, 0.2840118408203125, 0.30278778076171875, 0.321563720703125, 0.34033966064453125, 0.3591156005859375, 0.37789154052734375, 0.39666748046875, 0.41544342041015625, 0.4342193603515625, 0.45299530029296875, 0.471771240234375, 0.49054718017578125, 0.5093231201171875, 0.5280990600585938, 0.546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 6.0, 9.0, 13.0, 25.0, 25.0, 67.0, 76.0, 95.0, 189.0, 329.0, 687.0, 1661.0, 4793.0, 20600.0, 164650.0, 734100.0, 99894.0, 14825.0, 3780.0, 1369.0, 565.0, 302.0, 183.0, 104.0, 65.0, 43.0, 28.0, 19.0, 18.0, 5.0, 9.0, 4.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25830078125, -0.25032806396484375, -0.2423553466796875, -0.23438262939453125, -0.226409912109375, -0.21843719482421875, -0.2104644775390625, -0.20249176025390625, -0.19451904296875, -0.18654632568359375, -0.1785736083984375, -0.17060089111328125, -0.162628173828125, -0.15465545654296875, -0.1466827392578125, -0.13871002197265625, -0.1307373046875, -0.12276458740234375, -0.1147918701171875, -0.10681915283203125, -0.098846435546875, -0.09087371826171875, -0.0829010009765625, -0.07492828369140625, -0.06695556640625, -0.05898284912109375, -0.0510101318359375, -0.04303741455078125, -0.035064697265625, -0.02709197998046875, -0.0191192626953125, -0.01114654541015625, -0.003173828125, 0.00479888916015625, 0.0127716064453125, 0.02074432373046875, 0.028717041015625, 0.03668975830078125, 0.0446624755859375, 0.05263519287109375, 0.06060791015625, 0.06858062744140625, 0.0765533447265625, 0.08452606201171875, 0.092498779296875, 0.10047149658203125, 0.1084442138671875, 0.11641693115234375, 0.1243896484375, 0.13236236572265625, 0.1403350830078125, 0.14830780029296875, 0.156280517578125, 0.16425323486328125, 0.1722259521484375, 0.18019866943359375, 0.18817138671875, 0.19614410400390625, 0.2041168212890625, 0.21208953857421875, 0.220062255859375, 0.22803497314453125, 0.2360076904296875, 0.24398040771484375, 0.251953125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 2.0, 2.0, 5.0, 3.0, 7.0, 7.0, 22.0, 8.0, 16.0, 25.0, 19.0, 45.0, 48.0, 57.0, 88.0, 96.0, 122.0, 96.0, 86.0, 72.0, 34.0, 34.0, 22.0, 15.0, 22.0, 12.0, 7.0, 8.0, 7.0, 3.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.70280647277832e-05, -4.565343260765076e-05, -4.427880048751831e-05, -4.2904168367385864e-05, -4.152953624725342e-05, -4.015490412712097e-05, -3.8780272006988525e-05, -3.740563988685608e-05, -3.603100776672363e-05, -3.4656375646591187e-05, -3.328174352645874e-05, -3.1907111406326294e-05, -3.053247928619385e-05, -2.91578471660614e-05, -2.7783215045928955e-05, -2.640858292579651e-05, -2.5033950805664062e-05, -2.3659318685531616e-05, -2.228468656539917e-05, -2.0910054445266724e-05, -1.9535422325134277e-05, -1.816079020500183e-05, -1.6786158084869385e-05, -1.541152596473694e-05, -1.4036893844604492e-05, -1.2662261724472046e-05, -1.12876296043396e-05, -9.912997484207153e-06, -8.538365364074707e-06, -7.163733243942261e-06, -5.7891011238098145e-06, -4.414469003677368e-06, -3.039836883544922e-06, -1.6652047634124756e-06, -2.905726432800293e-07, 1.084059476852417e-06, 2.4586915969848633e-06, 3.8333237171173096e-06, 5.207955837249756e-06, 6.582587957382202e-06, 7.957220077514648e-06, 9.331852197647095e-06, 1.0706484317779541e-05, 1.2081116437911987e-05, 1.3455748558044434e-05, 1.483038067817688e-05, 1.6205012798309326e-05, 1.7579644918441772e-05, 1.895427703857422e-05, 2.0328909158706665e-05, 2.170354127883911e-05, 2.3078173398971558e-05, 2.4452805519104004e-05, 2.582743763923645e-05, 2.7202069759368896e-05, 2.8576701879501343e-05, 2.995133399963379e-05, 3.1325966119766235e-05, 3.270059823989868e-05, 3.407523036003113e-05, 3.5449862480163574e-05, 3.682449460029602e-05, 3.819912672042847e-05, 3.957375884056091e-05, 4.094839096069336e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 5.0, 12.0, 15.0, 27.0, 39.0, 54.0, 92.0, 201.0, 372.0, 875.0, 2672.0, 12509.0, 126276.0, 809475.0, 82736.0, 9483.0, 2155.0, 747.0, 347.0, 202.0, 91.0, 54.0, 35.0, 29.0, 17.0, 9.0, 8.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.268798828125, -0.2577934265136719, -0.24678802490234375, -0.23578262329101562, -0.2247772216796875, -0.21377182006835938, -0.20276641845703125, -0.19176101684570312, -0.180755615234375, -0.16975021362304688, -0.15874481201171875, -0.14773941040039062, -0.1367340087890625, -0.12572860717773438, -0.11472320556640625, -0.10371780395507812, -0.09271240234375, -0.08170700073242188, -0.07070159912109375, -0.059696197509765625, -0.0486907958984375, -0.037685394287109375, -0.02667999267578125, -0.015674591064453125, -0.004669189453125, 0.006336212158203125, 0.01734161376953125, 0.028347015380859375, 0.0393524169921875, 0.050357818603515625, 0.06136322021484375, 0.07236862182617188, 0.0833740234375, 0.09437942504882812, 0.10538482666015625, 0.11639022827148438, 0.1273956298828125, 0.13840103149414062, 0.14940643310546875, 0.16041183471679688, 0.171417236328125, 0.18242263793945312, 0.19342803955078125, 0.20443344116210938, 0.2154388427734375, 0.22644424438476562, 0.23744964599609375, 0.24845504760742188, 0.25946044921875, 0.2704658508300781, 0.28147125244140625, 0.2924766540527344, 0.3034820556640625, 0.3144874572753906, 0.32549285888671875, 0.3364982604980469, 0.347503662109375, 0.3585090637207031, 0.36951446533203125, 0.3805198669433594, 0.3915252685546875, 0.4025306701660156, 0.41353607177734375, 0.4245414733886719, 0.435546875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 13.0, 10.0, 18.0, 30.0, 56.0, 84.0, 104.0, 130.0, 128.0, 124.0, 99.0, 62.0, 48.0, 38.0, 24.0, 13.0, 8.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2265625, -0.2168731689453125, -0.207183837890625, -0.1974945068359375, -0.18780517578125, -0.1781158447265625, -0.168426513671875, -0.1587371826171875, -0.1490478515625, -0.1393585205078125, -0.129669189453125, -0.1199798583984375, -0.11029052734375, -0.1006011962890625, -0.090911865234375, -0.0812225341796875, -0.071533203125, -0.0618438720703125, -0.052154541015625, -0.0424652099609375, -0.03277587890625, -0.0230865478515625, -0.013397216796875, -0.0037078857421875, 0.0059814453125, 0.0156707763671875, 0.025360107421875, 0.0350494384765625, 0.04473876953125, 0.0544281005859375, 0.064117431640625, 0.0738067626953125, 0.08349609375, 0.0931854248046875, 0.102874755859375, 0.1125640869140625, 0.12225341796875, 0.1319427490234375, 0.141632080078125, 0.1513214111328125, 0.1610107421875, 0.1707000732421875, 0.180389404296875, 0.1900787353515625, 0.19976806640625, 0.2094573974609375, 0.219146728515625, 0.2288360595703125, 0.238525390625, 0.2482147216796875, 0.257904052734375, 0.2675933837890625, 0.27728271484375, 0.2869720458984375, 0.296661376953125, 0.3063507080078125, 0.3160400390625, 0.3257293701171875, 0.335418701171875, 0.3451080322265625, 0.35479736328125, 0.3644866943359375, 0.374176025390625, 0.3838653564453125, 0.3935546875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 11.0, 43.0, 181.0, 408.0, 269.0, 72.0, 18.0, 3.0, 3.0, 1.0, 1.0], "bins": [-22.551422119140625, -22.15372657775879, -21.756031036376953, -21.358335494995117, -20.96063995361328, -20.562944412231445, -20.16524887084961, -19.76755142211914, -19.369855880737305, -18.97216033935547, -18.574464797973633, -18.176769256591797, -17.77907371520996, -17.381378173828125, -16.983680725097656, -16.585987091064453, -16.188291549682617, -15.790596008300781, -15.392900466918945, -14.99520492553711, -14.597508430480957, -14.199812889099121, -13.802117347717285, -13.40442180633545, -13.006725311279297, -12.609029769897461, -12.211334228515625, -11.813638687133789, -11.415942192077637, -11.0182466506958, -10.620551109313965, -10.222855567932129, -9.825160026550293, -9.427464485168457, -9.029768943786621, -8.632072448730469, -8.234376907348633, -7.836681365966797, -7.438985824584961, -7.041290283203125, -6.643594741821289, -6.245899200439453, -5.848203182220459, -5.450507640838623, -5.052812099456787, -4.655116081237793, -4.257420539855957, -3.859724998474121, -3.462028980255127, -3.064333200454712, -2.666637659072876, -2.268941879272461, -1.8712462186813354, -1.47355055809021, -1.075854778289795, -0.678159236907959, -0.28046345710754395, 0.11723223328590393, 0.5149279236793518, 0.9126236438751221, 1.3103193044662476, 1.708014965057373, 2.105710744857788, 2.503406286239624, 2.901102066040039]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 6.0, 11.0, 6.0, 12.0, 8.0, 12.0, 15.0, 15.0, 39.0, 24.0, 21.0, 31.0, 36.0, 36.0, 51.0, 60.0, 52.0, 48.0, 74.0, 55.0, 53.0, 32.0, 41.0, 35.0, 43.0, 34.0, 27.0, 23.0, 16.0, 19.0, 20.0, 15.0, 12.0, 4.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.799252510070801, -3.672935724258423, -3.546618938446045, -3.420302152633667, -3.293985366821289, -3.167668581008911, -3.041351795196533, -2.9150350093841553, -2.7887182235717773, -2.6624014377593994, -2.5360846519470215, -2.4097678661346436, -2.2834510803222656, -2.1571342945098877, -2.0308175086975098, -1.9045007228851318, -1.778183937072754, -1.651867151260376, -1.525550365447998, -1.3992335796356201, -1.2729167938232422, -1.1466000080108643, -1.0202832221984863, -0.8939664363861084, -0.7676496505737305, -0.6413328647613525, -0.5150160789489746, -0.3886992931365967, -0.26238250732421875, -0.13606572151184082, -0.00974893569946289, 0.11656785011291504, 0.24288511276245117, 0.3692018985748291, 0.49551868438720703, 0.621835470199585, 0.7481522560119629, 0.8744690418243408, 1.0007858276367188, 1.1271026134490967, 1.2534193992614746, 1.3797361850738525, 1.5060529708862305, 1.6323697566986084, 1.7586865425109863, 1.8850033283233643, 2.011320114135742, 2.13763689994812, 2.263953685760498, 2.390270471572876, 2.516587257385254, 2.642904043197632, 2.7692208290100098, 2.8955376148223877, 3.0218544006347656, 3.1481711864471436, 3.2744879722595215, 3.4008047580718994, 3.5271215438842773, 3.6534383296966553, 3.779755115509033, 3.906071901321411, 4.032388687133789, 4.158705711364746, 4.285022258758545]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 6.0, 7.0, 10.0, 11.0, 19.0, 29.0, 39.0, 62.0, 107.0, 179.0, 312.0, 643.0, 1690.0, 4166612.0, 21849.0, 1360.0, 548.0, 301.0, 194.0, 95.0, 68.0, 39.0, 30.0, 17.0, 10.0, 11.0, 5.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.25, -4.124664306640625, -3.99932861328125, -3.873992919921875, -3.7486572265625, -3.623321533203125, -3.49798583984375, -3.372650146484375, -3.247314453125, -3.121978759765625, -2.99664306640625, -2.871307373046875, -2.7459716796875, -2.620635986328125, -2.49530029296875, -2.369964599609375, -2.24462890625, -2.119293212890625, -1.99395751953125, -1.868621826171875, -1.7432861328125, -1.617950439453125, -1.49261474609375, -1.367279052734375, -1.241943359375, -1.116607666015625, -0.99127197265625, -0.865936279296875, -0.7406005859375, -0.615264892578125, -0.48992919921875, -0.364593505859375, -0.2392578125, -0.113922119140625, 0.01141357421875, 0.136749267578125, 0.2620849609375, 0.387420654296875, 0.51275634765625, 0.638092041015625, 0.763427734375, 0.888763427734375, 1.01409912109375, 1.139434814453125, 1.2647705078125, 1.390106201171875, 1.51544189453125, 1.640777587890625, 1.76611328125, 1.891448974609375, 2.01678466796875, 2.142120361328125, 2.2674560546875, 2.392791748046875, 2.51812744140625, 2.643463134765625, 2.768798828125, 2.894134521484375, 3.01947021484375, 3.144805908203125, 3.2701416015625, 3.395477294921875, 3.52081298828125, 3.646148681640625, 3.771484375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 7.0, 11.0, 14.0, 22.0, 18.0, 26.0, 30.0, 55.0, 52.0, 81.0, 61.0, 78.0, 72.0, 85.0, 78.0, 60.0, 59.0, 41.0, 39.0, 24.0, 25.0, 19.0, 15.0, 9.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310546875, -0.30152130126953125, -0.2924957275390625, -0.28347015380859375, -0.274444580078125, -0.26541900634765625, -0.2563934326171875, -0.24736785888671875, -0.23834228515625, -0.22931671142578125, -0.2202911376953125, -0.21126556396484375, -0.202239990234375, -0.19321441650390625, -0.1841888427734375, -0.17516326904296875, -0.1661376953125, -0.15711212158203125, -0.1480865478515625, -0.13906097412109375, -0.130035400390625, -0.12100982666015625, -0.1119842529296875, -0.10295867919921875, -0.09393310546875, -0.08490753173828125, -0.0758819580078125, -0.06685638427734375, -0.057830810546875, -0.04880523681640625, -0.0397796630859375, -0.03075408935546875, -0.021728515625, -0.01270294189453125, -0.0036773681640625, 0.00534820556640625, 0.014373779296875, 0.02339935302734375, 0.0324249267578125, 0.04145050048828125, 0.05047607421875, 0.05950164794921875, 0.0685272216796875, 0.07755279541015625, 0.086578369140625, 0.09560394287109375, 0.1046295166015625, 0.11365509033203125, 0.1226806640625, 0.13170623779296875, 0.1407318115234375, 0.14975738525390625, 0.158782958984375, 0.16780853271484375, 0.1768341064453125, 0.18585968017578125, 0.19488525390625, 0.20391082763671875, 0.2129364013671875, 0.22196197509765625, 0.230987548828125, 0.24001312255859375, 0.2490386962890625, 0.25806427001953125, 0.26708984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 12.0, 13.0, 20.0, 12.0, 21.0, 22.0, 56.0, 69.0, 100.0, 144.0, 184.0, 320.0, 579.0, 944.0, 1824.0, 5297.0, 60337.0, 4110736.0, 8345.0, 2402.0, 1042.0, 685.0, 393.0, 218.0, 136.0, 105.0, 90.0, 43.0, 31.0, 21.0, 15.0, 19.0, 15.0, 12.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.52734375, -1.48126220703125, -1.4351806640625, -1.38909912109375, -1.343017578125, -1.29693603515625, -1.2508544921875, -1.20477294921875, -1.15869140625, -1.11260986328125, -1.0665283203125, -1.02044677734375, -0.974365234375, -0.92828369140625, -0.8822021484375, -0.83612060546875, -0.7900390625, -0.74395751953125, -0.6978759765625, -0.65179443359375, -0.605712890625, -0.55963134765625, -0.5135498046875, -0.46746826171875, -0.42138671875, -0.37530517578125, -0.3292236328125, -0.28314208984375, -0.237060546875, -0.19097900390625, -0.1448974609375, -0.09881591796875, -0.052734375, -0.00665283203125, 0.0394287109375, 0.08551025390625, 0.131591796875, 0.17767333984375, 0.2237548828125, 0.26983642578125, 0.31591796875, 0.36199951171875, 0.4080810546875, 0.45416259765625, 0.500244140625, 0.54632568359375, 0.5924072265625, 0.63848876953125, 0.6845703125, 0.73065185546875, 0.7767333984375, 0.82281494140625, 0.868896484375, 0.91497802734375, 0.9610595703125, 1.00714111328125, 1.05322265625, 1.09930419921875, 1.1453857421875, 1.19146728515625, 1.237548828125, 1.28363037109375, 1.3297119140625, 1.37579345703125, 1.421875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 13.0, 12.0, 46.0, 3814.0, 127.0, 26.0, 10.0, 9.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3037109375, -0.29384613037109375, -0.2839813232421875, -0.27411651611328125, -0.264251708984375, -0.25438690185546875, -0.2445220947265625, -0.23465728759765625, -0.22479248046875, -0.21492767333984375, -0.2050628662109375, -0.19519805908203125, -0.185333251953125, -0.17546844482421875, -0.1656036376953125, -0.15573883056640625, -0.1458740234375, -0.13600921630859375, -0.1261444091796875, -0.11627960205078125, -0.106414794921875, -0.09654998779296875, -0.0866851806640625, -0.07682037353515625, -0.06695556640625, -0.05709075927734375, -0.0472259521484375, -0.03736114501953125, -0.027496337890625, -0.01763153076171875, -0.0077667236328125, 0.00209808349609375, 0.011962890625, 0.02182769775390625, 0.0316925048828125, 0.04155731201171875, 0.051422119140625, 0.06128692626953125, 0.0711517333984375, 0.08101654052734375, 0.09088134765625, 0.10074615478515625, 0.1106109619140625, 0.12047576904296875, 0.130340576171875, 0.14020538330078125, 0.1500701904296875, 0.15993499755859375, 0.1697998046875, 0.17966461181640625, 0.1895294189453125, 0.19939422607421875, 0.209259033203125, 0.21912384033203125, 0.2289886474609375, 0.23885345458984375, 0.24871826171875, 0.25858306884765625, 0.2684478759765625, 0.27831268310546875, 0.288177490234375, 0.29804229736328125, 0.3079071044921875, 0.31777191162109375, 0.32763671875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 6.0, 7.0, 8.0, 18.0, 23.0, 50.0, 63.0, 119.0, 180.0, 159.0, 131.0, 74.0, 59.0, 36.0, 28.0, 13.0, 8.0, 7.0, 10.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4852113723754883, -0.45683056116104126, -0.42844974994659424, -0.4000689387321472, -0.3716881275177002, -0.3433073163032532, -0.31492650508880615, -0.28654569387435913, -0.2581648826599121, -0.2297840714454651, -0.20140326023101807, -0.17302244901657104, -0.14464163780212402, -0.116260826587677, -0.08788001537322998, -0.05949920415878296, -0.031118392944335938, -0.002737581729888916, 0.025643229484558105, 0.05402404069900513, 0.08240485191345215, 0.11078566312789917, 0.1391664743423462, 0.1675472855567932, 0.19592809677124023, 0.22430890798568726, 0.2526897192001343, 0.2810705304145813, 0.3094513416290283, 0.33783215284347534, 0.36621296405792236, 0.3945937752723694, 0.4229745864868164, 0.4513553977012634, 0.47973620891571045, 0.5081170201301575, 0.5364978313446045, 0.5648786425590515, 0.5932594537734985, 0.6216402649879456, 0.6500210762023926, 0.6784018874168396, 0.7067826986312866, 0.7351635098457336, 0.7635443210601807, 0.7919251322746277, 0.8203059434890747, 0.8486867547035217, 0.8770675659179688, 0.9054483771324158, 0.9338291883468628, 0.9622099995613098, 0.9905908107757568, 1.0189716815948486, 1.0473524332046509, 1.0757331848144531, 1.104114055633545, 1.1324949264526367, 1.160875678062439, 1.1892564296722412, 1.217637300491333, 1.2460181713104248, 1.274398922920227, 1.3027796745300293, 1.331160545349121]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 8.0, 4.0, 8.0, 7.0, 6.0, 15.0, 12.0, 7.0, 19.0, 15.0, 21.0, 22.0, 30.0, 26.0, 28.0, 39.0, 37.0, 34.0, 42.0, 35.0, 40.0, 42.0, 40.0, 33.0, 30.0, 30.0, 34.0, 38.0, 25.0, 30.0, 30.0, 27.0, 24.0, 20.0, 22.0, 16.0, 15.0, 19.0, 11.0, 10.0, 7.0, 13.0, 5.0, 3.0, 3.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.34016501903533936, -0.33031991124153137, -0.320474773645401, -0.310629665851593, -0.30078455805778503, -0.29093945026397705, -0.2810943126678467, -0.2712492048740387, -0.2614040970802307, -0.25155898928642273, -0.24171386659145355, -0.23186874389648438, -0.2220236361026764, -0.21217851340770721, -0.20233339071273804, -0.19248828291893005, -0.18264314532279968, -0.1727980226278305, -0.16295291483402252, -0.15310779213905334, -0.14326268434524536, -0.13341756165027618, -0.123572438955307, -0.11372732371091843, -0.10388220846652985, -0.09403709322214127, -0.08419197797775269, -0.07434685528278351, -0.06450174003839493, -0.05465662479400635, -0.04481150582432747, -0.03496638685464859, -0.02512127161026001, -0.01527615450322628, -0.005431037396192551, 0.004414079710841179, 0.014259196817874908, 0.02410431206226349, 0.03394943103194237, 0.043794550001621246, 0.05363966524600983, 0.06348478049039841, 0.07332989573478699, 0.08317501842975616, 0.09302013367414474, 0.10286524891853333, 0.1127103716135025, 0.12255548685789108, 0.13240060210227966, 0.14224572479724884, 0.15209083259105682, 0.161935955286026, 0.17178106307983398, 0.18162618577480316, 0.19147130846977234, 0.20131641626358032, 0.2111615389585495, 0.22100666165351868, 0.23085176944732666, 0.24069689214229584, 0.250542014837265, 0.260387122631073, 0.270232230424881, 0.28007736802101135, 0.28992247581481934]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 5.0, 14.0, 21.0, 24.0, 61.0, 68.0, 115.0, 155.0, 248.0, 427.0, 816.0, 1759.0, 4511.0, 14534.0, 61365.0, 421278.0, 452784.0, 66588.0, 15277.0, 4665.0, 1802.0, 855.0, 421.0, 283.0, 144.0, 115.0, 69.0, 41.0, 35.0, 22.0, 10.0, 13.0, 4.0, 1.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.78076171875, -0.7578125, -0.73486328125, -0.7119140625, -0.68896484375, -0.666015625, -0.64306640625, -0.6201171875, -0.59716796875, -0.57421875, -0.55126953125, -0.5283203125, -0.50537109375, -0.482421875, -0.45947265625, -0.4365234375, -0.41357421875, -0.390625, -0.36767578125, -0.3447265625, -0.32177734375, -0.298828125, -0.27587890625, -0.2529296875, -0.22998046875, -0.20703125, -0.18408203125, -0.1611328125, -0.13818359375, -0.115234375, -0.09228515625, -0.0693359375, -0.04638671875, -0.0234375, -0.00048828125, 0.0224609375, 0.04541015625, 0.068359375, 0.09130859375, 0.1142578125, 0.13720703125, 0.16015625, 0.18310546875, 0.2060546875, 0.22900390625, 0.251953125, 0.27490234375, 0.2978515625, 0.32080078125, 0.34375, 0.36669921875, 0.3896484375, 0.41259765625, 0.435546875, 0.45849609375, 0.4814453125, 0.50439453125, 0.52734375, 0.55029296875, 0.5732421875, 0.59619140625, 0.619140625, 0.64208984375, 0.6650390625, 0.68798828125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 10.0, 10.0, 12.0, 22.0, 24.0, 20.0, 42.0, 42.0, 50.0, 70.0, 63.0, 66.0, 82.0, 67.0, 79.0, 74.0, 65.0, 41.0, 40.0, 16.0, 21.0, 26.0, 20.0, 12.0, 12.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.307861328125, -0.2989768981933594, -0.29009246826171875, -0.2812080383300781, -0.2723236083984375, -0.2634391784667969, -0.25455474853515625, -0.24567031860351562, -0.236785888671875, -0.22790145874023438, -0.21901702880859375, -0.21013259887695312, -0.2012481689453125, -0.19236373901367188, -0.18347930908203125, -0.17459487915039062, -0.16571044921875, -0.15682601928710938, -0.14794158935546875, -0.13905715942382812, -0.1301727294921875, -0.12128829956054688, -0.11240386962890625, -0.10351943969726562, -0.094635009765625, -0.08575057983398438, -0.07686614990234375, -0.06798171997070312, -0.0590972900390625, -0.050212860107421875, -0.04132843017578125, -0.032444000244140625, -0.0235595703125, -0.014675140380859375, -0.00579071044921875, 0.003093719482421875, 0.0119781494140625, 0.020862579345703125, 0.02974700927734375, 0.038631439208984375, 0.047515869140625, 0.056400299072265625, 0.06528472900390625, 0.07416915893554688, 0.0830535888671875, 0.09193801879882812, 0.10082244873046875, 0.10970687866210938, 0.11859130859375, 0.12747573852539062, 0.13636016845703125, 0.14524459838867188, 0.1541290283203125, 0.16301345825195312, 0.17189788818359375, 0.18078231811523438, 0.189666748046875, 0.19855117797851562, 0.20743560791015625, 0.21632003784179688, 0.2252044677734375, 0.23408889770507812, 0.24297332763671875, 0.2518577575683594, 0.2607421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 3.0, 11.0, 3.0, 17.0, 20.0, 34.0, 39.0, 63.0, 94.0, 134.0, 223.0, 422.0, 854.0, 1890.0, 4965.0, 16378.0, 77947.0, 573480.0, 310119.0, 44370.0, 11010.0, 3480.0, 1433.0, 667.0, 327.0, 192.0, 115.0, 73.0, 50.0, 35.0, 26.0, 15.0, 18.0, 15.0, 5.0, 5.0, 1.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.491943359375, -0.4742698669433594, -0.45659637451171875, -0.4389228820800781, -0.4212493896484375, -0.4035758972167969, -0.38590240478515625, -0.3682289123535156, -0.350555419921875, -0.3328819274902344, -0.31520843505859375, -0.2975349426269531, -0.2798614501953125, -0.2621879577636719, -0.24451446533203125, -0.22684097290039062, -0.20916748046875, -0.19149398803710938, -0.17382049560546875, -0.15614700317382812, -0.1384735107421875, -0.12080001831054688, -0.10312652587890625, -0.08545303344726562, -0.067779541015625, -0.050106048583984375, -0.03243255615234375, -0.014759063720703125, 0.0029144287109375, 0.020587921142578125, 0.03826141357421875, 0.055934906005859375, 0.0736083984375, 0.09128189086914062, 0.10895538330078125, 0.12662887573242188, 0.1443023681640625, 0.16197586059570312, 0.17964935302734375, 0.19732284545898438, 0.214996337890625, 0.23266983032226562, 0.25034332275390625, 0.2680168151855469, 0.2856903076171875, 0.3033638000488281, 0.32103729248046875, 0.3387107849121094, 0.35638427734375, 0.3740577697753906, 0.39173126220703125, 0.4094047546386719, 0.4270782470703125, 0.4447517395019531, 0.46242523193359375, 0.4800987243652344, 0.497772216796875, 0.5154457092285156, 0.5331192016601562, 0.5507926940917969, 0.5684661865234375, 0.5861396789550781, 0.6038131713867188, 0.6214866638183594, 0.63916015625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 9.0, 9.0, 13.0, 13.0, 23.0, 27.0, 26.0, 38.0, 38.0, 41.0, 40.0, 56.0, 44.0, 58.0, 67.0, 60.0, 42.0, 60.0, 48.0, 52.0, 36.0, 43.0, 20.0, 30.0, 33.0, 24.0, 13.0, 13.0, 7.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.634796142578125, -0.60748291015625, -0.580169677734375, -0.5528564453125, -0.525543212890625, -0.49822998046875, -0.470916748046875, -0.443603515625, -0.416290283203125, -0.38897705078125, -0.361663818359375, -0.3343505859375, -0.307037353515625, -0.27972412109375, -0.252410888671875, -0.22509765625, -0.197784423828125, -0.17047119140625, -0.143157958984375, -0.1158447265625, -0.088531494140625, -0.06121826171875, -0.033905029296875, -0.006591796875, 0.020721435546875, 0.04803466796875, 0.075347900390625, 0.1026611328125, 0.129974365234375, 0.15728759765625, 0.184600830078125, 0.2119140625, 0.239227294921875, 0.26654052734375, 0.293853759765625, 0.3211669921875, 0.348480224609375, 0.37579345703125, 0.403106689453125, 0.430419921875, 0.457733154296875, 0.48504638671875, 0.512359619140625, 0.5396728515625, 0.566986083984375, 0.59429931640625, 0.621612548828125, 0.64892578125, 0.676239013671875, 0.70355224609375, 0.730865478515625, 0.7581787109375, 0.785491943359375, 0.81280517578125, 0.840118408203125, 0.867431640625, 0.894744873046875, 0.92205810546875, 0.949371337890625, 0.9766845703125, 1.003997802734375, 1.03131103515625, 1.058624267578125, 1.0859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 1.0, 7.0, 6.0, 9.0, 11.0, 17.0, 20.0, 28.0, 31.0, 51.0, 79.0, 126.0, 234.0, 434.0, 757.0, 1763.0, 4769.0, 16224.0, 78688.0, 558484.0, 322939.0, 46316.0, 10959.0, 3538.0, 1462.0, 674.0, 366.0, 184.0, 121.0, 78.0, 52.0, 41.0, 27.0, 17.0, 11.0, 9.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1673583984375, -0.16112518310546875, -0.1548919677734375, -0.14865875244140625, -0.142425537109375, -0.13619232177734375, -0.1299591064453125, -0.12372589111328125, -0.11749267578125, -0.11125946044921875, -0.1050262451171875, -0.09879302978515625, -0.092559814453125, -0.08632659912109375, -0.0800933837890625, -0.07386016845703125, -0.067626953125, -0.06139373779296875, -0.0551605224609375, -0.04892730712890625, -0.042694091796875, -0.03646087646484375, -0.0302276611328125, -0.02399444580078125, -0.01776123046875, -0.01152801513671875, -0.0052947998046875, 0.00093841552734375, 0.007171630859375, 0.01340484619140625, 0.0196380615234375, 0.02587127685546875, 0.0321044921875, 0.03833770751953125, 0.0445709228515625, 0.05080413818359375, 0.057037353515625, 0.06327056884765625, 0.0695037841796875, 0.07573699951171875, 0.08197021484375, 0.08820343017578125, 0.0944366455078125, 0.10066986083984375, 0.106903076171875, 0.11313629150390625, 0.1193695068359375, 0.12560272216796875, 0.1318359375, 0.13806915283203125, 0.1443023681640625, 0.15053558349609375, 0.156768798828125, 0.16300201416015625, 0.1692352294921875, 0.17546844482421875, 0.18170166015625, 0.18793487548828125, 0.1941680908203125, 0.20040130615234375, 0.206634521484375, 0.21286773681640625, 0.2191009521484375, 0.22533416748046875, 0.2315673828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 13.0, 2.0, 5.0, 8.0, 3.0, 6.0, 13.0, 10.0, 18.0, 29.0, 32.0, 38.0, 58.0, 66.0, 81.0, 82.0, 94.0, 92.0, 70.0, 57.0, 54.0, 28.0, 25.0, 31.0, 29.0, 10.0, 10.0, 8.0, 5.0, 8.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-4.6193599700927734e-05, -4.501082003116608e-05, -4.382804036140442e-05, -4.264526069164276e-05, -4.1462481021881104e-05, -4.0279701352119446e-05, -3.909692168235779e-05, -3.791414201259613e-05, -3.673136234283447e-05, -3.5548582673072815e-05, -3.436580300331116e-05, -3.31830233335495e-05, -3.200024366378784e-05, -3.0817463994026184e-05, -2.9634684324264526e-05, -2.845190465450287e-05, -2.726912498474121e-05, -2.6086345314979553e-05, -2.4903565645217896e-05, -2.3720785975456238e-05, -2.253800630569458e-05, -2.1355226635932922e-05, -2.0172446966171265e-05, -1.8989667296409607e-05, -1.780688762664795e-05, -1.662410795688629e-05, -1.5441328287124634e-05, -1.4258548617362976e-05, -1.3075768947601318e-05, -1.189298927783966e-05, -1.0710209608078003e-05, -9.527429938316345e-06, -8.344650268554688e-06, -7.16187059879303e-06, -5.979090929031372e-06, -4.796311259269714e-06, -3.6135315895080566e-06, -2.430751919746399e-06, -1.2479722499847412e-06, -6.51925802230835e-08, 1.1175870895385742e-06, 2.300366759300232e-06, 3.4831464290618896e-06, 4.665926098823547e-06, 5.848705768585205e-06, 7.031485438346863e-06, 8.21426510810852e-06, 9.397044777870178e-06, 1.0579824447631836e-05, 1.1762604117393494e-05, 1.2945383787155151e-05, 1.4128163456916809e-05, 1.5310943126678467e-05, 1.6493722796440125e-05, 1.7676502466201782e-05, 1.885928213596344e-05, 2.0042061805725098e-05, 2.1224841475486755e-05, 2.2407621145248413e-05, 2.359040081501007e-05, 2.477318048477173e-05, 2.5955960154533386e-05, 2.7138739824295044e-05, 2.83215194940567e-05, 2.950429916381836e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 5.0, 7.0, 5.0, 7.0, 14.0, 21.0, 31.0, 43.0, 71.0, 91.0, 161.0, 271.0, 483.0, 905.0, 1818.0, 4266.0, 11965.0, 46413.0, 272185.0, 569473.0, 105691.0, 22309.0, 6855.0, 2630.0, 1235.0, 655.0, 364.0, 212.0, 121.0, 81.0, 66.0, 32.0, 23.0, 13.0, 13.0, 9.0, 5.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18017578125, -0.17401504516601562, -0.16785430908203125, -0.16169357299804688, -0.1555328369140625, -0.14937210083007812, -0.14321136474609375, -0.13705062866210938, -0.130889892578125, -0.12472915649414062, -0.11856842041015625, -0.11240768432617188, -0.1062469482421875, -0.10008621215820312, -0.09392547607421875, -0.08776473999023438, -0.08160400390625, -0.07544326782226562, -0.06928253173828125, -0.06312179565429688, -0.0569610595703125, -0.050800323486328125, -0.04463958740234375, -0.038478851318359375, -0.032318115234375, -0.026157379150390625, -0.01999664306640625, -0.013835906982421875, -0.0076751708984375, -0.001514434814453125, 0.00464630126953125, 0.010807037353515625, 0.0169677734375, 0.023128509521484375, 0.02928924560546875, 0.035449981689453125, 0.0416107177734375, 0.047771453857421875, 0.05393218994140625, 0.060092926025390625, 0.066253662109375, 0.07241439819335938, 0.07857513427734375, 0.08473587036132812, 0.0908966064453125, 0.09705734252929688, 0.10321807861328125, 0.10937881469726562, 0.11553955078125, 0.12170028686523438, 0.12786102294921875, 0.13402175903320312, 0.1401824951171875, 0.14634323120117188, 0.15250396728515625, 0.15866470336914062, 0.164825439453125, 0.17098617553710938, 0.17714691162109375, 0.18330764770507812, 0.1894683837890625, 0.19562911987304688, 0.20178985595703125, 0.20795059204101562, 0.214111328125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 9.0, 5.0, 9.0, 11.0, 20.0, 18.0, 23.0, 36.0, 42.0, 57.0, 69.0, 82.0, 86.0, 82.0, 86.0, 91.0, 50.0, 47.0, 45.0, 46.0, 16.0, 18.0, 16.0, 8.0, 7.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2374267578125, -0.23070144653320312, -0.22397613525390625, -0.21725082397460938, -0.2105255126953125, -0.20380020141601562, -0.19707489013671875, -0.19034957885742188, -0.183624267578125, -0.17689895629882812, -0.17017364501953125, -0.16344833374023438, -0.1567230224609375, -0.14999771118164062, -0.14327239990234375, -0.13654708862304688, -0.12982177734375, -0.12309646606445312, -0.11637115478515625, -0.10964584350585938, -0.1029205322265625, -0.09619522094726562, -0.08946990966796875, -0.08274459838867188, -0.076019287109375, -0.06929397583007812, -0.06256866455078125, -0.055843353271484375, -0.0491180419921875, -0.042392730712890625, -0.03566741943359375, -0.028942108154296875, -0.022216796875, -0.015491485595703125, -0.00876617431640625, -0.002040863037109375, 0.0046844482421875, 0.011409759521484375, 0.01813507080078125, 0.024860382080078125, 0.031585693359375, 0.038311004638671875, 0.04503631591796875, 0.051761627197265625, 0.0584869384765625, 0.06521224975585938, 0.07193756103515625, 0.07866287231445312, 0.08538818359375, 0.09211349487304688, 0.09883880615234375, 0.10556411743164062, 0.1122894287109375, 0.11901473999023438, 0.12574005126953125, 0.13246536254882812, 0.139190673828125, 0.14591598510742188, 0.15264129638671875, 0.15936660766601562, 0.1660919189453125, 0.17281723022460938, 0.17954254150390625, 0.18626785278320312, 0.1929931640625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 11.0, 10.0, 10.0, 19.0, 29.0, 47.0, 73.0, 112.0, 130.0, 133.0, 128.0, 97.0, 68.0, 48.0, 31.0, 16.0, 7.0, 12.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.7198100090026855, -4.608731746673584, -4.497653484344482, -4.386575222015381, -4.275496959686279, -4.1644182205200195, -4.053339958190918, -3.9422619342803955, -3.831183433532715, -3.7201051712036133, -3.6090269088745117, -3.49794864654541, -3.3868701457977295, -3.275791883468628, -3.1647136211395264, -3.053635358810425, -2.9425570964813232, -2.8314788341522217, -2.72040057182312, -2.6093220710754395, -2.498243808746338, -2.3871655464172363, -2.2760872840881348, -2.165009021759033, -2.0539307594299316, -1.94285249710083, -1.831774115562439, -1.7206958532333374, -1.6096174716949463, -1.4985392093658447, -1.3874609470367432, -1.2763826847076416, -1.1653039455413818, -1.0542256832122803, -0.9431473016738892, -0.8320690393447876, -0.7209907174110413, -0.6099123954772949, -0.49883413314819336, -0.387755811214447, -0.2766774892807007, -0.16559918224811554, -0.054520875215530396, 0.056557416915893555, 0.1676357388496399, 0.27871406078338623, 0.3897923231124878, 0.5008706450462341, 0.6119489669799805, 0.7230272889137268, 0.8341056108474731, 0.9451838731765747, 1.0562622547149658, 1.1673405170440674, 1.278418779373169, 1.3894970417022705, 1.5005754232406616, 1.6116536855697632, 1.7227320671081543, 1.8338103294372559, 1.9448885917663574, 2.055966854095459, 2.1670451164245605, 2.278123617172241, 2.3892018795013428]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 2.0, 9.0, 6.0, 10.0, 17.0, 21.0, 16.0, 18.0, 18.0, 20.0, 38.0, 42.0, 41.0, 32.0, 42.0, 44.0, 60.0, 43.0, 55.0, 34.0, 41.0, 51.0, 36.0, 45.0, 43.0, 28.0, 28.0, 26.0, 20.0, 27.0, 16.0, 19.0, 9.0, 13.0, 6.0, 6.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1822519302368164, -3.0799543857574463, -2.977656841278076, -2.875359296798706, -2.773061752319336, -2.670764446258545, -2.568466901779175, -2.4661693572998047, -2.3638718128204346, -2.2615742683410645, -2.1592767238616943, -2.056979179382324, -1.9546817541122437, -1.8523842096328735, -1.750086784362793, -1.6477892398834229, -1.5454916954040527, -1.4431941509246826, -1.3408966064453125, -1.238599181175232, -1.1363016366958618, -1.0340040922164917, -0.9317066073417664, -0.829409122467041, -0.7271115779876709, -0.6248140335083008, -0.5225165486335754, -0.4202190339565277, -0.31792151927948, -0.21562397480010986, -0.11332648992538452, -0.01102900505065918, 0.09126853942871094, 0.19356605410575867, 0.2958635687828064, 0.3981610834598541, 0.5004585981369019, 0.602756142616272, 0.7050536274909973, 0.8073511123657227, 0.9096486568450928, 1.011946201324463, 1.114243745803833, 1.2165411710739136, 1.3188387155532837, 1.4211362600326538, 1.5234336853027344, 1.6257312297821045, 1.7280287742614746, 1.8303263187408447, 1.9326238632202148, 2.034921407699585, 2.137218952178955, 2.239516258239746, 2.341813802719116, 2.4441113471984863, 2.5464088916778564, 2.6487064361572266, 2.7510039806365967, 2.853301525115967, 2.955598831176758, 3.057896614074707, 3.160193920135498, 3.262491464614868, 3.3647890090942383]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 16.0, 12.0, 14.0, 22.0, 29.0, 37.0, 94.0, 143.0, 232.0, 656.0, 4187857.0, 4163.0, 458.0, 204.0, 103.0, 75.0, 55.0, 34.0, 24.0, 18.0, 3.0, 7.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8203125, -8.5596923828125, -8.299072265625, -8.0384521484375, -7.77783203125, -7.5172119140625, -7.256591796875, -6.9959716796875, -6.7353515625, -6.4747314453125, -6.214111328125, -5.9534912109375, -5.69287109375, -5.4322509765625, -5.171630859375, -4.9110107421875, -4.650390625, -4.3897705078125, -4.129150390625, -3.8685302734375, -3.60791015625, -3.3472900390625, -3.086669921875, -2.8260498046875, -2.5654296875, -2.3048095703125, -2.044189453125, -1.7835693359375, -1.52294921875, -1.2623291015625, -1.001708984375, -0.7410888671875, -0.48046875, -0.2198486328125, 0.040771484375, 0.3013916015625, 0.56201171875, 0.8226318359375, 1.083251953125, 1.3438720703125, 1.6044921875, 1.8651123046875, 2.125732421875, 2.3863525390625, 2.64697265625, 2.9075927734375, 3.168212890625, 3.4288330078125, 3.689453125, 3.9500732421875, 4.210693359375, 4.4713134765625, 4.73193359375, 4.9925537109375, 5.253173828125, 5.5137939453125, 5.7744140625, 6.0350341796875, 6.295654296875, 6.5562744140625, 6.81689453125, 7.0775146484375, 7.338134765625, 7.5987548828125, 7.859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 1.0, 8.0, 11.0, 10.0, 20.0, 24.0, 31.0, 38.0, 44.0, 41.0, 66.0, 65.0, 54.0, 95.0, 71.0, 71.0, 67.0, 50.0, 65.0, 38.0, 33.0, 28.0, 23.0, 14.0, 10.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.31005859375, -0.3011207580566406, -0.29218292236328125, -0.2832450866699219, -0.2743072509765625, -0.2653694152832031, -0.25643157958984375, -0.24749374389648438, -0.238555908203125, -0.22961807250976562, -0.22068023681640625, -0.21174240112304688, -0.2028045654296875, -0.19386672973632812, -0.18492889404296875, -0.17599105834960938, -0.16705322265625, -0.15811538696289062, -0.14917755126953125, -0.14023971557617188, -0.1313018798828125, -0.12236404418945312, -0.11342620849609375, -0.10448837280273438, -0.095550537109375, -0.08661270141601562, -0.07767486572265625, -0.06873703002929688, -0.0597991943359375, -0.050861358642578125, -0.04192352294921875, -0.032985687255859375, -0.0240478515625, -0.015110015869140625, -0.00617218017578125, 0.002765655517578125, 0.0117034912109375, 0.020641326904296875, 0.02957916259765625, 0.038516998291015625, 0.047454833984375, 0.056392669677734375, 0.06533050537109375, 0.07426834106445312, 0.0832061767578125, 0.09214401245117188, 0.10108184814453125, 0.11001968383789062, 0.11895751953125, 0.12789535522460938, 0.13683319091796875, 0.14577102661132812, 0.1547088623046875, 0.16364669799804688, 0.17258453369140625, 0.18152236938476562, 0.190460205078125, 0.19939804077148438, 0.20833587646484375, 0.21727371215820312, 0.2262115478515625, 0.23514938354492188, 0.24408721923828125, 0.2530250549316406, 0.261962890625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 8.0, 4.0, 6.0, 16.0, 16.0, 15.0, 34.0, 28.0, 60.0, 76.0, 107.0, 160.0, 239.0, 337.0, 490.0, 803.0, 2036.0, 30649.0, 4153439.0, 3016.0, 968.0, 584.0, 387.0, 246.0, 161.0, 105.0, 81.0, 60.0, 41.0, 29.0, 26.0, 14.0, 14.0, 11.0, 2.0, 9.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.814453125, -2.736541748046875, -2.65863037109375, -2.580718994140625, -2.5028076171875, -2.424896240234375, -2.34698486328125, -2.269073486328125, -2.191162109375, -2.113250732421875, -2.03533935546875, -1.957427978515625, -1.8795166015625, -1.801605224609375, -1.72369384765625, -1.645782470703125, -1.56787109375, -1.489959716796875, -1.41204833984375, -1.334136962890625, -1.2562255859375, -1.178314208984375, -1.10040283203125, -1.022491455078125, -0.944580078125, -0.866668701171875, -0.78875732421875, -0.710845947265625, -0.6329345703125, -0.555023193359375, -0.47711181640625, -0.399200439453125, -0.3212890625, -0.243377685546875, -0.16546630859375, -0.087554931640625, -0.0096435546875, 0.068267822265625, 0.14617919921875, 0.224090576171875, 0.302001953125, 0.379913330078125, 0.45782470703125, 0.535736083984375, 0.6136474609375, 0.691558837890625, 0.76947021484375, 0.847381591796875, 0.92529296875, 1.003204345703125, 1.08111572265625, 1.159027099609375, 1.2369384765625, 1.314849853515625, 1.39276123046875, 1.470672607421875, 1.548583984375, 1.626495361328125, 1.70440673828125, 1.782318115234375, 1.8602294921875, 1.938140869140625, 2.01605224609375, 2.093963623046875, 2.171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 12.0, 17.0, 3940.0, 88.0, 10.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.459228515625, -0.4427452087402344, -0.42626190185546875, -0.4097785949707031, -0.3932952880859375, -0.3768119812011719, -0.36032867431640625, -0.3438453674316406, -0.327362060546875, -0.3108787536621094, -0.29439544677734375, -0.2779121398925781, -0.2614288330078125, -0.24494552612304688, -0.22846221923828125, -0.21197891235351562, -0.19549560546875, -0.17901229858398438, -0.16252899169921875, -0.14604568481445312, -0.1295623779296875, -0.11307907104492188, -0.09659576416015625, -0.08011245727539062, -0.063629150390625, -0.047145843505859375, -0.03066253662109375, -0.014179229736328125, 0.0023040771484375, 0.018787384033203125, 0.03527069091796875, 0.051753997802734375, 0.0682373046875, 0.08472061157226562, 0.10120391845703125, 0.11768722534179688, 0.1341705322265625, 0.15065383911132812, 0.16713714599609375, 0.18362045288085938, 0.200103759765625, 0.21658706665039062, 0.23307037353515625, 0.24955368041992188, 0.2660369873046875, 0.2825202941894531, 0.29900360107421875, 0.3154869079589844, 0.33197021484375, 0.3484535217285156, 0.36493682861328125, 0.3814201354980469, 0.3979034423828125, 0.4143867492675781, 0.43087005615234375, 0.4473533630371094, 0.463836669921875, 0.4803199768066406, 0.49680328369140625, 0.5132865905761719, 0.5297698974609375, 0.5462532043457031, 0.5627365112304688, 0.5792198181152344, 0.595703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 13.0, 11.0, 13.0, 15.0, 34.0, 38.0, 79.0, 123.0, 190.0, 155.0, 111.0, 63.0, 31.0, 32.0, 21.0, 15.0, 14.0, 12.0, 4.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9294941425323486, -0.9010617733001709, -0.8726294040679932, -0.8441969752311707, -0.8157646059989929, -0.7873322367668152, -0.7588998675346375, -0.7304674386978149, -0.7020350694656372, -0.6736027002334595, -0.6451703310012817, -0.6167379021644592, -0.5883055329322815, -0.5598731637001038, -0.531440794467926, -0.5030083656311035, -0.47457602620124817, -0.44614365696907043, -0.4177112579345703, -0.3892788887023926, -0.36084648966789246, -0.3324141204357147, -0.3039817214012146, -0.27554935216903687, -0.24711696803569794, -0.218684583902359, -0.19025219976902008, -0.16181981563568115, -0.13338744640350342, -0.10495506227016449, -0.07652267813682556, -0.04809029400348663, -0.019657909870147705, 0.008774472400546074, 0.03720685467123985, 0.06563923507928848, 0.09407161921262741, 0.12250399589538574, 0.15093638002872467, 0.1793687641620636, 0.20780114829540253, 0.23623353242874146, 0.2646659016609192, 0.2930983006954193, 0.32153066992759705, 0.34996306896209717, 0.3783954381942749, 0.40682780742645264, 0.43526020646095276, 0.4636925756931305, 0.4921249747276306, 0.5205573439598083, 0.5489897131919861, 0.5774221420288086, 0.6058545112609863, 0.6342868804931641, 0.6627192497253418, 0.6911516189575195, 0.7195839881896973, 0.7480164170265198, 0.7764487862586975, 0.8048811554908752, 0.833313524723053, 0.8617459535598755, 0.8901783227920532]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 11.0, 12.0, 15.0, 12.0, 21.0, 24.0, 24.0, 32.0, 41.0, 30.0, 47.0, 35.0, 41.0, 42.0, 50.0, 64.0, 47.0, 43.0, 65.0, 48.0, 39.0, 35.0, 29.0, 32.0, 23.0, 26.0, 24.0, 17.0, 11.0, 12.0, 8.0, 9.0, 3.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5416792631149292, -0.5253645181655884, -0.5090497732162476, -0.49273499846458435, -0.47642025351524353, -0.4601054787635803, -0.4437907338142395, -0.4274759888648987, -0.41116124391555786, -0.39484649896621704, -0.37853172421455383, -0.362216979265213, -0.3459022343158722, -0.329587459564209, -0.31327271461486816, -0.29695796966552734, -0.28064319491386414, -0.2643284499645233, -0.2480136901140213, -0.2316989302635193, -0.21538418531417847, -0.19906942546367645, -0.18275466561317444, -0.16643992066383362, -0.1501251608133316, -0.1338104009628296, -0.11749565601348877, -0.10118089616298676, -0.08486614376306534, -0.06855139136314392, -0.05223663151264191, -0.03592187911272049, -0.019607126712799072, -0.003292372450232506, 0.01302238181233406, 0.029337137937545776, 0.045651890337467194, 0.06196664273738861, 0.07828140258789062, 0.09459615498781204, 0.11091090738773346, 0.12722566723823547, 0.1435404121875763, 0.1598551720380783, 0.17616993188858032, 0.19248467683792114, 0.20879943668842316, 0.22511419653892517, 0.241428941488266, 0.2577436864376068, 0.27405846118927, 0.29037320613861084, 0.30668795108795166, 0.3230026960372925, 0.3393174707889557, 0.3556322157382965, 0.3719469904899597, 0.38826173543930054, 0.40457651019096375, 0.42089125514030457, 0.4372060000896454, 0.4535207748413086, 0.4698355197906494, 0.48615026473999023, 0.502465009689331]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 7.0, 7.0, 15.0, 12.0, 25.0, 38.0, 53.0, 84.0, 143.0, 236.0, 360.0, 727.0, 1124.0, 2335.0, 5030.0, 15738.0, 124055.0, 777386.0, 97649.0, 13963.0, 4780.0, 2142.0, 1093.0, 597.0, 361.0, 202.0, 120.0, 105.0, 46.0, 40.0, 16.0, 15.0, 11.0, 14.0, 3.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.86181640625, -0.8335189819335938, -0.8052215576171875, -0.7769241333007812, -0.748626708984375, -0.7203292846679688, -0.6920318603515625, -0.6637344360351562, -0.63543701171875, -0.6071395874023438, -0.5788421630859375, -0.5505447387695312, -0.522247314453125, -0.49394989013671875, -0.4656524658203125, -0.43735504150390625, -0.4090576171875, -0.38076019287109375, -0.3524627685546875, -0.32416534423828125, -0.295867919921875, -0.26757049560546875, -0.2392730712890625, -0.21097564697265625, -0.18267822265625, -0.15438079833984375, -0.1260833740234375, -0.09778594970703125, -0.069488525390625, -0.04119110107421875, -0.0128936767578125, 0.01540374755859375, 0.043701171875, 0.07199859619140625, 0.1002960205078125, 0.12859344482421875, 0.156890869140625, 0.18518829345703125, 0.2134857177734375, 0.24178314208984375, 0.27008056640625, 0.29837799072265625, 0.3266754150390625, 0.35497283935546875, 0.383270263671875, 0.41156768798828125, 0.4398651123046875, 0.46816253662109375, 0.4964599609375, 0.5247573852539062, 0.5530548095703125, 0.5813522338867188, 0.609649658203125, 0.6379470825195312, 0.6662445068359375, 0.6945419311523438, 0.72283935546875, 0.7511367797851562, 0.7794342041015625, 0.8077316284179688, 0.836029052734375, 0.8643264770507812, 0.8926239013671875, 0.9209213256835938, 0.94921875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 7.0, 9.0, 16.0, 21.0, 26.0, 28.0, 37.0, 47.0, 32.0, 65.0, 60.0, 63.0, 57.0, 67.0, 75.0, 64.0, 49.0, 49.0, 49.0, 43.0, 28.0, 27.0, 29.0, 11.0, 12.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.303466796875, -0.29479217529296875, -0.2861175537109375, -0.27744293212890625, -0.268768310546875, -0.26009368896484375, -0.2514190673828125, -0.24274444580078125, -0.23406982421875, -0.22539520263671875, -0.2167205810546875, -0.20804595947265625, -0.199371337890625, -0.19069671630859375, -0.1820220947265625, -0.17334747314453125, -0.1646728515625, -0.15599822998046875, -0.1473236083984375, -0.13864898681640625, -0.129974365234375, -0.12129974365234375, -0.1126251220703125, -0.10395050048828125, -0.09527587890625, -0.08660125732421875, -0.0779266357421875, -0.06925201416015625, -0.060577392578125, -0.05190277099609375, -0.0432281494140625, -0.03455352783203125, -0.02587890625, -0.01720428466796875, -0.0085296630859375, 0.00014495849609375, 0.008819580078125, 0.01749420166015625, 0.0261688232421875, 0.03484344482421875, 0.04351806640625, 0.05219268798828125, 0.0608673095703125, 0.06954193115234375, 0.078216552734375, 0.08689117431640625, 0.0955657958984375, 0.10424041748046875, 0.1129150390625, 0.12158966064453125, 0.1302642822265625, 0.13893890380859375, 0.147613525390625, 0.15628814697265625, 0.1649627685546875, 0.17363739013671875, 0.18231201171875, 0.19098663330078125, 0.1996612548828125, 0.20833587646484375, 0.217010498046875, 0.22568511962890625, 0.2343597412109375, 0.24303436279296875, 0.251708984375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 6.0, 9.0, 14.0, 30.0, 34.0, 35.0, 58.0, 69.0, 163.0, 298.0, 475.0, 975.0, 2329.0, 6839.0, 34427.0, 477630.0, 479825.0, 34053.0, 6821.0, 2244.0, 998.0, 490.0, 270.0, 167.0, 93.0, 63.0, 44.0, 24.0, 16.0, 8.0, 20.0, 4.0, 7.0, 4.0, 3.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63916015625, -0.6191864013671875, -0.599212646484375, -0.5792388916015625, -0.55926513671875, -0.5392913818359375, -0.519317626953125, -0.4993438720703125, -0.4793701171875, -0.4593963623046875, -0.439422607421875, -0.4194488525390625, -0.39947509765625, -0.3795013427734375, -0.359527587890625, -0.3395538330078125, -0.319580078125, -0.2996063232421875, -0.279632568359375, -0.2596588134765625, -0.23968505859375, -0.2197113037109375, -0.199737548828125, -0.1797637939453125, -0.1597900390625, -0.1398162841796875, -0.119842529296875, -0.0998687744140625, -0.07989501953125, -0.0599212646484375, -0.039947509765625, -0.0199737548828125, 0.0, 0.0199737548828125, 0.039947509765625, 0.0599212646484375, 0.07989501953125, 0.0998687744140625, 0.119842529296875, 0.1398162841796875, 0.1597900390625, 0.1797637939453125, 0.199737548828125, 0.2197113037109375, 0.23968505859375, 0.2596588134765625, 0.279632568359375, 0.2996063232421875, 0.319580078125, 0.3395538330078125, 0.359527587890625, 0.3795013427734375, 0.39947509765625, 0.4194488525390625, 0.439422607421875, 0.4593963623046875, 0.4793701171875, 0.4993438720703125, 0.519317626953125, 0.5392913818359375, 0.55926513671875, 0.5792388916015625, 0.599212646484375, 0.6191864013671875, 0.63916015625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 9.0, 11.0, 12.0, 17.0, 17.0, 18.0, 26.0, 32.0, 35.0, 30.0, 34.0, 34.0, 35.0, 47.0, 40.0, 45.0, 48.0, 51.0, 60.0, 44.0, 36.0, 29.0, 33.0, 31.0, 30.0, 28.0, 34.0, 24.0, 22.0, 20.0, 15.0, 14.0, 10.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83642578125, -0.8123626708984375, -0.788299560546875, -0.7642364501953125, -0.74017333984375, -0.7161102294921875, -0.692047119140625, -0.6679840087890625, -0.6439208984375, -0.6198577880859375, -0.595794677734375, -0.5717315673828125, -0.54766845703125, -0.5236053466796875, -0.499542236328125, -0.4754791259765625, -0.451416015625, -0.4273529052734375, -0.403289794921875, -0.3792266845703125, -0.35516357421875, -0.3311004638671875, -0.307037353515625, -0.2829742431640625, -0.2589111328125, -0.2348480224609375, -0.210784912109375, -0.1867218017578125, -0.16265869140625, -0.1385955810546875, -0.114532470703125, -0.0904693603515625, -0.06640625, -0.0423431396484375, -0.018280029296875, 0.0057830810546875, 0.02984619140625, 0.0539093017578125, 0.077972412109375, 0.1020355224609375, 0.1260986328125, 0.1501617431640625, 0.174224853515625, 0.1982879638671875, 0.22235107421875, 0.2464141845703125, 0.270477294921875, 0.2945404052734375, 0.318603515625, 0.3426666259765625, 0.366729736328125, 0.3907928466796875, 0.41485595703125, 0.4389190673828125, 0.462982177734375, 0.4870452880859375, 0.5111083984375, 0.5351715087890625, 0.559234619140625, 0.5832977294921875, 0.60736083984375, 0.6314239501953125, 0.655487060546875, 0.6795501708984375, 0.70361328125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 4.0, 8.0, 9.0, 6.0, 8.0, 16.0, 31.0, 42.0, 110.0, 240.0, 528.0, 1741.0, 8147.0, 107670.0, 882273.0, 40842.0, 4893.0, 1193.0, 399.0, 165.0, 86.0, 54.0, 20.0, 11.0, 15.0, 12.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3017578125, -0.29111480712890625, -0.2804718017578125, -0.26982879638671875, -0.259185791015625, -0.24854278564453125, -0.2378997802734375, -0.22725677490234375, -0.21661376953125, -0.20597076416015625, -0.1953277587890625, -0.18468475341796875, -0.174041748046875, -0.16339874267578125, -0.1527557373046875, -0.14211273193359375, -0.1314697265625, -0.12082672119140625, -0.1101837158203125, -0.09954071044921875, -0.088897705078125, -0.07825469970703125, -0.0676116943359375, -0.05696868896484375, -0.04632568359375, -0.03568267822265625, -0.0250396728515625, -0.01439666748046875, -0.003753662109375, 0.00688934326171875, 0.0175323486328125, 0.02817535400390625, 0.038818359375, 0.04946136474609375, 0.0601043701171875, 0.07074737548828125, 0.081390380859375, 0.09203338623046875, 0.1026763916015625, 0.11331939697265625, 0.12396240234375, 0.13460540771484375, 0.1452484130859375, 0.15589141845703125, 0.166534423828125, 0.17717742919921875, 0.1878204345703125, 0.19846343994140625, 0.2091064453125, 0.21974945068359375, 0.2303924560546875, 0.24103546142578125, 0.251678466796875, 0.26232147216796875, 0.2729644775390625, 0.28360748291015625, 0.29425048828125, 0.30489349365234375, 0.3155364990234375, 0.32617950439453125, 0.336822509765625, 0.34746551513671875, 0.3581085205078125, 0.36875152587890625, 0.37939453125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 8.0, 11.0, 9.0, 19.0, 27.0, 27.0, 41.0, 79.0, 89.0, 121.0, 133.0, 121.0, 82.0, 62.0, 31.0, 41.0, 22.0, 19.0, 14.0, 8.0, 4.0, 2.0, 4.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.398822784423828e-05, -4.2389146983623505e-05, -4.079006612300873e-05, -3.919098526239395e-05, -3.7591904401779175e-05, -3.59928235411644e-05, -3.439374268054962e-05, -3.2794661819934845e-05, -3.119558095932007e-05, -2.9596500098705292e-05, -2.7997419238090515e-05, -2.639833837747574e-05, -2.4799257516860962e-05, -2.3200176656246185e-05, -2.160109579563141e-05, -2.0002014935016632e-05, -1.8402934074401855e-05, -1.680385321378708e-05, -1.5204772353172302e-05, -1.3605691492557526e-05, -1.2006610631942749e-05, -1.0407529771327972e-05, -8.808448910713196e-06, -7.209368050098419e-06, -5.610287189483643e-06, -4.011206328868866e-06, -2.4121254682540894e-06, -8.130446076393127e-07, 7.860362529754639e-07, 2.3851171135902405e-06, 3.984197974205017e-06, 5.583278834819794e-06, 7.18235969543457e-06, 8.781440556049347e-06, 1.0380521416664124e-05, 1.19796022772789e-05, 1.3578683137893677e-05, 1.5177763998508453e-05, 1.677684485912323e-05, 1.8375925719738007e-05, 1.9975006580352783e-05, 2.157408744096756e-05, 2.3173168301582336e-05, 2.4772249162197113e-05, 2.637133002281189e-05, 2.7970410883426666e-05, 2.9569491744041443e-05, 3.116857260465622e-05, 3.2767653465270996e-05, 3.436673432588577e-05, 3.596581518650055e-05, 3.7564896047115326e-05, 3.91639769077301e-05, 4.076305776834488e-05, 4.2362138628959656e-05, 4.396121948957443e-05, 4.556030035018921e-05, 4.7159381210803986e-05, 4.875846207141876e-05, 5.035754293203354e-05, 5.1956623792648315e-05, 5.355570465326309e-05, 5.515478551387787e-05, 5.6753866374492645e-05, 5.835294723510742e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 8.0, 14.0, 25.0, 26.0, 49.0, 71.0, 152.0, 343.0, 901.0, 3333.0, 19528.0, 626234.0, 377821.0, 15650.0, 2937.0, 796.0, 335.0, 140.0, 71.0, 48.0, 22.0, 16.0, 14.0, 4.0, 4.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.333251953125, -0.3204078674316406, -0.30756378173828125, -0.2947196960449219, -0.2818756103515625, -0.2690315246582031, -0.25618743896484375, -0.24334335327148438, -0.230499267578125, -0.21765518188476562, -0.20481109619140625, -0.19196701049804688, -0.1791229248046875, -0.16627883911132812, -0.15343475341796875, -0.14059066772460938, -0.12774658203125, -0.11490249633789062, -0.10205841064453125, -0.08921432495117188, -0.0763702392578125, -0.06352615356445312, -0.05068206787109375, -0.037837982177734375, -0.024993896484375, -0.012149810791015625, 0.00069427490234375, 0.013538360595703125, 0.0263824462890625, 0.039226531982421875, 0.05207061767578125, 0.06491470336914062, 0.0777587890625, 0.09060287475585938, 0.10344696044921875, 0.11629104614257812, 0.1291351318359375, 0.14197921752929688, 0.15482330322265625, 0.16766738891601562, 0.180511474609375, 0.19335556030273438, 0.20619964599609375, 0.21904373168945312, 0.2318878173828125, 0.24473190307617188, 0.25757598876953125, 0.2704200744628906, 0.28326416015625, 0.2961082458496094, 0.30895233154296875, 0.3217964172363281, 0.3346405029296875, 0.3474845886230469, 0.36032867431640625, 0.3731727600097656, 0.386016845703125, 0.3988609313964844, 0.41170501708984375, 0.4245491027832031, 0.4373931884765625, 0.4502372741699219, 0.46308135986328125, 0.4759254455566406, 0.48876953125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 7.0, 14.0, 15.0, 16.0, 23.0, 30.0, 65.0, 95.0, 112.0, 119.0, 118.0, 112.0, 88.0, 59.0, 31.0, 27.0, 23.0, 15.0, 11.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.23193359375, -0.223663330078125, -0.21539306640625, -0.207122802734375, -0.1988525390625, -0.190582275390625, -0.18231201171875, -0.174041748046875, -0.165771484375, -0.157501220703125, -0.14923095703125, -0.140960693359375, -0.1326904296875, -0.124420166015625, -0.11614990234375, -0.107879638671875, -0.099609375, -0.091339111328125, -0.08306884765625, -0.074798583984375, -0.0665283203125, -0.058258056640625, -0.04998779296875, -0.041717529296875, -0.033447265625, -0.025177001953125, -0.01690673828125, -0.008636474609375, -0.0003662109375, 0.007904052734375, 0.01617431640625, 0.024444580078125, 0.03271484375, 0.040985107421875, 0.04925537109375, 0.057525634765625, 0.0657958984375, 0.074066162109375, 0.08233642578125, 0.090606689453125, 0.098876953125, 0.107147216796875, 0.11541748046875, 0.123687744140625, 0.1319580078125, 0.140228271484375, 0.14849853515625, 0.156768798828125, 0.1650390625, 0.173309326171875, 0.18157958984375, 0.189849853515625, 0.1981201171875, 0.206390380859375, 0.21466064453125, 0.222930908203125, 0.231201171875, 0.239471435546875, 0.24774169921875, 0.256011962890625, 0.2642822265625, 0.272552490234375, 0.28082275390625, 0.289093017578125, 0.29736328125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 13.0, 16.0, 21.0, 54.0, 55.0, 77.0, 124.0, 130.0, 116.0, 108.0, 74.0, 56.0, 52.0, 36.0, 10.0, 10.0, 7.0, 4.0, 10.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4914488792419434, -3.399714708328247, -3.30798077583313, -3.2162466049194336, -3.1245126724243164, -3.03277850151062, -2.941044330596924, -2.8493103981018066, -2.7575762271881104, -2.665842056274414, -2.574108123779297, -2.4823739528656006, -2.3906397819519043, -2.298905849456787, -2.207171678543091, -2.1154375076293945, -2.0237035751342773, -1.9319695234298706, -1.8402354717254639, -1.7485013008117676, -1.6567672491073608, -1.565033197402954, -1.4732990264892578, -1.381564974784851, -1.2898309230804443, -1.1980968713760376, -1.1063628196716309, -1.0146286487579346, -0.9228945970535278, -0.8311605453491211, -0.7394264340400696, -0.6476923227310181, -0.5559585094451904, -0.4642244279384613, -0.3724903464317322, -0.28075626492500305, -0.18902218341827393, -0.0972881019115448, -0.005554020404815674, 0.08618009090423584, 0.17791414260864258, 0.2696482241153717, 0.36138230562210083, 0.45311638712882996, 0.5448504686355591, 0.6365845203399658, 0.7283186316490173, 0.8200527429580688, 0.9117867946624756, 1.0035208463668823, 1.095254898071289, 1.1869890689849854, 1.278723120689392, 1.3704571723937988, 1.4621913433074951, 1.5539253950119019, 1.6456594467163086, 1.7373934984207153, 1.829127550125122, 1.9208617210388184, 2.0125956535339355, 2.104329824447632, 2.196063995361328, 2.2877979278564453, 2.3795320987701416]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 3.0, 7.0, 7.0, 6.0, 5.0, 12.0, 13.0, 11.0, 18.0, 22.0, 26.0, 34.0, 50.0, 47.0, 52.0, 44.0, 59.0, 70.0, 59.0, 57.0, 61.0, 53.0, 35.0, 36.0, 31.0, 37.0, 32.0, 20.0, 20.0, 22.0, 14.0, 13.0, 7.0, 11.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9098610877990723, -2.780362367630005, -2.6508636474609375, -2.521364688873291, -2.3918659687042236, -2.2623672485351562, -2.132868528366089, -2.0033698081970215, -1.8738709688186646, -1.7443722486495972, -1.6148734092712402, -1.4853746891021729, -1.3558759689331055, -1.2263771295547485, -1.0968784093856812, -0.967379629611969, -0.8378808498382568, -0.7083820700645447, -0.5788832902908325, -0.44938457012176514, -0.319885790348053, -0.19038701057434082, -0.06088829040527344, 0.06861048936843872, 0.19810926914215088, 0.32760804891586304, 0.4571067988872528, 0.5866055488586426, 0.7161043286323547, 0.8456031084060669, 0.9751018285751343, 1.1046006679534912, 1.2340993881225586, 1.363598108291626, 1.493096947669983, 1.6225956678390503, 1.7520945072174072, 1.8815932273864746, 2.011091947555542, 2.1405906677246094, 2.270089626312256, 2.3995883464813232, 2.5290870666503906, 2.658586025238037, 2.7880847454071045, 2.917583465576172, 3.0470821857452393, 3.1765809059143066, 3.306079626083374, 3.4355783462524414, 3.565077066421509, 3.694575786590576, 3.8240747451782227, 3.95357346534729, 4.083072185516357, 4.212571144104004, 4.342069625854492, 4.471568584442139, 4.601067066192627, 4.730566024780273, 4.860064506530762, 4.989563465118408, 5.119062423706055, 5.248560905456543, 5.3780598640441895]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 12.0, 16.0, 14.0, 28.0, 41.0, 70.0, 82.0, 122.0, 366.0, 1524.0, 4188615.0, 2452.0, 465.0, 165.0, 97.0, 57.0, 40.0, 30.0, 26.0, 15.0, 8.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.47265625, -7.25018310546875, -7.0277099609375, -6.80523681640625, -6.582763671875, -6.36029052734375, -6.1378173828125, -5.91534423828125, -5.69287109375, -5.47039794921875, -5.2479248046875, -5.02545166015625, -4.802978515625, -4.58050537109375, -4.3580322265625, -4.13555908203125, -3.9130859375, -3.69061279296875, -3.4681396484375, -3.24566650390625, -3.023193359375, -2.80072021484375, -2.5782470703125, -2.35577392578125, -2.13330078125, -1.91082763671875, -1.6883544921875, -1.46588134765625, -1.243408203125, -1.02093505859375, -0.7984619140625, -0.57598876953125, -0.353515625, -0.13104248046875, 0.0914306640625, 0.31390380859375, 0.536376953125, 0.75885009765625, 0.9813232421875, 1.20379638671875, 1.42626953125, 1.64874267578125, 1.8712158203125, 2.09368896484375, 2.316162109375, 2.53863525390625, 2.7611083984375, 2.98358154296875, 3.2060546875, 3.42852783203125, 3.6510009765625, 3.87347412109375, 4.095947265625, 4.31842041015625, 4.5408935546875, 4.76336669921875, 4.98583984375, 5.20831298828125, 5.4307861328125, 5.65325927734375, 5.875732421875, 6.09820556640625, 6.3206787109375, 6.54315185546875, 6.765625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 11.0, 15.0, 11.0, 26.0, 26.0, 45.0, 55.0, 45.0, 84.0, 70.0, 69.0, 79.0, 93.0, 77.0, 56.0, 61.0, 37.0, 43.0, 31.0, 20.0, 12.0, 15.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.348876953125, -0.3389701843261719, -0.32906341552734375, -0.3191566467285156, -0.3092498779296875, -0.2993431091308594, -0.28943634033203125, -0.2795295715332031, -0.269622802734375, -0.2597160339355469, -0.24980926513671875, -0.23990249633789062, -0.2299957275390625, -0.22008895874023438, -0.21018218994140625, -0.20027542114257812, -0.19036865234375, -0.18046188354492188, -0.17055511474609375, -0.16064834594726562, -0.1507415771484375, -0.14083480834960938, -0.13092803955078125, -0.12102127075195312, -0.111114501953125, -0.10120773315429688, -0.09130096435546875, -0.08139419555664062, -0.0714874267578125, -0.061580657958984375, -0.05167388916015625, -0.041767120361328125, -0.0318603515625, -0.021953582763671875, -0.01204681396484375, -0.002140045166015625, 0.0077667236328125, 0.017673492431640625, 0.02758026123046875, 0.037487030029296875, 0.047393798828125, 0.057300567626953125, 0.06720733642578125, 0.07711410522460938, 0.0870208740234375, 0.09692764282226562, 0.10683441162109375, 0.11674118041992188, 0.12664794921875, 0.13655471801757812, 0.14646148681640625, 0.15636825561523438, 0.1662750244140625, 0.17618179321289062, 0.18608856201171875, 0.19599533081054688, 0.205902099609375, 0.21580886840820312, 0.22571563720703125, 0.23562240600585938, 0.2455291748046875, 0.2554359436035156, 0.26534271240234375, 0.2752494812011719, 0.28515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 5.0, 3.0, 4.0, 8.0, 4.0, 7.0, 9.0, 10.0, 16.0, 19.0, 32.0, 48.0, 43.0, 71.0, 92.0, 132.0, 167.0, 261.0, 410.0, 716.0, 1273.0, 3110.0, 15251.0, 4143973.0, 21646.0, 3384.0, 1509.0, 724.0, 406.0, 275.0, 170.0, 119.0, 85.0, 58.0, 55.0, 41.0, 32.0, 29.0, 14.0, 19.0, 12.0, 11.0, 5.0, 7.0, 7.0, 0.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2685546875, -1.22705078125, -1.185546875, -1.14404296875, -1.1025390625, -1.06103515625, -1.01953125, -0.97802734375, -0.9365234375, -0.89501953125, -0.853515625, -0.81201171875, -0.7705078125, -0.72900390625, -0.6875, -0.64599609375, -0.6044921875, -0.56298828125, -0.521484375, -0.47998046875, -0.4384765625, -0.39697265625, -0.35546875, -0.31396484375, -0.2724609375, -0.23095703125, -0.189453125, -0.14794921875, -0.1064453125, -0.06494140625, -0.0234375, 0.01806640625, 0.0595703125, 0.10107421875, 0.142578125, 0.18408203125, 0.2255859375, 0.26708984375, 0.30859375, 0.35009765625, 0.3916015625, 0.43310546875, 0.474609375, 0.51611328125, 0.5576171875, 0.59912109375, 0.640625, 0.68212890625, 0.7236328125, 0.76513671875, 0.806640625, 0.84814453125, 0.8896484375, 0.93115234375, 0.97265625, 1.01416015625, 1.0556640625, 1.09716796875, 1.138671875, 1.18017578125, 1.2216796875, 1.26318359375, 1.3046875, 1.34619140625, 1.3876953125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 14.0, 14.0, 68.0, 3707.0, 215.0, 25.0, 9.0, 6.0, 7.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.348388671875, -0.3308219909667969, -0.31325531005859375, -0.2956886291503906, -0.2781219482421875, -0.2605552673339844, -0.24298858642578125, -0.22542190551757812, -0.207855224609375, -0.19028854370117188, -0.17272186279296875, -0.15515518188476562, -0.1375885009765625, -0.12002182006835938, -0.10245513916015625, -0.08488845825195312, -0.06732177734375, -0.049755096435546875, -0.03218841552734375, -0.014621734619140625, 0.0029449462890625, 0.020511627197265625, 0.03807830810546875, 0.055644989013671875, 0.073211669921875, 0.09077835083007812, 0.10834503173828125, 0.12591171264648438, 0.1434783935546875, 0.16104507446289062, 0.17861175537109375, 0.19617843627929688, 0.2137451171875, 0.23131179809570312, 0.24887847900390625, 0.2664451599121094, 0.2840118408203125, 0.3015785217285156, 0.31914520263671875, 0.3367118835449219, 0.354278564453125, 0.3718452453613281, 0.38941192626953125, 0.4069786071777344, 0.4245452880859375, 0.4421119689941406, 0.45967864990234375, 0.4772453308105469, 0.49481201171875, 0.5123786926269531, 0.5299453735351562, 0.5475120544433594, 0.5650787353515625, 0.5826454162597656, 0.6002120971679688, 0.6177787780761719, 0.635345458984375, 0.6529121398925781, 0.6704788208007812, 0.6880455017089844, 0.7056121826171875, 0.7231788635253906, 0.7407455444335938, 0.7583122253417969, 0.77587890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 7.0, 17.0, 36.0, 69.0, 152.0, 265.0, 229.0, 97.0, 46.0, 34.0, 20.0, 12.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0], "bins": [-3.4105446338653564, -3.3435423374176025, -3.2765402793884277, -3.209537982940674, -3.14253568649292, -3.075533390045166, -3.008531332015991, -2.9415290355682373, -2.8745269775390625, -2.8075246810913086, -2.740522623062134, -2.67352032661438, -2.606518030166626, -2.539515972137451, -2.4725136756896973, -2.4055113792419434, -2.3385090827941895, -2.2715067863464355, -2.2045047283172607, -2.137502431869507, -2.070500135421753, -2.003498077392578, -1.9364957809448242, -1.8694934844970703, -1.802491307258606, -1.7354891300201416, -1.6684868335723877, -1.6014846563339233, -1.534482479095459, -1.467480182647705, -1.4004780054092407, -1.3334758281707764, -1.2664732933044434, -1.199471116065979, -1.132468819618225, -1.0654666423797607, -0.9984644055366516, -0.9314621686935425, -0.8644599914550781, -0.797457754611969, -0.7304555773735046, -0.6634533405303955, -0.5964511632919312, -0.529448926448822, -0.4624466896057129, -0.39544445276260376, -0.328442245721817, -0.2614400386810303, -0.19443780183792114, -0.1274355798959732, -0.06043335795402527, 0.0065688639879226685, 0.0735710859298706, 0.14057332277297974, 0.20757552981376648, 0.2745777368545532, 0.34157997369766235, 0.4085822105407715, 0.4755844175815582, 0.542586624622345, 0.6095888614654541, 0.6765910983085632, 0.7435933351516724, 0.8105955123901367, 0.8775977492332458]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 7.0, 9.0, 10.0, 9.0, 14.0, 20.0, 12.0, 23.0, 30.0, 22.0, 39.0, 37.0, 34.0, 51.0, 50.0, 49.0, 49.0, 39.0, 52.0, 60.0, 52.0, 57.0, 54.0, 43.0, 28.0, 24.0, 19.0, 27.0, 18.0, 21.0, 14.0, 5.0, 8.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8186982870101929, -0.7940117716789246, -0.769325315952301, -0.7446388006210327, -0.7199522852897644, -0.6952658295631409, -0.6705793142318726, -0.645892858505249, -0.6212063431739807, -0.5965198278427124, -0.5718333721160889, -0.5471468567848206, -0.5224603414535522, -0.4977738857269287, -0.4730873703956604, -0.4484008848667145, -0.42371436953544617, -0.39902788400650024, -0.37434136867523193, -0.349654883146286, -0.3249683976173401, -0.3002818822860718, -0.27559539675712585, -0.25090891122817993, -0.22622241079807281, -0.2015359103679657, -0.17684942483901978, -0.15216292440891266, -0.12747642397880554, -0.10278993844985962, -0.0781034380197525, -0.05341695249080658, -0.028730452060699463, -0.004043957218527794, 0.020642537623643875, 0.04532903432846069, 0.07001552730798721, 0.09470202028751373, 0.11938852071762085, 0.14407500624656677, 0.1687615066766739, 0.193448007106781, 0.21813449263572693, 0.24282099306583405, 0.26750749349594116, 0.2921939790248871, 0.316880464553833, 0.3415669798851013, 0.36625346541404724, 0.39093995094299316, 0.4156264662742615, 0.4403129518032074, 0.4649994373321533, 0.48968595266342163, 0.5143724679946899, 0.5390589237213135, 0.5637454390525818, 0.5884319543838501, 0.6131184101104736, 0.6378049254417419, 0.6624914407730103, 0.6871778964996338, 0.7118644118309021, 0.7365509271621704, 0.761237382888794]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 5.0, 9.0, 8.0, 5.0, 23.0, 14.0, 18.0, 27.0, 38.0, 44.0, 78.0, 106.0, 149.0, 224.0, 357.0, 608.0, 1107.0, 1952.0, 4059.0, 8820.0, 23217.0, 71617.0, 257381.0, 444464.0, 158660.0, 45984.0, 16048.0, 6534.0, 3011.0, 1601.0, 844.0, 514.0, 316.0, 226.0, 133.0, 103.0, 66.0, 47.0, 36.0, 19.0, 17.0, 15.0, 11.0, 7.0, 6.0, 7.0, 6.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.40869140625, -0.39642333984375, -0.3841552734375, -0.37188720703125, -0.359619140625, -0.34735107421875, -0.3350830078125, -0.32281494140625, -0.310546875, -0.29827880859375, -0.2860107421875, -0.27374267578125, -0.261474609375, -0.24920654296875, -0.2369384765625, -0.22467041015625, -0.21240234375, -0.20013427734375, -0.1878662109375, -0.17559814453125, -0.163330078125, -0.15106201171875, -0.1387939453125, -0.12652587890625, -0.1142578125, -0.10198974609375, -0.0897216796875, -0.07745361328125, -0.065185546875, -0.05291748046875, -0.0406494140625, -0.02838134765625, -0.01611328125, -0.00384521484375, 0.0084228515625, 0.02069091796875, 0.032958984375, 0.04522705078125, 0.0574951171875, 0.06976318359375, 0.08203125, 0.09429931640625, 0.1065673828125, 0.11883544921875, 0.131103515625, 0.14337158203125, 0.1556396484375, 0.16790771484375, 0.18017578125, 0.19244384765625, 0.2047119140625, 0.21697998046875, 0.229248046875, 0.24151611328125, 0.2537841796875, 0.26605224609375, 0.2783203125, 0.29058837890625, 0.3028564453125, 0.31512451171875, 0.327392578125, 0.33966064453125, 0.3519287109375, 0.36419677734375, 0.37646484375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 7.0, 7.0, 12.0, 15.0, 20.0, 32.0, 23.0, 31.0, 55.0, 65.0, 52.0, 77.0, 74.0, 78.0, 65.0, 69.0, 67.0, 59.0, 45.0, 43.0, 35.0, 25.0, 12.0, 14.0, 12.0, 8.0, 0.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.362548828125, -0.3525733947753906, -0.34259796142578125, -0.3326225280761719, -0.3226470947265625, -0.3126716613769531, -0.30269622802734375, -0.2927207946777344, -0.282745361328125, -0.2727699279785156, -0.26279449462890625, -0.2528190612792969, -0.2428436279296875, -0.23286819458007812, -0.22289276123046875, -0.21291732788085938, -0.20294189453125, -0.19296646118164062, -0.18299102783203125, -0.17301559448242188, -0.1630401611328125, -0.15306472778320312, -0.14308929443359375, -0.13311386108398438, -0.123138427734375, -0.11316299438476562, -0.10318756103515625, -0.09321212768554688, -0.0832366943359375, -0.07326126098632812, -0.06328582763671875, -0.053310394287109375, -0.0433349609375, -0.033359527587890625, -0.02338409423828125, -0.013408660888671875, -0.0034332275390625, 0.006542205810546875, 0.01651763916015625, 0.026493072509765625, 0.036468505859375, 0.046443939208984375, 0.05641937255859375, 0.06639480590820312, 0.0763702392578125, 0.08634567260742188, 0.09632110595703125, 0.10629653930664062, 0.11627197265625, 0.12624740600585938, 0.13622283935546875, 0.14619827270507812, 0.1561737060546875, 0.16614913940429688, 0.17612457275390625, 0.18610000610351562, 0.196075439453125, 0.20605087280273438, 0.21602630615234375, 0.22600173950195312, 0.2359771728515625, 0.24595260620117188, 0.25592803955078125, 0.2659034729003906, 0.27587890625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 13.0, 14.0, 19.0, 22.0, 51.0, 55.0, 71.0, 89.0, 131.0, 252.0, 432.0, 780.0, 1728.0, 4913.0, 19051.0, 147190.0, 732631.0, 117118.0, 16375.0, 4215.0, 1636.0, 666.0, 368.0, 250.0, 150.0, 94.0, 70.0, 45.0, 36.0, 16.0, 20.0, 13.0, 9.0, 4.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.513671875, -0.49680328369140625, -0.4799346923828125, -0.46306610107421875, -0.446197509765625, -0.42932891845703125, -0.4124603271484375, -0.39559173583984375, -0.37872314453125, -0.36185455322265625, -0.3449859619140625, -0.32811737060546875, -0.311248779296875, -0.29438018798828125, -0.2775115966796875, -0.26064300537109375, -0.2437744140625, -0.22690582275390625, -0.2100372314453125, -0.19316864013671875, -0.176300048828125, -0.15943145751953125, -0.1425628662109375, -0.12569427490234375, -0.10882568359375, -0.09195709228515625, -0.0750885009765625, -0.05821990966796875, -0.041351318359375, -0.02448272705078125, -0.0076141357421875, 0.00925445556640625, 0.026123046875, 0.04299163818359375, 0.0598602294921875, 0.07672882080078125, 0.093597412109375, 0.11046600341796875, 0.1273345947265625, 0.14420318603515625, 0.16107177734375, 0.17794036865234375, 0.1948089599609375, 0.21167755126953125, 0.228546142578125, 0.24541473388671875, 0.2622833251953125, 0.27915191650390625, 0.2960205078125, 0.31288909912109375, 0.3297576904296875, 0.34662628173828125, 0.363494873046875, 0.38036346435546875, 0.3972320556640625, 0.41410064697265625, 0.43096923828125, 0.44783782958984375, 0.4647064208984375, 0.48157501220703125, 0.498443603515625, 0.5153121948242188, 0.5321807861328125, 0.5490493774414062, 0.56591796875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 9.0, 7.0, 8.0, 12.0, 15.0, 15.0, 21.0, 32.0, 23.0, 25.0, 29.0, 38.0, 36.0, 37.0, 37.0, 53.0, 33.0, 40.0, 60.0, 48.0, 39.0, 55.0, 42.0, 33.0, 34.0, 30.0, 34.0, 19.0, 24.0, 20.0, 17.0, 14.0, 11.0, 8.0, 10.0, 4.0, 7.0, 9.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.64697265625, -0.6252517700195312, -0.6035308837890625, -0.5818099975585938, -0.560089111328125, -0.5383682250976562, -0.5166473388671875, -0.49492645263671875, -0.47320556640625, -0.45148468017578125, -0.4297637939453125, -0.40804290771484375, -0.386322021484375, -0.36460113525390625, -0.3428802490234375, -0.32115936279296875, -0.2994384765625, -0.27771759033203125, -0.2559967041015625, -0.23427581787109375, -0.212554931640625, -0.19083404541015625, -0.1691131591796875, -0.14739227294921875, -0.12567138671875, -0.10395050048828125, -0.0822296142578125, -0.06050872802734375, -0.038787841796875, -0.01706695556640625, 0.0046539306640625, 0.02637481689453125, 0.048095703125, 0.06981658935546875, 0.0915374755859375, 0.11325836181640625, 0.134979248046875, 0.15670013427734375, 0.1784210205078125, 0.20014190673828125, 0.22186279296875, 0.24358367919921875, 0.2653045654296875, 0.28702545166015625, 0.308746337890625, 0.33046722412109375, 0.3521881103515625, 0.37390899658203125, 0.3956298828125, 0.41735076904296875, 0.4390716552734375, 0.46079254150390625, 0.482513427734375, 0.5042343139648438, 0.5259552001953125, 0.5476760864257812, 0.56939697265625, 0.5911178588867188, 0.6128387451171875, 0.6345596313476562, 0.656280517578125, 0.6780014038085938, 0.6997222900390625, 0.7214431762695312, 0.7431640625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 9.0, 9.0, 8.0, 10.0, 20.0, 20.0, 27.0, 42.0, 78.0, 98.0, 162.0, 274.0, 478.0, 931.0, 1944.0, 4784.0, 14552.0, 74693.0, 652046.0, 252257.0, 31720.0, 8246.0, 3110.0, 1327.0, 709.0, 365.0, 210.0, 146.0, 69.0, 57.0, 35.0, 28.0, 20.0, 11.0, 8.0, 7.0, 8.0, 9.0, 4.0, 3.0, 1.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.140625, -0.13590049743652344, -0.13117599487304688, -0.1264514923095703, -0.12172698974609375, -0.11700248718261719, -0.11227798461914062, -0.10755348205566406, -0.1028289794921875, -0.09810447692871094, -0.09337997436523438, -0.08865547180175781, -0.08393096923828125, -0.07920646667480469, -0.07448196411132812, -0.06975746154785156, -0.065032958984375, -0.06030845642089844, -0.055583953857421875, -0.05085945129394531, -0.04613494873046875, -0.04141044616699219, -0.036685943603515625, -0.03196144104003906, -0.0272369384765625, -0.022512435913085938, -0.017787933349609375, -0.013063430786132812, -0.00833892822265625, -0.0036144256591796875, 0.001110076904296875, 0.0058345794677734375, 0.01055908203125, 0.015283584594726562, 0.020008087158203125, 0.024732589721679688, 0.02945709228515625, 0.03418159484863281, 0.038906097412109375, 0.04363059997558594, 0.0483551025390625, 0.05307960510253906, 0.057804107666015625, 0.06252861022949219, 0.06725311279296875, 0.07197761535644531, 0.07670211791992188, 0.08142662048339844, 0.086151123046875, 0.09087562561035156, 0.09560012817382812, 0.10032463073730469, 0.10504913330078125, 0.10977363586425781, 0.11449813842773438, 0.11922264099121094, 0.1239471435546875, 0.12867164611816406, 0.13339614868164062, 0.1381206512451172, 0.14284515380859375, 0.1475696563720703, 0.15229415893554688, 0.15701866149902344, 0.1617431640625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 8.0, 4.0, 11.0, 21.0, 18.0, 24.0, 59.0, 73.0, 124.0, 156.0, 152.0, 136.0, 67.0, 50.0, 27.0, 20.0, 10.0, 13.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4955482482910156e-05, -5.311984568834305e-05, -5.128420889377594e-05, -4.944857209920883e-05, -4.7612935304641724e-05, -4.5777298510074615e-05, -4.394166171550751e-05, -4.21060249209404e-05, -4.027038812637329e-05, -3.843475133180618e-05, -3.6599114537239075e-05, -3.4763477742671967e-05, -3.292784094810486e-05, -3.109220415353775e-05, -2.9256567358970642e-05, -2.7420930564403534e-05, -2.5585293769836426e-05, -2.3749656975269318e-05, -2.191402018070221e-05, -2.00783833861351e-05, -1.8242746591567993e-05, -1.6407109797000885e-05, -1.4571473002433777e-05, -1.2735836207866669e-05, -1.090019941329956e-05, -9.064562618732452e-06, -7.228925824165344e-06, -5.393289029598236e-06, -3.557652235031128e-06, -1.7220154404640198e-06, 1.1362135410308838e-07, 1.9492581486701965e-06, 3.7848949432373047e-06, 5.620531737804413e-06, 7.456168532371521e-06, 9.291805326938629e-06, 1.1127442121505737e-05, 1.2963078916072845e-05, 1.4798715710639954e-05, 1.6634352505207062e-05, 1.846998929977417e-05, 2.0305626094341278e-05, 2.2141262888908386e-05, 2.3976899683475494e-05, 2.5812536478042603e-05, 2.764817327260971e-05, 2.948381006717682e-05, 3.131944686174393e-05, 3.3155083656311035e-05, 3.499072045087814e-05, 3.682635724544525e-05, 3.866199404001236e-05, 4.049763083457947e-05, 4.2333267629146576e-05, 4.4168904423713684e-05, 4.600454121828079e-05, 4.78401780128479e-05, 4.967581480741501e-05, 5.151145160198212e-05, 5.3347088396549225e-05, 5.518272519111633e-05, 5.701836198568344e-05, 5.885399878025055e-05, 6.068963557481766e-05, 6.252527236938477e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 10.0, 11.0, 11.0, 16.0, 18.0, 29.0, 35.0, 70.0, 110.0, 170.0, 354.0, 585.0, 1234.0, 3032.0, 8678.0, 36643.0, 431503.0, 510318.0, 40478.0, 9305.0, 3157.0, 1317.0, 660.0, 310.0, 191.0, 102.0, 71.0, 48.0, 21.0, 21.0, 17.0, 5.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2213134765625, -0.21480941772460938, -0.20830535888671875, -0.20180130004882812, -0.1952972412109375, -0.18879318237304688, -0.18228912353515625, -0.17578506469726562, -0.169281005859375, -0.16277694702148438, -0.15627288818359375, -0.14976882934570312, -0.1432647705078125, -0.13676071166992188, -0.13025665283203125, -0.12375259399414062, -0.11724853515625, -0.11074447631835938, -0.10424041748046875, -0.09773635864257812, -0.0912322998046875, -0.08472824096679688, -0.07822418212890625, -0.07172012329101562, -0.065216064453125, -0.058712005615234375, -0.05220794677734375, -0.045703887939453125, -0.0391998291015625, -0.032695770263671875, -0.02619171142578125, -0.019687652587890625, -0.01318359375, -0.006679534912109375, -0.00017547607421875, 0.006328582763671875, 0.0128326416015625, 0.019336700439453125, 0.02584075927734375, 0.032344818115234375, 0.038848876953125, 0.045352935791015625, 0.05185699462890625, 0.058361053466796875, 0.0648651123046875, 0.07136917114257812, 0.07787322998046875, 0.08437728881835938, 0.09088134765625, 0.09738540649414062, 0.10388946533203125, 0.11039352416992188, 0.1168975830078125, 0.12340164184570312, 0.12990570068359375, 0.13640975952148438, 0.142913818359375, 0.14941787719726562, 0.15592193603515625, 0.16242599487304688, 0.1689300537109375, 0.17543411254882812, 0.18193817138671875, 0.18844223022460938, 0.1949462890625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 5.0, 8.0, 11.0, 11.0, 9.0, 6.0, 20.0, 29.0, 36.0, 55.0, 57.0, 68.0, 99.0, 107.0, 113.0, 76.0, 62.0, 54.0, 44.0, 25.0, 23.0, 19.0, 22.0, 10.0, 7.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2054443359375, -0.19953536987304688, -0.19362640380859375, -0.18771743774414062, -0.1818084716796875, -0.17589950561523438, -0.16999053955078125, -0.16408157348632812, -0.158172607421875, -0.15226364135742188, -0.14635467529296875, -0.14044570922851562, -0.1345367431640625, -0.12862777709960938, -0.12271881103515625, -0.11680984497070312, -0.11090087890625, -0.10499191284179688, -0.09908294677734375, -0.09317398071289062, -0.0872650146484375, -0.08135604858398438, -0.07544708251953125, -0.06953811645507812, -0.063629150390625, -0.057720184326171875, -0.05181121826171875, -0.045902252197265625, -0.0399932861328125, -0.034084320068359375, -0.02817535400390625, -0.022266387939453125, -0.016357421875, -0.010448455810546875, -0.00453948974609375, 0.001369476318359375, 0.0072784423828125, 0.013187408447265625, 0.01909637451171875, 0.025005340576171875, 0.030914306640625, 0.036823272705078125, 0.04273223876953125, 0.048641204833984375, 0.0545501708984375, 0.060459136962890625, 0.06636810302734375, 0.07227706909179688, 0.07818603515625, 0.08409500122070312, 0.09000396728515625, 0.09591293334960938, 0.1018218994140625, 0.10773086547851562, 0.11363983154296875, 0.11954879760742188, 0.125457763671875, 0.13136672973632812, 0.13727569580078125, 0.14318466186523438, 0.1490936279296875, 0.15500259399414062, 0.16091156005859375, 0.16682052612304688, 0.1727294921875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 14.0, 27.0, 81.0, 234.0, 344.0, 206.0, 64.0, 17.0, 20.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.736486434936523, -8.489704132080078, -8.242920875549316, -7.996138572692871, -7.749356269836426, -7.502573490142822, -7.255790710449219, -7.009008407592773, -6.762226104736328, -6.515443325042725, -6.268661022186279, -6.021878242492676, -5.7750959396362305, -5.528313159942627, -5.281530380249023, -5.034748077392578, -4.787965297698975, -4.541182518005371, -4.294400215148926, -4.047617435455322, -3.800835132598877, -3.5540523529052734, -3.307269811630249, -3.0604872703552246, -2.8137047290802, -2.566922187805176, -2.3201396465301514, -2.073357105255127, -1.826574444770813, -1.5797919034957886, -1.3330092430114746, -1.0862267017364502, -0.8394441604614258, -0.5926616191864014, -0.3458790183067322, -0.09909641742706299, 0.14768612384796143, 0.39446866512298584, 0.6412513256072998, 0.8880338668823242, 1.1348164081573486, 1.381598949432373, 1.6283814907073975, 1.8751641511917114, 2.1219468116760254, 2.3687291145324707, 2.615511894226074, 2.8622944355010986, 3.109076976776123, 3.3558595180511475, 3.602642059326172, 3.8494248390197754, 4.096207141876221, 4.342989921569824, 4.5897722244262695, 4.836555004119873, 5.083337783813477, 5.33012056350708, 5.576902866363525, 5.823685646057129, 6.070467948913574, 6.317250728607178, 6.564033508300781, 6.810815811157227, 7.057598114013672]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 2.0, 9.0, 9.0, 8.0, 17.0, 20.0, 24.0, 22.0, 18.0, 15.0, 32.0, 33.0, 40.0, 45.0, 45.0, 39.0, 50.0, 54.0, 58.0, 47.0, 38.0, 47.0, 41.0, 38.0, 37.0, 27.0, 29.0, 26.0, 17.0, 19.0, 17.0, 7.0, 16.0, 8.0, 11.0, 7.0, 9.0, 5.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.983551025390625, -2.8853437900543213, -2.7871365547180176, -2.688929319381714, -2.59072208404541, -2.4925146102905273, -2.3943073749542236, -2.29610013961792, -2.197892904281616, -2.0996856689453125, -2.001478433609009, -1.9032710790634155, -1.8050638437271118, -1.706856608390808, -1.6086492538452148, -1.5104420185089111, -1.4122347831726074, -1.3140275478363037, -1.2158203125, -1.1176129579544067, -1.019405722618103, -0.9211984872817993, -0.8229911923408508, -0.7247838973999023, -0.6265766620635986, -0.5283694267272949, -0.43016213178634644, -0.33195486664772034, -0.23374760150909424, -0.13554033637046814, -0.03733307123184204, 0.060874223709106445, 0.15908169746398926, 0.25728896260261536, 0.35549622774124146, 0.45370349287986755, 0.5519107580184937, 0.6501179933547974, 0.7483252882957458, 0.8465325832366943, 0.944739818572998, 1.0429470539093018, 1.1411542892456055, 1.2393616437911987, 1.3375688791275024, 1.4357761144638062, 1.5339834690093994, 1.6321907043457031, 1.7303979396820068, 1.8286051750183105, 1.9268124103546143, 2.025019645690918, 2.123227119445801, 2.2214343547821045, 2.319641590118408, 2.417848825454712, 2.5160560607910156, 2.6142632961273193, 2.712470531463623, 2.8106777667999268, 2.9088850021362305, 3.0070924758911133, 3.105299711227417, 3.2035069465637207, 3.3017141819000244]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 11.0, 11.0, 20.0, 18.0, 13.0, 20.0, 24.0, 35.0, 50.0, 57.0, 101.0, 116.0, 204.0, 348.0, 568.0, 986.0, 1907.0, 4048.0, 12191.0, 124223.0, 3987806.0, 45466.0, 8902.0, 3380.0, 1593.0, 910.0, 507.0, 278.0, 168.0, 113.0, 66.0, 40.0, 24.0, 19.0, 9.0, 9.0, 8.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2429962158203125, -1.205718994140625, -1.1684417724609375, -1.13116455078125, -1.0938873291015625, -1.056610107421875, -1.0193328857421875, -0.9820556640625, -0.9447784423828125, -0.907501220703125, -0.8702239990234375, -0.83294677734375, -0.7956695556640625, -0.758392333984375, -0.7211151123046875, -0.683837890625, -0.6465606689453125, -0.609283447265625, -0.5720062255859375, -0.53472900390625, -0.4974517822265625, -0.460174560546875, -0.4228973388671875, -0.3856201171875, -0.3483428955078125, -0.311065673828125, -0.2737884521484375, -0.23651123046875, -0.1992340087890625, -0.161956787109375, -0.1246795654296875, -0.08740234375, -0.0501251220703125, -0.012847900390625, 0.0244293212890625, 0.06170654296875, 0.0989837646484375, 0.136260986328125, 0.1735382080078125, 0.2108154296875, 0.2480926513671875, 0.285369873046875, 0.3226470947265625, 0.35992431640625, 0.3972015380859375, 0.434478759765625, 0.4717559814453125, 0.509033203125, 0.5463104248046875, 0.583587646484375, 0.6208648681640625, 0.65814208984375, 0.6954193115234375, 0.732696533203125, 0.7699737548828125, 0.8072509765625, 0.8445281982421875, 0.881805419921875, 0.9190826416015625, 0.95635986328125, 0.9936370849609375, 1.030914306640625, 1.0681915283203125, 1.10546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 4.0, 5.0, 11.0, 9.0, 33.0, 32.0, 33.0, 38.0, 56.0, 80.0, 75.0, 81.0, 93.0, 70.0, 80.0, 76.0, 64.0, 42.0, 31.0, 26.0, 17.0, 17.0, 14.0, 9.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.37060546875, -0.36067962646484375, -0.3507537841796875, -0.34082794189453125, -0.330902099609375, -0.32097625732421875, -0.3110504150390625, -0.30112457275390625, -0.29119873046875, -0.28127288818359375, -0.2713470458984375, -0.26142120361328125, -0.251495361328125, -0.24156951904296875, -0.2316436767578125, -0.22171783447265625, -0.2117919921875, -0.20186614990234375, -0.1919403076171875, -0.18201446533203125, -0.172088623046875, -0.16216278076171875, -0.1522369384765625, -0.14231109619140625, -0.13238525390625, -0.12245941162109375, -0.1125335693359375, -0.10260772705078125, -0.092681884765625, -0.08275604248046875, -0.0728302001953125, -0.06290435791015625, -0.052978515625, -0.04305267333984375, -0.0331268310546875, -0.02320098876953125, -0.013275146484375, -0.00334930419921875, 0.0065765380859375, 0.01650238037109375, 0.02642822265625, 0.03635406494140625, 0.0462799072265625, 0.05620574951171875, 0.066131591796875, 0.07605743408203125, 0.0859832763671875, 0.09590911865234375, 0.1058349609375, 0.11576080322265625, 0.1256866455078125, 0.13561248779296875, 0.145538330078125, 0.15546417236328125, 0.1653900146484375, 0.17531585693359375, 0.18524169921875, 0.19516754150390625, 0.2050933837890625, 0.21501922607421875, 0.224945068359375, 0.23487091064453125, 0.2447967529296875, 0.25472259521484375, 0.2646484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 7.0, 9.0, 13.0, 23.0, 52.0, 122.0, 209.0, 693.0, 2581.0, 17549.0, 4061628.0, 103184.0, 6210.0, 1270.0, 403.0, 169.0, 72.0, 38.0, 22.0, 8.0, 13.0, 4.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8310546875, -1.7673797607421875, -1.703704833984375, -1.6400299072265625, -1.57635498046875, -1.5126800537109375, -1.449005126953125, -1.3853302001953125, -1.3216552734375, -1.2579803466796875, -1.194305419921875, -1.1306304931640625, -1.06695556640625, -1.0032806396484375, -0.939605712890625, -0.8759307861328125, -0.812255859375, -0.7485809326171875, -0.684906005859375, -0.6212310791015625, -0.55755615234375, -0.4938812255859375, -0.430206298828125, -0.3665313720703125, -0.3028564453125, -0.2391815185546875, -0.175506591796875, -0.1118316650390625, -0.04815673828125, 0.0155181884765625, 0.079193115234375, 0.1428680419921875, 0.20654296875, 0.2702178955078125, 0.333892822265625, 0.3975677490234375, 0.46124267578125, 0.5249176025390625, 0.588592529296875, 0.6522674560546875, 0.7159423828125, 0.7796173095703125, 0.843292236328125, 0.9069671630859375, 0.97064208984375, 1.0343170166015625, 1.097991943359375, 1.1616668701171875, 1.225341796875, 1.2890167236328125, 1.352691650390625, 1.4163665771484375, 1.48004150390625, 1.5437164306640625, 1.607391357421875, 1.6710662841796875, 1.7347412109375, 1.7984161376953125, 1.862091064453125, 1.9257659912109375, 1.98944091796875, 2.0531158447265625, 2.116790771484375, 2.1804656982421875, 2.244140625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 7.0, 10.0, 9.0, 15.0, 15.0, 22.0, 23.0, 56.0, 191.0, 1070.0, 2035.0, 358.0, 116.0, 49.0, 26.0, 13.0, 22.0, 11.0, 8.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5849609375, -0.5560302734375, -0.527099609375, -0.4981689453125, -0.46923828125, -0.4403076171875, -0.411376953125, -0.3824462890625, -0.353515625, -0.3245849609375, -0.295654296875, -0.2667236328125, -0.23779296875, -0.2088623046875, -0.179931640625, -0.1510009765625, -0.1220703125, -0.0931396484375, -0.064208984375, -0.0352783203125, -0.00634765625, 0.0225830078125, 0.051513671875, 0.0804443359375, 0.109375, 0.1383056640625, 0.167236328125, 0.1961669921875, 0.22509765625, 0.2540283203125, 0.282958984375, 0.3118896484375, 0.3408203125, 0.3697509765625, 0.398681640625, 0.4276123046875, 0.45654296875, 0.4854736328125, 0.514404296875, 0.5433349609375, 0.572265625, 0.6011962890625, 0.630126953125, 0.6590576171875, 0.68798828125, 0.7169189453125, 0.745849609375, 0.7747802734375, 0.8037109375, 0.8326416015625, 0.861572265625, 0.8905029296875, 0.91943359375, 0.9483642578125, 0.977294921875, 1.0062255859375, 1.03515625, 1.0640869140625, 1.093017578125, 1.1219482421875, 1.15087890625, 1.1798095703125, 1.208740234375, 1.2376708984375, 1.2666015625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 4.0, 5.0, 9.0, 17.0, 31.0, 51.0, 48.0, 106.0, 152.0, 177.0, 156.0, 80.0, 57.0, 25.0, 23.0, 10.0, 12.0, 13.0, 6.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.085221767425537, -5.921083450317383, -5.7569451332092285, -5.592806816101074, -5.428668975830078, -5.264530658721924, -5.1003923416137695, -4.936254024505615, -4.772115707397461, -4.607977390289307, -4.443839073181152, -4.279700756072998, -4.115562438964844, -3.9514243602752686, -3.7872862815856934, -3.623147964477539, -3.4590096473693848, -3.2948713302612305, -3.130733013153076, -2.966594934463501, -2.8024566173553467, -2.6383183002471924, -2.474180221557617, -2.310041904449463, -2.1459035873413086, -1.9817652702331543, -1.8176270723342896, -1.6534888744354248, -1.4893505573272705, -1.3252122402191162, -1.1610740423202515, -0.9969358444213867, -0.8327970504760742, -0.6686587929725647, -0.5045205354690552, -0.34038227796554565, -0.17624402046203613, -0.012105762958526611, 0.1520324945449829, 0.31617069244384766, 0.48030900955200195, 0.6444472670555115, 0.808585524559021, 0.9727237820625305, 1.13686203956604, 1.3010003566741943, 1.465138554573059, 1.6292767524719238, 1.7934150695800781, 1.9575533866882324, 2.1216917037963867, 2.285829782485962, 2.449968099594116, 2.6141064167022705, 2.7782444953918457, 2.9423828125, 3.1065211296081543, 3.2706594467163086, 3.434797763824463, 3.598935842514038, 3.7630741596221924, 3.9272124767303467, 4.091350555419922, 4.255488872528076, 4.4196271896362305]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 1.0, 6.0, 5.0, 14.0, 10.0, 2.0, 13.0, 24.0, 22.0, 25.0, 34.0, 32.0, 30.0, 29.0, 49.0, 37.0, 57.0, 50.0, 52.0, 53.0, 40.0, 44.0, 36.0, 42.0, 45.0, 40.0, 38.0, 25.0, 29.0, 29.0, 12.0, 22.0, 9.0, 15.0, 3.0, 6.0, 5.0, 2.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.839420795440674, -2.7610788345336914, -2.682737112045288, -2.6043951511383057, -2.5260531902313232, -2.44771146774292, -2.3693695068359375, -2.291027545928955, -2.2126855850219727, -2.1343436241149902, -2.056001901626587, -1.9776599407196045, -1.899317979812622, -1.8209761381149292, -1.7426342964172363, -1.664292335510254, -1.5859506130218506, -1.5076087713241577, -1.4292668104171753, -1.3509249687194824, -1.2725830078125, -1.1942411661148071, -1.1158993244171143, -1.0375573635101318, -0.959215521812439, -0.8808736205101013, -0.8025317192077637, -0.7241898775100708, -0.6458479762077332, -0.5675060749053955, -0.48916420340538025, -0.410822331905365, -0.33248043060302734, -0.2541385293006897, -0.17579665780067444, -0.09745477139949799, -0.019112884998321533, 0.05922901630401611, 0.13757088780403137, 0.21591275930404663, 0.2942546606063843, 0.3725965619087219, 0.4509384334087372, 0.5292803049087524, 0.6076222062110901, 0.6859641075134277, 0.7643059492111206, 0.8426478505134583, 0.9209897518157959, 0.9993316531181335, 1.0776735544204712, 1.156015396118164, 1.2343573570251465, 1.3126991987228394, 1.3910410404205322, 1.4693830013275146, 1.5477248430252075, 1.6260666847229004, 1.7044086456298828, 1.7827504873275757, 1.8610923290252686, 1.939434289932251, 2.0177762508392334, 2.0961179733276367, 2.174459934234619]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 7.0, 11.0, 9.0, 11.0, 11.0, 24.0, 43.0, 55.0, 73.0, 147.0, 181.0, 320.0, 591.0, 1080.0, 2228.0, 5402.0, 16695.0, 79457.0, 595013.0, 289882.0, 39534.0, 10389.0, 3722.0, 1631.0, 793.0, 450.0, 254.0, 175.0, 100.0, 63.0, 55.0, 40.0, 25.0, 18.0, 17.0, 9.0, 13.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.9521484375, -0.9255523681640625, -0.898956298828125, -0.8723602294921875, -0.84576416015625, -0.8191680908203125, -0.792572021484375, -0.7659759521484375, -0.7393798828125, -0.7127838134765625, -0.686187744140625, -0.6595916748046875, -0.63299560546875, -0.6063995361328125, -0.579803466796875, -0.5532073974609375, -0.526611328125, -0.5000152587890625, -0.473419189453125, -0.4468231201171875, -0.42022705078125, -0.3936309814453125, -0.367034912109375, -0.3404388427734375, -0.3138427734375, -0.2872467041015625, -0.260650634765625, -0.2340545654296875, -0.20745849609375, -0.1808624267578125, -0.154266357421875, -0.1276702880859375, -0.10107421875, -0.0744781494140625, -0.047882080078125, -0.0212860107421875, 0.00531005859375, 0.0319061279296875, 0.058502197265625, 0.0850982666015625, 0.1116943359375, 0.1382904052734375, 0.164886474609375, 0.1914825439453125, 0.21807861328125, 0.2446746826171875, 0.271270751953125, 0.2978668212890625, 0.324462890625, 0.3510589599609375, 0.377655029296875, 0.4042510986328125, 0.43084716796875, 0.4574432373046875, 0.484039306640625, 0.5106353759765625, 0.5372314453125, 0.5638275146484375, 0.590423583984375, 0.6170196533203125, 0.64361572265625, 0.6702117919921875, 0.696807861328125, 0.7234039306640625, 0.75]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 5.0, 13.0, 17.0, 38.0, 42.0, 42.0, 52.0, 50.0, 64.0, 67.0, 89.0, 78.0, 90.0, 77.0, 54.0, 53.0, 41.0, 38.0, 19.0, 26.0, 18.0, 11.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35595703125, -0.346038818359375, -0.33612060546875, -0.326202392578125, -0.3162841796875, -0.306365966796875, -0.29644775390625, -0.286529541015625, -0.276611328125, -0.266693115234375, -0.25677490234375, -0.246856689453125, -0.2369384765625, -0.227020263671875, -0.21710205078125, -0.207183837890625, -0.197265625, -0.187347412109375, -0.17742919921875, -0.167510986328125, -0.1575927734375, -0.147674560546875, -0.13775634765625, -0.127838134765625, -0.117919921875, -0.108001708984375, -0.09808349609375, -0.088165283203125, -0.0782470703125, -0.068328857421875, -0.05841064453125, -0.048492431640625, -0.03857421875, -0.028656005859375, -0.01873779296875, -0.008819580078125, 0.0010986328125, 0.011016845703125, 0.02093505859375, 0.030853271484375, 0.040771484375, 0.050689697265625, 0.06060791015625, 0.070526123046875, 0.0804443359375, 0.090362548828125, 0.10028076171875, 0.110198974609375, 0.1201171875, 0.130035400390625, 0.13995361328125, 0.149871826171875, 0.1597900390625, 0.169708251953125, 0.17962646484375, 0.189544677734375, 0.199462890625, 0.209381103515625, 0.21929931640625, 0.229217529296875, 0.2391357421875, 0.249053955078125, 0.25897216796875, 0.268890380859375, 0.27880859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 5.0, 3.0, 9.0, 5.0, 22.0, 27.0, 27.0, 36.0, 57.0, 93.0, 112.0, 201.0, 336.0, 595.0, 1090.0, 2671.0, 8108.0, 42630.0, 729433.0, 233765.0, 20244.0, 5083.0, 1921.0, 825.0, 455.0, 273.0, 166.0, 104.0, 65.0, 53.0, 37.0, 28.0, 12.0, 15.0, 10.0, 7.0, 4.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.81396484375, -0.7875442504882812, -0.7611236572265625, -0.7347030639648438, -0.708282470703125, -0.6818618774414062, -0.6554412841796875, -0.6290206909179688, -0.60260009765625, -0.5761795043945312, -0.5497589111328125, -0.5233383178710938, -0.496917724609375, -0.47049713134765625, -0.4440765380859375, -0.41765594482421875, -0.3912353515625, -0.36481475830078125, -0.3383941650390625, -0.31197357177734375, -0.285552978515625, -0.25913238525390625, -0.2327117919921875, -0.20629119873046875, -0.17987060546875, -0.15345001220703125, -0.1270294189453125, -0.10060882568359375, -0.074188232421875, -0.04776763916015625, -0.0213470458984375, 0.00507354736328125, 0.031494140625, 0.05791473388671875, 0.0843353271484375, 0.11075592041015625, 0.137176513671875, 0.16359710693359375, 0.1900177001953125, 0.21643829345703125, 0.24285888671875, 0.26927947998046875, 0.2957000732421875, 0.32212066650390625, 0.348541259765625, 0.37496185302734375, 0.4013824462890625, 0.42780303955078125, 0.4542236328125, 0.48064422607421875, 0.5070648193359375, 0.5334854125976562, 0.559906005859375, 0.5863265991210938, 0.6127471923828125, 0.6391677856445312, 0.66558837890625, 0.6920089721679688, 0.7184295654296875, 0.7448501586914062, 0.771270751953125, 0.7976913452148438, 0.8241119384765625, 0.8505325317382812, 0.876953125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 1.0, 7.0, 4.0, 3.0, 5.0, 9.0, 9.0, 10.0, 11.0, 20.0, 18.0, 22.0, 30.0, 20.0, 33.0, 38.0, 58.0, 44.0, 46.0, 61.0, 43.0, 39.0, 54.0, 50.0, 41.0, 37.0, 24.0, 38.0, 34.0, 35.0, 23.0, 17.0, 30.0, 14.0, 15.0, 14.0, 13.0, 12.0, 7.0, 3.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6953125, -0.6734085083007812, -0.6515045166015625, -0.6296005249023438, -0.607696533203125, -0.5857925415039062, -0.5638885498046875, -0.5419845581054688, -0.52008056640625, -0.49817657470703125, -0.4762725830078125, -0.45436859130859375, -0.432464599609375, -0.41056060791015625, -0.3886566162109375, -0.36675262451171875, -0.3448486328125, -0.32294464111328125, -0.3010406494140625, -0.27913665771484375, -0.257232666015625, -0.23532867431640625, -0.2134246826171875, -0.19152069091796875, -0.16961669921875, -0.14771270751953125, -0.1258087158203125, -0.10390472412109375, -0.082000732421875, -0.06009674072265625, -0.0381927490234375, -0.01628875732421875, 0.005615234375, 0.02751922607421875, 0.0494232177734375, 0.07132720947265625, 0.093231201171875, 0.11513519287109375, 0.1370391845703125, 0.15894317626953125, 0.18084716796875, 0.20275115966796875, 0.2246551513671875, 0.24655914306640625, 0.268463134765625, 0.29036712646484375, 0.3122711181640625, 0.33417510986328125, 0.3560791015625, 0.37798309326171875, 0.3998870849609375, 0.42179107666015625, 0.443695068359375, 0.46559906005859375, 0.4875030517578125, 0.5094070434570312, 0.53131103515625, 0.5532150268554688, 0.5751190185546875, 0.5970230102539062, 0.618927001953125, 0.6408309936523438, 0.6627349853515625, 0.6846389770507812, 0.70654296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 10.0, 4.0, 6.0, 2.0, 11.0, 12.0, 9.0, 20.0, 29.0, 49.0, 74.0, 114.0, 125.0, 255.0, 467.0, 951.0, 2266.0, 6983.0, 40735.0, 845826.0, 131922.0, 12458.0, 3397.0, 1284.0, 590.0, 346.0, 202.0, 109.0, 86.0, 47.0, 40.0, 27.0, 24.0, 19.0, 14.0, 8.0, 10.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.36962890625, -0.3575897216796875, -0.345550537109375, -0.3335113525390625, -0.32147216796875, -0.3094329833984375, -0.297393798828125, -0.2853546142578125, -0.2733154296875, -0.2612762451171875, -0.249237060546875, -0.2371978759765625, -0.22515869140625, -0.2131195068359375, -0.201080322265625, -0.1890411376953125, -0.177001953125, -0.1649627685546875, -0.152923583984375, -0.1408843994140625, -0.12884521484375, -0.1168060302734375, -0.104766845703125, -0.0927276611328125, -0.0806884765625, -0.0686492919921875, -0.056610107421875, -0.0445709228515625, -0.03253173828125, -0.0204925537109375, -0.008453369140625, 0.0035858154296875, 0.015625, 0.0276641845703125, 0.039703369140625, 0.0517425537109375, 0.06378173828125, 0.0758209228515625, 0.087860107421875, 0.0998992919921875, 0.1119384765625, 0.1239776611328125, 0.136016845703125, 0.1480560302734375, 0.16009521484375, 0.1721343994140625, 0.184173583984375, 0.1962127685546875, 0.208251953125, 0.2202911376953125, 0.232330322265625, 0.2443695068359375, 0.25640869140625, 0.2684478759765625, 0.280487060546875, 0.2925262451171875, 0.3045654296875, 0.3166046142578125, 0.328643798828125, 0.3406829833984375, 0.35272216796875, 0.3647613525390625, 0.376800537109375, 0.3888397216796875, 0.40087890625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 9.0, 8.0, 12.0, 7.0, 14.0, 32.0, 51.0, 118.0, 273.0, 228.0, 121.0, 49.0, 20.0, 24.0, 12.0, 6.0, 7.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.894371032714844e-05, -9.481608867645264e-05, -9.068846702575684e-05, -8.656084537506104e-05, -8.243322372436523e-05, -7.830560207366943e-05, -7.417798042297363e-05, -7.005035877227783e-05, -6.592273712158203e-05, -6.179511547088623e-05, -5.766749382019043e-05, -5.353987216949463e-05, -4.941225051879883e-05, -4.528462886810303e-05, -4.1157007217407227e-05, -3.7029385566711426e-05, -3.2901763916015625e-05, -2.8774142265319824e-05, -2.4646520614624023e-05, -2.0518898963928223e-05, -1.6391277313232422e-05, -1.2263655662536621e-05, -8.13603401184082e-06, -4.0084123611450195e-06, 1.1920928955078125e-07, 4.246830940246582e-06, 8.374452590942383e-06, 1.2502074241638184e-05, 1.6629695892333984e-05, 2.0757317543029785e-05, 2.4884939193725586e-05, 2.9012560844421387e-05, 3.314018249511719e-05, 3.726780414581299e-05, 4.139542579650879e-05, 4.552304744720459e-05, 4.965066909790039e-05, 5.377829074859619e-05, 5.790591239929199e-05, 6.203353404998779e-05, 6.61611557006836e-05, 7.02887773513794e-05, 7.44163990020752e-05, 7.8544020652771e-05, 8.26716423034668e-05, 8.67992639541626e-05, 9.09268856048584e-05, 9.50545072555542e-05, 9.918212890625e-05, 0.0001033097505569458, 0.0001074373722076416, 0.0001115649938583374, 0.0001156926155090332, 0.000119820237159729, 0.0001239478588104248, 0.0001280754804611206, 0.0001322031021118164, 0.0001363307237625122, 0.000140458345413208, 0.0001445859670639038, 0.0001487135887145996, 0.0001528412103652954, 0.0001569688320159912, 0.000161096453666687, 0.0001652240753173828]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 12.0, 12.0, 32.0, 30.0, 45.0, 80.0, 101.0, 163.0, 291.0, 414.0, 794.0, 1483.0, 3193.0, 7703.0, 23175.0, 115486.0, 740753.0, 117027.0, 23256.0, 7718.0, 3245.0, 1544.0, 804.0, 436.0, 278.0, 146.0, 95.0, 68.0, 43.0, 38.0, 23.0, 21.0, 7.0, 6.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.26924896240234375, -0.2604217529296875, -0.25159454345703125, -0.242767333984375, -0.23394012451171875, -0.2251129150390625, -0.21628570556640625, -0.20745849609375, -0.19863128662109375, -0.1898040771484375, -0.18097686767578125, -0.172149658203125, -0.16332244873046875, -0.1544952392578125, -0.14566802978515625, -0.1368408203125, -0.12801361083984375, -0.1191864013671875, -0.11035919189453125, -0.101531982421875, -0.09270477294921875, -0.0838775634765625, -0.07505035400390625, -0.06622314453125, -0.05739593505859375, -0.0485687255859375, -0.03974151611328125, -0.030914306640625, -0.02208709716796875, -0.0132598876953125, -0.00443267822265625, 0.00439453125, 0.01322174072265625, 0.0220489501953125, 0.03087615966796875, 0.039703369140625, 0.04853057861328125, 0.0573577880859375, 0.06618499755859375, 0.07501220703125, 0.08383941650390625, 0.0926666259765625, 0.10149383544921875, 0.110321044921875, 0.11914825439453125, 0.1279754638671875, 0.13680267333984375, 0.1456298828125, 0.15445709228515625, 0.1632843017578125, 0.17211151123046875, 0.180938720703125, 0.18976593017578125, 0.1985931396484375, 0.20742034912109375, 0.21624755859375, 0.22507476806640625, 0.2339019775390625, 0.24272918701171875, 0.251556396484375, 0.26038360595703125, 0.2692108154296875, 0.27803802490234375, 0.286865234375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 5.0, 5.0, 7.0, 10.0, 13.0, 14.0, 22.0, 31.0, 35.0, 55.0, 69.0, 93.0, 103.0, 111.0, 111.0, 80.0, 63.0, 46.0, 27.0, 18.0, 15.0, 12.0, 12.0, 12.0, 4.0, 7.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2205810546875, -0.2125225067138672, -0.20446395874023438, -0.19640541076660156, -0.18834686279296875, -0.18028831481933594, -0.17222976684570312, -0.1641712188720703, -0.1561126708984375, -0.1480541229248047, -0.13999557495117188, -0.13193702697753906, -0.12387847900390625, -0.11581993103027344, -0.10776138305664062, -0.09970283508300781, -0.091644287109375, -0.08358573913574219, -0.07552719116210938, -0.06746864318847656, -0.05941009521484375, -0.05135154724121094, -0.043292999267578125, -0.03523445129394531, -0.0271759033203125, -0.019117355346679688, -0.011058807373046875, -0.0030002593994140625, 0.00505828857421875, 0.013116836547851562, 0.021175384521484375, 0.029233932495117188, 0.03729248046875, 0.04535102844238281, 0.053409576416015625, 0.06146812438964844, 0.06952667236328125, 0.07758522033691406, 0.08564376831054688, 0.09370231628417969, 0.1017608642578125, 0.10981941223144531, 0.11787796020507812, 0.12593650817871094, 0.13399505615234375, 0.14205360412597656, 0.15011215209960938, 0.1581707000732422, 0.166229248046875, 0.1742877960205078, 0.18234634399414062, 0.19040489196777344, 0.19846343994140625, 0.20652198791503906, 0.21458053588867188, 0.2226390838623047, 0.2306976318359375, 0.2387561798095703, 0.24681472778320312, 0.25487327575683594, 0.26293182373046875, 0.27099037170410156, 0.2790489196777344, 0.2871074676513672, 0.295166015625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 21.0, 50.0, 113.0, 226.0, 229.0, 156.0, 77.0, 51.0, 29.0, 13.0, 11.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.145428657531738, -7.930696487426758, -7.715964317321777, -7.501232147216797, -7.286499977111816, -7.071767807006836, -6.8570356369018555, -6.642303466796875, -6.4275712966918945, -6.212839126586914, -5.998106956481934, -5.783374786376953, -5.568642616271973, -5.353910446166992, -5.139178276062012, -4.924446105957031, -4.709713935852051, -4.49498176574707, -4.28024959564209, -4.065517425537109, -3.850785255432129, -3.6360530853271484, -3.421320915222168, -3.2065887451171875, -2.991856575012207, -2.7771244049072266, -2.562392234802246, -2.3476600646972656, -2.132927894592285, -1.9181957244873047, -1.7034635543823242, -1.4887313842773438, -1.2739992141723633, -1.0592670440673828, -0.8445348739624023, -0.6298027038574219, -0.4150705337524414, -0.20033836364746094, 0.014393806457519531, 0.2291259765625, 0.44385814666748047, 0.6585903167724609, 0.8733224868774414, 1.0880546569824219, 1.3027868270874023, 1.5175189971923828, 1.7322511672973633, 1.9469833374023438, 2.161715507507324, 2.3764476776123047, 2.591179847717285, 2.8059120178222656, 3.020644187927246, 3.2353763580322266, 3.450108528137207, 3.6648406982421875, 3.879572868347168, 4.094305038452148, 4.309037208557129, 4.523769378662109, 4.73850154876709, 4.95323371887207, 5.167965888977051, 5.382698059082031, 5.597430229187012]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 3.0, 12.0, 13.0, 15.0, 16.0, 14.0, 27.0, 23.0, 27.0, 33.0, 27.0, 43.0, 45.0, 48.0, 40.0, 71.0, 66.0, 55.0, 46.0, 52.0, 31.0, 57.0, 43.0, 32.0, 33.0, 22.0, 26.0, 13.0, 11.0, 14.0, 10.0, 3.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9072117805480957, -2.81426739692688, -2.721323013305664, -2.6283786296844482, -2.5354342460632324, -2.4424898624420166, -2.349545478820801, -2.256601095199585, -2.163656711578369, -2.0707123279571533, -1.9777679443359375, -1.8848235607147217, -1.7918791770935059, -1.69893479347229, -1.6059904098510742, -1.5130460262298584, -1.4201016426086426, -1.3271572589874268, -1.234212875366211, -1.1412684917449951, -1.0483241081237793, -0.9553797245025635, -0.8624353408813477, -0.7694909572601318, -0.676546573638916, -0.5836021900177002, -0.4906578063964844, -0.39771342277526855, -0.30476903915405273, -0.21182465553283691, -0.1188802719116211, -0.025935888290405273, 0.06700849533081055, 0.15995287895202637, 0.2528972625732422, 0.345841646194458, 0.43878602981567383, 0.5317304134368896, 0.6246747970581055, 0.7176191806793213, 0.8105635643005371, 0.9035079479217529, 0.9964523315429688, 1.0893967151641846, 1.1823410987854004, 1.2752854824066162, 1.368229866027832, 1.4611742496490479, 1.5541186332702637, 1.6470630168914795, 1.7400074005126953, 1.8329517841339111, 1.925896167755127, 2.0188405513763428, 2.1117849349975586, 2.2047293186187744, 2.2976737022399902, 2.390618085861206, 2.483562469482422, 2.5765068531036377, 2.6694512367248535, 2.7623956203460693, 2.855340003967285, 2.948284387588501, 3.041228771209717]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 7.0, 2.0, 0.0, 5.0, 7.0, 8.0, 15.0, 17.0, 17.0, 26.0, 27.0, 41.0, 50.0, 93.0, 125.0, 213.0, 346.0, 696.0, 1418.0, 2919.0, 7946.0, 81814.0, 4040667.0, 45718.0, 6812.0, 2547.0, 1240.0, 667.0, 350.0, 204.0, 101.0, 67.0, 40.0, 28.0, 17.0, 16.0, 5.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.0216217041015625, -0.979766845703125, -0.9379119873046875, -0.89605712890625, -0.8542022705078125, -0.812347412109375, -0.7704925537109375, -0.7286376953125, -0.6867828369140625, -0.644927978515625, -0.6030731201171875, -0.56121826171875, -0.5193634033203125, -0.477508544921875, -0.4356536865234375, -0.393798828125, -0.3519439697265625, -0.310089111328125, -0.2682342529296875, -0.22637939453125, -0.1845245361328125, -0.142669677734375, -0.1008148193359375, -0.0589599609375, -0.0171051025390625, 0.024749755859375, 0.0666046142578125, 0.10845947265625, 0.1503143310546875, 0.192169189453125, 0.2340240478515625, 0.27587890625, 0.3177337646484375, 0.359588623046875, 0.4014434814453125, 0.44329833984375, 0.4851531982421875, 0.527008056640625, 0.5688629150390625, 0.6107177734375, 0.6525726318359375, 0.694427490234375, 0.7362823486328125, 0.77813720703125, 0.8199920654296875, 0.861846923828125, 0.9037017822265625, 0.945556640625, 0.9874114990234375, 1.029266357421875, 1.0711212158203125, 1.11297607421875, 1.1548309326171875, 1.196685791015625, 1.2385406494140625, 1.2803955078125, 1.3222503662109375, 1.364105224609375, 1.4059600830078125, 1.44781494140625, 1.4896697998046875, 1.531524658203125, 1.5733795166015625, 1.615234375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 10.0, 22.0, 31.0, 42.0, 48.0, 63.0, 74.0, 67.0, 73.0, 107.0, 93.0, 95.0, 50.0, 51.0, 52.0, 36.0, 26.0, 19.0, 14.0, 9.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4296875, -0.41900634765625, -0.4083251953125, -0.39764404296875, -0.386962890625, -0.37628173828125, -0.3656005859375, -0.35491943359375, -0.34423828125, -0.33355712890625, -0.3228759765625, -0.31219482421875, -0.301513671875, -0.29083251953125, -0.2801513671875, -0.26947021484375, -0.2587890625, -0.24810791015625, -0.2374267578125, -0.22674560546875, -0.216064453125, -0.20538330078125, -0.1947021484375, -0.18402099609375, -0.17333984375, -0.16265869140625, -0.1519775390625, -0.14129638671875, -0.130615234375, -0.11993408203125, -0.1092529296875, -0.09857177734375, -0.087890625, -0.07720947265625, -0.0665283203125, -0.05584716796875, -0.045166015625, -0.03448486328125, -0.0238037109375, -0.01312255859375, -0.00244140625, 0.00823974609375, 0.0189208984375, 0.02960205078125, 0.040283203125, 0.05096435546875, 0.0616455078125, 0.07232666015625, 0.0830078125, 0.09368896484375, 0.1043701171875, 0.11505126953125, 0.125732421875, 0.13641357421875, 0.1470947265625, 0.15777587890625, 0.16845703125, 0.17913818359375, 0.1898193359375, 0.20050048828125, 0.211181640625, 0.22186279296875, 0.2325439453125, 0.24322509765625, 0.25390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 6.0, 7.0, 8.0, 14.0, 21.0, 28.0, 56.0, 54.0, 91.0, 125.0, 188.0, 389.0, 1004.0, 5264.0, 4022220.0, 159977.0, 2964.0, 737.0, 382.0, 220.0, 124.0, 104.0, 70.0, 56.0, 60.0, 38.0, 16.0, 17.0, 15.0, 5.0, 4.0, 4.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.89801025390625, -2.7901611328125, -2.68231201171875, -2.574462890625, -2.46661376953125, -2.3587646484375, -2.25091552734375, -2.14306640625, -2.03521728515625, -1.9273681640625, -1.81951904296875, -1.711669921875, -1.60382080078125, -1.4959716796875, -1.38812255859375, -1.2802734375, -1.17242431640625, -1.0645751953125, -0.95672607421875, -0.848876953125, -0.74102783203125, -0.6331787109375, -0.52532958984375, -0.41748046875, -0.30963134765625, -0.2017822265625, -0.09393310546875, 0.013916015625, 0.12176513671875, 0.2296142578125, 0.33746337890625, 0.4453125, 0.55316162109375, 0.6610107421875, 0.76885986328125, 0.876708984375, 0.98455810546875, 1.0924072265625, 1.20025634765625, 1.30810546875, 1.41595458984375, 1.5238037109375, 1.63165283203125, 1.739501953125, 1.84735107421875, 1.9552001953125, 2.06304931640625, 2.1708984375, 2.27874755859375, 2.3865966796875, 2.49444580078125, 2.602294921875, 2.71014404296875, 2.8179931640625, 2.92584228515625, 3.03369140625, 3.14154052734375, 3.2493896484375, 3.35723876953125, 3.465087890625, 3.57293701171875, 3.6807861328125, 3.78863525390625, 3.896484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 10.0, 43.0, 63.0, 312.0, 3159.0, 359.0, 76.0, 29.0, 13.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91796875, -0.85003662109375, -0.7821044921875, -0.71417236328125, -0.646240234375, -0.57830810546875, -0.5103759765625, -0.44244384765625, -0.37451171875, -0.30657958984375, -0.2386474609375, -0.17071533203125, -0.102783203125, -0.03485107421875, 0.0330810546875, 0.10101318359375, 0.1689453125, 0.23687744140625, 0.3048095703125, 0.37274169921875, 0.440673828125, 0.50860595703125, 0.5765380859375, 0.64447021484375, 0.71240234375, 0.78033447265625, 0.8482666015625, 0.91619873046875, 0.984130859375, 1.05206298828125, 1.1199951171875, 1.18792724609375, 1.255859375, 1.32379150390625, 1.3917236328125, 1.45965576171875, 1.527587890625, 1.59552001953125, 1.6634521484375, 1.73138427734375, 1.79931640625, 1.86724853515625, 1.9351806640625, 2.00311279296875, 2.071044921875, 2.13897705078125, 2.2069091796875, 2.27484130859375, 2.3427734375, 2.41070556640625, 2.4786376953125, 2.54656982421875, 2.614501953125, 2.68243408203125, 2.7503662109375, 2.81829833984375, 2.88623046875, 2.95416259765625, 3.0220947265625, 3.09002685546875, 3.157958984375, 3.22589111328125, 3.2938232421875, 3.36175537109375, 3.4296875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 29.0, 132.0, 551.0, 200.0, 35.0, 21.0, 7.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.79609489440918, -27.07457733154297, -26.353057861328125, -25.631540298461914, -24.910022735595703, -24.18850326538086, -23.46698570251465, -22.745468139648438, -22.023948669433594, -21.302431106567383, -20.58091163635254, -19.859394073486328, -19.137874603271484, -18.416357040405273, -17.694839477539062, -16.97332000732422, -16.251802444458008, -15.53028392791748, -14.808765411376953, -14.087247848510742, -13.365729331970215, -12.644210815429688, -11.922693252563477, -11.20117473602295, -10.479656219482422, -9.758137702941895, -9.036619186401367, -8.315101623535156, -7.593583106994629, -6.872064590454102, -6.150546550750732, -5.429028511047363, -4.707508087158203, -3.985989809036255, -3.2644715309143066, -2.5429532527923584, -1.8214349746704102, -1.099916696548462, -0.37839841842651367, 0.34311962127685547, 1.0646381378173828, 1.786156415939331, 2.5076746940612793, 3.2291929721832275, 3.950711250305176, 4.672229766845703, 5.393747806549072, 6.115265846252441, 6.836784362792969, 7.558302879333496, 8.279821395874023, 9.001338958740234, 9.722857475280762, 10.444375991821289, 11.1658935546875, 11.887412071228027, 12.608930587768555, 13.330449104309082, 14.05196762084961, 14.77348518371582, 15.495003700256348, 16.216522216796875, 16.938039779663086, 17.659557342529297, 18.38107681274414]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 5.0, 13.0, 25.0, 22.0, 16.0, 46.0, 54.0, 61.0, 72.0, 74.0, 90.0, 85.0, 83.0, 87.0, 73.0, 50.0, 37.0, 32.0, 23.0, 12.0, 8.0, 9.0, 5.0, 9.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.369791030883789, -8.162999153137207, -7.956207752227783, -7.749415874481201, -7.542623996734619, -7.335832595825195, -7.129040718078613, -6.922248840332031, -6.715456962585449, -6.508665084838867, -6.301873683929443, -6.095081806182861, -5.888289928436279, -5.6814985275268555, -5.474706649780273, -5.267914772033691, -5.061122894287109, -4.854331016540527, -4.6475396156311035, -4.4407477378845215, -4.2339558601379395, -4.027164459228516, -3.8203725814819336, -3.6135807037353516, -3.4067893028259277, -3.199997663497925, -2.9932057857513428, -2.78641414642334, -2.579622268676758, -2.372830629348755, -2.166038990020752, -1.95924711227417, -1.752455234527588, -1.5456634759902954, -1.338871717453003, -1.132080078125, -0.9252882599830627, -0.718496561050415, -0.5117048025131226, -0.3049130439758301, -0.0981212854385376, 0.10867045819759369, 0.315462201833725, 0.5222539305686951, 0.7290456891059875, 0.9358373880386353, 1.1426291465759277, 1.3494209051132202, 1.5562126636505127, 1.7630044221878052, 1.9697961807250977, 2.1765878200531006, 2.3833796977996826, 2.5901713371276855, 2.7969632148742676, 3.0037548542022705, 3.2105464935302734, 3.4173381328582764, 3.6241300106048584, 3.8309216499328613, 4.037713527679443, 4.244504928588867, 4.451296806335449, 4.658088684082031, 4.864880561828613]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 6.0, 11.0, 15.0, 11.0, 26.0, 40.0, 59.0, 61.0, 122.0, 181.0, 348.0, 583.0, 1140.0, 2395.0, 6110.0, 17792.0, 71389.0, 446748.0, 408442.0, 65688.0, 16684.0, 5777.0, 2420.0, 1093.0, 590.0, 315.0, 163.0, 94.0, 80.0, 50.0, 27.0, 27.0, 18.0, 13.0, 4.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.8515625, -0.8257369995117188, -0.7999114990234375, -0.7740859985351562, -0.748260498046875, -0.7224349975585938, -0.6966094970703125, -0.6707839965820312, -0.64495849609375, -0.6191329956054688, -0.5933074951171875, -0.5674819946289062, -0.541656494140625, -0.5158309936523438, -0.4900054931640625, -0.46417999267578125, -0.4383544921875, -0.41252899169921875, -0.3867034912109375, -0.36087799072265625, -0.335052490234375, -0.30922698974609375, -0.2834014892578125, -0.25757598876953125, -0.23175048828125, -0.20592498779296875, -0.1800994873046875, -0.15427398681640625, -0.128448486328125, -0.10262298583984375, -0.0767974853515625, -0.05097198486328125, -0.025146484375, 0.00067901611328125, 0.0265045166015625, 0.05233001708984375, 0.078155517578125, 0.10398101806640625, 0.1298065185546875, 0.15563201904296875, 0.18145751953125, 0.20728302001953125, 0.2331085205078125, 0.25893402099609375, 0.284759521484375, 0.31058502197265625, 0.3364105224609375, 0.36223602294921875, 0.3880615234375, 0.41388702392578125, 0.4397125244140625, 0.46553802490234375, 0.491363525390625, 0.5171890258789062, 0.5430145263671875, 0.5688400268554688, 0.59466552734375, 0.6204910278320312, 0.6463165283203125, 0.6721420288085938, 0.697967529296875, 0.7237930297851562, 0.7496185302734375, 0.7754440307617188, 0.80126953125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 16.0, 20.0, 30.0, 22.0, 43.0, 49.0, 53.0, 71.0, 102.0, 93.0, 91.0, 70.0, 78.0, 68.0, 45.0, 35.0, 30.0, 28.0, 19.0, 12.0, 9.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57666015625, -0.5625267028808594, -0.5483932495117188, -0.5342597961425781, -0.5201263427734375, -0.5059928894042969, -0.49185943603515625, -0.4777259826660156, -0.463592529296875, -0.4494590759277344, -0.43532562255859375, -0.4211921691894531, -0.4070587158203125, -0.3929252624511719, -0.37879180908203125, -0.3646583557128906, -0.35052490234375, -0.3363914489746094, -0.32225799560546875, -0.3081245422363281, -0.2939910888671875, -0.2798576354980469, -0.26572418212890625, -0.2515907287597656, -0.237457275390625, -0.22332382202148438, -0.20919036865234375, -0.19505691528320312, -0.1809234619140625, -0.16679000854492188, -0.15265655517578125, -0.13852310180664062, -0.1243896484375, -0.11025619506835938, -0.09612274169921875, -0.08198928833007812, -0.0678558349609375, -0.053722381591796875, -0.03958892822265625, -0.025455474853515625, -0.011322021484375, 0.002811431884765625, 0.01694488525390625, 0.031078338623046875, 0.0452117919921875, 0.059345245361328125, 0.07347869873046875, 0.08761215209960938, 0.10174560546875, 0.11587905883789062, 0.13001251220703125, 0.14414596557617188, 0.1582794189453125, 0.17241287231445312, 0.18654632568359375, 0.20067977905273438, 0.214813232421875, 0.22894668579101562, 0.24308013916015625, 0.2572135925292969, 0.2713470458984375, 0.2854804992675781, 0.29961395263671875, 0.3137474060058594, 0.327880859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 8.0, 5.0, 11.0, 16.0, 19.0, 36.0, 28.0, 46.0, 54.0, 79.0, 121.0, 201.0, 313.0, 554.0, 946.0, 1967.0, 5095.0, 16519.0, 87968.0, 682940.0, 208665.0, 29518.0, 7611.0, 2718.0, 1314.0, 707.0, 354.0, 225.0, 137.0, 108.0, 69.0, 43.0, 42.0, 24.0, 17.0, 21.0, 11.0, 12.0, 8.0, 5.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.7509765625, -0.7286911010742188, -0.7064056396484375, -0.6841201782226562, -0.661834716796875, -0.6395492553710938, -0.6172637939453125, -0.5949783325195312, -0.57269287109375, -0.5504074096679688, -0.5281219482421875, -0.5058364868164062, -0.483551025390625, -0.46126556396484375, -0.4389801025390625, -0.41669464111328125, -0.3944091796875, -0.37212371826171875, -0.3498382568359375, -0.32755279541015625, -0.305267333984375, -0.28298187255859375, -0.2606964111328125, -0.23841094970703125, -0.21612548828125, -0.19384002685546875, -0.1715545654296875, -0.14926910400390625, -0.126983642578125, -0.10469818115234375, -0.0824127197265625, -0.06012725830078125, -0.037841796875, -0.01555633544921875, 0.0067291259765625, 0.02901458740234375, 0.051300048828125, 0.07358551025390625, 0.0958709716796875, 0.11815643310546875, 0.14044189453125, 0.16272735595703125, 0.1850128173828125, 0.20729827880859375, 0.229583740234375, 0.25186920166015625, 0.2741546630859375, 0.29644012451171875, 0.3187255859375, 0.34101104736328125, 0.3632965087890625, 0.38558197021484375, 0.407867431640625, 0.43015289306640625, 0.4524383544921875, 0.47472381591796875, 0.49700927734375, 0.5192947387695312, 0.5415802001953125, 0.5638656616210938, 0.586151123046875, 0.6084365844726562, 0.6307220458984375, 0.6530075073242188, 0.67529296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 0.0, 6.0, 9.0, 9.0, 2.0, 10.0, 6.0, 12.0, 16.0, 19.0, 22.0, 18.0, 18.0, 25.0, 21.0, 36.0, 41.0, 26.0, 36.0, 42.0, 51.0, 45.0, 51.0, 32.0, 48.0, 37.0, 32.0, 35.0, 28.0, 39.0, 34.0, 32.0, 20.0, 14.0, 26.0, 18.0, 11.0, 10.0, 11.0, 11.0, 8.0, 7.0, 4.0, 4.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.72265625, -0.7006912231445312, -0.6787261962890625, -0.6567611694335938, -0.634796142578125, -0.6128311157226562, -0.5908660888671875, -0.5689010620117188, -0.54693603515625, -0.5249710083007812, -0.5030059814453125, -0.48104095458984375, -0.459075927734375, -0.43711090087890625, -0.4151458740234375, -0.39318084716796875, -0.3712158203125, -0.34925079345703125, -0.3272857666015625, -0.30532073974609375, -0.283355712890625, -0.26139068603515625, -0.2394256591796875, -0.21746063232421875, -0.19549560546875, -0.17353057861328125, -0.1515655517578125, -0.12960052490234375, -0.107635498046875, -0.08567047119140625, -0.0637054443359375, -0.04174041748046875, -0.019775390625, 0.00218963623046875, 0.0241546630859375, 0.04611968994140625, 0.068084716796875, 0.09004974365234375, 0.1120147705078125, 0.13397979736328125, 0.15594482421875, 0.17790985107421875, 0.1998748779296875, 0.22183990478515625, 0.243804931640625, 0.26576995849609375, 0.2877349853515625, 0.30970001220703125, 0.3316650390625, 0.35363006591796875, 0.3755950927734375, 0.39756011962890625, 0.419525146484375, 0.44149017333984375, 0.4634552001953125, 0.48542022705078125, 0.50738525390625, 0.5293502807617188, 0.5513153076171875, 0.5732803344726562, 0.595245361328125, 0.6172103881835938, 0.6391754150390625, 0.6611404418945312, 0.68310546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 11.0, 16.0, 26.0, 58.0, 109.0, 208.0, 458.0, 1478.0, 7197.0, 92810.0, 908046.0, 32391.0, 4089.0, 979.0, 341.0, 155.0, 75.0, 38.0, 25.0, 12.0, 5.0, 11.0, 2.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64990234375, -0.62847900390625, -0.6070556640625, -0.58563232421875, -0.564208984375, -0.54278564453125, -0.5213623046875, -0.49993896484375, -0.478515625, -0.45709228515625, -0.4356689453125, -0.41424560546875, -0.392822265625, -0.37139892578125, -0.3499755859375, -0.32855224609375, -0.30712890625, -0.28570556640625, -0.2642822265625, -0.24285888671875, -0.221435546875, -0.20001220703125, -0.1785888671875, -0.15716552734375, -0.1357421875, -0.11431884765625, -0.0928955078125, -0.07147216796875, -0.050048828125, -0.02862548828125, -0.0072021484375, 0.01422119140625, 0.03564453125, 0.05706787109375, 0.0784912109375, 0.09991455078125, 0.121337890625, 0.14276123046875, 0.1641845703125, 0.18560791015625, 0.20703125, 0.22845458984375, 0.2498779296875, 0.27130126953125, 0.292724609375, 0.31414794921875, 0.3355712890625, 0.35699462890625, 0.37841796875, 0.39984130859375, 0.4212646484375, 0.44268798828125, 0.464111328125, 0.48553466796875, 0.5069580078125, 0.52838134765625, 0.5498046875, 0.57122802734375, 0.5926513671875, 0.61407470703125, 0.635498046875, 0.65692138671875, 0.6783447265625, 0.69976806640625, 0.72119140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 10.0, 11.0, 18.0, 29.0, 45.0, 67.0, 101.0, 181.0, 213.0, 124.0, 78.0, 42.0, 20.0, 20.0, 8.0, 8.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010281801223754883, -9.903218597173691e-05, -9.524635970592499e-05, -9.146053344011307e-05, -8.767470717430115e-05, -8.388888090848923e-05, -8.010305464267731e-05, -7.631722837686539e-05, -7.253140211105347e-05, -6.874557584524155e-05, -6.495974957942963e-05, -6.11739233136177e-05, -5.7388097047805786e-05, -5.3602270781993866e-05, -4.9816444516181946e-05, -4.6030618250370026e-05, -4.2244791984558105e-05, -3.8458965718746185e-05, -3.4673139452934265e-05, -3.0887313187122345e-05, -2.7101486921310425e-05, -2.3315660655498505e-05, -1.9529834389686584e-05, -1.5744008123874664e-05, -1.1958181858062744e-05, -8.172355592250824e-06, -4.386529326438904e-06, -6.007030606269836e-07, 3.1851232051849365e-06, 6.970949470996857e-06, 1.0756775736808777e-05, 1.4542602002620697e-05, 1.8328428268432617e-05, 2.2114254534244537e-05, 2.5900080800056458e-05, 2.9685907065868378e-05, 3.34717333316803e-05, 3.725755959749222e-05, 4.104338586330414e-05, 4.482921212911606e-05, 4.861503839492798e-05, 5.24008646607399e-05, 5.618669092655182e-05, 5.997251719236374e-05, 6.375834345817566e-05, 6.754416972398758e-05, 7.13299959897995e-05, 7.511582225561142e-05, 7.890164852142334e-05, 8.268747478723526e-05, 8.647330105304718e-05, 9.02591273188591e-05, 9.404495358467102e-05, 9.783077985048294e-05, 0.00010161660611629486, 0.00010540243238210678, 0.0001091882586479187, 0.00011297408491373062, 0.00011675991117954254, 0.00012054573744535446, 0.00012433156371116638, 0.0001281173899769783, 0.00013190321624279022, 0.00013568904250860214, 0.00013947486877441406]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 15.0, 15.0, 15.0, 20.0, 36.0, 71.0, 90.0, 130.0, 189.0, 301.0, 515.0, 986.0, 1663.0, 3542.0, 8785.0, 27888.0, 160373.0, 710656.0, 98543.0, 20916.0, 7035.0, 3032.0, 1621.0, 851.0, 450.0, 267.0, 178.0, 109.0, 94.0, 48.0, 44.0, 20.0, 18.0, 8.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32421875, -0.3135490417480469, -0.30287933349609375, -0.2922096252441406, -0.2815399169921875, -0.2708702087402344, -0.26020050048828125, -0.24953079223632812, -0.238861083984375, -0.22819137573242188, -0.21752166748046875, -0.20685195922851562, -0.1961822509765625, -0.18551254272460938, -0.17484283447265625, -0.16417312622070312, -0.15350341796875, -0.14283370971679688, -0.13216400146484375, -0.12149429321289062, -0.1108245849609375, -0.10015487670898438, -0.08948516845703125, -0.07881546020507812, -0.068145751953125, -0.057476043701171875, -0.04680633544921875, -0.036136627197265625, -0.0254669189453125, -0.014797210693359375, -0.00412750244140625, 0.006542205810546875, 0.0172119140625, 0.027881622314453125, 0.03855133056640625, 0.049221038818359375, 0.0598907470703125, 0.07056045532226562, 0.08123016357421875, 0.09189987182617188, 0.102569580078125, 0.11323928833007812, 0.12390899658203125, 0.13457870483398438, 0.1452484130859375, 0.15591812133789062, 0.16658782958984375, 0.17725753784179688, 0.18792724609375, 0.19859695434570312, 0.20926666259765625, 0.21993637084960938, 0.2306060791015625, 0.24127578735351562, 0.25194549560546875, 0.2626152038574219, 0.273284912109375, 0.2839546203613281, 0.29462432861328125, 0.3052940368652344, 0.3159637451171875, 0.3266334533691406, 0.33730316162109375, 0.3479728698730469, 0.358642578125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 9.0, 12.0, 11.0, 6.0, 21.0, 22.0, 22.0, 26.0, 47.0, 50.0, 61.0, 71.0, 86.0, 81.0, 81.0, 68.0, 58.0, 44.0, 34.0, 29.0, 30.0, 23.0, 14.0, 23.0, 15.0, 8.0, 9.0, 6.0, 5.0, 3.0, 3.0, 9.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.246337890625, -0.2389812469482422, -0.23162460327148438, -0.22426795959472656, -0.21691131591796875, -0.20955467224121094, -0.20219802856445312, -0.1948413848876953, -0.1874847412109375, -0.1801280975341797, -0.17277145385742188, -0.16541481018066406, -0.15805816650390625, -0.15070152282714844, -0.14334487915039062, -0.1359882354736328, -0.128631591796875, -0.12127494812011719, -0.11391830444335938, -0.10656166076660156, -0.09920501708984375, -0.09184837341308594, -0.08449172973632812, -0.07713508605957031, -0.0697784423828125, -0.06242179870605469, -0.055065155029296875, -0.04770851135253906, -0.04035186767578125, -0.03299522399902344, -0.025638580322265625, -0.018281936645507812, -0.01092529296875, -0.0035686492919921875, 0.003787994384765625, 0.011144638061523438, 0.01850128173828125, 0.025857925415039062, 0.033214569091796875, 0.04057121276855469, 0.0479278564453125, 0.05528450012207031, 0.06264114379882812, 0.06999778747558594, 0.07735443115234375, 0.08471107482910156, 0.09206771850585938, 0.09942436218261719, 0.106781005859375, 0.11413764953613281, 0.12149429321289062, 0.12885093688964844, 0.13620758056640625, 0.14356422424316406, 0.15092086791992188, 0.1582775115966797, 0.1656341552734375, 0.1729907989501953, 0.18034744262695312, 0.18770408630371094, 0.19506072998046875, 0.20241737365722656, 0.20977401733398438, 0.2171306610107422, 0.2244873046875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 14.0, 49.0, 107.0, 200.0, 292.0, 185.0, 79.0, 36.0, 17.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2016143798828125, -5.936796188354492, -5.671977519989014, -5.407158851623535, -5.142340660095215, -4.8775224685668945, -4.612703800201416, -4.3478851318359375, -4.083066940307617, -3.8182485103607178, -3.5534300804138184, -3.288611650466919, -3.0237932205200195, -2.75897479057312, -2.4941563606262207, -2.2293379306793213, -1.9645195007324219, -1.6997010707855225, -1.434882640838623, -1.1700642108917236, -0.9052457809448242, -0.6404273509979248, -0.3756089210510254, -0.11079049110412598, 0.15402793884277344, 0.41884636878967285, 0.6836647987365723, 0.9484832286834717, 1.213301658630371, 1.4781200885772705, 1.74293851852417, 2.0077569484710693, 2.2725744247436523, 2.5373928546905518, 2.802211284637451, 3.0670297145843506, 3.33184814453125, 3.5966665744781494, 3.861485004425049, 4.126303672790527, 4.391121864318848, 4.655940055847168, 4.9207587242126465, 5.185577392578125, 5.450395584106445, 5.715213775634766, 5.980032444000244, 6.244851112365723, 6.509669303894043, 6.774487495422363, 7.039306163787842, 7.30412483215332, 7.568943023681641, 7.833761215209961, 8.098579406738281, 8.363398551940918, 8.628216743469238, 8.893034934997559, 9.157854080200195, 9.422672271728516, 9.687490463256836, 9.952308654785156, 10.217126846313477, 10.481945991516113, 10.746764183044434]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 9.0, 8.0, 2.0, 15.0, 6.0, 11.0, 9.0, 15.0, 27.0, 28.0, 32.0, 36.0, 27.0, 60.0, 51.0, 43.0, 56.0, 53.0, 56.0, 72.0, 56.0, 34.0, 49.0, 32.0, 33.0, 24.0, 22.0, 20.0, 31.0, 16.0, 14.0, 13.0, 10.0, 6.0, 5.0, 9.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.831061840057373, -3.7147722244262695, -3.598482608795166, -3.4821929931640625, -3.365903615951538, -3.2496140003204346, -3.133324384689331, -3.0170347690582275, -2.900745391845703, -2.7844557762145996, -2.668166160583496, -2.5518765449523926, -2.435587167739868, -2.3192975521087646, -2.203007936477661, -2.0867183208465576, -1.970428705215454, -1.8541390895843506, -1.7378495931625366, -1.621559977531433, -1.5052704811096191, -1.3889808654785156, -1.272691249847412, -1.1564016342163086, -1.0401121377944946, -0.9238225817680359, -0.8075330257415771, -0.6912434101104736, -0.5749538540840149, -0.45866429805755615, -0.34237468242645264, -0.2260851263999939, -0.10979580879211426, 0.006493762135505676, 0.12278333306312561, 0.23907291889190674, 0.3553624749183655, 0.4716520309448242, 0.5879416465759277, 0.7042312026023865, 0.8205207586288452, 0.936810314655304, 1.0530998706817627, 1.1693894863128662, 1.2856791019439697, 1.4019685983657837, 1.5182582139968872, 1.6345477104187012, 1.7508373260498047, 1.8671269416809082, 1.9834164381027222, 2.0997061729431152, 2.2159955501556396, 2.332285165786743, 2.4485747814178467, 2.56486439704895, 2.6811537742614746, 2.797443389892578, 2.9137330055236816, 3.030022621154785, 3.1463119983673096, 3.262601613998413, 3.3788912296295166, 3.49518084526062, 3.6114704608917236]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 6.0, 7.0, 11.0, 17.0, 22.0, 18.0, 36.0, 43.0, 48.0, 65.0, 84.0, 128.0, 197.0, 320.0, 550.0, 1105.0, 2411.0, 6049.0, 17977.0, 213000.0, 3856355.0, 72142.0, 14755.0, 4823.0, 2102.0, 1004.0, 416.0, 254.0, 132.0, 75.0, 43.0, 38.0, 15.0, 9.0, 8.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6337890625, -1.5911865234375, -1.548583984375, -1.5059814453125, -1.46337890625, -1.4207763671875, -1.378173828125, -1.3355712890625, -1.29296875, -1.2503662109375, -1.207763671875, -1.1651611328125, -1.12255859375, -1.0799560546875, -1.037353515625, -0.9947509765625, -0.9521484375, -0.9095458984375, -0.866943359375, -0.8243408203125, -0.78173828125, -0.7391357421875, -0.696533203125, -0.6539306640625, -0.611328125, -0.5687255859375, -0.526123046875, -0.4835205078125, -0.44091796875, -0.3983154296875, -0.355712890625, -0.3131103515625, -0.2705078125, -0.2279052734375, -0.185302734375, -0.1427001953125, -0.10009765625, -0.0574951171875, -0.014892578125, 0.0277099609375, 0.0703125, 0.1129150390625, 0.155517578125, 0.1981201171875, 0.24072265625, 0.2833251953125, 0.325927734375, 0.3685302734375, 0.4111328125, 0.4537353515625, 0.496337890625, 0.5389404296875, 0.58154296875, 0.6241455078125, 0.666748046875, 0.7093505859375, 0.751953125, 0.7945556640625, 0.837158203125, 0.8797607421875, 0.92236328125, 0.9649658203125, 1.007568359375, 1.0501708984375, 1.0927734375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 11.0, 10.0, 20.0, 28.0, 24.0, 40.0, 53.0, 68.0, 62.0, 94.0, 90.0, 87.0, 87.0, 74.0, 66.0, 57.0, 37.0, 25.0, 30.0, 21.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55322265625, -0.5396728515625, -0.526123046875, -0.5125732421875, -0.4990234375, -0.4854736328125, -0.471923828125, -0.4583740234375, -0.44482421875, -0.4312744140625, -0.417724609375, -0.4041748046875, -0.390625, -0.3770751953125, -0.363525390625, -0.3499755859375, -0.33642578125, -0.3228759765625, -0.309326171875, -0.2957763671875, -0.2822265625, -0.2686767578125, -0.255126953125, -0.2415771484375, -0.22802734375, -0.2144775390625, -0.200927734375, -0.1873779296875, -0.173828125, -0.1602783203125, -0.146728515625, -0.1331787109375, -0.11962890625, -0.1060791015625, -0.092529296875, -0.0789794921875, -0.0654296875, -0.0518798828125, -0.038330078125, -0.0247802734375, -0.01123046875, 0.0023193359375, 0.015869140625, 0.0294189453125, 0.04296875, 0.0565185546875, 0.070068359375, 0.0836181640625, 0.09716796875, 0.1107177734375, 0.124267578125, 0.1378173828125, 0.1513671875, 0.1649169921875, 0.178466796875, 0.1920166015625, 0.20556640625, 0.2191162109375, 0.232666015625, 0.2462158203125, 0.259765625, 0.2733154296875, 0.286865234375, 0.3004150390625, 0.31396484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 2.0, 5.0, 15.0, 16.0, 17.0, 38.0, 58.0, 100.0, 181.0, 497.0, 1812.0, 14568.0, 3967775.0, 200241.0, 6926.0, 1122.0, 339.0, 163.0, 110.0, 71.0, 66.0, 43.0, 34.0, 22.0, 23.0, 14.0, 12.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.22265625, -2.12939453125, -2.0361328125, -1.94287109375, -1.849609375, -1.75634765625, -1.6630859375, -1.56982421875, -1.4765625, -1.38330078125, -1.2900390625, -1.19677734375, -1.103515625, -1.01025390625, -0.9169921875, -0.82373046875, -0.73046875, -0.63720703125, -0.5439453125, -0.45068359375, -0.357421875, -0.26416015625, -0.1708984375, -0.07763671875, 0.015625, 0.10888671875, 0.2021484375, 0.29541015625, 0.388671875, 0.48193359375, 0.5751953125, 0.66845703125, 0.76171875, 0.85498046875, 0.9482421875, 1.04150390625, 1.134765625, 1.22802734375, 1.3212890625, 1.41455078125, 1.5078125, 1.60107421875, 1.6943359375, 1.78759765625, 1.880859375, 1.97412109375, 2.0673828125, 2.16064453125, 2.25390625, 2.34716796875, 2.4404296875, 2.53369140625, 2.626953125, 2.72021484375, 2.8134765625, 2.90673828125, 3.0, 3.09326171875, 3.1865234375, 3.27978515625, 3.373046875, 3.46630859375, 3.5595703125, 3.65283203125, 3.74609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 11.0, 13.0, 27.0, 53.0, 133.0, 673.0, 2426.0, 481.0, 118.0, 66.0, 33.0, 19.0, 12.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8447265625, -0.7819671630859375, -0.719207763671875, -0.6564483642578125, -0.59368896484375, -0.5309295654296875, -0.468170166015625, -0.4054107666015625, -0.3426513671875, -0.2798919677734375, -0.217132568359375, -0.1543731689453125, -0.09161376953125, -0.0288543701171875, 0.033905029296875, 0.0966644287109375, 0.159423828125, 0.2221832275390625, 0.284942626953125, 0.3477020263671875, 0.41046142578125, 0.4732208251953125, 0.535980224609375, 0.5987396240234375, 0.6614990234375, 0.7242584228515625, 0.787017822265625, 0.8497772216796875, 0.91253662109375, 0.9752960205078125, 1.038055419921875, 1.1008148193359375, 1.16357421875, 1.2263336181640625, 1.289093017578125, 1.3518524169921875, 1.41461181640625, 1.4773712158203125, 1.540130615234375, 1.6028900146484375, 1.6656494140625, 1.7284088134765625, 1.791168212890625, 1.8539276123046875, 1.91668701171875, 1.9794464111328125, 2.042205810546875, 2.1049652099609375, 2.167724609375, 2.2304840087890625, 2.293243408203125, 2.3560028076171875, 2.41876220703125, 2.4815216064453125, 2.544281005859375, 2.6070404052734375, 2.6697998046875, 2.7325592041015625, 2.795318603515625, 2.8580780029296875, 2.92083740234375, 2.9835968017578125, 3.046356201171875, 3.1091156005859375, 3.171875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 9.0, 17.0, 35.0, 54.0, 95.0, 226.0, 255.0, 138.0, 64.0, 32.0, 21.0, 15.0, 11.0, 7.0, 1.0, 2.0, 6.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7258501052856445, -7.362420558929443, -6.998991012573242, -6.635560989379883, -6.272131443023682, -5.9087018966674805, -5.545271873474121, -5.18184232711792, -4.818412780761719, -4.454983234405518, -4.091553688049316, -3.728123664855957, -3.364694118499756, -3.0012645721435547, -2.6378347873687744, -2.274405002593994, -1.910975456237793, -1.5475457906723022, -1.1841161251068115, -0.8206864595413208, -0.4572567939758301, -0.09382712841033936, 0.26960253715515137, 0.6330323219299316, 0.9964618682861328, 1.3598915338516235, 1.7233211994171143, 2.0867509841918945, 2.4501805305480957, 2.813610076904297, 3.177039861679077, 3.5404696464538574, 3.903900146484375, 4.267329692840576, 4.630759239196777, 4.994189262390137, 5.357618808746338, 5.721048355102539, 6.084478378295898, 6.4479079246521, 6.811337471008301, 7.174767017364502, 7.538196563720703, 7.9016265869140625, 8.265056610107422, 8.628485679626465, 8.991915702819824, 9.355344772338867, 9.718774795532227, 10.082204818725586, 10.445633888244629, 10.809063911437988, 11.172492980957031, 11.53592300415039, 11.89935302734375, 12.26278305053711, 12.626212120056152, 12.989642143249512, 13.353071212768555, 13.716501235961914, 14.079931259155273, 14.443360328674316, 14.806790351867676, 15.170219421386719, 15.533649444580078]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 1.0, 1.0, 6.0, 10.0, 12.0, 22.0, 18.0, 26.0, 28.0, 27.0, 50.0, 43.0, 45.0, 55.0, 71.0, 70.0, 62.0, 69.0, 69.0, 54.0, 40.0, 30.0, 39.0, 36.0, 36.0, 17.0, 20.0, 14.0, 10.0, 9.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.195430755615234, -4.047861576080322, -3.9002926349639893, -3.7527236938476562, -3.605154514312744, -3.457585573196411, -3.310016632080078, -3.162447452545166, -3.014878511428833, -2.8673095703125, -2.719740390777588, -2.572171449661255, -2.424602508544922, -2.2770333290100098, -2.1294643878936768, -1.9818953275680542, -1.8343262672424316, -1.686757206916809, -1.5391881465911865, -1.3916192054748535, -1.244050145149231, -1.0964810848236084, -0.9489120841026306, -0.8013430833816528, -0.6537740230560303, -0.5062049627304077, -0.35863596200942993, -0.21106693148612976, -0.06349790096282959, 0.08407115936279297, 0.23164016008377075, 0.37920916080474854, 0.5267786979675293, 0.6743477582931519, 0.8219167590141296, 0.9694857597351074, 1.11705482006073, 1.2646238803863525, 1.4121928215026855, 1.559761881828308, 1.7073309421539307, 1.8549000024795532, 2.002469062805176, 2.150038003921509, 2.297606945037842, 2.445176124572754, 2.592745065689087, 2.74031400680542, 2.887883186340332, 3.035452127456665, 3.183021306991577, 3.33059024810791, 3.4781594276428223, 3.6257283687591553, 3.7732973098754883, 3.9208664894104004, 4.0684356689453125, 4.216004848480225, 4.3635735511779785, 4.511142730712891, 4.658711910247803, 4.806281089782715, 4.953849792480469, 5.101418972015381, 5.248987674713135]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 15.0, 13.0, 5.0, 28.0, 34.0, 46.0, 75.0, 96.0, 207.0, 295.0, 543.0, 1127.0, 2528.0, 6605.0, 22451.0, 134162.0, 696438.0, 147758.0, 24014.0, 6862.0, 2597.0, 1189.0, 609.0, 307.0, 192.0, 114.0, 79.0, 50.0, 29.0, 20.0, 12.0, 10.0, 19.0, 8.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0791015625, -1.0437469482421875, -1.008392333984375, -0.9730377197265625, -0.93768310546875, -0.9023284912109375, -0.866973876953125, -0.8316192626953125, -0.7962646484375, -0.7609100341796875, -0.725555419921875, -0.6902008056640625, -0.65484619140625, -0.6194915771484375, -0.584136962890625, -0.5487823486328125, -0.513427734375, -0.4780731201171875, -0.442718505859375, -0.4073638916015625, -0.37200927734375, -0.3366546630859375, -0.301300048828125, -0.2659454345703125, -0.2305908203125, -0.1952362060546875, -0.159881591796875, -0.1245269775390625, -0.08917236328125, -0.0538177490234375, -0.018463134765625, 0.0168914794921875, 0.05224609375, 0.0876007080078125, 0.122955322265625, 0.1583099365234375, 0.19366455078125, 0.2290191650390625, 0.264373779296875, 0.2997283935546875, 0.3350830078125, 0.3704376220703125, 0.405792236328125, 0.4411468505859375, 0.47650146484375, 0.5118560791015625, 0.547210693359375, 0.5825653076171875, 0.617919921875, 0.6532745361328125, 0.688629150390625, 0.7239837646484375, 0.75933837890625, 0.7946929931640625, 0.830047607421875, 0.8654022216796875, 0.9007568359375, 0.9361114501953125, 0.971466064453125, 1.0068206787109375, 1.04217529296875, 1.0775299072265625, 1.112884521484375, 1.1482391357421875, 1.18359375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 8.0, 7.0, 19.0, 27.0, 31.0, 52.0, 48.0, 55.0, 57.0, 82.0, 88.0, 86.0, 82.0, 73.0, 62.0, 56.0, 52.0, 33.0, 24.0, 18.0, 8.0, 7.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.61572265625, -0.6013717651367188, -0.5870208740234375, -0.5726699829101562, -0.558319091796875, -0.5439682006835938, -0.5296173095703125, -0.5152664184570312, -0.50091552734375, -0.48656463623046875, -0.4722137451171875, -0.45786285400390625, -0.443511962890625, -0.42916107177734375, -0.4148101806640625, -0.40045928955078125, -0.3861083984375, -0.37175750732421875, -0.3574066162109375, -0.34305572509765625, -0.328704833984375, -0.31435394287109375, -0.3000030517578125, -0.28565216064453125, -0.27130126953125, -0.25695037841796875, -0.2425994873046875, -0.22824859619140625, -0.213897705078125, -0.19954681396484375, -0.1851959228515625, -0.17084503173828125, -0.156494140625, -0.14214324951171875, -0.1277923583984375, -0.11344146728515625, -0.099090576171875, -0.08473968505859375, -0.0703887939453125, -0.05603790283203125, -0.04168701171875, -0.02733612060546875, -0.0129852294921875, 0.00136566162109375, 0.015716552734375, 0.03006744384765625, 0.0444183349609375, 0.05876922607421875, 0.0731201171875, 0.08747100830078125, 0.1018218994140625, 0.11617279052734375, 0.130523681640625, 0.14487457275390625, 0.1592254638671875, 0.17357635498046875, 0.18792724609375, 0.20227813720703125, 0.2166290283203125, 0.23097991943359375, 0.245330810546875, 0.25968170166015625, 0.2740325927734375, 0.28838348388671875, 0.302734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 4.0, 9.0, 10.0, 12.0, 16.0, 16.0, 38.0, 53.0, 70.0, 118.0, 162.0, 235.0, 411.0, 696.0, 1440.0, 3220.0, 10951.0, 75998.0, 821737.0, 112050.0, 14000.0, 3809.0, 1548.0, 773.0, 413.0, 237.0, 157.0, 117.0, 65.0, 52.0, 34.0, 25.0, 20.0, 14.0, 11.0, 12.0, 4.0, 8.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.107421875, -1.069976806640625, -1.03253173828125, -0.995086669921875, -0.9576416015625, -0.920196533203125, -0.88275146484375, -0.845306396484375, -0.807861328125, -0.770416259765625, -0.73297119140625, -0.695526123046875, -0.6580810546875, -0.620635986328125, -0.58319091796875, -0.545745849609375, -0.50830078125, -0.470855712890625, -0.43341064453125, -0.395965576171875, -0.3585205078125, -0.321075439453125, -0.28363037109375, -0.246185302734375, -0.208740234375, -0.171295166015625, -0.13385009765625, -0.096405029296875, -0.0589599609375, -0.021514892578125, 0.01593017578125, 0.053375244140625, 0.0908203125, 0.128265380859375, 0.16571044921875, 0.203155517578125, 0.2406005859375, 0.278045654296875, 0.31549072265625, 0.352935791015625, 0.390380859375, 0.427825927734375, 0.46527099609375, 0.502716064453125, 0.5401611328125, 0.577606201171875, 0.61505126953125, 0.652496337890625, 0.68994140625, 0.727386474609375, 0.76483154296875, 0.802276611328125, 0.8397216796875, 0.877166748046875, 0.91461181640625, 0.952056884765625, 0.989501953125, 1.026947021484375, 1.06439208984375, 1.101837158203125, 1.1392822265625, 1.176727294921875, 1.21417236328125, 1.251617431640625, 1.2890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 7.0, 8.0, 15.0, 17.0, 15.0, 25.0, 19.0, 27.0, 26.0, 34.0, 36.0, 45.0, 44.0, 50.0, 46.0, 52.0, 50.0, 36.0, 57.0, 37.0, 39.0, 43.0, 23.0, 32.0, 42.0, 30.0, 18.0, 19.0, 19.0, 21.0, 10.0, 8.0, 8.0, 7.0, 6.0, 2.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.0419921875, -1.0101547241210938, -0.9783172607421875, -0.9464797973632812, -0.914642333984375, -0.8828048706054688, -0.8509674072265625, -0.8191299438476562, -0.78729248046875, -0.7554550170898438, -0.7236175537109375, -0.6917800903320312, -0.659942626953125, -0.6281051635742188, -0.5962677001953125, -0.5644302368164062, -0.5325927734375, -0.5007553100585938, -0.4689178466796875, -0.43708038330078125, -0.405242919921875, -0.37340545654296875, -0.3415679931640625, -0.30973052978515625, -0.27789306640625, -0.24605560302734375, -0.2142181396484375, -0.18238067626953125, -0.150543212890625, -0.11870574951171875, -0.0868682861328125, -0.05503082275390625, -0.023193359375, 0.00864410400390625, 0.0404815673828125, 0.07231903076171875, 0.104156494140625, 0.13599395751953125, 0.1678314208984375, 0.19966888427734375, 0.23150634765625, 0.26334381103515625, 0.2951812744140625, 0.32701873779296875, 0.358856201171875, 0.39069366455078125, 0.4225311279296875, 0.45436859130859375, 0.4862060546875, 0.5180435180664062, 0.5498809814453125, 0.5817184448242188, 0.613555908203125, 0.6453933715820312, 0.6772308349609375, 0.7090682983398438, 0.74090576171875, 0.7727432250976562, 0.8045806884765625, 0.8364181518554688, 0.868255615234375, 0.9000930786132812, 0.9319305419921875, 0.9637680053710938, 0.99560546875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 5.0, 3.0, 4.0, 7.0, 19.0, 12.0, 24.0, 41.0, 48.0, 92.0, 129.0, 257.0, 418.0, 794.0, 1679.0, 3211.0, 7147.0, 18839.0, 88068.0, 831444.0, 66846.0, 16820.0, 6540.0, 2957.0, 1368.0, 731.0, 388.0, 245.0, 154.0, 81.0, 69.0, 42.0, 23.0, 8.0, 10.0, 5.0, 8.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56201171875, -0.5452041625976562, -0.5283966064453125, -0.5115890502929688, -0.494781494140625, -0.47797393798828125, -0.4611663818359375, -0.44435882568359375, -0.42755126953125, -0.41074371337890625, -0.3939361572265625, -0.37712860107421875, -0.360321044921875, -0.34351348876953125, -0.3267059326171875, -0.30989837646484375, -0.2930908203125, -0.27628326416015625, -0.2594757080078125, -0.24266815185546875, -0.225860595703125, -0.20905303955078125, -0.1922454833984375, -0.17543792724609375, -0.15863037109375, -0.14182281494140625, -0.1250152587890625, -0.10820770263671875, -0.091400146484375, -0.07459259033203125, -0.0577850341796875, -0.04097747802734375, -0.024169921875, -0.00736236572265625, 0.0094451904296875, 0.02625274658203125, 0.043060302734375, 0.05986785888671875, 0.0766754150390625, 0.09348297119140625, 0.11029052734375, 0.12709808349609375, 0.1439056396484375, 0.16071319580078125, 0.177520751953125, 0.19432830810546875, 0.2111358642578125, 0.22794342041015625, 0.2447509765625, 0.26155853271484375, 0.2783660888671875, 0.29517364501953125, 0.311981201171875, 0.32878875732421875, 0.3455963134765625, 0.36240386962890625, 0.37921142578125, 0.39601898193359375, 0.4128265380859375, 0.42963409423828125, 0.446441650390625, 0.46324920654296875, 0.4800567626953125, 0.49686431884765625, 0.513671875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 6.0, 1.0, 3.0, 7.0, 11.0, 11.0, 15.0, 24.0, 31.0, 59.0, 117.0, 252.0, 216.0, 88.0, 45.0, 27.0, 14.0, 13.0, 13.0, 6.0, 6.0, 2.0, 4.0, 2.0, 4.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002143383026123047, -0.00020739808678627014, -0.0002004578709602356, -0.00019351765513420105, -0.0001865774393081665, -0.00017963722348213196, -0.0001726970076560974, -0.00016575679183006287, -0.00015881657600402832, -0.00015187636017799377, -0.00014493614435195923, -0.00013799592852592468, -0.00013105571269989014, -0.0001241154968738556, -0.00011717528104782104, -0.0001102350652217865, -0.00010329484939575195, -9.635463356971741e-05, -8.941441774368286e-05, -8.247420191764832e-05, -7.553398609161377e-05, -6.859377026557922e-05, -6.165355443954468e-05, -5.471333861351013e-05, -4.7773122787475586e-05, -4.083290696144104e-05, -3.3892691135406494e-05, -2.6952475309371948e-05, -2.0012259483337402e-05, -1.3072043657302856e-05, -6.1318278312683105e-06, 8.083879947662354e-07, 7.748603820800781e-06, 1.4688819646835327e-05, 2.1629035472869873e-05, 2.856925129890442e-05, 3.5509467124938965e-05, 4.244968295097351e-05, 4.938989877700806e-05, 5.63301146030426e-05, 6.327033042907715e-05, 7.02105462551117e-05, 7.715076208114624e-05, 8.409097790718079e-05, 9.103119373321533e-05, 9.797140955924988e-05, 0.00010491162538528442, 0.00011185184121131897, 0.00011879205703735352, 0.00012573227286338806, 0.0001326724886894226, 0.00013961270451545715, 0.0001465529203414917, 0.00015349313616752625, 0.0001604333519935608, 0.00016737356781959534, 0.00017431378364562988, 0.00018125399947166443, 0.00018819421529769897, 0.00019513443112373352, 0.00020207464694976807, 0.0002090148627758026, 0.00021595507860183716, 0.0002228952944278717, 0.00022983551025390625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 8.0, 9.0, 11.0, 21.0, 30.0, 40.0, 63.0, 129.0, 211.0, 529.0, 1219.0, 3145.0, 9224.0, 43423.0, 885788.0, 84416.0, 13485.0, 3954.0, 1496.0, 680.0, 288.0, 164.0, 83.0, 52.0, 21.0, 20.0, 17.0, 9.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7646484375, -0.7412185668945312, -0.7177886962890625, -0.6943588256835938, -0.670928955078125, -0.6474990844726562, -0.6240692138671875, -0.6006393432617188, -0.57720947265625, -0.5537796020507812, -0.5303497314453125, -0.5069198608398438, -0.483489990234375, -0.46006011962890625, -0.4366302490234375, -0.41320037841796875, -0.3897705078125, -0.36634063720703125, -0.3429107666015625, -0.31948089599609375, -0.296051025390625, -0.27262115478515625, -0.2491912841796875, -0.22576141357421875, -0.20233154296875, -0.17890167236328125, -0.1554718017578125, -0.13204193115234375, -0.108612060546875, -0.08518218994140625, -0.0617523193359375, -0.03832244873046875, -0.014892578125, 0.00853729248046875, 0.0319671630859375, 0.05539703369140625, 0.078826904296875, 0.10225677490234375, 0.1256866455078125, 0.14911651611328125, 0.17254638671875, 0.19597625732421875, 0.2194061279296875, 0.24283599853515625, 0.266265869140625, 0.28969573974609375, 0.3131256103515625, 0.33655548095703125, 0.3599853515625, 0.38341522216796875, 0.4068450927734375, 0.43027496337890625, 0.453704833984375, 0.47713470458984375, 0.5005645751953125, 0.5239944458007812, 0.54742431640625, 0.5708541870117188, 0.5942840576171875, 0.6177139282226562, 0.641143798828125, 0.6645736694335938, 0.6880035400390625, 0.7114334106445312, 0.73486328125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 0.0, 4.0, 4.0, 0.0, 8.0, 7.0, 6.0, 15.0, 7.0, 7.0, 12.0, 17.0, 27.0, 41.0, 67.0, 87.0, 135.0, 158.0, 112.0, 71.0, 60.0, 32.0, 26.0, 16.0, 20.0, 13.0, 9.0, 7.0, 9.0, 9.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42333984375, -0.4095458984375, -0.395751953125, -0.3819580078125, -0.3681640625, -0.3543701171875, -0.340576171875, -0.3267822265625, -0.31298828125, -0.2991943359375, -0.285400390625, -0.2716064453125, -0.2578125, -0.2440185546875, -0.230224609375, -0.2164306640625, -0.20263671875, -0.1888427734375, -0.175048828125, -0.1612548828125, -0.1474609375, -0.1336669921875, -0.119873046875, -0.1060791015625, -0.09228515625, -0.0784912109375, -0.064697265625, -0.0509033203125, -0.037109375, -0.0233154296875, -0.009521484375, 0.0042724609375, 0.01806640625, 0.0318603515625, 0.045654296875, 0.0594482421875, 0.0732421875, 0.0870361328125, 0.100830078125, 0.1146240234375, 0.12841796875, 0.1422119140625, 0.156005859375, 0.1697998046875, 0.18359375, 0.1973876953125, 0.211181640625, 0.2249755859375, 0.23876953125, 0.2525634765625, 0.266357421875, 0.2801513671875, 0.2939453125, 0.3077392578125, 0.321533203125, 0.3353271484375, 0.34912109375, 0.3629150390625, 0.376708984375, 0.3905029296875, 0.404296875, 0.4180908203125, 0.431884765625, 0.4456787109375, 0.45947265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 4.0, 11.0, 29.0, 65.0, 208.0, 407.0, 179.0, 70.0, 20.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.929523468017578, -25.396299362182617, -24.863075256347656, -24.329849243164062, -23.7966251373291, -23.26340103149414, -22.73017692565918, -22.19695281982422, -21.663728713989258, -21.130504608154297, -20.597280502319336, -20.064056396484375, -19.53083038330078, -18.99760627746582, -18.46438217163086, -17.9311580657959, -17.397933959960938, -16.864709854125977, -16.331485748291016, -15.798260688781738, -15.265036582946777, -14.7318115234375, -14.198587417602539, -13.665363311767578, -13.132137298583984, -12.598913192749023, -12.065688133239746, -11.532464027404785, -10.999239921569824, -10.466014862060547, -9.932790756225586, -9.399566650390625, -8.866341590881348, -8.333117485046387, -7.799892902374268, -7.266668319702148, -6.7334442138671875, -6.200219631195068, -5.666995048522949, -5.133770942687988, -4.600546360015869, -4.06732177734375, -3.534097671508789, -3.00087308883667, -2.46764874458313, -1.9344244003295898, -1.4011998176574707, -0.8679754734039307, -0.3347511291503906, 0.1984732747077942, 0.731697678565979, 1.2649221420288086, 1.7981464862823486, 2.3313708305358887, 2.864595413208008, 3.397819757461548, 3.931044101715088, 4.464268684387207, 4.997492790222168, 5.530717372894287, 6.063941955566406, 6.597166061401367, 7.130390644073486, 7.6636152267456055, 8.196839332580566]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 5.0, 7.0, 13.0, 7.0, 12.0, 16.0, 28.0, 17.0, 24.0, 22.0, 23.0, 37.0, 27.0, 46.0, 44.0, 59.0, 80.0, 84.0, 78.0, 51.0, 44.0, 38.0, 36.0, 45.0, 19.0, 32.0, 22.0, 17.0, 13.0, 15.0, 11.0, 5.0, 5.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.990909576416016, -4.83718729019165, -4.683465480804443, -4.529743194580078, -4.376021385192871, -4.222299098968506, -4.068576812744141, -3.9148550033569336, -3.7611327171325684, -3.6074106693267822, -3.453688621520996, -3.299966335296631, -3.1462442874908447, -2.9925222396850586, -2.8388001918792725, -2.6850781440734863, -2.5313560962677, -2.377634048461914, -2.223912000656128, -2.070189952850342, -1.9164676666259766, -1.7627456188201904, -1.6090235710144043, -1.4553014039993286, -1.3015793561935425, -1.1478573083877563, -0.9941351413726807, -0.8404130935668945, -0.6866909861564636, -0.5329688787460327, -0.3792468309402466, -0.2255246639251709, -0.07180261611938477, 0.08191947638988495, 0.23564156889915466, 0.3893636465072632, 0.5430857539176941, 0.696807861328125, 0.8505299091339111, 1.0042520761489868, 1.157974123954773, 1.311696171760559, 1.4654183387756348, 1.619140386581421, 1.772862434387207, 1.9265846014022827, 2.0803065299987793, 2.2340288162231445, 2.3877508640289307, 2.541472911834717, 2.695194959640503, 2.848917007446289, 3.0026392936706543, 3.1563613414764404, 3.3100833892822266, 3.463805675506592, 3.617527484893799, 3.771249532699585, 3.924971580505371, 4.078693866729736, 4.232415676116943, 4.386137962341309, 4.539859771728516, 4.693582057952881, 4.847304344177246]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 7.0, 3.0, 9.0, 16.0, 16.0, 24.0, 36.0, 48.0, 56.0, 89.0, 121.0, 186.0, 299.0, 522.0, 857.0, 1899.0, 4273.0, 14216.0, 234428.0, 3864308.0, 56304.0, 9919.0, 3397.0, 1455.0, 764.0, 383.0, 226.0, 122.0, 98.0, 61.0, 53.0, 29.0, 12.0, 5.0, 4.0, 3.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.111328125, -2.0589599609375, -2.006591796875, -1.9542236328125, -1.90185546875, -1.8494873046875, -1.797119140625, -1.7447509765625, -1.6923828125, -1.6400146484375, -1.587646484375, -1.5352783203125, -1.48291015625, -1.4305419921875, -1.378173828125, -1.3258056640625, -1.2734375, -1.2210693359375, -1.168701171875, -1.1163330078125, -1.06396484375, -1.0115966796875, -0.959228515625, -0.9068603515625, -0.8544921875, -0.8021240234375, -0.749755859375, -0.6973876953125, -0.64501953125, -0.5926513671875, -0.540283203125, -0.4879150390625, -0.435546875, -0.3831787109375, -0.330810546875, -0.2784423828125, -0.22607421875, -0.1737060546875, -0.121337890625, -0.0689697265625, -0.0166015625, 0.0357666015625, 0.088134765625, 0.1405029296875, 0.19287109375, 0.2452392578125, 0.297607421875, 0.3499755859375, 0.40234375, 0.4547119140625, 0.507080078125, 0.5594482421875, 0.61181640625, 0.6641845703125, 0.716552734375, 0.7689208984375, 0.8212890625, 0.8736572265625, 0.926025390625, 0.9783935546875, 1.03076171875, 1.0831298828125, 1.135498046875, 1.1878662109375, 1.240234375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 10.0, 12.0, 19.0, 42.0, 40.0, 62.0, 70.0, 90.0, 102.0, 113.0, 88.0, 90.0, 68.0, 64.0, 40.0, 33.0, 22.0, 14.0, 11.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53466796875, -0.51702880859375, -0.4993896484375, -0.48175048828125, -0.464111328125, -0.44647216796875, -0.4288330078125, -0.41119384765625, -0.3935546875, -0.37591552734375, -0.3582763671875, -0.34063720703125, -0.322998046875, -0.30535888671875, -0.2877197265625, -0.27008056640625, -0.25244140625, -0.23480224609375, -0.2171630859375, -0.19952392578125, -0.181884765625, -0.16424560546875, -0.1466064453125, -0.12896728515625, -0.111328125, -0.09368896484375, -0.0760498046875, -0.05841064453125, -0.040771484375, -0.02313232421875, -0.0054931640625, 0.01214599609375, 0.02978515625, 0.04742431640625, 0.0650634765625, 0.08270263671875, 0.100341796875, 0.11798095703125, 0.1356201171875, 0.15325927734375, 0.1708984375, 0.18853759765625, 0.2061767578125, 0.22381591796875, 0.241455078125, 0.25909423828125, 0.2767333984375, 0.29437255859375, 0.31201171875, 0.32965087890625, 0.3472900390625, 0.36492919921875, 0.382568359375, 0.40020751953125, 0.4178466796875, 0.43548583984375, 0.453125, 0.47076416015625, 0.4884033203125, 0.50604248046875, 0.523681640625, 0.54132080078125, 0.5589599609375, 0.57659912109375, 0.59423828125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 12.0, 14.0, 16.0, 34.0, 52.0, 89.0, 141.0, 205.0, 307.0, 496.0, 836.0, 1777.0, 5194.0, 23320.0, 684011.0, 3423800.0, 40647.0, 7872.0, 2557.0, 1140.0, 646.0, 382.0, 231.0, 198.0, 89.0, 64.0, 48.0, 32.0, 15.0, 9.0, 9.0, 9.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.82421875, -1.769134521484375, -1.71405029296875, -1.658966064453125, -1.6038818359375, -1.548797607421875, -1.49371337890625, -1.438629150390625, -1.383544921875, -1.328460693359375, -1.27337646484375, -1.218292236328125, -1.1632080078125, -1.108123779296875, -1.05303955078125, -0.997955322265625, -0.94287109375, -0.887786865234375, -0.83270263671875, -0.777618408203125, -0.7225341796875, -0.667449951171875, -0.61236572265625, -0.557281494140625, -0.502197265625, -0.447113037109375, -0.39202880859375, -0.336944580078125, -0.2818603515625, -0.226776123046875, -0.17169189453125, -0.116607666015625, -0.0615234375, -0.006439208984375, 0.04864501953125, 0.103729248046875, 0.1588134765625, 0.213897705078125, 0.26898193359375, 0.324066162109375, 0.379150390625, 0.434234619140625, 0.48931884765625, 0.544403076171875, 0.5994873046875, 0.654571533203125, 0.70965576171875, 0.764739990234375, 0.81982421875, 0.874908447265625, 0.92999267578125, 0.985076904296875, 1.0401611328125, 1.095245361328125, 1.15032958984375, 1.205413818359375, 1.260498046875, 1.315582275390625, 1.37066650390625, 1.425750732421875, 1.4808349609375, 1.535919189453125, 1.59100341796875, 1.646087646484375, 1.701171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 8.0, 10.0, 15.0, 29.0, 34.0, 75.0, 205.0, 1052.0, 1820.0, 471.0, 151.0, 75.0, 49.0, 28.0, 17.0, 16.0, 9.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7451171875, -1.687530517578125, -1.62994384765625, -1.572357177734375, -1.5147705078125, -1.457183837890625, -1.39959716796875, -1.342010498046875, -1.284423828125, -1.226837158203125, -1.16925048828125, -1.111663818359375, -1.0540771484375, -0.996490478515625, -0.93890380859375, -0.881317138671875, -0.82373046875, -0.766143798828125, -0.70855712890625, -0.650970458984375, -0.5933837890625, -0.535797119140625, -0.47821044921875, -0.420623779296875, -0.363037109375, -0.305450439453125, -0.24786376953125, -0.190277099609375, -0.1326904296875, -0.075103759765625, -0.01751708984375, 0.040069580078125, 0.09765625, 0.155242919921875, 0.21282958984375, 0.270416259765625, 0.3280029296875, 0.385589599609375, 0.44317626953125, 0.500762939453125, 0.558349609375, 0.615936279296875, 0.67352294921875, 0.731109619140625, 0.7886962890625, 0.846282958984375, 0.90386962890625, 0.961456298828125, 1.01904296875, 1.076629638671875, 1.13421630859375, 1.191802978515625, 1.2493896484375, 1.306976318359375, 1.36456298828125, 1.422149658203125, 1.479736328125, 1.537322998046875, 1.59490966796875, 1.652496337890625, 1.7100830078125, 1.767669677734375, 1.82525634765625, 1.882843017578125, 1.9404296875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 7.0, 19.0, 38.0, 72.0, 162.0, 249.0, 214.0, 108.0, 56.0, 25.0, 17.0, 7.0, 8.0, 5.0, 1.0, 7.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.526615142822266, -10.020986557006836, -9.51535701751709, -9.009727478027344, -8.504098892211914, -7.998469829559326, -7.492840766906738, -6.98721170425415, -6.4815826416015625, -5.975953578948975, -5.470324516296387, -4.964695453643799, -4.459066390991211, -3.953437328338623, -3.447808265686035, -2.9421792030334473, -2.4365501403808594, -1.9309210777282715, -1.4252920150756836, -0.9196629524230957, -0.4140338897705078, 0.09159517288208008, 0.597224235534668, 1.1028532981872559, 1.6084823608398438, 2.1141114234924316, 2.6197404861450195, 3.1253695487976074, 3.6309986114501953, 4.136627674102783, 4.642256736755371, 5.147885799407959, 5.653514862060547, 6.159143924713135, 6.664772987365723, 7.1704020500183105, 7.676031112670898, 8.181659698486328, 8.687289237976074, 9.19291877746582, 9.69854736328125, 10.20417594909668, 10.709805488586426, 11.215435028076172, 11.721063613891602, 12.226692199707031, 12.732321739196777, 13.237951278686523, 13.743579864501953, 14.249208450317383, 14.754837989807129, 15.260467529296875, 15.766096115112305, 16.271724700927734, 16.777355194091797, 17.282983779907227, 17.788612365722656, 18.294240951538086, 18.799869537353516, 19.305500030517578, 19.811128616333008, 20.316757202148438, 20.8223876953125, 21.32801628112793, 21.83364486694336]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 5.0, 8.0, 6.0, 15.0, 23.0, 21.0, 23.0, 17.0, 28.0, 37.0, 31.0, 36.0, 36.0, 55.0, 44.0, 40.0, 56.0, 58.0, 40.0, 38.0, 42.0, 41.0, 37.0, 38.0, 31.0, 32.0, 19.0, 24.0, 19.0, 23.0, 13.0, 8.0, 13.0, 8.0, 7.0, 4.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.978796005249023, -4.825719833374023, -4.672643661499023, -4.519567489624023, -4.366491317749023, -4.213415145874023, -4.060338973999023, -3.9072625637054443, -3.7541863918304443, -3.6011102199554443, -3.4480340480804443, -3.2949578762054443, -3.1418814659118652, -2.9888052940368652, -2.8357291221618652, -2.6826529502868652, -2.5295767784118652, -2.3765006065368652, -2.2234244346618652, -2.0703482627868652, -1.9172719717025757, -1.7641957998275757, -1.6111195087432861, -1.4580433368682861, -1.3049671649932861, -1.1518909931182861, -0.9988147616386414, -0.8457385301589966, -0.6926623582839966, -0.5395861864089966, -0.3865099549293518, -0.23343372344970703, -0.08035802841186523, 0.07271817326545715, 0.22579437494277954, 0.37887057662010193, 0.5319467782974243, 0.6850229501724243, 0.8380991816520691, 0.9911754131317139, 1.1442515850067139, 1.2973277568817139, 1.4504039287567139, 1.6034802198410034, 1.7565563917160034, 1.9096325635910034, 2.062708854675293, 2.215785026550293, 2.368861198425293, 2.521937370300293, 2.675013542175293, 2.828089714050293, 2.981165885925293, 3.134242057800293, 3.287318468093872, 3.440394639968872, 3.593470811843872, 3.746546983718872, 3.899623155593872, 4.052699565887451, 4.205775737762451, 4.358851909637451, 4.511928081512451, 4.665004253387451, 4.818080425262451]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 11.0, 7.0, 12.0, 16.0, 20.0, 34.0, 32.0, 53.0, 101.0, 152.0, 203.0, 427.0, 928.0, 1956.0, 4974.0, 14466.0, 57231.0, 397565.0, 477623.0, 66548.0, 16591.0, 5382.0, 2098.0, 940.0, 479.0, 260.0, 151.0, 110.0, 57.0, 38.0, 32.0, 13.0, 11.0, 8.0, 4.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4775390625, -1.43414306640625, -1.3907470703125, -1.34735107421875, -1.303955078125, -1.26055908203125, -1.2171630859375, -1.17376708984375, -1.13037109375, -1.08697509765625, -1.0435791015625, -1.00018310546875, -0.956787109375, -0.91339111328125, -0.8699951171875, -0.82659912109375, -0.783203125, -0.73980712890625, -0.6964111328125, -0.65301513671875, -0.609619140625, -0.56622314453125, -0.5228271484375, -0.47943115234375, -0.43603515625, -0.39263916015625, -0.3492431640625, -0.30584716796875, -0.262451171875, -0.21905517578125, -0.1756591796875, -0.13226318359375, -0.0888671875, -0.04547119140625, -0.0020751953125, 0.04132080078125, 0.084716796875, 0.12811279296875, 0.1715087890625, 0.21490478515625, 0.25830078125, 0.30169677734375, 0.3450927734375, 0.38848876953125, 0.431884765625, 0.47528076171875, 0.5186767578125, 0.56207275390625, 0.60546875, 0.64886474609375, 0.6922607421875, 0.73565673828125, 0.779052734375, 0.82244873046875, 0.8658447265625, 0.90924072265625, 0.95263671875, 0.99603271484375, 1.0394287109375, 1.08282470703125, 1.126220703125, 1.16961669921875, 1.2130126953125, 1.25640869140625, 1.2998046875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 10.0, 12.0, 7.0, 12.0, 31.0, 36.0, 55.0, 55.0, 52.0, 60.0, 64.0, 69.0, 83.0, 81.0, 63.0, 56.0, 58.0, 42.0, 34.0, 24.0, 29.0, 17.0, 17.0, 13.0, 7.0, 4.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.6265640258789062, -0.6105499267578125, -0.5945358276367188, -0.578521728515625, -0.5625076293945312, -0.5464935302734375, -0.5304794311523438, -0.51446533203125, -0.49845123291015625, -0.4824371337890625, -0.46642303466796875, -0.450408935546875, -0.43439483642578125, -0.4183807373046875, -0.40236663818359375, -0.3863525390625, -0.37033843994140625, -0.3543243408203125, -0.33831024169921875, -0.322296142578125, -0.30628204345703125, -0.2902679443359375, -0.27425384521484375, -0.25823974609375, -0.24222564697265625, -0.2262115478515625, -0.21019744873046875, -0.194183349609375, -0.17816925048828125, -0.1621551513671875, -0.14614105224609375, -0.130126953125, -0.11411285400390625, -0.0980987548828125, -0.08208465576171875, -0.066070556640625, -0.05005645751953125, -0.0340423583984375, -0.01802825927734375, -0.00201416015625, 0.01399993896484375, 0.0300140380859375, 0.04602813720703125, 0.062042236328125, 0.07805633544921875, 0.0940704345703125, 0.11008453369140625, 0.1260986328125, 0.14211273193359375, 0.1581268310546875, 0.17414093017578125, 0.190155029296875, 0.20616912841796875, 0.2221832275390625, 0.23819732666015625, 0.25421142578125, 0.27022552490234375, 0.2862396240234375, 0.30225372314453125, 0.318267822265625, 0.33428192138671875, 0.3502960205078125, 0.36631011962890625, 0.38232421875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 10.0, 14.0, 11.0, 16.0, 36.0, 29.0, 53.0, 64.0, 104.0, 173.0, 227.0, 319.0, 511.0, 896.0, 1583.0, 3257.0, 8172.0, 29125.0, 180690.0, 710863.0, 83629.0, 17286.0, 5774.0, 2455.0, 1230.0, 700.0, 441.0, 267.0, 195.0, 113.0, 96.0, 57.0, 41.0, 31.0, 20.0, 14.0, 9.0, 12.0, 11.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.365234375, -1.3229827880859375, -1.280731201171875, -1.2384796142578125, -1.19622802734375, -1.1539764404296875, -1.111724853515625, -1.0694732666015625, -1.0272216796875, -0.9849700927734375, -0.942718505859375, -0.9004669189453125, -0.85821533203125, -0.8159637451171875, -0.773712158203125, -0.7314605712890625, -0.689208984375, -0.6469573974609375, -0.604705810546875, -0.5624542236328125, -0.52020263671875, -0.4779510498046875, -0.435699462890625, -0.3934478759765625, -0.3511962890625, -0.3089447021484375, -0.266693115234375, -0.2244415283203125, -0.18218994140625, -0.1399383544921875, -0.097686767578125, -0.0554351806640625, -0.01318359375, 0.0290679931640625, 0.071319580078125, 0.1135711669921875, 0.15582275390625, 0.1980743408203125, 0.240325927734375, 0.2825775146484375, 0.3248291015625, 0.3670806884765625, 0.409332275390625, 0.4515838623046875, 0.49383544921875, 0.5360870361328125, 0.578338623046875, 0.6205902099609375, 0.662841796875, 0.7050933837890625, 0.747344970703125, 0.7895965576171875, 0.83184814453125, 0.8740997314453125, 0.916351318359375, 0.9586029052734375, 1.0008544921875, 1.0431060791015625, 1.085357666015625, 1.1276092529296875, 1.16986083984375, 1.2121124267578125, 1.254364013671875, 1.2966156005859375, 1.3388671875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 10.0, 7.0, 9.0, 14.0, 15.0, 14.0, 14.0, 24.0, 32.0, 27.0, 28.0, 40.0, 37.0, 37.0, 49.0, 40.0, 51.0, 67.0, 61.0, 59.0, 51.0, 45.0, 35.0, 46.0, 39.0, 22.0, 21.0, 23.0, 11.0, 15.0, 13.0, 8.0, 9.0, 4.0, 3.0, 8.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5517578125, -1.50665283203125, -1.4615478515625, -1.41644287109375, -1.371337890625, -1.32623291015625, -1.2811279296875, -1.23602294921875, -1.19091796875, -1.14581298828125, -1.1007080078125, -1.05560302734375, -1.010498046875, -0.96539306640625, -0.9202880859375, -0.87518310546875, -0.830078125, -0.78497314453125, -0.7398681640625, -0.69476318359375, -0.649658203125, -0.60455322265625, -0.5594482421875, -0.51434326171875, -0.46923828125, -0.42413330078125, -0.3790283203125, -0.33392333984375, -0.288818359375, -0.24371337890625, -0.1986083984375, -0.15350341796875, -0.1083984375, -0.06329345703125, -0.0181884765625, 0.02691650390625, 0.072021484375, 0.11712646484375, 0.1622314453125, 0.20733642578125, 0.25244140625, 0.29754638671875, 0.3426513671875, 0.38775634765625, 0.432861328125, 0.47796630859375, 0.5230712890625, 0.56817626953125, 0.61328125, 0.65838623046875, 0.7034912109375, 0.74859619140625, 0.793701171875, 0.83880615234375, 0.8839111328125, 0.92901611328125, 0.97412109375, 1.01922607421875, 1.0643310546875, 1.10943603515625, 1.154541015625, 1.19964599609375, 1.2447509765625, 1.28985595703125, 1.3349609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 4.0, 10.0, 19.0, 10.0, 31.0, 36.0, 88.0, 117.0, 239.0, 467.0, 974.0, 2257.0, 5605.0, 16768.0, 83533.0, 793557.0, 113665.0, 19964.0, 6389.0, 2575.0, 1083.0, 493.0, 284.0, 144.0, 99.0, 48.0, 29.0, 15.0, 12.0, 14.0, 6.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6387710571289062, -0.6178741455078125, -0.5969772338867188, -0.576080322265625, -0.5551834106445312, -0.5342864990234375, -0.5133895874023438, -0.49249267578125, -0.47159576416015625, -0.4506988525390625, -0.42980194091796875, -0.408905029296875, -0.38800811767578125, -0.3671112060546875, -0.34621429443359375, -0.3253173828125, -0.30442047119140625, -0.2835235595703125, -0.26262664794921875, -0.241729736328125, -0.22083282470703125, -0.1999359130859375, -0.17903900146484375, -0.15814208984375, -0.13724517822265625, -0.1163482666015625, -0.09545135498046875, -0.074554443359375, -0.05365753173828125, -0.0327606201171875, -0.01186370849609375, 0.009033203125, 0.02993011474609375, 0.0508270263671875, 0.07172393798828125, 0.092620849609375, 0.11351776123046875, 0.1344146728515625, 0.15531158447265625, 0.17620849609375, 0.19710540771484375, 0.2180023193359375, 0.23889923095703125, 0.259796142578125, 0.28069305419921875, 0.3015899658203125, 0.32248687744140625, 0.3433837890625, 0.36428070068359375, 0.3851776123046875, 0.40607452392578125, 0.426971435546875, 0.44786834716796875, 0.4687652587890625, 0.48966217041015625, 0.51055908203125, 0.5314559936523438, 0.5523529052734375, 0.5732498168945312, 0.594146728515625, 0.6150436401367188, 0.6359405517578125, 0.6568374633789062, 0.677734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 10.0, 4.0, 6.0, 17.0, 17.0, 27.0, 51.0, 65.0, 156.0, 209.0, 155.0, 83.0, 59.0, 29.0, 17.0, 26.0, 8.0, 4.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020360946655273438, -0.00019531697034835815, -0.00018702447414398193, -0.0001787319779396057, -0.0001704394817352295, -0.00016214698553085327, -0.00015385448932647705, -0.00014556199312210083, -0.0001372694969177246, -0.0001289770007133484, -0.00012068450450897217, -0.00011239200830459595, -0.00010409951210021973, -9.58070158958435e-05, -8.751451969146729e-05, -7.922202348709106e-05, -7.092952728271484e-05, -6.263703107833862e-05, -5.43445348739624e-05, -4.605203866958618e-05, -3.775954246520996e-05, -2.946704626083374e-05, -2.117455005645752e-05, -1.2882053852081299e-05, -4.589557647705078e-06, 3.7029385566711426e-06, 1.1995434761047363e-05, 2.0287930965423584e-05, 2.8580427169799805e-05, 3.6872923374176025e-05, 4.5165419578552246e-05, 5.345791578292847e-05, 6.175041198730469e-05, 7.004290819168091e-05, 7.833540439605713e-05, 8.662790060043335e-05, 9.492039680480957e-05, 0.00010321289300918579, 0.00011150538921356201, 0.00011979788541793823, 0.00012809038162231445, 0.00013638287782669067, 0.0001446753740310669, 0.00015296787023544312, 0.00016126036643981934, 0.00016955286264419556, 0.00017784535884857178, 0.000186137855052948, 0.00019443035125732422, 0.00020272284746170044, 0.00021101534366607666, 0.00021930783987045288, 0.0002276003360748291, 0.00023589283227920532, 0.00024418532848358154, 0.00025247782468795776, 0.000260770320892334, 0.0002690628170967102, 0.0002773553133010864, 0.00028564780950546265, 0.00029394030570983887, 0.0003022328019142151, 0.0003105252981185913, 0.00031881779432296753, 0.00032711029052734375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 6.0, 6.0, 11.0, 20.0, 35.0, 38.0, 77.0, 127.0, 257.0, 491.0, 915.0, 2176.0, 6055.0, 22128.0, 191263.0, 762552.0, 46467.0, 9992.0, 3204.0, 1357.0, 648.0, 285.0, 172.0, 109.0, 55.0, 35.0, 22.0, 23.0, 10.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.009765625, -0.9846572875976562, -0.9595489501953125, -0.9344406127929688, -0.909332275390625, -0.8842239379882812, -0.8591156005859375, -0.8340072631835938, -0.80889892578125, -0.7837905883789062, -0.7586822509765625, -0.7335739135742188, -0.708465576171875, -0.6833572387695312, -0.6582489013671875, -0.6331405639648438, -0.6080322265625, -0.5829238891601562, -0.5578155517578125, -0.5327072143554688, -0.507598876953125, -0.48249053955078125, -0.4573822021484375, -0.43227386474609375, -0.40716552734375, -0.38205718994140625, -0.3569488525390625, -0.33184051513671875, -0.306732177734375, -0.28162384033203125, -0.2565155029296875, -0.23140716552734375, -0.206298828125, -0.18119049072265625, -0.1560821533203125, -0.13097381591796875, -0.105865478515625, -0.08075714111328125, -0.0556488037109375, -0.03054046630859375, -0.00543212890625, 0.01967620849609375, 0.0447845458984375, 0.06989288330078125, 0.095001220703125, 0.12010955810546875, 0.1452178955078125, 0.17032623291015625, 0.1954345703125, 0.22054290771484375, 0.2456512451171875, 0.27075958251953125, 0.295867919921875, 0.32097625732421875, 0.3460845947265625, 0.37119293212890625, 0.39630126953125, 0.42140960693359375, 0.4465179443359375, 0.47162628173828125, 0.496734619140625, 0.5218429565429688, 0.5469512939453125, 0.5720596313476562, 0.59716796875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 7.0, 0.0, 7.0, 6.0, 4.0, 8.0, 19.0, 8.0, 25.0, 42.0, 40.0, 49.0, 87.0, 115.0, 148.0, 109.0, 69.0, 68.0, 59.0, 35.0, 19.0, 10.0, 12.0, 10.0, 9.0, 8.0, 11.0, 3.0, 4.0, 0.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.471435546875, -0.4537773132324219, -0.43611907958984375, -0.4184608459472656, -0.4008026123046875, -0.3831443786621094, -0.36548614501953125, -0.3478279113769531, -0.330169677734375, -0.3125114440917969, -0.29485321044921875, -0.2771949768066406, -0.2595367431640625, -0.24187850952148438, -0.22422027587890625, -0.20656204223632812, -0.18890380859375, -0.17124557495117188, -0.15358734130859375, -0.13592910766601562, -0.1182708740234375, -0.10061264038085938, -0.08295440673828125, -0.06529617309570312, -0.047637939453125, -0.029979705810546875, -0.01232147216796875, 0.005336761474609375, 0.0229949951171875, 0.040653228759765625, 0.05831146240234375, 0.07596969604492188, 0.0936279296875, 0.11128616333007812, 0.12894439697265625, 0.14660263061523438, 0.1642608642578125, 0.18191909790039062, 0.19957733154296875, 0.21723556518554688, 0.234893798828125, 0.2525520324707031, 0.27021026611328125, 0.2878684997558594, 0.3055267333984375, 0.3231849670410156, 0.34084320068359375, 0.3585014343261719, 0.37615966796875, 0.3938179016113281, 0.41147613525390625, 0.4291343688964844, 0.4467926025390625, 0.4644508361816406, 0.48210906982421875, 0.4997673034667969, 0.517425537109375, 0.5350837707519531, 0.5527420043945312, 0.5704002380371094, 0.5880584716796875, 0.6057167053222656, 0.6233749389648438, 0.6410331726074219, 0.65869140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 9.0, 13.0, 26.0, 58.0, 132.0, 317.0, 266.0, 113.0, 32.0, 24.0, 4.0, 7.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.480131149291992, -28.933151245117188, -28.386171340942383, -27.839191436767578, -27.292211532592773, -26.74523162841797, -26.198251724243164, -25.65127182006836, -25.104290008544922, -24.557310104370117, -24.010330200195312, -23.463350296020508, -22.916370391845703, -22.3693904876709, -21.822410583496094, -21.275428771972656, -20.728450775146484, -20.18147087097168, -19.634490966796875, -19.08751106262207, -18.540531158447266, -17.99355125427246, -17.446571350097656, -16.89958953857422, -16.352611541748047, -15.805631637573242, -15.258651733398438, -14.711671829223633, -14.164691925048828, -13.617712020874023, -13.070731163024902, -12.523751258850098, -11.976770401000977, -11.429790496826172, -10.882810592651367, -10.335830688476562, -9.788850784301758, -9.241870880126953, -8.694890022277832, -8.147910118103027, -7.600930690765381, -7.053950786590576, -6.506970405578613, -5.959990501403809, -5.413010597229004, -4.866030693054199, -4.3190507888793945, -3.7720704078674316, -3.225090503692627, -2.6781105995178223, -2.1311304569244385, -1.5841504335403442, -1.03717041015625, -0.4901905059814453, 0.05678963661193848, 0.6037697792053223, 1.150749683380127, 1.6977297067642212, 2.2447097301483154, 2.791689872741699, 3.338669776916504, 3.8856496810913086, 4.432629585266113, 4.979609966278076, 5.526589870452881]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 9.0, 4.0, 12.0, 3.0, 11.0, 15.0, 20.0, 18.0, 21.0, 29.0, 34.0, 39.0, 30.0, 39.0, 33.0, 41.0, 77.0, 78.0, 84.0, 65.0, 50.0, 53.0, 30.0, 27.0, 29.0, 28.0, 15.0, 20.0, 18.0, 15.0, 13.0, 8.0, 8.0, 10.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.526603698730469, -6.309216499328613, -6.091829776763916, -5.874443054199219, -5.657055854797363, -5.439668655395508, -5.2222819328308105, -5.004895210266113, -4.787508010864258, -4.570120811462402, -4.352734088897705, -4.135347366333008, -3.9179601669311523, -3.700573205947876, -3.4831862449645996, -3.2657992839813232, -3.048412322998047, -2.8310253620147705, -2.613638401031494, -2.3962514400482178, -2.1788644790649414, -1.961477518081665, -1.7440905570983887, -1.5267035961151123, -1.309316635131836, -1.0919296741485596, -0.8745427131652832, -0.6571557521820068, -0.43976879119873047, -0.2223818302154541, -0.004994869232177734, 0.21239209175109863, 0.429779052734375, 0.6471660137176514, 0.8645529747009277, 1.081939935684204, 1.2993268966674805, 1.5167138576507568, 1.7341008186340332, 1.9514877796173096, 2.168874740600586, 2.3862617015838623, 2.6036486625671387, 2.821035623550415, 3.0384225845336914, 3.2558095455169678, 3.473196506500244, 3.6905834674835205, 3.907970428466797, 4.125357627868652, 4.34274435043335, 4.560131072998047, 4.777518272399902, 4.994905471801758, 5.212292194366455, 5.429678916931152, 5.647066116333008, 5.864453315734863, 6.0818400382995605, 6.299226760864258, 6.516613960266113, 6.734001159667969, 6.951387882232666, 7.168774604797363, 7.386161804199219]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 8.0, 9.0, 9.0, 15.0, 25.0, 27.0, 39.0, 55.0, 90.0, 173.0, 320.0, 583.0, 1412.0, 4612.0, 47001.0, 4063892.0, 67461.0, 5641.0, 1528.0, 657.0, 319.0, 160.0, 100.0, 48.0, 30.0, 20.0, 16.0, 11.0, 8.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.216796875, -3.1374359130859375, -3.058074951171875, -2.9787139892578125, -2.89935302734375, -2.8199920654296875, -2.740631103515625, -2.6612701416015625, -2.5819091796875, -2.5025482177734375, -2.423187255859375, -2.3438262939453125, -2.26446533203125, -2.1851043701171875, -2.105743408203125, -2.0263824462890625, -1.947021484375, -1.8676605224609375, -1.788299560546875, -1.7089385986328125, -1.62957763671875, -1.5502166748046875, -1.470855712890625, -1.3914947509765625, -1.3121337890625, -1.2327728271484375, -1.153411865234375, -1.0740509033203125, -0.99468994140625, -0.9153289794921875, -0.835968017578125, -0.7566070556640625, -0.67724609375, -0.5978851318359375, -0.518524169921875, -0.4391632080078125, -0.35980224609375, -0.2804412841796875, -0.201080322265625, -0.1217193603515625, -0.0423583984375, 0.0370025634765625, 0.116363525390625, 0.1957244873046875, 0.27508544921875, 0.3544464111328125, 0.433807373046875, 0.5131683349609375, 0.592529296875, 0.6718902587890625, 0.751251220703125, 0.8306121826171875, 0.90997314453125, 0.9893341064453125, 1.068695068359375, 1.1480560302734375, 1.2274169921875, 1.3067779541015625, 1.386138916015625, 1.4654998779296875, 1.54486083984375, 1.6242218017578125, 1.703582763671875, 1.7829437255859375, 1.8623046875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 10.0, 15.0, 19.0, 18.0, 31.0, 30.0, 30.0, 42.0, 36.0, 41.0, 62.0, 53.0, 63.0, 52.0, 55.0, 53.0, 55.0, 66.0, 34.0, 41.0, 34.0, 31.0, 25.0, 20.0, 12.0, 16.0, 6.0, 7.0, 6.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.416259765625, -0.4051551818847656, -0.39405059814453125, -0.3829460144042969, -0.3718414306640625, -0.3607368469238281, -0.34963226318359375, -0.3385276794433594, -0.327423095703125, -0.3163185119628906, -0.30521392822265625, -0.2941093444824219, -0.2830047607421875, -0.2719001770019531, -0.26079559326171875, -0.24969100952148438, -0.23858642578125, -0.22748184204101562, -0.21637725830078125, -0.20527267456054688, -0.1941680908203125, -0.18306350708007812, -0.17195892333984375, -0.16085433959960938, -0.149749755859375, -0.13864517211914062, -0.12754058837890625, -0.11643600463867188, -0.1053314208984375, -0.09422683715820312, -0.08312225341796875, -0.07201766967773438, -0.0609130859375, -0.049808502197265625, -0.03870391845703125, -0.027599334716796875, -0.0164947509765625, -0.005390167236328125, 0.00571441650390625, 0.016819000244140625, 0.027923583984375, 0.039028167724609375, 0.05013275146484375, 0.061237335205078125, 0.0723419189453125, 0.08344650268554688, 0.09455108642578125, 0.10565567016601562, 0.11676025390625, 0.12786483764648438, 0.13896942138671875, 0.15007400512695312, 0.1611785888671875, 0.17228317260742188, 0.18338775634765625, 0.19449234008789062, 0.205596923828125, 0.21670150756835938, 0.22780609130859375, 0.23891067504882812, 0.2500152587890625, 0.2611198425292969, 0.27222442626953125, 0.2833290100097656, 0.29443359375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 3.0, 4.0, 7.0, 11.0, 18.0, 23.0, 42.0, 61.0, 107.0, 138.0, 245.0, 478.0, 1735.0, 21191.0, 4142755.0, 24600.0, 1818.0, 587.0, 206.0, 111.0, 68.0, 31.0, 21.0, 17.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5625, -4.40789794921875, -4.2532958984375, -4.09869384765625, -3.944091796875, -3.78948974609375, -3.6348876953125, -3.48028564453125, -3.32568359375, -3.17108154296875, -3.0164794921875, -2.86187744140625, -2.707275390625, -2.55267333984375, -2.3980712890625, -2.24346923828125, -2.0888671875, -1.93426513671875, -1.7796630859375, -1.62506103515625, -1.470458984375, -1.31585693359375, -1.1612548828125, -1.00665283203125, -0.85205078125, -0.69744873046875, -0.5428466796875, -0.38824462890625, -0.233642578125, -0.07904052734375, 0.0755615234375, 0.23016357421875, 0.384765625, 0.53936767578125, 0.6939697265625, 0.84857177734375, 1.003173828125, 1.15777587890625, 1.3123779296875, 1.46697998046875, 1.62158203125, 1.77618408203125, 1.9307861328125, 2.08538818359375, 2.239990234375, 2.39459228515625, 2.5491943359375, 2.70379638671875, 2.8583984375, 3.01300048828125, 3.1676025390625, 3.32220458984375, 3.476806640625, 3.63140869140625, 3.7860107421875, 3.94061279296875, 4.09521484375, 4.24981689453125, 4.4044189453125, 4.55902099609375, 4.713623046875, 4.86822509765625, 5.0228271484375, 5.17742919921875, 5.33203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 16.0, 45.0, 154.0, 1932.0, 1670.0, 193.0, 40.0, 16.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.88671875, -6.748931884765625, -6.61114501953125, -6.473358154296875, -6.3355712890625, -6.197784423828125, -6.05999755859375, -5.922210693359375, -5.784423828125, -5.646636962890625, -5.50885009765625, -5.371063232421875, -5.2332763671875, -5.095489501953125, -4.95770263671875, -4.819915771484375, -4.68212890625, -4.544342041015625, -4.40655517578125, -4.268768310546875, -4.1309814453125, -3.993194580078125, -3.85540771484375, -3.717620849609375, -3.579833984375, -3.442047119140625, -3.30426025390625, -3.166473388671875, -3.0286865234375, -2.890899658203125, -2.75311279296875, -2.615325927734375, -2.4775390625, -2.339752197265625, -2.20196533203125, -2.064178466796875, -1.9263916015625, -1.788604736328125, -1.65081787109375, -1.513031005859375, -1.375244140625, -1.237457275390625, -1.09967041015625, -0.961883544921875, -0.8240966796875, -0.686309814453125, -0.54852294921875, -0.410736083984375, -0.27294921875, -0.135162353515625, 0.00262451171875, 0.140411376953125, 0.2781982421875, 0.415985107421875, 0.55377197265625, 0.691558837890625, 0.829345703125, 0.967132568359375, 1.10491943359375, 1.242706298828125, 1.3804931640625, 1.518280029296875, 1.65606689453125, 1.793853759765625, 1.931640625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 11.0, 34.0, 118.0, 361.0, 327.0, 96.0, 34.0, 16.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.317466735839844, -47.26463317871094, -46.21179962158203, -45.158966064453125, -44.10613250732422, -43.05329895019531, -42.000465393066406, -40.9476318359375, -39.894798278808594, -38.84196472167969, -37.78913116455078, -36.736297607421875, -35.68346405029297, -34.63063049316406, -33.577796936035156, -32.52496337890625, -31.472129821777344, -30.419296264648438, -29.36646270751953, -28.313629150390625, -27.26079559326172, -26.207962036132812, -25.155128479003906, -24.102294921875, -23.049461364746094, -21.996627807617188, -20.94379425048828, -19.890960693359375, -18.83812713623047, -17.785293579101562, -16.732460021972656, -15.67962646484375, -14.626789093017578, -13.573955535888672, -12.521121978759766, -11.46828842163086, -10.415454864501953, -9.362621307373047, -8.30978775024414, -7.256954193115234, -6.204120635986328, -5.151287078857422, -4.098453521728516, -3.0456199645996094, -1.9927864074707031, -0.9399528503417969, 0.11288070678710938, 1.1657142639160156, 2.218547821044922, 3.271381378173828, 4.324214935302734, 5.377048492431641, 6.429882049560547, 7.482715606689453, 8.53554916381836, 9.588382720947266, 10.641216278076172, 11.694049835205078, 12.746883392333984, 13.79971694946289, 14.852550506591797, 15.905384063720703, 16.95821762084961, 18.011051177978516, 19.063884735107422]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 3.0, 4.0, 8.0, 5.0, 14.0, 15.0, 22.0, 16.0, 23.0, 30.0, 29.0, 33.0, 33.0, 48.0, 47.0, 53.0, 44.0, 67.0, 46.0, 48.0, 59.0, 51.0, 45.0, 38.0, 40.0, 26.0, 25.0, 19.0, 16.0, 16.0, 15.0, 10.0, 11.0, 10.0, 5.0, 5.0, 7.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.96102237701416, -7.726656913757324, -7.492291450500488, -7.257925987243652, -7.023560523986816, -6.7891950607299805, -6.5548295974731445, -6.320464134216309, -6.086098670959473, -5.851733207702637, -5.617367744445801, -5.383002281188965, -5.148636817932129, -4.914271354675293, -4.679905891418457, -4.445540428161621, -4.211174488067627, -3.976809024810791, -3.742443561553955, -3.508078098297119, -3.273712635040283, -3.0393471717834473, -2.8049814701080322, -2.5706160068511963, -2.3362505435943604, -2.1018850803375244, -1.8675196170806885, -1.633154034614563, -1.398788571357727, -1.1644231081008911, -0.9300575256347656, -0.6956920623779297, -0.46132659912109375, -0.22696110606193542, 0.0074043869972229, 0.2417699098587036, 0.47613537311553955, 0.7105008363723755, 0.944866418838501, 1.179231882095337, 1.4135973453521729, 1.6479628086090088, 1.8823282718658447, 2.1166939735412598, 2.3510594367980957, 2.5854249000549316, 2.8197903633117676, 3.0541558265686035, 3.2885212898254395, 3.5228867530822754, 3.7572522163391113, 3.9916176795959473, 4.225983142852783, 4.460348606109619, 4.694714546203613, 4.929080009460449, 5.163445472717285, 5.397810935974121, 5.632176399230957, 5.866541862487793, 6.100907325744629, 6.335272789001465, 6.569638252258301, 6.804003715515137, 7.038369178771973]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 5.0, 12.0, 15.0, 17.0, 30.0, 62.0, 105.0, 173.0, 346.0, 622.0, 1369.0, 3057.0, 7954.0, 23212.0, 82256.0, 334160.0, 430746.0, 116053.0, 31149.0, 10000.0, 3849.0, 1661.0, 762.0, 411.0, 205.0, 120.0, 79.0, 34.0, 29.0, 23.0, 10.0, 8.0, 4.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.84033203125, -0.8093490600585938, -0.7783660888671875, -0.7473831176757812, -0.716400146484375, -0.6854171752929688, -0.6544342041015625, -0.6234512329101562, -0.59246826171875, -0.5614852905273438, -0.5305023193359375, -0.49951934814453125, -0.468536376953125, -0.43755340576171875, -0.4065704345703125, -0.37558746337890625, -0.3446044921875, -0.31362152099609375, -0.2826385498046875, -0.25165557861328125, -0.220672607421875, -0.18968963623046875, -0.1587066650390625, -0.12772369384765625, -0.09674072265625, -0.06575775146484375, -0.0347747802734375, -0.00379180908203125, 0.027191162109375, 0.05817413330078125, 0.0891571044921875, 0.12014007568359375, 0.151123046875, 0.18210601806640625, 0.2130889892578125, 0.24407196044921875, 0.275054931640625, 0.30603790283203125, 0.3370208740234375, 0.36800384521484375, 0.39898681640625, 0.42996978759765625, 0.4609527587890625, 0.49193572998046875, 0.522918701171875, 0.5539016723632812, 0.5848846435546875, 0.6158676147460938, 0.6468505859375, 0.6778335571289062, 0.7088165283203125, 0.7397994995117188, 0.770782470703125, 0.8017654418945312, 0.8327484130859375, 0.8637313842773438, 0.89471435546875, 0.9256973266601562, 0.9566802978515625, 0.9876632690429688, 1.018646240234375, 1.0496292114257812, 1.0806121826171875, 1.1115951538085938, 1.142578125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 9.0, 5.0, 12.0, 19.0, 10.0, 18.0, 22.0, 29.0, 26.0, 25.0, 35.0, 48.0, 47.0, 42.0, 47.0, 47.0, 35.0, 47.0, 50.0, 46.0, 42.0, 36.0, 52.0, 31.0, 37.0, 29.0, 20.0, 24.0, 16.0, 18.0, 18.0, 8.0, 9.0, 10.0, 7.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.47705078125, -0.4634895324707031, -0.44992828369140625, -0.4363670349121094, -0.4228057861328125, -0.4092445373535156, -0.39568328857421875, -0.3821220397949219, -0.368560791015625, -0.3549995422363281, -0.34143829345703125, -0.3278770446777344, -0.3143157958984375, -0.3007545471191406, -0.28719329833984375, -0.2736320495605469, -0.26007080078125, -0.24650955200195312, -0.23294830322265625, -0.21938705444335938, -0.2058258056640625, -0.19226455688476562, -0.17870330810546875, -0.16514205932617188, -0.151580810546875, -0.13801956176757812, -0.12445831298828125, -0.11089706420898438, -0.0973358154296875, -0.08377456665039062, -0.07021331787109375, -0.056652069091796875, -0.0430908203125, -0.029529571533203125, -0.01596832275390625, -0.002407073974609375, 0.0111541748046875, 0.024715423583984375, 0.03827667236328125, 0.051837921142578125, 0.065399169921875, 0.07896041870117188, 0.09252166748046875, 0.10608291625976562, 0.1196441650390625, 0.13320541381835938, 0.14676666259765625, 0.16032791137695312, 0.17388916015625, 0.18745040893554688, 0.20101165771484375, 0.21457290649414062, 0.2281341552734375, 0.24169540405273438, 0.25525665283203125, 0.2688179016113281, 0.282379150390625, 0.2959403991699219, 0.30950164794921875, 0.3230628967285156, 0.3366241455078125, 0.3501853942871094, 0.36374664306640625, 0.3773078918457031, 0.390869140625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 15.0, 15.0, 20.0, 22.0, 32.0, 52.0, 79.0, 127.0, 233.0, 487.0, 1050.0, 2429.0, 8024.0, 35933.0, 261872.0, 652981.0, 66046.0, 12821.0, 3500.0, 1393.0, 625.0, 328.0, 195.0, 97.0, 58.0, 34.0, 30.0, 9.0, 14.0, 10.0, 10.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8369140625, -1.7846832275390625, -1.732452392578125, -1.6802215576171875, -1.62799072265625, -1.5757598876953125, -1.523529052734375, -1.4712982177734375, -1.4190673828125, -1.3668365478515625, -1.314605712890625, -1.2623748779296875, -1.21014404296875, -1.1579132080078125, -1.105682373046875, -1.0534515380859375, -1.001220703125, -0.9489898681640625, -0.896759033203125, -0.8445281982421875, -0.79229736328125, -0.7400665283203125, -0.687835693359375, -0.6356048583984375, -0.5833740234375, -0.5311431884765625, -0.478912353515625, -0.4266815185546875, -0.37445068359375, -0.3222198486328125, -0.269989013671875, -0.2177581787109375, -0.16552734375, -0.1132965087890625, -0.061065673828125, -0.0088348388671875, 0.04339599609375, 0.0956268310546875, 0.147857666015625, 0.2000885009765625, 0.2523193359375, 0.3045501708984375, 0.356781005859375, 0.4090118408203125, 0.46124267578125, 0.5134735107421875, 0.565704345703125, 0.6179351806640625, 0.670166015625, 0.7223968505859375, 0.774627685546875, 0.8268585205078125, 0.87908935546875, 0.9313201904296875, 0.983551025390625, 1.0357818603515625, 1.0880126953125, 1.1402435302734375, 1.192474365234375, 1.2447052001953125, 1.29693603515625, 1.3491668701171875, 1.401397705078125, 1.4536285400390625, 1.505859375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 9.0, 7.0, 10.0, 9.0, 20.0, 13.0, 12.0, 22.0, 23.0, 41.0, 39.0, 34.0, 32.0, 50.0, 49.0, 62.0, 61.0, 52.0, 47.0, 45.0, 39.0, 42.0, 46.0, 46.0, 42.0, 31.0, 22.0, 16.0, 25.0, 13.0, 6.0, 7.0, 11.0, 6.0, 3.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84375, -1.781707763671875, -1.71966552734375, -1.657623291015625, -1.5955810546875, -1.533538818359375, -1.47149658203125, -1.409454345703125, -1.347412109375, -1.285369873046875, -1.22332763671875, -1.161285400390625, -1.0992431640625, -1.037200927734375, -0.97515869140625, -0.913116455078125, -0.85107421875, -0.789031982421875, -0.72698974609375, -0.664947509765625, -0.6029052734375, -0.540863037109375, -0.47882080078125, -0.416778564453125, -0.354736328125, -0.292694091796875, -0.23065185546875, -0.168609619140625, -0.1065673828125, -0.044525146484375, 0.01751708984375, 0.079559326171875, 0.1416015625, 0.203643798828125, 0.26568603515625, 0.327728271484375, 0.3897705078125, 0.451812744140625, 0.51385498046875, 0.575897216796875, 0.637939453125, 0.699981689453125, 0.76202392578125, 0.824066162109375, 0.8861083984375, 0.948150634765625, 1.01019287109375, 1.072235107421875, 1.13427734375, 1.196319580078125, 1.25836181640625, 1.320404052734375, 1.3824462890625, 1.444488525390625, 1.50653076171875, 1.568572998046875, 1.630615234375, 1.692657470703125, 1.75469970703125, 1.816741943359375, 1.8787841796875, 1.940826416015625, 2.00286865234375, 2.064910888671875, 2.126953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 8.0, 9.0, 13.0, 30.0, 37.0, 55.0, 94.0, 201.0, 457.0, 1001.0, 2612.0, 8690.0, 42114.0, 667259.0, 285901.0, 29738.0, 6674.0, 2119.0, 785.0, 340.0, 171.0, 93.0, 58.0, 35.0, 21.0, 12.0, 5.0, 7.0, 7.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.123046875, -1.0889129638671875, -1.054779052734375, -1.0206451416015625, -0.98651123046875, -0.9523773193359375, -0.918243408203125, -0.8841094970703125, -0.8499755859375, -0.8158416748046875, -0.781707763671875, -0.7475738525390625, -0.71343994140625, -0.6793060302734375, -0.645172119140625, -0.6110382080078125, -0.576904296875, -0.5427703857421875, -0.508636474609375, -0.4745025634765625, -0.44036865234375, -0.4062347412109375, -0.372100830078125, -0.3379669189453125, -0.3038330078125, -0.2696990966796875, -0.235565185546875, -0.2014312744140625, -0.16729736328125, -0.1331634521484375, -0.099029541015625, -0.0648956298828125, -0.03076171875, 0.0033721923828125, 0.037506103515625, 0.0716400146484375, 0.10577392578125, 0.1399078369140625, 0.174041748046875, 0.2081756591796875, 0.2423095703125, 0.2764434814453125, 0.310577392578125, 0.3447113037109375, 0.37884521484375, 0.4129791259765625, 0.447113037109375, 0.4812469482421875, 0.515380859375, 0.5495147705078125, 0.583648681640625, 0.6177825927734375, 0.65191650390625, 0.6860504150390625, 0.720184326171875, 0.7543182373046875, 0.7884521484375, 0.8225860595703125, 0.856719970703125, 0.8908538818359375, 0.92498779296875, 0.9591217041015625, 0.993255615234375, 1.0273895263671875, 1.0615234375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 4.0, 3.0, 9.0, 16.0, 18.0, 22.0, 40.0, 43.0, 67.0, 81.0, 121.0, 162.0, 112.0, 73.0, 46.0, 36.0, 27.0, 29.0, 15.0, 19.0, 16.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00026535987854003906, -0.00025716423988342285, -0.00024896860122680664, -0.00024077296257019043, -0.00023257732391357422, -0.000224381685256958, -0.0002161860466003418, -0.00020799040794372559, -0.00019979476928710938, -0.00019159913063049316, -0.00018340349197387695, -0.00017520785331726074, -0.00016701221466064453, -0.00015881657600402832, -0.0001506209373474121, -0.0001424252986907959, -0.0001342296600341797, -0.00012603402137756348, -0.00011783838272094727, -0.00010964274406433105, -0.00010144710540771484, -9.325146675109863e-05, -8.505582809448242e-05, -7.686018943786621e-05, -6.866455078125e-05, -6.046891212463379e-05, -5.227327346801758e-05, -4.407763481140137e-05, -3.5881996154785156e-05, -2.7686357498168945e-05, -1.9490718841552734e-05, -1.1295080184936523e-05, -3.0994415283203125e-06, 5.0961971282958984e-06, 1.329183578491211e-05, 2.148747444152832e-05, 2.968311309814453e-05, 3.787875175476074e-05, 4.607439041137695e-05, 5.4270029067993164e-05, 6.246566772460938e-05, 7.066130638122559e-05, 7.88569450378418e-05, 8.705258369445801e-05, 9.524822235107422e-05, 0.00010344386100769043, 0.00011163949966430664, 0.00011983513832092285, 0.00012803077697753906, 0.00013622641563415527, 0.00014442205429077148, 0.0001526176929473877, 0.0001608133316040039, 0.00016900897026062012, 0.00017720460891723633, 0.00018540024757385254, 0.00019359588623046875, 0.00020179152488708496, 0.00020998716354370117, 0.00021818280220031738, 0.0002263784408569336, 0.0002345740795135498, 0.00024276971817016602, 0.0002509653568267822, 0.00025916099548339844]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 7.0, 17.0, 24.0, 31.0, 69.0, 91.0, 200.0, 416.0, 771.0, 1686.0, 4321.0, 13250.0, 53576.0, 493683.0, 406540.0, 53159.0, 13118.0, 4247.0, 1699.0, 757.0, 385.0, 203.0, 121.0, 57.0, 34.0, 18.0, 24.0, 11.0, 1.0, 4.0, 2.0, 2.0, 7.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63427734375, -0.6098785400390625, -0.585479736328125, -0.5610809326171875, -0.53668212890625, -0.5122833251953125, -0.487884521484375, -0.4634857177734375, -0.4390869140625, -0.4146881103515625, -0.390289306640625, -0.3658905029296875, -0.34149169921875, -0.3170928955078125, -0.292694091796875, -0.2682952880859375, -0.243896484375, -0.2194976806640625, -0.195098876953125, -0.1707000732421875, -0.14630126953125, -0.1219024658203125, -0.097503662109375, -0.0731048583984375, -0.0487060546875, -0.0243072509765625, 9.1552734375e-05, 0.0244903564453125, 0.04888916015625, 0.0732879638671875, 0.097686767578125, 0.1220855712890625, 0.146484375, 0.1708831787109375, 0.195281982421875, 0.2196807861328125, 0.24407958984375, 0.2684783935546875, 0.292877197265625, 0.3172760009765625, 0.3416748046875, 0.3660736083984375, 0.390472412109375, 0.4148712158203125, 0.43927001953125, 0.4636688232421875, 0.488067626953125, 0.5124664306640625, 0.536865234375, 0.5612640380859375, 0.585662841796875, 0.6100616455078125, 0.63446044921875, 0.6588592529296875, 0.683258056640625, 0.7076568603515625, 0.7320556640625, 0.7564544677734375, 0.780853271484375, 0.8052520751953125, 0.82965087890625, 0.8540496826171875, 0.878448486328125, 0.9028472900390625, 0.92724609375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 11.0, 5.0, 9.0, 10.0, 12.0, 13.0, 18.0, 21.0, 36.0, 57.0, 66.0, 81.0, 100.0, 124.0, 96.0, 86.0, 53.0, 59.0, 36.0, 22.0, 16.0, 16.0, 9.0, 6.0, 10.0, 7.0, 3.0, 0.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.67431640625, -0.6547927856445312, -0.6352691650390625, -0.6157455444335938, -0.596221923828125, -0.5766983032226562, -0.5571746826171875, -0.5376510620117188, -0.51812744140625, -0.49860382080078125, -0.4790802001953125, -0.45955657958984375, -0.440032958984375, -0.42050933837890625, -0.4009857177734375, -0.38146209716796875, -0.3619384765625, -0.34241485595703125, -0.3228912353515625, -0.30336761474609375, -0.283843994140625, -0.26432037353515625, -0.2447967529296875, -0.22527313232421875, -0.20574951171875, -0.18622589111328125, -0.1667022705078125, -0.14717864990234375, -0.127655029296875, -0.10813140869140625, -0.0886077880859375, -0.06908416748046875, -0.049560546875, -0.03003692626953125, -0.0105133056640625, 0.00901031494140625, 0.028533935546875, 0.04805755615234375, 0.0675811767578125, 0.08710479736328125, 0.10662841796875, 0.12615203857421875, 0.1456756591796875, 0.16519927978515625, 0.184722900390625, 0.20424652099609375, 0.2237701416015625, 0.24329376220703125, 0.2628173828125, 0.28234100341796875, 0.3018646240234375, 0.32138824462890625, 0.340911865234375, 0.36043548583984375, 0.3799591064453125, 0.39948272705078125, 0.41900634765625, 0.43852996826171875, 0.4580535888671875, 0.47757720947265625, 0.497100830078125, 0.5166244506835938, 0.5361480712890625, 0.5556716918945312, 0.5751953125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 12.0, 13.0, 31.0, 78.0, 130.0, 258.0, 237.0, 119.0, 52.0, 27.0, 19.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.34766960144043, -14.835050582885742, -14.322432518005371, -13.809813499450684, -13.297195434570312, -12.784576416015625, -12.271957397460938, -11.75933837890625, -11.246720314025879, -10.734101295471191, -10.22148323059082, -9.708864212036133, -9.196245193481445, -8.683627128601074, -8.171008110046387, -7.658389568328857, -7.145771026611328, -6.633152484893799, -6.1205339431762695, -5.607914924621582, -5.095296382904053, -4.582677841186523, -4.070058822631836, -3.5574402809143066, -3.0448217391967773, -2.532203197479248, -2.0195844173431396, -1.5069657564163208, -0.994347095489502, -0.48172855377197266, 0.030890226364135742, 0.5435090065002441, 1.0561256408691406, 1.5687443017959595, 2.0813629627227783, 2.5939817428588867, 3.106600284576416, 3.6192188262939453, 4.131837844848633, 4.644456386566162, 5.157074928283691, 5.669693470001221, 6.18231201171875, 6.6949310302734375, 7.207549571990967, 7.720168113708496, 8.232787132263184, 8.745405197143555, 9.258024215698242, 9.77064323425293, 10.2832612991333, 10.795880317687988, 11.30849838256836, 11.821117401123047, 12.333736419677734, 12.846355438232422, 13.358973503112793, 13.87159252166748, 14.384210586547852, 14.896829605102539, 15.409448623657227, 15.922066688537598, 16.43468475341797, 16.947303771972656, 17.459922790527344]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 11.0, 15.0, 13.0, 16.0, 16.0, 25.0, 16.0, 31.0, 25.0, 40.0, 34.0, 33.0, 48.0, 64.0, 78.0, 71.0, 69.0, 51.0, 40.0, 37.0, 37.0, 22.0, 30.0, 12.0, 20.0, 20.0, 16.0, 15.0, 9.0, 9.0, 8.0, 12.0, 4.0, 8.0, 6.0, 3.0, 2.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-8.77496337890625, -8.524949073791504, -8.274934768676758, -8.024920463562012, -7.774906635284424, -7.524892330169678, -7.27487850189209, -7.024864196777344, -6.774849891662598, -6.524835586547852, -6.2748212814331055, -6.024807453155518, -5.7747931480407715, -5.524778842926025, -5.2747650146484375, -5.024750709533691, -4.774736404418945, -4.524722099304199, -4.274707794189453, -4.024693965911865, -3.774679660797119, -3.524665355682373, -3.274651288986206, -3.024637222290039, -2.774622917175293, -2.524608612060547, -2.27459454536438, -2.024580478668213, -1.7745661735534668, -1.5245519876480103, -1.2745378017425537, -1.0245236158370972, -0.7745099067687988, -0.5244957208633423, -0.27448153495788574, -0.0244673490524292, 0.22554683685302734, 0.4755610227584839, 0.7255752086639404, 0.975589394569397, 1.2256035804748535, 1.47561776638031, 1.7256319522857666, 1.9756461381912231, 2.2256603240966797, 2.475674629211426, 2.7256886959075928, 2.9757027626037598, 3.225717067718506, 3.475731372833252, 3.725745439529419, 3.975759506225586, 4.225773811340332, 4.475788116455078, 4.725802421569824, 4.975816249847412, 5.225830554962158, 5.475844860076904, 5.725858688354492, 5.975872993469238, 6.225887298583984, 6.4759016036987305, 6.725915908813477, 6.9759297370910645, 7.2259440422058105]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 4.0, 5.0, 5.0, 3.0, 9.0, 7.0, 16.0, 12.0, 20.0, 36.0, 41.0, 73.0, 106.0, 225.0, 329.0, 654.0, 1633.0, 5624.0, 50455.0, 3909323.0, 211631.0, 9709.0, 2385.0, 942.0, 447.0, 228.0, 129.0, 79.0, 52.0, 33.0, 23.0, 17.0, 15.0, 8.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.85546875, -2.78521728515625, -2.7149658203125, -2.64471435546875, -2.574462890625, -2.50421142578125, -2.4339599609375, -2.36370849609375, -2.29345703125, -2.22320556640625, -2.1529541015625, -2.08270263671875, -2.012451171875, -1.94219970703125, -1.8719482421875, -1.80169677734375, -1.7314453125, -1.66119384765625, -1.5909423828125, -1.52069091796875, -1.450439453125, -1.38018798828125, -1.3099365234375, -1.23968505859375, -1.16943359375, -1.09918212890625, -1.0289306640625, -0.95867919921875, -0.888427734375, -0.81817626953125, -0.7479248046875, -0.67767333984375, -0.607421875, -0.53717041015625, -0.4669189453125, -0.39666748046875, -0.326416015625, -0.25616455078125, -0.1859130859375, -0.11566162109375, -0.04541015625, 0.02484130859375, 0.0950927734375, 0.16534423828125, 0.235595703125, 0.30584716796875, 0.3760986328125, 0.44635009765625, 0.5166015625, 0.58685302734375, 0.6571044921875, 0.72735595703125, 0.797607421875, 0.86785888671875, 0.9381103515625, 1.00836181640625, 1.07861328125, 1.14886474609375, 1.2191162109375, 1.28936767578125, 1.359619140625, 1.42987060546875, 1.5001220703125, 1.57037353515625, 1.640625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 9.0, 8.0, 15.0, 15.0, 22.0, 21.0, 25.0, 34.0, 37.0, 43.0, 50.0, 46.0, 65.0, 61.0, 69.0, 64.0, 50.0, 66.0, 45.0, 40.0, 39.0, 35.0, 26.0, 20.0, 19.0, 14.0, 11.0, 5.0, 10.0, 9.0, 9.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.6259765625, -0.6096229553222656, -0.5932693481445312, -0.5769157409667969, -0.5605621337890625, -0.5442085266113281, -0.5278549194335938, -0.5115013122558594, -0.495147705078125, -0.4787940979003906, -0.46244049072265625, -0.4460868835449219, -0.4297332763671875, -0.4133796691894531, -0.39702606201171875, -0.3806724548339844, -0.36431884765625, -0.3479652404785156, -0.33161163330078125, -0.3152580261230469, -0.2989044189453125, -0.2825508117675781, -0.26619720458984375, -0.24984359741210938, -0.233489990234375, -0.21713638305664062, -0.20078277587890625, -0.18442916870117188, -0.1680755615234375, -0.15172195434570312, -0.13536834716796875, -0.11901473999023438, -0.1026611328125, -0.08630752563476562, -0.06995391845703125, -0.053600311279296875, -0.0372467041015625, -0.020893096923828125, -0.00453948974609375, 0.011814117431640625, 0.028167724609375, 0.044521331787109375, 0.06087493896484375, 0.07722854614257812, 0.0935821533203125, 0.10993576049804688, 0.12628936767578125, 0.14264297485351562, 0.15899658203125, 0.17535018920898438, 0.19170379638671875, 0.20805740356445312, 0.2244110107421875, 0.24076461791992188, 0.25711822509765625, 0.2734718322753906, 0.289825439453125, 0.3061790466308594, 0.32253265380859375, 0.3388862609863281, 0.3552398681640625, 0.3715934753417969, 0.38794708251953125, 0.4043006896972656, 0.420654296875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 0.0, 4.0, 7.0, 9.0, 21.0, 29.0, 36.0, 64.0, 92.0, 171.0, 355.0, 866.0, 3130.0, 27713.0, 4080976.0, 74068.0, 4630.0, 1154.0, 415.0, 206.0, 143.0, 67.0, 48.0, 28.0, 21.0, 13.0, 7.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.26953125, -4.138671875, -4.0078125, -3.876953125, -3.74609375, -3.615234375, -3.484375, -3.353515625, -3.22265625, -3.091796875, -2.9609375, -2.830078125, -2.69921875, -2.568359375, -2.4375, -2.306640625, -2.17578125, -2.044921875, -1.9140625, -1.783203125, -1.65234375, -1.521484375, -1.390625, -1.259765625, -1.12890625, -0.998046875, -0.8671875, -0.736328125, -0.60546875, -0.474609375, -0.34375, -0.212890625, -0.08203125, 0.048828125, 0.1796875, 0.310546875, 0.44140625, 0.572265625, 0.703125, 0.833984375, 0.96484375, 1.095703125, 1.2265625, 1.357421875, 1.48828125, 1.619140625, 1.75, 1.880859375, 2.01171875, 2.142578125, 2.2734375, 2.404296875, 2.53515625, 2.666015625, 2.796875, 2.927734375, 3.05859375, 3.189453125, 3.3203125, 3.451171875, 3.58203125, 3.712890625, 3.84375, 3.974609375, 4.10546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 6.0, 7.0, 12.0, 22.0, 59.0, 103.0, 424.0, 1872.0, 1188.0, 232.0, 81.0, 35.0, 14.0, 10.0, 5.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.94921875, -4.841094970703125, -4.73297119140625, -4.624847412109375, -4.5167236328125, -4.408599853515625, -4.30047607421875, -4.192352294921875, -4.084228515625, -3.976104736328125, -3.86798095703125, -3.759857177734375, -3.6517333984375, -3.543609619140625, -3.43548583984375, -3.327362060546875, -3.21923828125, -3.111114501953125, -3.00299072265625, -2.894866943359375, -2.7867431640625, -2.678619384765625, -2.57049560546875, -2.462371826171875, -2.354248046875, -2.246124267578125, -2.13800048828125, -2.029876708984375, -1.9217529296875, -1.813629150390625, -1.70550537109375, -1.597381591796875, -1.4892578125, -1.381134033203125, -1.27301025390625, -1.164886474609375, -1.0567626953125, -0.948638916015625, -0.84051513671875, -0.732391357421875, -0.624267578125, -0.516143798828125, -0.40802001953125, -0.299896240234375, -0.1917724609375, -0.083648681640625, 0.02447509765625, 0.132598876953125, 0.24072265625, 0.348846435546875, 0.45697021484375, 0.565093994140625, 0.6732177734375, 0.781341552734375, 0.88946533203125, 0.997589111328125, 1.105712890625, 1.213836669921875, 1.32196044921875, 1.430084228515625, 1.5382080078125, 1.646331787109375, 1.75445556640625, 1.862579345703125, 1.970703125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 10.0, 12.0, 30.0, 41.0, 84.0, 130.0, 216.0, 190.0, 124.0, 77.0, 37.0, 21.0, 10.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.27149486541748, -13.719356536865234, -13.167217254638672, -12.615078926086426, -12.06294059753418, -11.510801315307617, -10.958662986755371, -10.406524658203125, -9.854385375976562, -9.302247047424316, -8.750107765197754, -8.197969436645508, -7.6458306312561035, -7.093691825866699, -6.541553497314453, -5.989414691925049, -5.4372758865356445, -4.88513708114624, -4.332998275756836, -3.78085994720459, -3.2287211418151855, -2.6765823364257812, -2.124443769454956, -1.5723052024841309, -1.0201663970947266, -0.4680277109146118, 0.08411097526550293, 0.6362496614456177, 1.1883883476257324, 1.7405271530151367, 2.292665719985962, 2.844804286956787, 3.396942138671875, 3.9490809440612793, 4.501219749450684, 5.05335807800293, 5.605496883392334, 6.157635688781738, 6.709774017333984, 7.261912822723389, 7.814051628112793, 8.366189956665039, 8.918329238891602, 9.470467567443848, 10.022605895996094, 10.574745178222656, 11.126883506774902, 11.679021835327148, 12.231161117553711, 12.783299446105957, 13.33543872833252, 13.887577056884766, 14.439716339111328, 14.991854667663574, 15.54399299621582, 16.096132278442383, 16.648269653320312, 17.200408935546875, 17.752546310424805, 18.304685592651367, 18.85682487487793, 19.40896224975586, 19.961101531982422, 20.513240814208984, 21.065380096435547]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 11.0, 9.0, 10.0, 7.0, 16.0, 21.0, 14.0, 17.0, 29.0, 29.0, 26.0, 35.0, 28.0, 33.0, 41.0, 39.0, 63.0, 56.0, 71.0, 63.0, 49.0, 47.0, 44.0, 35.0, 27.0, 29.0, 26.0, 22.0, 22.0, 20.0, 13.0, 10.0, 11.0, 3.0, 10.0, 3.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.990432262420654, -6.754762649536133, -6.5190935134887695, -6.283424377441406, -6.047754764556885, -5.812085151672363, -5.576416015625, -5.340746879577637, -5.105077266693115, -4.869407653808594, -4.6337385177612305, -4.398069381713867, -4.162399768829346, -3.9267303943634033, -3.691061019897461, -3.4553916454315186, -3.219722270965576, -2.984052896499634, -2.7483835220336914, -2.512714147567749, -2.2770447731018066, -2.0413753986358643, -1.8057060241699219, -1.5700366497039795, -1.334367275238037, -1.0986979007720947, -0.8630285263061523, -0.62735915184021, -0.3916897773742676, -0.1560204029083252, 0.07964897155761719, 0.31531834602355957, 0.5509881973266602, 0.7866575717926025, 1.022326946258545, 1.2579963207244873, 1.4936656951904297, 1.729335069656372, 1.9650044441223145, 2.200673818588257, 2.436343193054199, 2.6720125675201416, 2.907681941986084, 3.1433513164520264, 3.3790206909179688, 3.614690065383911, 3.8503594398498535, 4.086029052734375, 4.321698188781738, 4.557367324829102, 4.793036937713623, 5.0287065505981445, 5.264375686645508, 5.500044822692871, 5.735714435577393, 5.971384048461914, 6.207053184509277, 6.442722320556641, 6.678391933441162, 6.914061546325684, 7.149730682373047, 7.38539981842041, 7.621069431304932, 7.856739044189453, 8.092408180236816]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 12.0, 13.0, 20.0, 24.0, 48.0, 79.0, 114.0, 194.0, 360.0, 553.0, 1060.0, 1999.0, 4006.0, 8065.0, 17660.0, 41354.0, 109146.0, 316606.0, 344854.0, 120220.0, 45260.0, 19038.0, 8897.0, 4226.0, 2117.0, 1122.0, 629.0, 326.0, 194.0, 133.0, 75.0, 54.0, 23.0, 25.0, 13.0, 12.0, 3.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6171875, -0.591522216796875, -0.56585693359375, -0.540191650390625, -0.5145263671875, -0.488861083984375, -0.46319580078125, -0.437530517578125, -0.411865234375, -0.386199951171875, -0.36053466796875, -0.334869384765625, -0.3092041015625, -0.283538818359375, -0.25787353515625, -0.232208251953125, -0.20654296875, -0.180877685546875, -0.15521240234375, -0.129547119140625, -0.1038818359375, -0.078216552734375, -0.05255126953125, -0.026885986328125, -0.001220703125, 0.024444580078125, 0.05010986328125, 0.075775146484375, 0.1014404296875, 0.127105712890625, 0.15277099609375, 0.178436279296875, 0.2041015625, 0.229766845703125, 0.25543212890625, 0.281097412109375, 0.3067626953125, 0.332427978515625, 0.35809326171875, 0.383758544921875, 0.409423828125, 0.435089111328125, 0.46075439453125, 0.486419677734375, 0.5120849609375, 0.537750244140625, 0.56341552734375, 0.589080810546875, 0.61474609375, 0.640411376953125, 0.66607666015625, 0.691741943359375, 0.7174072265625, 0.743072509765625, 0.76873779296875, 0.794403076171875, 0.820068359375, 0.845733642578125, 0.87139892578125, 0.897064208984375, 0.9227294921875, 0.948394775390625, 0.97406005859375, 0.999725341796875, 1.025390625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 5.0, 8.0, 6.0, 6.0, 17.0, 20.0, 20.0, 23.0, 33.0, 49.0, 34.0, 41.0, 50.0, 49.0, 46.0, 58.0, 45.0, 58.0, 55.0, 50.0, 58.0, 46.0, 50.0, 39.0, 22.0, 22.0, 22.0, 14.0, 11.0, 11.0, 4.0, 3.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.78173828125, -0.7617149353027344, -0.7416915893554688, -0.7216682434082031, -0.7016448974609375, -0.6816215515136719, -0.6615982055664062, -0.6415748596191406, -0.621551513671875, -0.6015281677246094, -0.5815048217773438, -0.5614814758300781, -0.5414581298828125, -0.5214347839355469, -0.5014114379882812, -0.4813880920410156, -0.46136474609375, -0.4413414001464844, -0.42131805419921875, -0.4012947082519531, -0.3812713623046875, -0.3612480163574219, -0.34122467041015625, -0.3212013244628906, -0.301177978515625, -0.2811546325683594, -0.26113128662109375, -0.24110794067382812, -0.2210845947265625, -0.20106124877929688, -0.18103790283203125, -0.16101455688476562, -0.1409912109375, -0.12096786499023438, -0.10094451904296875, -0.08092117309570312, -0.0608978271484375, -0.040874481201171875, -0.02085113525390625, -0.000827789306640625, 0.019195556640625, 0.039218902587890625, 0.05924224853515625, 0.07926559448242188, 0.0992889404296875, 0.11931228637695312, 0.13933563232421875, 0.15935897827148438, 0.17938232421875, 0.19940567016601562, 0.21942901611328125, 0.23945236206054688, 0.2594757080078125, 0.2794990539550781, 0.29952239990234375, 0.3195457458496094, 0.339569091796875, 0.3595924377441406, 0.37961578369140625, 0.3996391296386719, 0.4196624755859375, 0.4396858215332031, 0.45970916748046875, 0.4797325134277344, 0.499755859375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 11.0, 12.0, 16.0, 13.0, 32.0, 33.0, 45.0, 70.0, 83.0, 137.0, 181.0, 292.0, 489.0, 874.0, 1725.0, 4340.0, 14180.0, 65679.0, 692736.0, 220223.0, 33101.0, 8267.0, 2864.0, 1289.0, 630.0, 387.0, 241.0, 174.0, 101.0, 99.0, 55.0, 34.0, 31.0, 19.0, 16.0, 14.0, 12.0, 7.0, 7.0, 7.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.806640625, -1.74981689453125, -1.6929931640625, -1.63616943359375, -1.579345703125, -1.52252197265625, -1.4656982421875, -1.40887451171875, -1.35205078125, -1.29522705078125, -1.2384033203125, -1.18157958984375, -1.124755859375, -1.06793212890625, -1.0111083984375, -0.95428466796875, -0.8974609375, -0.84063720703125, -0.7838134765625, -0.72698974609375, -0.670166015625, -0.61334228515625, -0.5565185546875, -0.49969482421875, -0.44287109375, -0.38604736328125, -0.3292236328125, -0.27239990234375, -0.215576171875, -0.15875244140625, -0.1019287109375, -0.04510498046875, 0.01171875, 0.06854248046875, 0.1253662109375, 0.18218994140625, 0.239013671875, 0.29583740234375, 0.3526611328125, 0.40948486328125, 0.46630859375, 0.52313232421875, 0.5799560546875, 0.63677978515625, 0.693603515625, 0.75042724609375, 0.8072509765625, 0.86407470703125, 0.9208984375, 0.97772216796875, 1.0345458984375, 1.09136962890625, 1.148193359375, 1.20501708984375, 1.2618408203125, 1.31866455078125, 1.37548828125, 1.43231201171875, 1.4891357421875, 1.54595947265625, 1.602783203125, 1.65960693359375, 1.7164306640625, 1.77325439453125, 1.830078125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 10.0, 10.0, 8.0, 12.0, 21.0, 15.0, 17.0, 29.0, 27.0, 42.0, 47.0, 51.0, 59.0, 51.0, 47.0, 63.0, 44.0, 53.0, 60.0, 51.0, 32.0, 38.0, 31.0, 26.0, 20.0, 26.0, 22.0, 16.0, 15.0, 13.0, 2.0, 11.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0], "bins": [-2.755859375, -2.6802978515625, -2.604736328125, -2.5291748046875, -2.45361328125, -2.3780517578125, -2.302490234375, -2.2269287109375, -2.1513671875, -2.0758056640625, -2.000244140625, -1.9246826171875, -1.84912109375, -1.7735595703125, -1.697998046875, -1.6224365234375, -1.546875, -1.4713134765625, -1.395751953125, -1.3201904296875, -1.24462890625, -1.1690673828125, -1.093505859375, -1.0179443359375, -0.9423828125, -0.8668212890625, -0.791259765625, -0.7156982421875, -0.64013671875, -0.5645751953125, -0.489013671875, -0.4134521484375, -0.337890625, -0.2623291015625, -0.186767578125, -0.1112060546875, -0.03564453125, 0.0399169921875, 0.115478515625, 0.1910400390625, 0.2666015625, 0.3421630859375, 0.417724609375, 0.4932861328125, 0.56884765625, 0.6444091796875, 0.719970703125, 0.7955322265625, 0.87109375, 0.9466552734375, 1.022216796875, 1.0977783203125, 1.17333984375, 1.2489013671875, 1.324462890625, 1.4000244140625, 1.4755859375, 1.5511474609375, 1.626708984375, 1.7022705078125, 1.77783203125, 1.8533935546875, 1.928955078125, 2.0045166015625, 2.080078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 10.0, 14.0, 1.0, 16.0, 22.0, 19.0, 33.0, 50.0, 53.0, 77.0, 119.0, 118.0, 192.0, 316.0, 398.0, 710.0, 1012.0, 1733.0, 3217.0, 6787.0, 16653.0, 53484.0, 321055.0, 552090.0, 57176.0, 17677.0, 7100.0, 3387.0, 1769.0, 1063.0, 702.0, 428.0, 297.0, 219.0, 145.0, 102.0, 79.0, 47.0, 59.0, 34.0, 35.0, 20.0, 8.0, 8.0, 7.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.79345703125, -0.7694320678710938, -0.7454071044921875, -0.7213821411132812, -0.697357177734375, -0.6733322143554688, -0.6493072509765625, -0.6252822875976562, -0.60125732421875, -0.5772323608398438, -0.5532073974609375, -0.5291824340820312, -0.505157470703125, -0.48113250732421875, -0.4571075439453125, -0.43308258056640625, -0.4090576171875, -0.38503265380859375, -0.3610076904296875, -0.33698272705078125, -0.312957763671875, -0.28893280029296875, -0.2649078369140625, -0.24088287353515625, -0.21685791015625, -0.19283294677734375, -0.1688079833984375, -0.14478302001953125, -0.120758056640625, -0.09673309326171875, -0.0727081298828125, -0.04868316650390625, -0.024658203125, -0.00063323974609375, 0.0233917236328125, 0.04741668701171875, 0.071441650390625, 0.09546661376953125, 0.1194915771484375, 0.14351654052734375, 0.16754150390625, 0.19156646728515625, 0.2155914306640625, 0.23961639404296875, 0.263641357421875, 0.28766632080078125, 0.3116912841796875, 0.33571624755859375, 0.3597412109375, 0.38376617431640625, 0.4077911376953125, 0.43181610107421875, 0.455841064453125, 0.47986602783203125, 0.5038909912109375, 0.5279159545898438, 0.55194091796875, 0.5759658813476562, 0.5999908447265625, 0.6240158081054688, 0.648040771484375, 0.6720657348632812, 0.6960906982421875, 0.7201156616210938, 0.744140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 9.0, 8.0, 12.0, 18.0, 25.0, 27.0, 41.0, 78.0, 128.0, 248.0, 169.0, 91.0, 60.0, 23.0, 21.0, 11.0, 8.0, 7.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005178451538085938, -0.0005004033446311951, -0.0004829615354537964, -0.0004655197262763977, -0.000448077917098999, -0.00043063610792160034, -0.00041319429874420166, -0.000395752489566803, -0.0003783106803894043, -0.0003608688712120056, -0.00034342706203460693, -0.00032598525285720825, -0.00030854344367980957, -0.0002911016345024109, -0.0002736598253250122, -0.0002562180161476135, -0.00023877620697021484, -0.00022133439779281616, -0.00020389258861541748, -0.0001864507794380188, -0.00016900897026062012, -0.00015156716108322144, -0.00013412535190582275, -0.00011668354272842407, -9.924173355102539e-05, -8.179992437362671e-05, -6.435811519622803e-05, -4.6916306018829346e-05, -2.9474496841430664e-05, -1.2032687664031982e-05, 5.409121513366699e-06, 2.285093069076538e-05, 4.029273986816406e-05, 5.7734549045562744e-05, 7.517635822296143e-05, 9.261816740036011e-05, 0.00011005997657775879, 0.00012750178575515747, 0.00014494359493255615, 0.00016238540410995483, 0.00017982721328735352, 0.0001972690224647522, 0.00021471083164215088, 0.00023215264081954956, 0.00024959444999694824, 0.0002670362591743469, 0.0002844780683517456, 0.0003019198775291443, 0.00031936168670654297, 0.00033680349588394165, 0.00035424530506134033, 0.000371687114238739, 0.0003891289234161377, 0.0004065707325935364, 0.00042401254177093506, 0.00044145435094833374, 0.0004588961601257324, 0.0004763379693031311, 0.0004937797784805298, 0.0005112215876579285, 0.0005286633968353271, 0.0005461052060127258, 0.0005635470151901245, 0.0005809888243675232, 0.0005984306335449219]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 9.0, 2.0, 4.0, 11.0, 18.0, 28.0, 39.0, 71.0, 100.0, 177.0, 375.0, 774.0, 2002.0, 6425.0, 28169.0, 252772.0, 701438.0, 42924.0, 8739.0, 2523.0, 952.0, 464.0, 230.0, 102.0, 64.0, 37.0, 28.0, 21.0, 13.0, 14.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0712890625, -1.0331878662109375, -0.995086669921875, -0.9569854736328125, -0.91888427734375, -0.8807830810546875, -0.842681884765625, -0.8045806884765625, -0.7664794921875, -0.7283782958984375, -0.690277099609375, -0.6521759033203125, -0.61407470703125, -0.5759735107421875, -0.537872314453125, -0.4997711181640625, -0.461669921875, -0.4235687255859375, -0.385467529296875, -0.3473663330078125, -0.30926513671875, -0.2711639404296875, -0.233062744140625, -0.1949615478515625, -0.1568603515625, -0.1187591552734375, -0.080657958984375, -0.0425567626953125, -0.00445556640625, 0.0336456298828125, 0.071746826171875, 0.1098480224609375, 0.14794921875, 0.1860504150390625, 0.224151611328125, 0.2622528076171875, 0.30035400390625, 0.3384552001953125, 0.376556396484375, 0.4146575927734375, 0.4527587890625, 0.4908599853515625, 0.528961181640625, 0.5670623779296875, 0.60516357421875, 0.6432647705078125, 0.681365966796875, 0.7194671630859375, 0.757568359375, 0.7956695556640625, 0.833770751953125, 0.8718719482421875, 0.90997314453125, 0.9480743408203125, 0.986175537109375, 1.0242767333984375, 1.0623779296875, 1.1004791259765625, 1.138580322265625, 1.1766815185546875, 1.21478271484375, 1.2528839111328125, 1.290985107421875, 1.3290863037109375, 1.3671875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 6.0, 9.0, 12.0, 25.0, 16.0, 26.0, 40.0, 47.0, 64.0, 107.0, 132.0, 116.0, 96.0, 72.0, 56.0, 35.0, 32.0, 21.0, 18.0, 13.0, 15.0, 8.0, 6.0, 8.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.123046875, -1.0950393676757812, -1.0670318603515625, -1.0390243530273438, -1.011016845703125, -0.9830093383789062, -0.9550018310546875, -0.9269943237304688, -0.89898681640625, -0.8709793090820312, -0.8429718017578125, -0.8149642944335938, -0.786956787109375, -0.7589492797851562, -0.7309417724609375, -0.7029342651367188, -0.6749267578125, -0.6469192504882812, -0.6189117431640625, -0.5909042358398438, -0.562896728515625, -0.5348892211914062, -0.5068817138671875, -0.47887420654296875, -0.45086669921875, -0.42285919189453125, -0.3948516845703125, -0.36684417724609375, -0.338836669921875, -0.31082916259765625, -0.2828216552734375, -0.25481414794921875, -0.226806640625, -0.19879913330078125, -0.1707916259765625, -0.14278411865234375, -0.114776611328125, -0.08676910400390625, -0.0587615966796875, -0.03075408935546875, -0.00274658203125, 0.02526092529296875, 0.0532684326171875, 0.08127593994140625, 0.109283447265625, 0.13729095458984375, 0.1652984619140625, 0.19330596923828125, 0.2213134765625, 0.24932098388671875, 0.2773284912109375, 0.30533599853515625, 0.333343505859375, 0.36135101318359375, 0.3893585205078125, 0.41736602783203125, 0.44537353515625, 0.47338104248046875, 0.5013885498046875, 0.5293960571289062, 0.557403564453125, 0.5854110717773438, 0.6134185791015625, 0.6414260864257812, 0.66943359375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 8.0, 16.0, 53.0, 140.0, 480.0, 232.0, 63.0, 5.0, 9.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.801151275634766, -45.6234245300293, -44.44569778442383, -43.26797103881836, -42.090248107910156, -40.91252136230469, -39.73479461669922, -38.55706787109375, -37.37934112548828, -36.20161437988281, -35.023887634277344, -33.846160888671875, -32.668434143066406, -31.49070930480957, -30.312984466552734, -29.135257720947266, -27.957530975341797, -26.779804229736328, -25.60207748413086, -24.424352645874023, -23.246625900268555, -22.068899154663086, -20.89117431640625, -19.71344757080078, -18.535720825195312, -17.357994079589844, -16.180267333984375, -15.002542495727539, -13.82481575012207, -12.647089004516602, -11.46936321258545, -10.291637420654297, -9.113910675048828, -7.936184406280518, -6.758458137512207, -5.5807318687438965, -4.403005599975586, -3.2252793312072754, -2.047553062438965, -0.8698272705078125, 0.30789947509765625, 1.4856257438659668, 2.6633520126342773, 3.841078281402588, 5.018804550170898, 6.196530818939209, 7.3742570877075195, 8.551982879638672, 9.72970962524414, 10.90743637084961, 12.085162162780762, 13.262887954711914, 14.440614700317383, 15.618341445922852, 16.796066284179688, 17.973793029785156, 19.151519775390625, 20.329246520996094, 21.506973266601562, 22.6846981048584, 23.862424850463867, 25.040151596069336, 26.217876434326172, 27.39560317993164, 28.57332992553711]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 14.0, 10.0, 23.0, 12.0, 23.0, 30.0, 31.0, 21.0, 27.0, 27.0, 33.0, 30.0, 43.0, 56.0, 102.0, 110.0, 61.0, 49.0, 31.0, 33.0, 30.0, 26.0, 18.0, 19.0, 21.0, 12.0, 11.0, 17.0, 11.0, 17.0, 10.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-9.112117767333984, -8.818464279174805, -8.524810791015625, -8.231157302856445, -7.937503814697266, -7.643850326538086, -7.350196838378906, -7.056543350219727, -6.762889862060547, -6.469236373901367, -6.1755828857421875, -5.881929397583008, -5.588275909423828, -5.294622421264648, -5.000968933105469, -4.707315444946289, -4.413661956787109, -4.12000846862793, -3.82635498046875, -3.5327014923095703, -3.2390480041503906, -2.945394515991211, -2.6517410278320312, -2.3580875396728516, -2.064434051513672, -1.7707805633544922, -1.4771270751953125, -1.1834735870361328, -0.8898200988769531, -0.5961666107177734, -0.30251312255859375, -0.008859634399414062, 0.2847938537597656, 0.5784473419189453, 0.872100830078125, 1.1657543182373047, 1.4594078063964844, 1.753061294555664, 2.0467147827148438, 2.3403682708740234, 2.634021759033203, 2.927675247192383, 3.2213287353515625, 3.514982223510742, 3.808635711669922, 4.102289199829102, 4.395942687988281, 4.689596176147461, 4.983249664306641, 5.27690315246582, 5.570556640625, 5.86421012878418, 6.157863616943359, 6.451517105102539, 6.745170593261719, 7.038824081420898, 7.332477569580078, 7.626131057739258, 7.9197845458984375, 8.213438034057617, 8.507091522216797, 8.800745010375977, 9.094398498535156, 9.388051986694336, 9.681705474853516]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 13.0, 7.0, 17.0, 14.0, 19.0, 25.0, 24.0, 43.0, 52.0, 92.0, 145.0, 221.0, 400.0, 629.0, 1079.0, 2005.0, 3759.0, 8700.0, 34004.0, 699625.0, 3214161.0, 196065.0, 19562.0, 6407.0, 3012.0, 1723.0, 955.0, 589.0, 348.0, 213.0, 146.0, 75.0, 44.0, 31.0, 22.0, 18.0, 9.0, 11.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.451171875, -1.4048309326171875, -1.358489990234375, -1.3121490478515625, -1.26580810546875, -1.2194671630859375, -1.173126220703125, -1.1267852783203125, -1.0804443359375, -1.0341033935546875, -0.987762451171875, -0.9414215087890625, -0.89508056640625, -0.8487396240234375, -0.802398681640625, -0.7560577392578125, -0.709716796875, -0.6633758544921875, -0.617034912109375, -0.5706939697265625, -0.52435302734375, -0.4780120849609375, -0.431671142578125, -0.3853302001953125, -0.3389892578125, -0.2926483154296875, -0.246307373046875, -0.1999664306640625, -0.15362548828125, -0.1072845458984375, -0.060943603515625, -0.0146026611328125, 0.03173828125, 0.0780792236328125, 0.124420166015625, 0.1707611083984375, 0.21710205078125, 0.2634429931640625, 0.309783935546875, 0.3561248779296875, 0.4024658203125, 0.4488067626953125, 0.495147705078125, 0.5414886474609375, 0.58782958984375, 0.6341705322265625, 0.680511474609375, 0.7268524169921875, 0.773193359375, 0.8195343017578125, 0.865875244140625, 0.9122161865234375, 0.95855712890625, 1.0048980712890625, 1.051239013671875, 1.0975799560546875, 1.1439208984375, 1.1902618408203125, 1.236602783203125, 1.2829437255859375, 1.32928466796875, 1.3756256103515625, 1.421966552734375, 1.4683074951171875, 1.5146484375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 7.0, 5.0, 4.0, 14.0, 4.0, 12.0, 17.0, 19.0, 12.0, 19.0, 34.0, 30.0, 41.0, 27.0, 33.0, 39.0, 39.0, 42.0, 51.0, 32.0, 54.0, 46.0, 45.0, 45.0, 47.0, 49.0, 30.0, 35.0, 30.0, 24.0, 15.0, 23.0, 10.0, 20.0, 10.0, 7.0, 8.0, 5.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5263671875, -0.5102996826171875, -0.494232177734375, -0.4781646728515625, -0.46209716796875, -0.4460296630859375, -0.429962158203125, -0.4138946533203125, -0.3978271484375, -0.3817596435546875, -0.365692138671875, -0.3496246337890625, -0.33355712890625, -0.3174896240234375, -0.301422119140625, -0.2853546142578125, -0.269287109375, -0.2532196044921875, -0.237152099609375, -0.2210845947265625, -0.20501708984375, -0.1889495849609375, -0.172882080078125, -0.1568145751953125, -0.1407470703125, -0.1246795654296875, -0.108612060546875, -0.0925445556640625, -0.07647705078125, -0.0604095458984375, -0.044342041015625, -0.0282745361328125, -0.01220703125, 0.0038604736328125, 0.019927978515625, 0.0359954833984375, 0.05206298828125, 0.0681304931640625, 0.084197998046875, 0.1002655029296875, 0.1163330078125, 0.1324005126953125, 0.148468017578125, 0.1645355224609375, 0.18060302734375, 0.1966705322265625, 0.212738037109375, 0.2288055419921875, 0.244873046875, 0.2609405517578125, 0.277008056640625, 0.2930755615234375, 0.30914306640625, 0.3252105712890625, 0.341278076171875, 0.3573455810546875, 0.3734130859375, 0.3894805908203125, 0.405548095703125, 0.4216156005859375, 0.43768310546875, 0.4537506103515625, 0.469818115234375, 0.4858856201171875, 0.501953125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 7.0, 4.0, 12.0, 27.0, 55.0, 126.0, 198.0, 477.0, 942.0, 3025.0, 33778.0, 4100633.0, 49277.0, 3687.0, 1091.0, 496.0, 222.0, 119.0, 40.0, 26.0, 19.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.953125, -4.79095458984375, -4.6287841796875, -4.46661376953125, -4.304443359375, -4.14227294921875, -3.9801025390625, -3.81793212890625, -3.65576171875, -3.49359130859375, -3.3314208984375, -3.16925048828125, -3.007080078125, -2.84490966796875, -2.6827392578125, -2.52056884765625, -2.3583984375, -2.19622802734375, -2.0340576171875, -1.87188720703125, -1.709716796875, -1.54754638671875, -1.3853759765625, -1.22320556640625, -1.06103515625, -0.89886474609375, -0.7366943359375, -0.57452392578125, -0.412353515625, -0.25018310546875, -0.0880126953125, 0.07415771484375, 0.236328125, 0.39849853515625, 0.5606689453125, 0.72283935546875, 0.885009765625, 1.04718017578125, 1.2093505859375, 1.37152099609375, 1.53369140625, 1.69586181640625, 1.8580322265625, 2.02020263671875, 2.182373046875, 2.34454345703125, 2.5067138671875, 2.66888427734375, 2.8310546875, 2.99322509765625, 3.1553955078125, 3.31756591796875, 3.479736328125, 3.64190673828125, 3.8040771484375, 3.96624755859375, 4.12841796875, 4.29058837890625, 4.4527587890625, 4.61492919921875, 4.777099609375, 4.93927001953125, 5.1014404296875, 5.26361083984375, 5.42578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 21.0, 48.0, 74.0, 201.0, 569.0, 1625.0, 1031.0, 277.0, 104.0, 45.0, 24.0, 15.0, 6.0, 7.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.861328125, -3.749908447265625, -3.63848876953125, -3.527069091796875, -3.4156494140625, -3.304229736328125, -3.19281005859375, -3.081390380859375, -2.969970703125, -2.858551025390625, -2.74713134765625, -2.635711669921875, -2.5242919921875, -2.412872314453125, -2.30145263671875, -2.190032958984375, -2.07861328125, -1.967193603515625, -1.85577392578125, -1.744354248046875, -1.6329345703125, -1.521514892578125, -1.41009521484375, -1.298675537109375, -1.187255859375, -1.075836181640625, -0.96441650390625, -0.852996826171875, -0.7415771484375, -0.630157470703125, -0.51873779296875, -0.407318115234375, -0.2958984375, -0.184478759765625, -0.07305908203125, 0.038360595703125, 0.1497802734375, 0.261199951171875, 0.37261962890625, 0.484039306640625, 0.595458984375, 0.706878662109375, 0.81829833984375, 0.929718017578125, 1.0411376953125, 1.152557373046875, 1.26397705078125, 1.375396728515625, 1.48681640625, 1.598236083984375, 1.70965576171875, 1.821075439453125, 1.9324951171875, 2.043914794921875, 2.15533447265625, 2.266754150390625, 2.378173828125, 2.489593505859375, 2.60101318359375, 2.712432861328125, 2.8238525390625, 2.935272216796875, 3.04669189453125, 3.158111572265625, 3.26953125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 13.0, 12.0, 20.0, 28.0, 50.0, 94.0, 140.0, 196.0, 157.0, 113.0, 65.0, 40.0, 27.0, 13.0, 8.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.471111297607422, -11.894577026367188, -11.318042755126953, -10.741509437561035, -10.1649751663208, -9.588440895080566, -9.011907577514648, -8.435373306274414, -7.85883903503418, -7.282304763793945, -6.705770969390869, -6.129237174987793, -5.552702903747559, -4.976168632507324, -4.399634838104248, -3.823101043701172, -3.2465667724609375, -2.6700327396392822, -2.093498706817627, -1.5169646739959717, -0.9404306411743164, -0.36389660835266113, 0.21263742446899414, 0.7891712188720703, 1.3657054901123047, 1.94223952293396, 2.5187735557556152, 3.0953075885772705, 3.671841621398926, 4.24837589263916, 4.824909687042236, 5.4014434814453125, 5.977977752685547, 6.554512023925781, 7.131045818328857, 7.707579612731934, 8.284113883972168, 8.860648155212402, 9.43718147277832, 10.013715744018555, 10.590250015258789, 11.166784286499023, 11.743318557739258, 12.319851875305176, 12.89638614654541, 13.472920417785645, 14.049453735351562, 14.625988006591797, 15.202522277832031, 15.779056549072266, 16.3555908203125, 16.932125091552734, 17.50865936279297, 18.08519172668457, 18.661725997924805, 19.23826026916504, 19.814794540405273, 20.391328811645508, 20.967863082885742, 21.544397354125977, 22.120929718017578, 22.697463989257812, 23.273998260498047, 23.85053253173828, 24.427066802978516]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 6.0, 3.0, 4.0, 8.0, 6.0, 17.0, 15.0, 15.0, 29.0, 26.0, 31.0, 18.0, 42.0, 44.0, 47.0, 65.0, 55.0, 68.0, 63.0, 71.0, 46.0, 46.0, 44.0, 35.0, 33.0, 33.0, 20.0, 19.0, 14.0, 18.0, 15.0, 8.0, 9.0, 6.0, 4.0, 5.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.278467178344727, -7.967028617858887, -7.655590057373047, -7.344151496887207, -7.032712936401367, -6.721274375915527, -6.409836292266846, -6.098397731781006, -5.786959171295166, -5.475520610809326, -5.164082050323486, -4.8526434898376465, -4.541205406188965, -4.229766845703125, -3.918328285217285, -3.6068897247314453, -3.2954511642456055, -2.9840126037597656, -2.672574043273926, -2.361135721206665, -2.049697160720825, -1.7382586002349854, -1.426820158958435, -1.1153817176818848, -0.8039431571960449, -0.49250465631484985, -0.18106615543365479, 0.13037234544754028, 0.44181084632873535, 0.7532494068145752, 1.0646878480911255, 1.3761262893676758, 1.6875648498535156, 1.9990034103393555, 2.3104419708251953, 2.621880292892456, 2.933318853378296, 3.2447574138641357, 3.5561957359313965, 3.8676342964172363, 4.179072856903076, 4.490511417388916, 4.801949977874756, 5.113388538360596, 5.424826622009277, 5.736265182495117, 6.047703742980957, 6.359142303466797, 6.670580863952637, 6.982019424438477, 7.293457984924316, 7.604896545410156, 7.916335105895996, 8.227773666381836, 8.539212226867676, 8.850650787353516, 9.162088394165039, 9.473526954650879, 9.784965515136719, 10.096404075622559, 10.407842636108398, 10.719281196594238, 11.030719757080078, 11.342157363891602, 11.653596878051758]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 16.0, 18.0, 9.0, 24.0, 47.0, 44.0, 73.0, 119.0, 186.0, 288.0, 383.0, 651.0, 1083.0, 1654.0, 2944.0, 5004.0, 9176.0, 17209.0, 34868.0, 77354.0, 193205.0, 369175.0, 187694.0, 75087.0, 34241.0, 16599.0, 9069.0, 4878.0, 2906.0, 1709.0, 1028.0, 690.0, 397.0, 249.0, 152.0, 101.0, 73.0, 38.0, 32.0, 26.0, 13.0, 15.0, 9.0, 6.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.0, -0.9692153930664062, -0.9384307861328125, -0.9076461791992188, -0.876861572265625, -0.8460769653320312, -0.8152923583984375, -0.7845077514648438, -0.75372314453125, -0.7229385375976562, -0.6921539306640625, -0.6613693237304688, -0.630584716796875, -0.5998001098632812, -0.5690155029296875, -0.5382308959960938, -0.5074462890625, -0.47666168212890625, -0.4458770751953125, -0.41509246826171875, -0.384307861328125, -0.35352325439453125, -0.3227386474609375, -0.29195404052734375, -0.26116943359375, -0.23038482666015625, -0.1996002197265625, -0.16881561279296875, -0.138031005859375, -0.10724639892578125, -0.0764617919921875, -0.04567718505859375, -0.014892578125, 0.01589202880859375, 0.0466766357421875, 0.07746124267578125, 0.108245849609375, 0.13903045654296875, 0.1698150634765625, 0.20059967041015625, 0.23138427734375, 0.26216888427734375, 0.2929534912109375, 0.32373809814453125, 0.354522705078125, 0.38530731201171875, 0.4160919189453125, 0.44687652587890625, 0.4776611328125, 0.5084457397460938, 0.5392303466796875, 0.5700149536132812, 0.600799560546875, 0.6315841674804688, 0.6623687744140625, 0.6931533813476562, 0.72393798828125, 0.7547225952148438, 0.7855072021484375, 0.8162918090820312, 0.847076416015625, 0.8778610229492188, 0.9086456298828125, 0.9394302368164062, 0.97021484375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 7.0, 5.0, 14.0, 9.0, 12.0, 12.0, 13.0, 18.0, 34.0, 25.0, 24.0, 41.0, 32.0, 31.0, 45.0, 42.0, 39.0, 37.0, 45.0, 52.0, 53.0, 51.0, 49.0, 29.0, 46.0, 22.0, 37.0, 40.0, 22.0, 19.0, 14.0, 12.0, 16.0, 9.0, 7.0, 8.0, 6.0, 4.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.72216796875, -0.70135498046875, -0.6805419921875, -0.65972900390625, -0.638916015625, -0.61810302734375, -0.5972900390625, -0.57647705078125, -0.5556640625, -0.53485107421875, -0.5140380859375, -0.49322509765625, -0.472412109375, -0.45159912109375, -0.4307861328125, -0.40997314453125, -0.38916015625, -0.36834716796875, -0.3475341796875, -0.32672119140625, -0.305908203125, -0.28509521484375, -0.2642822265625, -0.24346923828125, -0.22265625, -0.20184326171875, -0.1810302734375, -0.16021728515625, -0.139404296875, -0.11859130859375, -0.0977783203125, -0.07696533203125, -0.05615234375, -0.03533935546875, -0.0145263671875, 0.00628662109375, 0.027099609375, 0.04791259765625, 0.0687255859375, 0.08953857421875, 0.1103515625, 0.13116455078125, 0.1519775390625, 0.17279052734375, 0.193603515625, 0.21441650390625, 0.2352294921875, 0.25604248046875, 0.27685546875, 0.29766845703125, 0.3184814453125, 0.33929443359375, 0.360107421875, 0.38092041015625, 0.4017333984375, 0.42254638671875, 0.443359375, 0.46417236328125, 0.4849853515625, 0.50579833984375, 0.526611328125, 0.54742431640625, 0.5682373046875, 0.58905029296875, 0.60986328125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 8.0, 10.0, 9.0, 26.0, 23.0, 26.0, 48.0, 75.0, 76.0, 113.0, 171.0, 227.0, 320.0, 534.0, 884.0, 1715.0, 4233.0, 15703.0, 113338.0, 821190.0, 70932.0, 11658.0, 3388.0, 1502.0, 810.0, 512.0, 318.0, 195.0, 132.0, 108.0, 76.0, 53.0, 43.0, 21.0, 30.0, 20.0, 12.0, 13.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.09375, -3.008758544921875, -2.92376708984375, -2.838775634765625, -2.7537841796875, -2.668792724609375, -2.58380126953125, -2.498809814453125, -2.413818359375, -2.328826904296875, -2.24383544921875, -2.158843994140625, -2.0738525390625, -1.988861083984375, -1.90386962890625, -1.818878173828125, -1.73388671875, -1.648895263671875, -1.56390380859375, -1.478912353515625, -1.3939208984375, -1.308929443359375, -1.22393798828125, -1.138946533203125, -1.053955078125, -0.968963623046875, -0.88397216796875, -0.798980712890625, -0.7139892578125, -0.628997802734375, -0.54400634765625, -0.459014892578125, -0.3740234375, -0.289031982421875, -0.20404052734375, -0.119049072265625, -0.0340576171875, 0.050933837890625, 0.13592529296875, 0.220916748046875, 0.305908203125, 0.390899658203125, 0.47589111328125, 0.560882568359375, 0.6458740234375, 0.730865478515625, 0.81585693359375, 0.900848388671875, 0.98583984375, 1.070831298828125, 1.15582275390625, 1.240814208984375, 1.3258056640625, 1.410797119140625, 1.49578857421875, 1.580780029296875, 1.665771484375, 1.750762939453125, 1.83575439453125, 1.920745849609375, 2.0057373046875, 2.090728759765625, 2.17572021484375, 2.260711669921875, 2.345703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 3.0, 9.0, 10.0, 8.0, 8.0, 13.0, 12.0, 10.0, 19.0, 26.0, 22.0, 27.0, 44.0, 35.0, 44.0, 31.0, 60.0, 51.0, 48.0, 77.0, 61.0, 56.0, 44.0, 43.0, 38.0, 22.0, 25.0, 23.0, 21.0, 25.0, 15.0, 11.0, 6.0, 8.0, 8.0, 4.0, 4.0, 6.0, 2.0, 0.0, 5.0, 0.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.580078125, -2.4906005859375, -2.401123046875, -2.3116455078125, -2.22216796875, -2.1326904296875, -2.043212890625, -1.9537353515625, -1.8642578125, -1.7747802734375, -1.685302734375, -1.5958251953125, -1.50634765625, -1.4168701171875, -1.327392578125, -1.2379150390625, -1.1484375, -1.0589599609375, -0.969482421875, -0.8800048828125, -0.79052734375, -0.7010498046875, -0.611572265625, -0.5220947265625, -0.4326171875, -0.3431396484375, -0.253662109375, -0.1641845703125, -0.07470703125, 0.0147705078125, 0.104248046875, 0.1937255859375, 0.283203125, 0.3726806640625, 0.462158203125, 0.5516357421875, 0.64111328125, 0.7305908203125, 0.820068359375, 0.9095458984375, 0.9990234375, 1.0885009765625, 1.177978515625, 1.2674560546875, 1.35693359375, 1.4464111328125, 1.535888671875, 1.6253662109375, 1.71484375, 1.8043212890625, 1.893798828125, 1.9832763671875, 2.07275390625, 2.1622314453125, 2.251708984375, 2.3411865234375, 2.4306640625, 2.5201416015625, 2.609619140625, 2.6990966796875, 2.78857421875, 2.8780517578125, 2.967529296875, 3.0570068359375, 3.146484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 11.0, 6.0, 4.0, 11.0, 10.0, 19.0, 15.0, 39.0, 58.0, 83.0, 121.0, 216.0, 283.0, 571.0, 1039.0, 2161.0, 5190.0, 15881.0, 66861.0, 732081.0, 177286.0, 31089.0, 8895.0, 3268.0, 1460.0, 740.0, 449.0, 225.0, 162.0, 100.0, 58.0, 39.0, 31.0, 22.0, 23.0, 8.0, 7.0, 11.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.7900390625, -0.7651596069335938, -0.7402801513671875, -0.7154006958007812, -0.690521240234375, -0.6656417846679688, -0.6407623291015625, -0.6158828735351562, -0.59100341796875, -0.5661239624023438, -0.5412445068359375, -0.5163650512695312, -0.491485595703125, -0.46660614013671875, -0.4417266845703125, -0.41684722900390625, -0.3919677734375, -0.36708831787109375, -0.3422088623046875, -0.31732940673828125, -0.292449951171875, -0.26757049560546875, -0.2426910400390625, -0.21781158447265625, -0.19293212890625, -0.16805267333984375, -0.1431732177734375, -0.11829376220703125, -0.093414306640625, -0.06853485107421875, -0.0436553955078125, -0.01877593994140625, 0.006103515625, 0.03098297119140625, 0.0558624267578125, 0.08074188232421875, 0.105621337890625, 0.13050079345703125, 0.1553802490234375, 0.18025970458984375, 0.20513916015625, 0.23001861572265625, 0.2548980712890625, 0.27977752685546875, 0.304656982421875, 0.32953643798828125, 0.3544158935546875, 0.37929534912109375, 0.4041748046875, 0.42905426025390625, 0.4539337158203125, 0.47881317138671875, 0.503692626953125, 0.5285720825195312, 0.5534515380859375, 0.5783309936523438, 0.60321044921875, 0.6280899047851562, 0.6529693603515625, 0.6778488159179688, 0.702728271484375, 0.7276077270507812, 0.7524871826171875, 0.7773666381835938, 0.80224609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 4.0, 9.0, 8.0, 4.0, 10.0, 15.0, 20.0, 18.0, 28.0, 27.0, 55.0, 61.0, 79.0, 103.0, 163.0, 99.0, 61.0, 57.0, 37.0, 37.0, 19.0, 12.0, 6.0, 13.0, 10.0, 6.0, 6.0, 8.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00031447410583496094, -0.0003055669367313385, -0.00029665976762771606, -0.00028775259852409363, -0.0002788454294204712, -0.00026993826031684875, -0.0002610310912132263, -0.0002521239221096039, -0.00024321675300598145, -0.000234309583902359, -0.00022540241479873657, -0.00021649524569511414, -0.0002075880765914917, -0.00019868090748786926, -0.00018977373838424683, -0.0001808665692806244, -0.00017195940017700195, -0.00016305223107337952, -0.00015414506196975708, -0.00014523789286613464, -0.0001363307237625122, -0.00012742355465888977, -0.00011851638555526733, -0.0001096092164516449, -0.00010070204734802246, -9.179487824440002e-05, -8.288770914077759e-05, -7.398054003715515e-05, -6.507337093353271e-05, -5.616620182991028e-05, -4.725903272628784e-05, -3.8351863622665405e-05, -2.944469451904297e-05, -2.0537525415420532e-05, -1.1630356311798096e-05, -2.723187208175659e-06, 6.183981895446777e-06, 1.5091150999069214e-05, 2.399832010269165e-05, 3.290548920631409e-05, 4.1812658309936523e-05, 5.071982741355896e-05, 5.9626996517181396e-05, 6.853416562080383e-05, 7.744133472442627e-05, 8.63485038280487e-05, 9.525567293167114e-05, 0.00010416284203529358, 0.00011307001113891602, 0.00012197718024253845, 0.0001308843493461609, 0.00013979151844978333, 0.00014869868755340576, 0.0001576058566570282, 0.00016651302576065063, 0.00017542019486427307, 0.0001843273639678955, 0.00019323453307151794, 0.00020214170217514038, 0.00021104887127876282, 0.00021995604038238525, 0.0002288632094860077, 0.00023777037858963013, 0.00024667754769325256, 0.000255584716796875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 3.0, 4.0, 7.0, 11.0, 20.0, 24.0, 28.0, 33.0, 79.0, 107.0, 160.0, 224.0, 430.0, 844.0, 1668.0, 4315.0, 13870.0, 64100.0, 725720.0, 192955.0, 30673.0, 7777.0, 2772.0, 1163.0, 595.0, 332.0, 185.0, 150.0, 85.0, 71.0, 45.0, 25.0, 21.0, 16.0, 8.0, 6.0, 8.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.697265625, -0.67303466796875, -0.6488037109375, -0.62457275390625, -0.600341796875, -0.57611083984375, -0.5518798828125, -0.52764892578125, -0.50341796875, -0.47918701171875, -0.4549560546875, -0.43072509765625, -0.406494140625, -0.38226318359375, -0.3580322265625, -0.33380126953125, -0.3095703125, -0.28533935546875, -0.2611083984375, -0.23687744140625, -0.212646484375, -0.18841552734375, -0.1641845703125, -0.13995361328125, -0.11572265625, -0.09149169921875, -0.0672607421875, -0.04302978515625, -0.018798828125, 0.00543212890625, 0.0296630859375, 0.05389404296875, 0.078125, 0.10235595703125, 0.1265869140625, 0.15081787109375, 0.175048828125, 0.19927978515625, 0.2235107421875, 0.24774169921875, 0.27197265625, 0.29620361328125, 0.3204345703125, 0.34466552734375, 0.368896484375, 0.39312744140625, 0.4173583984375, 0.44158935546875, 0.4658203125, 0.49005126953125, 0.5142822265625, 0.53851318359375, 0.562744140625, 0.58697509765625, 0.6112060546875, 0.63543701171875, 0.65966796875, 0.68389892578125, 0.7081298828125, 0.73236083984375, 0.756591796875, 0.78082275390625, 0.8050537109375, 0.82928466796875, 0.853515625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 5.0, 7.0, 4.0, 9.0, 10.0, 17.0, 25.0, 20.0, 28.0, 42.0, 37.0, 42.0, 58.0, 72.0, 109.0, 108.0, 85.0, 67.0, 51.0, 38.0, 34.0, 27.0, 15.0, 9.0, 15.0, 9.0, 13.0, 9.0, 15.0, 9.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.666015625, -0.6470413208007812, -0.6280670166015625, -0.6090927124023438, -0.590118408203125, -0.5711441040039062, -0.5521697998046875, -0.5331954956054688, -0.51422119140625, -0.49524688720703125, -0.4762725830078125, -0.45729827880859375, -0.438323974609375, -0.41934967041015625, -0.4003753662109375, -0.38140106201171875, -0.3624267578125, -0.34345245361328125, -0.3244781494140625, -0.30550384521484375, -0.286529541015625, -0.26755523681640625, -0.2485809326171875, -0.22960662841796875, -0.21063232421875, -0.19165802001953125, -0.1726837158203125, -0.15370941162109375, -0.134735107421875, -0.11576080322265625, -0.0967864990234375, -0.07781219482421875, -0.058837890625, -0.03986358642578125, -0.0208892822265625, -0.00191497802734375, 0.017059326171875, 0.03603363037109375, 0.0550079345703125, 0.07398223876953125, 0.09295654296875, 0.11193084716796875, 0.1309051513671875, 0.14987945556640625, 0.168853759765625, 0.18782806396484375, 0.2068023681640625, 0.22577667236328125, 0.2447509765625, 0.26372528076171875, 0.2826995849609375, 0.30167388916015625, 0.320648193359375, 0.33962249755859375, 0.3585968017578125, 0.37757110595703125, 0.39654541015625, 0.41551971435546875, 0.4344940185546875, 0.45346832275390625, 0.472442626953125, 0.49141693115234375, 0.5103912353515625, 0.5293655395507812, 0.54833984375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 13.0, 32.0, 113.0, 349.0, 320.0, 100.0, 45.0, 16.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.54279327392578, -41.529170989990234, -40.51555252075195, -39.501930236816406, -38.488311767578125, -37.47468948364258, -36.46106719970703, -35.44744873046875, -34.4338264465332, -33.420204162597656, -32.406585693359375, -31.392963409423828, -30.379343032836914, -29.36572265625, -28.352102279663086, -27.338481903076172, -26.324861526489258, -25.311241149902344, -24.29762077331543, -23.284000396728516, -22.27037811279297, -21.256757736206055, -20.24313735961914, -19.229516983032227, -18.215896606445312, -17.2022762298584, -16.188655853271484, -15.175034523010254, -14.161413192749023, -13.14779281616211, -12.134172439575195, -11.120552062988281, -10.106929779052734, -9.09330940246582, -8.07968807220459, -7.066067695617676, -6.0524468421936035, -5.038825988769531, -4.025205612182617, -3.011584758758545, -1.9979639053344727, -0.9843431711196899, 0.029277563095092773, 1.042898178100586, 2.056519031524658, 3.0701398849487305, 4.0837602615356445, 5.097381114959717, 6.111001968383789, 7.124622821807861, 8.138243675231934, 9.151864051818848, 10.165485382080078, 11.179105758666992, 12.192726135253906, 13.20634651184082, 14.21996784210205, 15.233588218688965, 16.247209548950195, 17.26082992553711, 18.274450302124023, 19.288070678710938, 20.301692962646484, 21.3153133392334, 22.328933715820312]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 5.0, 7.0, 9.0, 9.0, 11.0, 9.0, 15.0, 11.0, 14.0, 17.0, 15.0, 29.0, 35.0, 31.0, 35.0, 29.0, 38.0, 63.0, 180.0, 109.0, 45.0, 37.0, 29.0, 28.0, 24.0, 25.0, 24.0, 17.0, 18.0, 16.0, 19.0, 13.0, 5.0, 8.0, 7.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.030384063720703, -14.596818923950195, -14.163253784179688, -13.72968864440918, -13.296123504638672, -12.862558364868164, -12.42899227142334, -11.995427131652832, -11.561861991882324, -11.128296852111816, -10.694731712341309, -10.2611665725708, -9.827600479125977, -9.394035339355469, -8.960470199584961, -8.526905059814453, -8.093339920043945, -7.6597747802734375, -7.22620964050293, -6.792644023895264, -6.359078884124756, -5.925513744354248, -5.491948127746582, -5.058382987976074, -4.624817848205566, -4.191252708435059, -3.7576873302459717, -3.3241219520568848, -2.890556812286377, -2.456991672515869, -2.0234262943267822, -1.5898609161376953, -1.156296730041504, -0.7227314710617065, -0.2891662120819092, 0.14439904689788818, 0.5779643058776855, 1.0115294456481934, 1.4450948238372803, 1.8786602020263672, 2.312225341796875, 2.745790481567383, 3.1793558597564697, 3.6129212379455566, 4.0464863777160645, 4.480051517486572, 4.913617134094238, 5.347182273864746, 5.780747413635254, 6.214312553405762, 6.6478776931762695, 7.0814433097839355, 7.515008449554443, 7.948573589324951, 8.382139205932617, 8.815704345703125, 9.249269485473633, 9.68283462524414, 10.116399765014648, 10.549964904785156, 10.983530044555664, 11.417095184326172, 11.850661277770996, 12.284226417541504, 12.717791557312012]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 8.0, 11.0, 7.0, 7.0, 10.0, 22.0, 30.0, 29.0, 41.0, 59.0, 119.0, 180.0, 317.0, 513.0, 1034.0, 2205.0, 5265.0, 15154.0, 74637.0, 1331726.0, 2584543.0, 142533.0, 22917.0, 7263.0, 2837.0, 1274.0, 685.0, 328.0, 207.0, 103.0, 60.0, 59.0, 35.0, 19.0, 16.0, 9.0, 5.0, 5.0, 2.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.568359375, -2.501007080078125, -2.43365478515625, -2.366302490234375, -2.2989501953125, -2.231597900390625, -2.16424560546875, -2.096893310546875, -2.029541015625, -1.962188720703125, -1.89483642578125, -1.827484130859375, -1.7601318359375, -1.692779541015625, -1.62542724609375, -1.558074951171875, -1.49072265625, -1.423370361328125, -1.35601806640625, -1.288665771484375, -1.2213134765625, -1.153961181640625, -1.08660888671875, -1.019256591796875, -0.951904296875, -0.884552001953125, -0.81719970703125, -0.749847412109375, -0.6824951171875, -0.615142822265625, -0.54779052734375, -0.480438232421875, -0.4130859375, -0.345733642578125, -0.27838134765625, -0.211029052734375, -0.1436767578125, -0.076324462890625, -0.00897216796875, 0.058380126953125, 0.125732421875, 0.193084716796875, 0.26043701171875, 0.327789306640625, 0.3951416015625, 0.462493896484375, 0.52984619140625, 0.597198486328125, 0.66455078125, 0.731903076171875, 0.79925537109375, 0.866607666015625, 0.9339599609375, 1.001312255859375, 1.06866455078125, 1.136016845703125, 1.203369140625, 1.270721435546875, 1.33807373046875, 1.405426025390625, 1.4727783203125, 1.540130615234375, 1.60748291015625, 1.674835205078125, 1.7421875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 5.0, 5.0, 4.0, 10.0, 9.0, 13.0, 13.0, 15.0, 13.0, 32.0, 34.0, 31.0, 30.0, 38.0, 48.0, 51.0, 53.0, 40.0, 52.0, 54.0, 53.0, 44.0, 56.0, 31.0, 43.0, 39.0, 19.0, 26.0, 19.0, 30.0, 19.0, 11.0, 19.0, 8.0, 8.0, 9.0, 3.0, 4.0, 8.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.74072265625, -0.7195816040039062, -0.6984405517578125, -0.6772994995117188, -0.656158447265625, -0.6350173950195312, -0.6138763427734375, -0.5927352905273438, -0.57159423828125, -0.5504531860351562, -0.5293121337890625, -0.5081710815429688, -0.487030029296875, -0.46588897705078125, -0.4447479248046875, -0.42360687255859375, -0.4024658203125, -0.38132476806640625, -0.3601837158203125, -0.33904266357421875, -0.317901611328125, -0.29676055908203125, -0.2756195068359375, -0.25447845458984375, -0.23333740234375, -0.21219635009765625, -0.1910552978515625, -0.16991424560546875, -0.148773193359375, -0.12763214111328125, -0.1064910888671875, -0.08535003662109375, -0.064208984375, -0.04306793212890625, -0.0219268798828125, -0.00078582763671875, 0.020355224609375, 0.04149627685546875, 0.0626373291015625, 0.08377838134765625, 0.10491943359375, 0.12606048583984375, 0.1472015380859375, 0.16834259033203125, 0.189483642578125, 0.21062469482421875, 0.2317657470703125, 0.25290679931640625, 0.2740478515625, 0.29518890380859375, 0.3163299560546875, 0.33747100830078125, 0.358612060546875, 0.37975311279296875, 0.4008941650390625, 0.42203521728515625, 0.44317626953125, 0.46431732177734375, 0.4854583740234375, 0.5065994262695312, 0.527740478515625, 0.5488815307617188, 0.5700225830078125, 0.5911636352539062, 0.6123046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 17.0, 12.0, 15.0, 18.0, 39.0, 54.0, 87.0, 185.0, 309.0, 663.0, 1736.0, 7853.0, 210098.0, 3944732.0, 23254.0, 3145.0, 996.0, 405.0, 237.0, 131.0, 84.0, 52.0, 39.0, 32.0, 21.0, 9.0, 14.0, 6.0, 0.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.473388671875, -6.25927734375, -6.045166015625, -5.8310546875, -5.616943359375, -5.40283203125, -5.188720703125, -4.974609375, -4.760498046875, -4.54638671875, -4.332275390625, -4.1181640625, -3.904052734375, -3.68994140625, -3.475830078125, -3.26171875, -3.047607421875, -2.83349609375, -2.619384765625, -2.4052734375, -2.191162109375, -1.97705078125, -1.762939453125, -1.548828125, -1.334716796875, -1.12060546875, -0.906494140625, -0.6923828125, -0.478271484375, -0.26416015625, -0.050048828125, 0.1640625, 0.378173828125, 0.59228515625, 0.806396484375, 1.0205078125, 1.234619140625, 1.44873046875, 1.662841796875, 1.876953125, 2.091064453125, 2.30517578125, 2.519287109375, 2.7333984375, 2.947509765625, 3.16162109375, 3.375732421875, 3.58984375, 3.803955078125, 4.01806640625, 4.232177734375, 4.4462890625, 4.660400390625, 4.87451171875, 5.088623046875, 5.302734375, 5.516845703125, 5.73095703125, 5.945068359375, 6.1591796875, 6.373291015625, 6.58740234375, 6.801513671875, 7.015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 8.0, 10.0, 9.0, 18.0, 18.0, 25.0, 36.0, 56.0, 61.0, 115.0, 156.0, 211.0, 421.0, 724.0, 871.0, 497.0, 283.0, 176.0, 122.0, 76.0, 48.0, 36.0, 22.0, 18.0, 14.0, 11.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.076171875, -2.98046875, -2.884765625, -2.7890625, -2.693359375, -2.59765625, -2.501953125, -2.40625, -2.310546875, -2.21484375, -2.119140625, -2.0234375, -1.927734375, -1.83203125, -1.736328125, -1.640625, -1.544921875, -1.44921875, -1.353515625, -1.2578125, -1.162109375, -1.06640625, -0.970703125, -0.875, -0.779296875, -0.68359375, -0.587890625, -0.4921875, -0.396484375, -0.30078125, -0.205078125, -0.109375, -0.013671875, 0.08203125, 0.177734375, 0.2734375, 0.369140625, 0.46484375, 0.560546875, 0.65625, 0.751953125, 0.84765625, 0.943359375, 1.0390625, 1.134765625, 1.23046875, 1.326171875, 1.421875, 1.517578125, 1.61328125, 1.708984375, 1.8046875, 1.900390625, 1.99609375, 2.091796875, 2.1875, 2.283203125, 2.37890625, 2.474609375, 2.5703125, 2.666015625, 2.76171875, 2.857421875, 2.953125, 3.048828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 13.0, 33.0, 71.0, 155.0, 333.0, 243.0, 90.0, 31.0, 14.0, 7.0, 5.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.54647827148438, -87.66806030273438, -85.78964233398438, -83.91122436523438, -82.03280639648438, -80.15438842773438, -78.27597045898438, -76.39754486083984, -74.51912689208984, -72.64070892333984, -70.76229095458984, -68.88387298583984, -67.00545501708984, -65.12702941894531, -63.24861526489258, -61.37019729614258, -59.49177932739258, -57.61336135864258, -55.73494338989258, -53.85652160644531, -51.97810363769531, -50.09968566894531, -48.22126770019531, -46.34284973144531, -44.46443176269531, -42.58601379394531, -40.70759582519531, -38.82917785644531, -36.95075607299805, -35.07233810424805, -33.19392013549805, -31.315502166748047, -29.437076568603516, -27.558658599853516, -25.680238723754883, -23.801820755004883, -21.92340087890625, -20.04498291015625, -18.16656494140625, -16.28814697265625, -14.409727096557617, -12.5313081741333, -10.652889251708984, -8.774471282958984, -6.896052360534668, -5.017633438110352, -3.1392154693603516, -1.2607965469360352, 0.6176223754882812, 2.4960410594940186, 4.374459743499756, 6.252878189086914, 8.13129711151123, 10.009716033935547, 11.888134002685547, 13.766552925109863, 15.64497184753418, 17.52338981628418, 19.401809692382812, 21.280227661132812, 23.158645629882812, 25.037065505981445, 26.915483474731445, 28.793903350830078, 30.672321319580078]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 9.0, 11.0, 10.0, 20.0, 13.0, 24.0, 21.0, 35.0, 35.0, 44.0, 50.0, 43.0, 50.0, 67.0, 76.0, 57.0, 76.0, 52.0, 50.0, 34.0, 44.0, 35.0, 29.0, 20.0, 32.0, 14.0, 11.0, 8.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-25.032047271728516, -24.416133880615234, -23.800222396850586, -23.184309005737305, -22.568397521972656, -21.952484130859375, -21.336570739746094, -20.720657348632812, -20.104745864868164, -19.488832473754883, -18.872920989990234, -18.257007598876953, -17.641094207763672, -17.025182723999023, -16.409269332885742, -15.793356895446777, -15.177444458007812, -14.561532020568848, -13.945619583129883, -13.329706192016602, -12.713793754577637, -12.097881317138672, -11.48196792602539, -10.866055488586426, -10.250143051147461, -9.634230613708496, -9.018318176269531, -8.40240478515625, -7.786492347717285, -7.17057991027832, -6.554666996002197, -5.938754081726074, -5.322840690612793, -4.706928253173828, -4.091015338897705, -3.475102663040161, -2.859189987182617, -2.2432773113250732, -1.6273646354675293, -1.0114517211914062, -0.3955392837524414, 0.22037339210510254, 0.8362860679626465, 1.4521987438201904, 2.0681114196777344, 2.6840240955352783, 3.2999367713928223, 3.9158496856689453, 4.53176212310791, 5.147674560546875, 5.763587474822998, 6.379500389099121, 6.995412826538086, 7.611325263977051, 8.227237701416016, 8.843151092529297, 9.459063529968262, 10.074975967407227, 10.690889358520508, 11.306801795959473, 11.922714233398438, 12.538626670837402, 13.154539108276367, 13.770452499389648, 14.386364936828613]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 7.0, 9.0, 5.0, 15.0, 23.0, 33.0, 48.0, 81.0, 121.0, 171.0, 276.0, 523.0, 1002.0, 1815.0, 3682.0, 8726.0, 24226.0, 99175.0, 709441.0, 147916.0, 31592.0, 10663.0, 4407.0, 2035.0, 1046.0, 585.0, 342.0, 202.0, 122.0, 77.0, 60.0, 27.0, 34.0, 14.0, 14.0, 16.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.37109375, -2.300537109375, -2.22998046875, -2.159423828125, -2.0888671875, -2.018310546875, -1.94775390625, -1.877197265625, -1.806640625, -1.736083984375, -1.66552734375, -1.594970703125, -1.5244140625, -1.453857421875, -1.38330078125, -1.312744140625, -1.2421875, -1.171630859375, -1.10107421875, -1.030517578125, -0.9599609375, -0.889404296875, -0.81884765625, -0.748291015625, -0.677734375, -0.607177734375, -0.53662109375, -0.466064453125, -0.3955078125, -0.324951171875, -0.25439453125, -0.183837890625, -0.11328125, -0.042724609375, 0.02783203125, 0.098388671875, 0.1689453125, 0.239501953125, 0.31005859375, 0.380615234375, 0.451171875, 0.521728515625, 0.59228515625, 0.662841796875, 0.7333984375, 0.803955078125, 0.87451171875, 0.945068359375, 1.015625, 1.086181640625, 1.15673828125, 1.227294921875, 1.2978515625, 1.368408203125, 1.43896484375, 1.509521484375, 1.580078125, 1.650634765625, 1.72119140625, 1.791748046875, 1.8623046875, 1.932861328125, 2.00341796875, 2.073974609375, 2.14453125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 10.0, 10.0, 11.0, 28.0, 27.0, 23.0, 46.0, 50.0, 64.0, 64.0, 89.0, 88.0, 84.0, 79.0, 57.0, 61.0, 48.0, 38.0, 28.0, 22.0, 13.0, 13.0, 9.0, 8.0, 12.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8544921875, -1.80267333984375, -1.7508544921875, -1.69903564453125, -1.647216796875, -1.59539794921875, -1.5435791015625, -1.49176025390625, -1.43994140625, -1.38812255859375, -1.3363037109375, -1.28448486328125, -1.232666015625, -1.18084716796875, -1.1290283203125, -1.07720947265625, -1.025390625, -0.97357177734375, -0.9217529296875, -0.86993408203125, -0.818115234375, -0.76629638671875, -0.7144775390625, -0.66265869140625, -0.61083984375, -0.55902099609375, -0.5072021484375, -0.45538330078125, -0.403564453125, -0.35174560546875, -0.2999267578125, -0.24810791015625, -0.1962890625, -0.14447021484375, -0.0926513671875, -0.04083251953125, 0.010986328125, 0.06280517578125, 0.1146240234375, 0.16644287109375, 0.21826171875, 0.27008056640625, 0.3218994140625, 0.37371826171875, 0.425537109375, 0.47735595703125, 0.5291748046875, 0.58099365234375, 0.6328125, 0.68463134765625, 0.7364501953125, 0.78826904296875, 0.840087890625, 0.89190673828125, 0.9437255859375, 0.99554443359375, 1.04736328125, 1.09918212890625, 1.1510009765625, 1.20281982421875, 1.254638671875, 1.30645751953125, 1.3582763671875, 1.41009521484375, 1.4619140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 1.0, 5.0, 5.0, 6.0, 2.0, 15.0, 18.0, 16.0, 20.0, 30.0, 41.0, 55.0, 83.0, 110.0, 155.0, 266.0, 459.0, 863.0, 2104.0, 6772.0, 34849.0, 886839.0, 96658.0, 12837.0, 3456.0, 1281.0, 580.0, 340.0, 201.0, 158.0, 99.0, 57.0, 44.0, 31.0, 17.0, 19.0, 13.0, 14.0, 9.0, 6.0, 8.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.697265625, -2.60650634765625, -2.5157470703125, -2.42498779296875, -2.334228515625, -2.24346923828125, -2.1527099609375, -2.06195068359375, -1.97119140625, -1.88043212890625, -1.7896728515625, -1.69891357421875, -1.608154296875, -1.51739501953125, -1.4266357421875, -1.33587646484375, -1.2451171875, -1.15435791015625, -1.0635986328125, -0.97283935546875, -0.882080078125, -0.79132080078125, -0.7005615234375, -0.60980224609375, -0.51904296875, -0.42828369140625, -0.3375244140625, -0.24676513671875, -0.156005859375, -0.06524658203125, 0.0255126953125, 0.11627197265625, 0.20703125, 0.29779052734375, 0.3885498046875, 0.47930908203125, 0.570068359375, 0.66082763671875, 0.7515869140625, 0.84234619140625, 0.93310546875, 1.02386474609375, 1.1146240234375, 1.20538330078125, 1.296142578125, 1.38690185546875, 1.4776611328125, 1.56842041015625, 1.6591796875, 1.74993896484375, 1.8406982421875, 1.93145751953125, 2.022216796875, 2.11297607421875, 2.2037353515625, 2.29449462890625, 2.38525390625, 2.47601318359375, 2.5667724609375, 2.65753173828125, 2.748291015625, 2.83905029296875, 2.9298095703125, 3.02056884765625, 3.111328125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 6.0, 12.0, 14.0, 18.0, 19.0, 16.0, 21.0, 35.0, 26.0, 34.0, 33.0, 42.0, 70.0, 68.0, 91.0, 83.0, 46.0, 52.0, 54.0, 43.0, 30.0, 31.0, 17.0, 22.0, 17.0, 15.0, 13.0, 12.0, 6.0, 3.0, 7.0, 3.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.59765625, -4.456298828125, -4.31494140625, -4.173583984375, -4.0322265625, -3.890869140625, -3.74951171875, -3.608154296875, -3.466796875, -3.325439453125, -3.18408203125, -3.042724609375, -2.9013671875, -2.760009765625, -2.61865234375, -2.477294921875, -2.3359375, -2.194580078125, -2.05322265625, -1.911865234375, -1.7705078125, -1.629150390625, -1.48779296875, -1.346435546875, -1.205078125, -1.063720703125, -0.92236328125, -0.781005859375, -0.6396484375, -0.498291015625, -0.35693359375, -0.215576171875, -0.07421875, 0.067138671875, 0.20849609375, 0.349853515625, 0.4912109375, 0.632568359375, 0.77392578125, 0.915283203125, 1.056640625, 1.197998046875, 1.33935546875, 1.480712890625, 1.6220703125, 1.763427734375, 1.90478515625, 2.046142578125, 2.1875, 2.328857421875, 2.47021484375, 2.611572265625, 2.7529296875, 2.894287109375, 3.03564453125, 3.177001953125, 3.318359375, 3.459716796875, 3.60107421875, 3.742431640625, 3.8837890625, 4.025146484375, 4.16650390625, 4.307861328125, 4.44921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 8.0, 13.0, 12.0, 20.0, 22.0, 34.0, 42.0, 70.0, 113.0, 230.0, 479.0, 1263.0, 3541.0, 16883.0, 934494.0, 79128.0, 8301.0, 2332.0, 782.0, 354.0, 134.0, 91.0, 53.0, 33.0, 19.0, 23.0, 14.0, 13.0, 13.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.169921875, -1.131927490234375, -1.09393310546875, -1.055938720703125, -1.0179443359375, -0.979949951171875, -0.94195556640625, -0.903961181640625, -0.865966796875, -0.827972412109375, -0.78997802734375, -0.751983642578125, -0.7139892578125, -0.675994873046875, -0.63800048828125, -0.600006103515625, -0.56201171875, -0.524017333984375, -0.48602294921875, -0.448028564453125, -0.4100341796875, -0.372039794921875, -0.33404541015625, -0.296051025390625, -0.258056640625, -0.220062255859375, -0.18206787109375, -0.144073486328125, -0.1060791015625, -0.068084716796875, -0.03009033203125, 0.007904052734375, 0.0458984375, 0.083892822265625, 0.12188720703125, 0.159881591796875, 0.1978759765625, 0.235870361328125, 0.27386474609375, 0.311859130859375, 0.349853515625, 0.387847900390625, 0.42584228515625, 0.463836669921875, 0.5018310546875, 0.539825439453125, 0.57781982421875, 0.615814208984375, 0.65380859375, 0.691802978515625, 0.72979736328125, 0.767791748046875, 0.8057861328125, 0.843780517578125, 0.88177490234375, 0.919769287109375, 0.957763671875, 0.995758056640625, 1.03375244140625, 1.071746826171875, 1.1097412109375, 1.147735595703125, 1.18572998046875, 1.223724365234375, 1.26171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 0.0, 2.0, 4.0, 5.0, 5.0, 7.0, 8.0, 18.0, 19.0, 23.0, 22.0, 32.0, 65.0, 132.0, 200.0, 162.0, 88.0, 60.0, 36.0, 27.0, 17.0, 11.0, 11.0, 11.0, 9.0, 3.0, 3.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028586387634277344, -0.00027718767523765564, -0.00026851147413253784, -0.00025983527302742004, -0.00025115907192230225, -0.00024248287081718445, -0.00023380666971206665, -0.00022513046860694885, -0.00021645426750183105, -0.00020777806639671326, -0.00019910186529159546, -0.00019042566418647766, -0.00018174946308135986, -0.00017307326197624207, -0.00016439706087112427, -0.00015572085976600647, -0.00014704465866088867, -0.00013836845755577087, -0.00012969225645065308, -0.00012101605534553528, -0.00011233985424041748, -0.00010366365313529968, -9.498745203018188e-05, -8.631125092506409e-05, -7.763504981994629e-05, -6.895884871482849e-05, -6.028264760971069e-05, -5.1606446504592896e-05, -4.29302453994751e-05, -3.42540442943573e-05, -2.5577843189239502e-05, -1.6901642084121704e-05, -8.225440979003906e-06, 4.507601261138916e-07, 9.12696123123169e-06, 1.7803162336349487e-05, 2.6479363441467285e-05, 3.515556454658508e-05, 4.383176565170288e-05, 5.250796675682068e-05, 6.118416786193848e-05, 6.986036896705627e-05, 7.853657007217407e-05, 8.721277117729187e-05, 9.588897228240967e-05, 0.00010456517338752747, 0.00011324137449264526, 0.00012191757559776306, 0.00013059377670288086, 0.00013926997780799866, 0.00014794617891311646, 0.00015662238001823425, 0.00016529858112335205, 0.00017397478222846985, 0.00018265098333358765, 0.00019132718443870544, 0.00020000338554382324, 0.00020867958664894104, 0.00021735578775405884, 0.00022603198885917664, 0.00023470818996429443, 0.00024338439106941223, 0.00025206059217453003, 0.00026073679327964783, 0.0002694129943847656]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 9.0, 6.0, 11.0, 20.0, 27.0, 35.0, 66.0, 95.0, 206.0, 432.0, 1523.0, 9170.0, 981434.0, 50518.0, 3640.0, 805.0, 283.0, 109.0, 59.0, 35.0, 20.0, 9.0, 11.0, 8.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.046875, -1.9879913330078125, -1.929107666015625, -1.8702239990234375, -1.81134033203125, -1.7524566650390625, -1.693572998046875, -1.6346893310546875, -1.5758056640625, -1.5169219970703125, -1.458038330078125, -1.3991546630859375, -1.34027099609375, -1.2813873291015625, -1.222503662109375, -1.1636199951171875, -1.104736328125, -1.0458526611328125, -0.986968994140625, -0.9280853271484375, -0.86920166015625, -0.8103179931640625, -0.751434326171875, -0.6925506591796875, -0.6336669921875, -0.5747833251953125, -0.515899658203125, -0.4570159912109375, -0.39813232421875, -0.3392486572265625, -0.280364990234375, -0.2214813232421875, -0.16259765625, -0.1037139892578125, -0.044830322265625, 0.0140533447265625, 0.07293701171875, 0.1318206787109375, 0.190704345703125, 0.2495880126953125, 0.3084716796875, 0.3673553466796875, 0.426239013671875, 0.4851226806640625, 0.54400634765625, 0.6028900146484375, 0.661773681640625, 0.7206573486328125, 0.779541015625, 0.8384246826171875, 0.897308349609375, 0.9561920166015625, 1.01507568359375, 1.0739593505859375, 1.132843017578125, 1.1917266845703125, 1.2506103515625, 1.3094940185546875, 1.368377685546875, 1.4272613525390625, 1.48614501953125, 1.5450286865234375, 1.603912353515625, 1.6627960205078125, 1.7216796875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 11.0, 3.0, 7.0, 9.0, 13.0, 11.0, 12.0, 17.0, 25.0, 48.0, 134.0, 235.0, 229.0, 82.0, 43.0, 30.0, 24.0, 12.0, 16.0, 15.0, 14.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.25390625, -1.2178497314453125, -1.181793212890625, -1.1457366943359375, -1.10968017578125, -1.0736236572265625, -1.037567138671875, -1.0015106201171875, -0.9654541015625, -0.9293975830078125, -0.893341064453125, -0.8572845458984375, -0.82122802734375, -0.7851715087890625, -0.749114990234375, -0.7130584716796875, -0.677001953125, -0.6409454345703125, -0.604888916015625, -0.5688323974609375, -0.53277587890625, -0.4967193603515625, -0.460662841796875, -0.4246063232421875, -0.3885498046875, -0.3524932861328125, -0.316436767578125, -0.2803802490234375, -0.24432373046875, -0.2082672119140625, -0.172210693359375, -0.1361541748046875, -0.10009765625, -0.0640411376953125, -0.027984619140625, 0.0080718994140625, 0.04412841796875, 0.0801849365234375, 0.116241455078125, 0.1522979736328125, 0.1883544921875, 0.2244110107421875, 0.260467529296875, 0.2965240478515625, 0.33258056640625, 0.3686370849609375, 0.404693603515625, 0.4407501220703125, 0.476806640625, 0.5128631591796875, 0.548919677734375, 0.5849761962890625, 0.62103271484375, 0.6570892333984375, 0.693145751953125, 0.7292022705078125, 0.7652587890625, 0.8013153076171875, 0.837371826171875, 0.8734283447265625, 0.90948486328125, 0.9455413818359375, 0.981597900390625, 1.0176544189453125, 1.0537109375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 20.0, 52.0, 78.0, 580.0, 144.0, 60.0, 33.0, 12.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.29560852050781, -34.217350006103516, -33.13909149169922, -32.060829162597656, -30.98257064819336, -29.904312133789062, -28.826051712036133, -27.747791290283203, -26.669532775878906, -25.59127426147461, -24.51301383972168, -23.43475341796875, -22.356494903564453, -21.278236389160156, -20.199975967407227, -19.121715545654297, -18.04345703125, -16.965198516845703, -15.886938095092773, -14.80867862701416, -13.730419158935547, -12.652159690856934, -11.57390022277832, -10.495640754699707, -9.417381286621094, -8.33912181854248, -7.260862350463867, -6.182602882385254, -5.104343414306641, -4.026083946228027, -2.947824478149414, -1.8695650100708008, -0.7913093566894531, 0.28695011138916016, 1.3652095794677734, 2.4434690475463867, 3.521728515625, 4.599987983703613, 5.678247451782227, 6.75650691986084, 7.834766387939453, 8.913025856018066, 9.99128532409668, 11.069544792175293, 12.147804260253906, 13.22606372833252, 14.304323196411133, 15.382582664489746, 16.46084213256836, 17.539100646972656, 18.617361068725586, 19.695621490478516, 20.773880004882812, 21.85213851928711, 22.93039894104004, 24.00865936279297, 25.086917877197266, 26.165176391601562, 27.243436813354492, 28.321697235107422, 29.39995574951172, 30.478214263916016, 31.556474685668945, 32.634735107421875, 33.71299362182617]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 13.0, 16.0, 6.0, 19.0, 14.0, 16.0, 31.0, 24.0, 14.0, 30.0, 36.0, 56.0, 325.0, 140.0, 31.0, 28.0, 25.0, 17.0, 20.0, 16.0, 24.0, 21.0, 8.0, 15.0, 12.0, 12.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-19.801328659057617, -19.290637969970703, -18.77994728088379, -18.269256591796875, -17.75856590270996, -17.247875213623047, -16.737184524536133, -16.22649383544922, -15.715802192687988, -15.205111503601074, -14.69442081451416, -14.183730125427246, -13.673038482666016, -13.162347793579102, -12.651657104492188, -12.140966415405273, -11.63027572631836, -11.119585037231445, -10.608894348144531, -10.098203659057617, -9.587512969970703, -9.076822280883789, -8.566130638122559, -8.055439949035645, -7.5447492599487305, -7.034058570861816, -6.523367881774902, -6.01267671585083, -5.501986026763916, -4.991295337677002, -4.48060417175293, -3.9699134826660156, -3.4592208862304688, -2.9485301971435547, -2.4378392696380615, -1.927148461341858, -1.4164576530456543, -0.9057669639587402, -0.39507603645324707, 0.1156148910522461, 0.6263055801391602, 1.1369963884353638, 1.6476871967315674, 2.1583781242370605, 2.6690688133239746, 3.1797595024108887, 3.690450429916382, 4.201141357421875, 4.711832046508789, 5.222522735595703, 5.733213424682617, 6.2439045906066895, 6.7545952796936035, 7.265285968780518, 7.77597713470459, 8.286667823791504, 8.797358512878418, 9.308049201965332, 9.818739891052246, 10.32943058013916, 10.84012222290039, 11.350812911987305, 11.861503601074219, 12.372194290161133, 12.882884979248047]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 8.0, 1.0, 5.0, 20.0, 16.0, 31.0, 32.0, 62.0, 60.0, 99.0, 308.0, 117.0, 53.0, 52.0, 31.0, 21.0, 30.0, 17.0, 12.0, 10.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.306640625, -2.2437744140625, -2.180908203125, -2.1180419921875, -2.05517578125, -1.9923095703125, -1.929443359375, -1.8665771484375, -1.8037109375, -1.7408447265625, -1.677978515625, -1.6151123046875, -1.55224609375, -1.4893798828125, -1.426513671875, -1.3636474609375, -1.30078125, -1.2379150390625, -1.175048828125, -1.1121826171875, -1.04931640625, -0.9864501953125, -0.923583984375, -0.8607177734375, -0.7978515625, -0.7349853515625, -0.672119140625, -0.6092529296875, -0.54638671875, -0.4835205078125, -0.420654296875, -0.3577880859375, -0.294921875, -0.2320556640625, -0.169189453125, -0.1063232421875, -0.04345703125, 0.0194091796875, 0.082275390625, 0.1451416015625, 0.2080078125, 0.2708740234375, 0.333740234375, 0.3966064453125, 0.45947265625, 0.5223388671875, 0.585205078125, 0.6480712890625, 0.7109375, 0.7738037109375, 0.836669921875, 0.8995361328125, 0.96240234375, 1.0252685546875, 1.088134765625, 1.1510009765625, 1.2138671875, 1.2767333984375, 1.339599609375, 1.4024658203125, 1.46533203125, 1.5281982421875, 1.591064453125, 1.6539306640625, 1.716796875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 7.0, 5.0, 3.0, 5.0, 6.0, 13.0, 12.0, 11.0, 6.0, 19.0, 44.0, 35.0, 73.0, 113.0, 174.0, 297.0, 633.0, 1487.0, 4767.0, 43857.0, 8320232.0, 11859.0, 2777.0, 981.0, 453.0, 244.0, 128.0, 97.0, 61.0, 33.0, 30.0, 28.0, 16.0, 18.0, 8.0, 8.0, 5.0, 4.0, 5.0, 6.0, 4.0, 7.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0], "bins": [-9.084898948669434, -8.834385871887207, -8.583873748779297, -8.33336067199707, -8.082847595214844, -7.832334518432617, -7.581821918487549, -7.3313093185424805, -7.080796241760254, -6.830283164978027, -6.579770565032959, -6.329257965087891, -6.078744888305664, -5.8282318115234375, -5.577719211578369, -5.327206611633301, -5.076693534851074, -4.826180458068848, -4.575667858123779, -4.325155258178711, -4.074642181396484, -3.824129343032837, -3.5736165046691895, -3.323103666305542, -3.0725908279418945, -2.822077989578247, -2.5715651512145996, -2.321052312850952, -2.0705394744873047, -1.8200266361236572, -1.5695137977600098, -1.3190009593963623, -1.0684871673583984, -0.817974328994751, -0.5674614906311035, -0.31694865226745605, -0.0664358139038086, 0.18407702445983887, 0.43458986282348633, 0.6851027011871338, 0.9356155395507812, 1.1861283779144287, 1.4366412162780762, 1.6871540546417236, 1.937666893005371, 2.1881797313690186, 2.438692569732666, 2.6892054080963135, 2.939718246459961, 3.1902310848236084, 3.440743923187256, 3.6912567615509033, 3.941769599914551, 4.192282676696777, 4.442795276641846, 4.693307876586914, 4.943820953369141, 5.194334030151367, 5.4448466300964355, 5.695359230041504, 5.9458723068237305, 6.196385383605957, 6.446897983551025, 6.697410583496094, 6.94792366027832]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 6.0, 2.0, 2.0, 8.0, 8.0, 2.0, 3.0, 7.0, 7.0, 5.0, 8.0, 5.0, 3.0, 6.0, 5.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.012498378753662, -5.805891036987305, -5.5992841720581055, -5.392677307128906, -5.186069965362549, -4.979462623596191, -4.772855758666992, -4.566248893737793, -4.3596415519714355, -4.153034210205078, -3.946427345275879, -3.7398202419281006, -3.5332131385803223, -3.326606035232544, -3.1199989318847656, -2.9133918285369873, -2.706784725189209, -2.5001776218414307, -2.2935705184936523, -2.086963415145874, -1.8803563117980957, -1.6737492084503174, -1.467142105102539, -1.2605350017547607, -1.0539278984069824, -0.8473207950592041, -0.6407136917114258, -0.43410658836364746, -0.22749948501586914, -0.02089238166809082, 0.1857147216796875, 0.3923218250274658, 0.5989289283752441, 0.8055360317230225, 1.0121431350708008, 1.218750238418579, 1.4253573417663574, 1.6319644451141357, 1.838571548461914, 2.0451786518096924, 2.2517857551574707, 2.458392858505249, 2.6649999618530273, 2.8716070652008057, 3.078214168548584, 3.2848212718963623, 3.4914283752441406, 3.698035478591919, 3.9046425819396973, 4.111249923706055, 4.317856788635254, 4.524463653564453, 4.7310709953308105, 4.937678337097168, 5.144285202026367, 5.350892066955566, 5.557499408721924, 5.764106750488281, 5.9707136154174805, 6.17732048034668, 6.383927822113037, 6.5905351638793945, 6.797142028808594, 7.003748893737793, 7.21035623550415]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 5.0, 19.0, 13.0, 28.0, 37.0, 52.0, 98.0, 129.0, 226.0, 395.0, 854.0, 1695.0, 4110.0, 11199.0, 39395.0, 167426.0, 218376.0, 55521.0, 15112.0, 5125.0, 2183.0, 1002.0, 485.0, 291.0, 167.0, 108.0, 76.0, 41.0, 24.0, 22.0, 9.0, 10.0, 5.0, 7.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.106689453125, -7.84619140625, -7.585693359375, -7.3251953125, -7.064697265625, -6.80419921875, -6.543701171875, -6.283203125, -6.022705078125, -5.76220703125, -5.501708984375, -5.2412109375, -4.980712890625, -4.72021484375, -4.459716796875, -4.19921875, -3.938720703125, -3.67822265625, -3.417724609375, -3.1572265625, -2.896728515625, -2.63623046875, -2.375732421875, -2.115234375, -1.854736328125, -1.59423828125, -1.333740234375, -1.0732421875, -0.812744140625, -0.55224609375, -0.291748046875, -0.03125, 0.229248046875, 0.48974609375, 0.750244140625, 1.0107421875, 1.271240234375, 1.53173828125, 1.792236328125, 2.052734375, 2.313232421875, 2.57373046875, 2.834228515625, 3.0947265625, 3.355224609375, 3.61572265625, 3.876220703125, 4.13671875, 4.397216796875, 4.65771484375, 4.918212890625, 5.1787109375, 5.439208984375, 5.69970703125, 5.960205078125, 6.220703125, 6.481201171875, 6.74169921875, 7.002197265625, 7.2626953125, 7.523193359375, 7.78369140625, 8.044189453125, 8.3046875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 7.0, 9.0, 9.0, 11.0, 13.0, 18.0, 26.0, 59.0, 50.0, 59.0, 67.0, 75.0, 90.0, 96.0, 98.0, 58.0, 62.0, 45.0, 46.0, 23.0, 14.0, 19.0, 9.0, 13.0, 5.0, 9.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.68359375, -1.6350860595703125, -1.586578369140625, -1.5380706787109375, -1.48956298828125, -1.4410552978515625, -1.392547607421875, -1.3440399169921875, -1.2955322265625, -1.2470245361328125, -1.198516845703125, -1.1500091552734375, -1.10150146484375, -1.0529937744140625, -1.004486083984375, -0.9559783935546875, -0.907470703125, -0.8589630126953125, -0.810455322265625, -0.7619476318359375, -0.71343994140625, -0.6649322509765625, -0.616424560546875, -0.5679168701171875, -0.5194091796875, -0.4709014892578125, -0.422393798828125, -0.3738861083984375, -0.32537841796875, -0.2768707275390625, -0.228363037109375, -0.1798553466796875, -0.13134765625, -0.0828399658203125, -0.034332275390625, 0.0141754150390625, 0.06268310546875, 0.1111907958984375, 0.159698486328125, 0.2082061767578125, 0.2567138671875, 0.3052215576171875, 0.353729248046875, 0.4022369384765625, 0.45074462890625, 0.4992523193359375, 0.547760009765625, 0.5962677001953125, 0.644775390625, 0.6932830810546875, 0.741790771484375, 0.7902984619140625, 0.83880615234375, 0.8873138427734375, 0.935821533203125, 0.9843292236328125, 1.0328369140625, 1.0813446044921875, 1.129852294921875, 1.1783599853515625, 1.22686767578125, 1.2753753662109375, 1.323883056640625, 1.3723907470703125, 1.4208984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 6.0, 6.0, 14.0, 56.0, 96.0, 167.0, 67.0, 26.0, 17.0, 8.0, 10.0, 4.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.818387985229492, -8.407612800598145, -7.9968366622924805, -7.586061477661133, -7.175285339355469, -6.764510154724121, -6.353734493255615, -5.942958831787109, -5.5321831703186035, -5.121407508850098, -4.710631847381592, -4.299856185913086, -3.889080762863159, -3.4783051013946533, -3.0675296783447266, -2.6567540168762207, -2.245978355407715, -1.835202693939209, -1.4244271516799927, -1.0136516094207764, -0.6028759479522705, -0.19210028648376465, 0.2186751365661621, 0.629450798034668, 1.0402264595031738, 1.4510021209716797, 1.861777663230896, 2.2725532054901123, 2.683328866958618, 3.094104528427124, 3.504879951477051, 3.9156556129455566, 4.3264312744140625, 4.737206935882568, 5.147982597351074, 5.558757781982422, 5.969533920288086, 6.380309104919434, 6.7910847663879395, 7.201860427856445, 7.612636089324951, 8.023411750793457, 8.434186935424805, 8.844963073730469, 9.255738258361816, 9.66651439666748, 10.077289581298828, 10.488065719604492, 10.89884090423584, 11.309616088867188, 11.720392227172852, 12.1311674118042, 12.541943550109863, 12.952718734741211, 13.363494873046875, 13.774270057678223, 14.18504524230957, 14.595820426940918, 15.006596565246582, 15.41737174987793, 15.828147888183594, 16.238924026489258, 16.64969825744629, 17.060474395751953, 17.471250534057617]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 1.0, 5.0, 6.0, 5.0, 5.0, 5.0, 9.0, 14.0, 20.0, 34.0, 89.0, 104.0, 78.0, 43.0, 18.0, 14.0, 3.0, 3.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.792799472808838, -7.552576065063477, -7.312352657318115, -7.072129249572754, -6.831905841827393, -6.591682434082031, -6.351458549499512, -6.111235618591309, -5.871011734008789, -5.630788326263428, -5.390564918518066, -5.150341510772705, -4.910118103027344, -4.669894695281982, -4.429671287536621, -4.189447402954102, -3.9492244720458984, -3.709001064300537, -3.468777656555176, -3.2285542488098145, -2.988330841064453, -2.748107433319092, -2.5078837871551514, -2.26766037940979, -2.0274369716644287, -1.7872135639190674, -1.546990156173706, -1.3067666292190552, -1.0665432214736938, -0.8263198137283325, -0.5860962867736816, -0.3458728790283203, -0.10564947128295898, 0.13457396626472473, 0.37479740381240845, 0.6150208711624146, 0.8552442789077759, 1.0954676866531372, 1.335691213607788, 1.5759146213531494, 1.8161380290985107, 2.056361436843872, 2.2965848445892334, 2.536808490753174, 2.777031898498535, 3.0172553062438965, 3.257478713989258, 3.497702121734619, 3.7379255294799805, 3.978148937225342, 4.218372344970703, 4.4585957527160645, 4.698819160461426, 4.939042568206787, 5.179265975952148, 5.419489860534668, 5.659712791442871, 5.899936199188232, 6.140159606933594, 6.380383014678955, 6.620606422424316, 6.860829830169678, 7.101053237915039, 7.341277122497559, 7.58150053024292]}, "eval/loss": 4.228886127471924, "eval/wer": 1.9632883776279255, "eval/runtime": 974.9232, "eval/samples_per_second": 2.71, "eval/steps_per_second": 0.34} \ No newline at end of file