diff --git "a/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" "b/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" --- "a/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" +++ "b/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.5352, "train/learning_rate": 7.740498812351543e-06, "train/epoch": 15.13, "train/global_step": 13500, "_runtime": 82090, "_timestamp": 1647456632, "_step": 13508, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 11.0, 13.0, 13.0, 11.0, 11.0, 20.0, 23.0, 31.0, 27.0, 31.0, 50.0, 48.0, 37.0, 60.0, 56.0, 69.0, 55.0, 56.0, 64.0, 39.0, 45.0, 52.0, 38.0, 35.0, 25.0, 16.0, 23.0, 15.0, 14.0, 13.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.53314781188965, -23.069297790527344, -22.60544776916504, -22.141597747802734, -21.67774772644043, -21.213897705078125, -20.750045776367188, -20.286195755004883, -19.822345733642578, -19.358495712280273, -18.89464569091797, -18.430795669555664, -17.96694564819336, -17.503093719482422, -17.03924560546875, -16.575393676757812, -16.11154556274414, -15.647695541381836, -15.183845520019531, -14.719995498657227, -14.256144523620605, -13.7922945022583, -13.328444480895996, -12.864594459533691, -12.40074348449707, -11.936893463134766, -11.473043441772461, -11.009193420410156, -10.545342445373535, -10.08149242401123, -9.617642402648926, -9.153792381286621, -8.689942359924316, -8.226092338562012, -7.762241840362549, -7.298391819000244, -6.834541320800781, -6.370691299438477, -5.906841278076172, -5.442991256713867, -4.979140758514404, -4.5152907371521, -4.051440238952637, -3.587590217590332, -3.1237399578094482, -2.6598896980285645, -2.1960396766662598, -1.732189416885376, -1.2683391571044922, -0.8044889569282532, -0.34063875675201416, 0.12321138381958008, 0.5870616436004639, 1.0509119033813477, 1.5147619247436523, 1.9786121845245361, 2.44246244430542, 2.9063127040863037, 3.3701629638671875, 3.834012985229492, 4.297863006591797, 4.76171350479126, 5.2255635261535645, 5.689414024353027, 6.153264045715332]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 7.0, 8.0, 10.0, 7.0, 14.0, 16.0, 30.0, 15.0, 25.0, 27.0, 34.0, 40.0, 42.0, 37.0, 54.0, 40.0, 29.0, 36.0, 43.0, 45.0, 45.0, 44.0, 45.0, 44.0, 33.0, 34.0, 28.0, 32.0, 24.0, 23.0, 15.0, 15.0, 12.0, 8.0, 6.0, 10.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.69301986694336, -11.303744316101074, -10.914467811584473, -10.525192260742188, -10.135916709899902, -9.746641159057617, -9.357364654541016, -8.96808910369873, -8.578813552856445, -8.18953800201416, -7.800261974334717, -7.410985946655273, -7.021710395812988, -6.632434368133545, -6.243158340454102, -5.853882789611816, -5.464606761932373, -5.07533073425293, -4.6860551834106445, -4.296779155731201, -3.907503604888916, -3.5182275772094727, -3.1289517879486084, -2.739675998687744, -2.35040020942688, -1.9611244201660156, -1.5718486309051514, -1.1825727224349976, -0.7932969331741333, -0.40402114391326904, -0.014745235443115234, 0.374530553817749, 0.7638063430786133, 1.1530821323394775, 1.5423579216003418, 1.9316338300704956, 2.3209095001220703, 2.7101855278015137, 3.099461317062378, 3.488737106323242, 3.8780128955841064, 4.267288684844971, 4.656564712524414, 5.045840263366699, 5.435116291046143, 5.824391841888428, 6.213667869567871, 6.602943420410156, 6.9922194480896, 7.381495475769043, 7.770771026611328, 8.160046577453613, 8.549323081970215, 8.9385986328125, 9.327874183654785, 9.71714973449707, 10.106426239013672, 10.495701789855957, 10.884978294372559, 11.274253845214844, 11.663529396057129, 12.052804946899414, 12.442081451416016, 12.8313570022583, 13.220632553100586]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 6.0, 10.0, 12.0, 21.0, 22.0, 51.0, 83.0, 108.0, 196.0, 367.0, 556.0, 956.0, 1620.0, 2634.0, 4230.0, 6946.0, 11469.0, 18413.0, 29022.0, 46131.0, 71197.0, 106964.0, 157228.0, 221410.0, 300073.0, 379571.0, 443117.0, 472918.0, 454154.0, 398748.0, 319959.0, 240289.0, 171844.0, 118277.0, 78849.0, 50957.0, 32867.0, 20458.0, 12618.0, 7650.0, 4808.0, 2961.0, 1806.0, 1090.0, 640.0, 378.0, 248.0, 133.0, 91.0, 51.0, 36.0, 22.0, 10.0, 15.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-15.375, -14.8887939453125, -14.402587890625, -13.9163818359375, -13.43017578125, -12.9439697265625, -12.457763671875, -11.9715576171875, -11.4853515625, -10.9991455078125, -10.512939453125, -10.0267333984375, -9.54052734375, -9.0543212890625, -8.568115234375, -8.0819091796875, -7.595703125, -7.1094970703125, -6.623291015625, -6.1370849609375, -5.65087890625, -5.1646728515625, -4.678466796875, -4.1922607421875, -3.7060546875, -3.2198486328125, -2.733642578125, -2.2474365234375, -1.76123046875, -1.2750244140625, -0.788818359375, -0.3026123046875, 0.18359375, 0.6697998046875, 1.156005859375, 1.6422119140625, 2.12841796875, 2.6146240234375, 3.100830078125, 3.5870361328125, 4.0732421875, 4.5594482421875, 5.045654296875, 5.5318603515625, 6.01806640625, 6.5042724609375, 6.990478515625, 7.4766845703125, 7.962890625, 8.4490966796875, 8.935302734375, 9.4215087890625, 9.90771484375, 10.3939208984375, 10.880126953125, 11.3663330078125, 11.8525390625, 12.3387451171875, 12.824951171875, 13.3111572265625, 13.79736328125, 14.2835693359375, 14.769775390625, 15.2559814453125, 15.7421875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 10.0, 10.0, 14.0, 23.0, 17.0, 18.0, 19.0, 26.0, 29.0, 35.0, 34.0, 37.0, 39.0, 47.0, 53.0, 47.0, 34.0, 44.0, 44.0, 39.0, 35.0, 35.0, 36.0, 40.0, 42.0, 31.0, 21.0, 23.0, 19.0, 18.0, 11.0, 17.0, 9.0, 7.0, 5.0, 5.0, 4.0, 8.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.8125, -12.409423828125, -12.00634765625, -11.603271484375, -11.2001953125, -10.797119140625, -10.39404296875, -9.990966796875, -9.587890625, -9.184814453125, -8.78173828125, -8.378662109375, -7.9755859375, -7.572509765625, -7.16943359375, -6.766357421875, -6.36328125, -5.960205078125, -5.55712890625, -5.154052734375, -4.7509765625, -4.347900390625, -3.94482421875, -3.541748046875, -3.138671875, -2.735595703125, -2.33251953125, -1.929443359375, -1.5263671875, -1.123291015625, -0.72021484375, -0.317138671875, 0.0859375, 0.489013671875, 0.89208984375, 1.295166015625, 1.6982421875, 2.101318359375, 2.50439453125, 2.907470703125, 3.310546875, 3.713623046875, 4.11669921875, 4.519775390625, 4.9228515625, 5.325927734375, 5.72900390625, 6.132080078125, 6.53515625, 6.938232421875, 7.34130859375, 7.744384765625, 8.1474609375, 8.550537109375, 8.95361328125, 9.356689453125, 9.759765625, 10.162841796875, 10.56591796875, 10.968994140625, 11.3720703125, 11.775146484375, 12.17822265625, 12.581298828125, 12.984375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 8.0, 12.0, 17.0, 28.0, 48.0, 64.0, 119.0, 215.0, 361.0, 600.0, 949.0, 1573.0, 2653.0, 4204.0, 6731.0, 10421.0, 16829.0, 25248.0, 38331.0, 55354.0, 81524.0, 113855.0, 153372.0, 201125.0, 253390.0, 303189.0, 346007.0, 371338.0, 378735.0, 363203.0, 328410.0, 282163.0, 231069.0, 180146.0, 136147.0, 98634.0, 69972.0, 48119.0, 32024.0, 21562.0, 13842.0, 8707.0, 5376.0, 3351.0, 1995.0, 1287.0, 812.0, 475.0, 287.0, 162.0, 100.0, 78.0, 31.0, 19.0, 11.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.484375, -10.1492919921875, -9.814208984375, -9.4791259765625, -9.14404296875, -8.8089599609375, -8.473876953125, -8.1387939453125, -7.8037109375, -7.4686279296875, -7.133544921875, -6.7984619140625, -6.46337890625, -6.1282958984375, -5.793212890625, -5.4581298828125, -5.123046875, -4.7879638671875, -4.452880859375, -4.1177978515625, -3.78271484375, -3.4476318359375, -3.112548828125, -2.7774658203125, -2.4423828125, -2.1072998046875, -1.772216796875, -1.4371337890625, -1.10205078125, -0.7669677734375, -0.431884765625, -0.0968017578125, 0.23828125, 0.5733642578125, 0.908447265625, 1.2435302734375, 1.57861328125, 1.9136962890625, 2.248779296875, 2.5838623046875, 2.9189453125, 3.2540283203125, 3.589111328125, 3.9241943359375, 4.25927734375, 4.5943603515625, 4.929443359375, 5.2645263671875, 5.599609375, 5.9346923828125, 6.269775390625, 6.6048583984375, 6.93994140625, 7.2750244140625, 7.610107421875, 7.9451904296875, 8.2802734375, 8.6153564453125, 8.950439453125, 9.2855224609375, 9.62060546875, 9.9556884765625, 10.290771484375, 10.6258544921875, 10.9609375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 5.0, 13.0, 17.0, 19.0, 20.0, 22.0, 52.0, 39.0, 55.0, 71.0, 93.0, 77.0, 84.0, 108.0, 153.0, 142.0, 176.0, 152.0, 161.0, 211.0, 186.0, 186.0, 189.0, 199.0, 171.0, 189.0, 182.0, 137.0, 144.0, 134.0, 122.0, 96.0, 81.0, 75.0, 55.0, 49.0, 40.0, 38.0, 30.0, 22.0, 15.0, 17.0, 9.0, 8.0, 8.0, 3.0, 3.0, 3.0, 0.0, 5.0, 4.0, 1.0, 2.0, 1.0], "bins": [-6.3046875, -6.1083984375, -5.912109375, -5.7158203125, -5.51953125, -5.3232421875, -5.126953125, -4.9306640625, -4.734375, -4.5380859375, -4.341796875, -4.1455078125, -3.94921875, -3.7529296875, -3.556640625, -3.3603515625, -3.1640625, -2.9677734375, -2.771484375, -2.5751953125, -2.37890625, -2.1826171875, -1.986328125, -1.7900390625, -1.59375, -1.3974609375, -1.201171875, -1.0048828125, -0.80859375, -0.6123046875, -0.416015625, -0.2197265625, -0.0234375, 0.1728515625, 0.369140625, 0.5654296875, 0.76171875, 0.9580078125, 1.154296875, 1.3505859375, 1.546875, 1.7431640625, 1.939453125, 2.1357421875, 2.33203125, 2.5283203125, 2.724609375, 2.9208984375, 3.1171875, 3.3134765625, 3.509765625, 3.7060546875, 3.90234375, 4.0986328125, 4.294921875, 4.4912109375, 4.6875, 4.8837890625, 5.080078125, 5.2763671875, 5.47265625, 5.6689453125, 5.865234375, 6.0615234375, 6.2578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 2.0, 8.0, 10.0, 8.0, 12.0, 22.0, 17.0, 16.0, 23.0, 19.0, 26.0, 30.0, 41.0, 32.0, 32.0, 52.0, 35.0, 47.0, 34.0, 54.0, 44.0, 33.0, 38.0, 47.0, 29.0, 35.0, 38.0, 23.0, 30.0, 22.0, 18.0, 21.0, 15.0, 16.0, 17.0, 7.0, 6.0, 9.0, 6.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.3939208984375, -12.969406127929688, -12.544891357421875, -12.120376586914062, -11.69586181640625, -11.271347045898438, -10.846832275390625, -10.422317504882812, -9.997802734375, -9.573287963867188, -9.148773193359375, -8.724258422851562, -8.29974365234375, -7.8752288818359375, -7.450714111328125, -7.0261993408203125, -6.6016845703125, -6.1771697998046875, -5.752655029296875, -5.3281402587890625, -4.90362548828125, -4.4791107177734375, -4.054595947265625, -3.6300811767578125, -3.20556640625, -2.7810516357421875, -2.356536865234375, -1.9320220947265625, -1.50750732421875, -1.0829925537109375, -0.658477783203125, -0.2339630126953125, 0.1905517578125, 0.6150665283203125, 1.039581298828125, 1.4640960693359375, 1.88861083984375, 2.3131256103515625, 2.737640380859375, 3.1621551513671875, 3.586669921875, 4.0111846923828125, 4.435699462890625, 4.8602142333984375, 5.28472900390625, 5.7092437744140625, 6.133758544921875, 6.5582733154296875, 6.9827880859375, 7.4073028564453125, 7.831817626953125, 8.256332397460938, 8.68084716796875, 9.105361938476562, 9.529876708984375, 9.954391479492188, 10.37890625, 10.803421020507812, 11.227935791015625, 11.652450561523438, 12.07696533203125, 12.501480102539062, 12.925994873046875, 13.350509643554688, 13.7750244140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 15.0, 7.0, 11.0, 15.0, 15.0, 19.0, 22.0, 33.0, 22.0, 26.0, 29.0, 29.0, 24.0, 33.0, 36.0, 36.0, 46.0, 47.0, 37.0, 37.0, 48.0, 50.0, 34.0, 40.0, 39.0, 29.0, 27.0, 32.0, 22.0, 24.0, 19.0, 11.0, 20.0, 9.0, 6.0, 11.0, 4.0, 8.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.140398025512695, -15.619043350219727, -15.097688674926758, -14.576333999633789, -14.05497932434082, -13.533624649047852, -13.012269973754883, -12.490915298461914, -11.969560623168945, -11.448205947875977, -10.926851272583008, -10.405496597290039, -9.88414192199707, -9.362787246704102, -8.841432571411133, -8.320077896118164, -7.798724174499512, -7.277369499206543, -6.756014823913574, -6.2346601486206055, -5.713305473327637, -5.191950798034668, -4.670596599578857, -4.149241924285889, -3.62788724899292, -3.106532573699951, -2.5851778984069824, -2.0638234615325928, -1.542468786239624, -1.0211141109466553, -0.4997596740722656, 0.021595001220703125, 0.5429496765136719, 1.0643043518066406, 1.5856589078903198, 2.107013463973999, 2.6283681392669678, 3.1497228145599365, 3.671077251434326, 4.192431926727295, 4.713786602020264, 5.235141277313232, 5.756495952606201, 6.277850151062012, 6.7992048263549805, 7.320559501647949, 7.841914176940918, 8.363268852233887, 8.884623527526855, 9.405978202819824, 9.927332878112793, 10.448687553405762, 10.97004222869873, 11.4913969039917, 12.012750625610352, 12.53410530090332, 13.055459976196289, 13.576814651489258, 14.098169326782227, 14.619524002075195, 15.140878677368164, 15.662233352661133, 16.1835880279541, 16.70494270324707, 17.22629737854004]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 6.0, 7.0, 12.0, 22.0, 35.0, 42.0, 63.0, 98.0, 133.0, 216.0, 344.0, 467.0, 762.0, 1060.0, 1556.0, 2450.0, 3880.0, 5968.0, 9190.0, 14370.0, 21840.0, 32488.0, 47639.0, 66966.0, 89332.0, 110623.0, 124714.0, 123433.0, 107611.0, 85408.0, 63815.0, 44964.0, 30618.0, 20457.0, 13223.0, 8586.0, 5679.0, 3638.0, 2353.0, 1518.0, 995.0, 659.0, 433.0, 297.0, 161.0, 134.0, 94.0, 59.0, 41.0, 28.0, 32.0, 14.0, 12.0, 5.0, 2.0, 1.0, 2.0, 3.0], "bins": [-4.95703125, -4.80645751953125, -4.6558837890625, -4.50531005859375, -4.354736328125, -4.20416259765625, -4.0535888671875, -3.90301513671875, -3.75244140625, -3.60186767578125, -3.4512939453125, -3.30072021484375, -3.150146484375, -2.99957275390625, -2.8489990234375, -2.69842529296875, -2.5478515625, -2.39727783203125, -2.2467041015625, -2.09613037109375, -1.945556640625, -1.79498291015625, -1.6444091796875, -1.49383544921875, -1.34326171875, -1.19268798828125, -1.0421142578125, -0.89154052734375, -0.740966796875, -0.59039306640625, -0.4398193359375, -0.28924560546875, -0.138671875, 0.01190185546875, 0.1624755859375, 0.31304931640625, 0.463623046875, 0.61419677734375, 0.7647705078125, 0.91534423828125, 1.06591796875, 1.21649169921875, 1.3670654296875, 1.51763916015625, 1.668212890625, 1.81878662109375, 1.9693603515625, 2.11993408203125, 2.2705078125, 2.42108154296875, 2.5716552734375, 2.72222900390625, 2.872802734375, 3.02337646484375, 3.1739501953125, 3.32452392578125, 3.47509765625, 3.62567138671875, 3.7762451171875, 3.92681884765625, 4.077392578125, 4.22796630859375, 4.3785400390625, 4.52911376953125, 4.6796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 6.0, 13.0, 10.0, 9.0, 9.0, 18.0, 13.0, 20.0, 24.0, 32.0, 21.0, 30.0, 29.0, 27.0, 24.0, 33.0, 39.0, 32.0, 45.0, 53.0, 31.0, 40.0, 47.0, 49.0, 31.0, 45.0, 36.0, 28.0, 29.0, 29.0, 24.0, 25.0, 15.0, 13.0, 21.0, 6.0, 8.0, 9.0, 5.0, 9.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.125, -15.60107421875, -15.0771484375, -14.55322265625, -14.029296875, -13.50537109375, -12.9814453125, -12.45751953125, -11.93359375, -11.40966796875, -10.8857421875, -10.36181640625, -9.837890625, -9.31396484375, -8.7900390625, -8.26611328125, -7.7421875, -7.21826171875, -6.6943359375, -6.17041015625, -5.646484375, -5.12255859375, -4.5986328125, -4.07470703125, -3.55078125, -3.02685546875, -2.5029296875, -1.97900390625, -1.455078125, -0.93115234375, -0.4072265625, 0.11669921875, 0.640625, 1.16455078125, 1.6884765625, 2.21240234375, 2.736328125, 3.26025390625, 3.7841796875, 4.30810546875, 4.83203125, 5.35595703125, 5.8798828125, 6.40380859375, 6.927734375, 7.45166015625, 7.9755859375, 8.49951171875, 9.0234375, 9.54736328125, 10.0712890625, 10.59521484375, 11.119140625, 11.64306640625, 12.1669921875, 12.69091796875, 13.21484375, 13.73876953125, 14.2626953125, 14.78662109375, 15.310546875, 15.83447265625, 16.3583984375, 16.88232421875, 17.40625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 5.0, 6.0, 2.0, 7.0, 6.0, 13.0, 24.0, 30.0, 34.0, 46.0, 84.0, 95.0, 174.0, 229.0, 384.0, 674.0, 1220.0, 2122.0, 3698.0, 6852.0, 13294.0, 27715.0, 287311.0, 642397.0, 30601.0, 14620.0, 7426.0, 4037.0, 2210.0, 1275.0, 723.0, 436.0, 250.0, 182.0, 110.0, 69.0, 58.0, 46.0, 22.0, 13.0, 13.0, 8.0, 8.0, 7.0, 2.0, 4.0, 3.0, 4.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-16.578125, -16.06103515625, -15.5439453125, -15.02685546875, -14.509765625, -13.99267578125, -13.4755859375, -12.95849609375, -12.44140625, -11.92431640625, -11.4072265625, -10.89013671875, -10.373046875, -9.85595703125, -9.3388671875, -8.82177734375, -8.3046875, -7.78759765625, -7.2705078125, -6.75341796875, -6.236328125, -5.71923828125, -5.2021484375, -4.68505859375, -4.16796875, -3.65087890625, -3.1337890625, -2.61669921875, -2.099609375, -1.58251953125, -1.0654296875, -0.54833984375, -0.03125, 0.48583984375, 1.0029296875, 1.52001953125, 2.037109375, 2.55419921875, 3.0712890625, 3.58837890625, 4.10546875, 4.62255859375, 5.1396484375, 5.65673828125, 6.173828125, 6.69091796875, 7.2080078125, 7.72509765625, 8.2421875, 8.75927734375, 9.2763671875, 9.79345703125, 10.310546875, 10.82763671875, 11.3447265625, 11.86181640625, 12.37890625, 12.89599609375, 13.4130859375, 13.93017578125, 14.447265625, 14.96435546875, 15.4814453125, 15.99853515625, 16.515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 4.0, 4.0, 5.0, 6.0, 4.0, 8.0, 5.0, 8.0, 13.0, 13.0, 14.0, 16.0, 20.0, 22.0, 17.0, 33.0, 29.0, 39.0, 40.0, 24.0, 44.0, 33.0, 37.0, 49.0, 48.0, 26.0, 34.0, 37.0, 41.0, 30.0, 44.0, 38.0, 34.0, 22.0, 24.0, 18.0, 19.0, 15.0, 17.0, 14.0, 9.0, 14.0, 6.0, 9.0, 4.0, 4.0, 1.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-12.3828125, -12.010498046875, -11.63818359375, -11.265869140625, -10.8935546875, -10.521240234375, -10.14892578125, -9.776611328125, -9.404296875, -9.031982421875, -8.65966796875, -8.287353515625, -7.9150390625, -7.542724609375, -7.17041015625, -6.798095703125, -6.42578125, -6.053466796875, -5.68115234375, -5.308837890625, -4.9365234375, -4.564208984375, -4.19189453125, -3.819580078125, -3.447265625, -3.074951171875, -2.70263671875, -2.330322265625, -1.9580078125, -1.585693359375, -1.21337890625, -0.841064453125, -0.46875, -0.096435546875, 0.27587890625, 0.648193359375, 1.0205078125, 1.392822265625, 1.76513671875, 2.137451171875, 2.509765625, 2.882080078125, 3.25439453125, 3.626708984375, 3.9990234375, 4.371337890625, 4.74365234375, 5.115966796875, 5.48828125, 5.860595703125, 6.23291015625, 6.605224609375, 6.9775390625, 7.349853515625, 7.72216796875, 8.094482421875, 8.466796875, 8.839111328125, 9.21142578125, 9.583740234375, 9.9560546875, 10.328369140625, 10.70068359375, 11.072998046875, 11.4453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 6.0, 4.0, 5.0, 4.0, 8.0, 11.0, 9.0, 16.0, 15.0, 15.0, 22.0, 40.0, 35.0, 52.0, 83.0, 122.0, 155.0, 239.0, 403.0, 773.0, 1996.0, 7608.0, 40610.0, 942834.0, 41647.0, 7829.0, 2068.0, 741.0, 381.0, 237.0, 149.0, 117.0, 68.0, 44.0, 57.0, 35.0, 26.0, 25.0, 18.0, 8.0, 10.0, 10.0, 6.0, 8.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.51953125, -3.4112548828125, -3.302978515625, -3.1947021484375, -3.08642578125, -2.9781494140625, -2.869873046875, -2.7615966796875, -2.6533203125, -2.5450439453125, -2.436767578125, -2.3284912109375, -2.22021484375, -2.1119384765625, -2.003662109375, -1.8953857421875, -1.787109375, -1.6788330078125, -1.570556640625, -1.4622802734375, -1.35400390625, -1.2457275390625, -1.137451171875, -1.0291748046875, -0.9208984375, -0.8126220703125, -0.704345703125, -0.5960693359375, -0.48779296875, -0.3795166015625, -0.271240234375, -0.1629638671875, -0.0546875, 0.0535888671875, 0.161865234375, 0.2701416015625, 0.37841796875, 0.4866943359375, 0.594970703125, 0.7032470703125, 0.8115234375, 0.9197998046875, 1.028076171875, 1.1363525390625, 1.24462890625, 1.3529052734375, 1.461181640625, 1.5694580078125, 1.677734375, 1.7860107421875, 1.894287109375, 2.0025634765625, 2.11083984375, 2.2191162109375, 2.327392578125, 2.4356689453125, 2.5439453125, 2.6522216796875, 2.760498046875, 2.8687744140625, 2.97705078125, 3.0853271484375, 3.193603515625, 3.3018798828125, 3.41015625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 9.0, 16.0, 12.0, 9.0, 20.0, 17.0, 29.0, 20.0, 22.0, 46.0, 44.0, 40.0, 49.0, 70.0, 68.0, 57.0, 69.0, 65.0, 62.0, 55.0, 29.0, 30.0, 26.0, 21.0, 20.0, 17.0, 7.0, 15.0, 6.0, 8.0, 4.0, 12.0, 3.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0001175999641418457, -0.00011423882097005844, -0.00011087767779827118, -0.00010751653462648392, -0.00010415539145469666, -0.0001007942482829094, -9.743310511112213e-05, -9.407196193933487e-05, -9.071081876754761e-05, -8.734967559576035e-05, -8.398853242397308e-05, -8.062738925218582e-05, -7.726624608039856e-05, -7.39051029086113e-05, -7.054395973682404e-05, -6.718281656503677e-05, -6.382167339324951e-05, -6.046053022146225e-05, -5.709938704967499e-05, -5.3738243877887726e-05, -5.0377100706100464e-05, -4.70159575343132e-05, -4.365481436252594e-05, -4.029367119073868e-05, -3.6932528018951416e-05, -3.3571384847164154e-05, -3.0210241675376892e-05, -2.684909850358963e-05, -2.3487955331802368e-05, -2.0126812160015106e-05, -1.6765668988227844e-05, -1.3404525816440582e-05, -1.004338264465332e-05, -6.682239472866058e-06, -3.3210963010787964e-06, 4.0046870708465576e-08, 3.4011900424957275e-06, 6.7623332142829895e-06, 1.0123476386070251e-05, 1.3484619557857513e-05, 1.6845762729644775e-05, 2.0206905901432037e-05, 2.35680490732193e-05, 2.692919224500656e-05, 3.0290335416793823e-05, 3.3651478588581085e-05, 3.701262176036835e-05, 4.037376493215561e-05, 4.373490810394287e-05, 4.709605127573013e-05, 5.0457194447517395e-05, 5.381833761930466e-05, 5.717948079109192e-05, 6.054062396287918e-05, 6.390176713466644e-05, 6.72629103064537e-05, 7.062405347824097e-05, 7.398519665002823e-05, 7.734633982181549e-05, 8.070748299360275e-05, 8.406862616539001e-05, 8.742976933717728e-05, 9.079091250896454e-05, 9.41520556807518e-05, 9.751319885253906e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 5.0, 4.0, 18.0, 15.0, 23.0, 20.0, 23.0, 37.0, 46.0, 72.0, 114.0, 147.0, 212.0, 326.0, 542.0, 974.0, 1814.0, 4450.0, 14262.0, 52583.0, 177317.0, 361680.0, 286637.0, 103871.0, 28921.0, 8292.0, 2929.0, 1255.0, 717.0, 392.0, 251.0, 192.0, 112.0, 79.0, 55.0, 44.0, 27.0, 33.0, 10.0, 25.0, 12.0, 8.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.544921875, -2.464813232421875, -2.38470458984375, -2.304595947265625, -2.2244873046875, -2.144378662109375, -2.06427001953125, -1.984161376953125, -1.904052734375, -1.823944091796875, -1.74383544921875, -1.663726806640625, -1.5836181640625, -1.503509521484375, -1.42340087890625, -1.343292236328125, -1.26318359375, -1.183074951171875, -1.10296630859375, -1.022857666015625, -0.9427490234375, -0.862640380859375, -0.78253173828125, -0.702423095703125, -0.622314453125, -0.542205810546875, -0.46209716796875, -0.381988525390625, -0.3018798828125, -0.221771240234375, -0.14166259765625, -0.061553955078125, 0.0185546875, 0.098663330078125, 0.17877197265625, 0.258880615234375, 0.3389892578125, 0.419097900390625, 0.49920654296875, 0.579315185546875, 0.659423828125, 0.739532470703125, 0.81964111328125, 0.899749755859375, 0.9798583984375, 1.059967041015625, 1.14007568359375, 1.220184326171875, 1.30029296875, 1.380401611328125, 1.46051025390625, 1.540618896484375, 1.6207275390625, 1.700836181640625, 1.78094482421875, 1.861053466796875, 1.941162109375, 2.021270751953125, 2.10137939453125, 2.181488037109375, 2.2615966796875, 2.341705322265625, 2.42181396484375, 2.501922607421875, 2.58203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 10.0, 13.0, 4.0, 15.0, 9.0, 13.0, 13.0, 21.0, 29.0, 28.0, 34.0, 35.0, 43.0, 56.0, 54.0, 68.0, 76.0, 62.0, 68.0, 61.0, 44.0, 44.0, 36.0, 28.0, 22.0, 21.0, 11.0, 15.0, 8.0, 9.0, 14.0, 10.0, 3.0, 2.0, 15.0, 8.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.50830078125, -0.49446868896484375, -0.4806365966796875, -0.46680450439453125, -0.452972412109375, -0.43914031982421875, -0.4253082275390625, -0.41147613525390625, -0.39764404296875, -0.38381195068359375, -0.3699798583984375, -0.35614776611328125, -0.342315673828125, -0.32848358154296875, -0.3146514892578125, -0.30081939697265625, -0.2869873046875, -0.27315521240234375, -0.2593231201171875, -0.24549102783203125, -0.231658935546875, -0.21782684326171875, -0.2039947509765625, -0.19016265869140625, -0.17633056640625, -0.16249847412109375, -0.1486663818359375, -0.13483428955078125, -0.121002197265625, -0.10717010498046875, -0.0933380126953125, -0.07950592041015625, -0.065673828125, -0.05184173583984375, -0.0380096435546875, -0.02417755126953125, -0.010345458984375, 0.00348663330078125, 0.0173187255859375, 0.03115081787109375, 0.04498291015625, 0.05881500244140625, 0.0726470947265625, 0.08647918701171875, 0.100311279296875, 0.11414337158203125, 0.1279754638671875, 0.14180755615234375, 0.1556396484375, 0.16947174072265625, 0.1833038330078125, 0.19713592529296875, 0.210968017578125, 0.22480010986328125, 0.2386322021484375, 0.25246429443359375, 0.26629638671875, 0.28012847900390625, 0.2939605712890625, 0.30779266357421875, 0.321624755859375, 0.33545684814453125, 0.3492889404296875, 0.36312103271484375, 0.376953125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 4.0, 7.0, 1.0, 6.0, 6.0, 5.0, 9.0, 14.0, 16.0, 17.0, 18.0, 27.0, 22.0, 28.0, 28.0, 34.0, 39.0, 44.0, 47.0, 55.0, 31.0, 47.0, 41.0, 39.0, 34.0, 44.0, 41.0, 35.0, 32.0, 46.0, 25.0, 18.0, 27.0, 21.0, 17.0, 14.0, 18.0, 11.0, 4.0, 8.0, 8.0, 2.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.269243240356445, -13.825632095336914, -13.382019996643066, -12.938408851623535, -12.494796752929688, -12.051185607910156, -11.607574462890625, -11.163962364196777, -10.72035026550293, -10.276739120483398, -9.83312702178955, -9.38951587677002, -8.945903778076172, -8.50229263305664, -8.05868148803711, -7.615069389343262, -7.1714582443237305, -6.727846622467041, -6.284235000610352, -5.84062385559082, -5.397011756896973, -4.953400611877441, -4.509788990020752, -4.0661773681640625, -3.622565746307373, -3.1789541244506836, -2.735342502593994, -2.291731119155884, -1.8481194972991943, -1.4045078754425049, -0.9608964920043945, -0.5172848701477051, -0.07367324829101562, 0.36993831396102905, 0.8135498762130737, 1.2571613788604736, 1.700773000717163, 2.1443846225738525, 2.587996006011963, 3.0316076278686523, 3.475219249725342, 3.9188308715820312, 4.362442493438721, 4.80605411529541, 5.249665260314941, 5.693277359008789, 6.13688850402832, 6.58050012588501, 7.024111747741699, 7.467723369598389, 7.911334991455078, 8.35494613647461, 8.798558235168457, 9.242169380187988, 9.685781478881836, 10.129392623901367, 10.573003768920898, 11.01661491394043, 11.460227012634277, 11.903838157653809, 12.347450256347656, 12.791061401367188, 13.234672546386719, 13.678284645080566, 14.121896743774414]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 9.0, 8.0, 13.0, 9.0, 10.0, 17.0, 16.0, 20.0, 19.0, 33.0, 20.0, 31.0, 24.0, 30.0, 22.0, 33.0, 38.0, 35.0, 40.0, 56.0, 35.0, 37.0, 44.0, 49.0, 36.0, 42.0, 33.0, 29.0, 25.0, 38.0, 20.0, 25.0, 17.0, 15.0, 13.0, 11.0, 11.0, 8.0, 8.0, 7.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.000316619873047, -15.481047630310059, -14.96177864074707, -14.442509651184082, -13.923240661621094, -13.403971672058105, -12.884702682495117, -12.365433692932129, -11.84616470336914, -11.326895713806152, -10.807626724243164, -10.288357734680176, -9.769088745117188, -9.2498197555542, -8.730550765991211, -8.211281776428223, -7.692012786865234, -7.172743797302246, -6.653474807739258, -6.1342058181762695, -5.614936828613281, -5.095667839050293, -4.576398849487305, -4.057129859924316, -3.537860870361328, -3.01859188079834, -2.4993228912353516, -1.9800539016723633, -1.460784912109375, -0.9415159225463867, -0.42224693298339844, 0.09702205657958984, 0.6162929534912109, 1.1355619430541992, 1.6548309326171875, 2.174099922180176, 2.693368911743164, 3.2126379013061523, 3.7319068908691406, 4.251175880432129, 4.770444869995117, 5.2897138595581055, 5.808982849121094, 6.328251838684082, 6.84752082824707, 7.366789817810059, 7.886058807373047, 8.405327796936035, 8.924596786499023, 9.443865776062012, 9.963134765625, 10.482403755187988, 11.001672744750977, 11.520941734313965, 12.040210723876953, 12.559479713439941, 13.07874870300293, 13.598017692565918, 14.117286682128906, 14.636555671691895, 15.155824661254883, 15.675093650817871, 16.19436264038086, 16.71363067626953, 17.232900619506836]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 8.0, 6.0, 37.0, 49.0, 96.0, 126.0, 254.0, 351.0, 647.0, 917.0, 1513.0, 2466.0, 3621.0, 5432.0, 8365.0, 12513.0, 17683.0, 25190.0, 34163.0, 45819.0, 57892.0, 69922.0, 81726.0, 89910.0, 93880.0, 91936.0, 85134.0, 75121.0, 63146.0, 50129.0, 38841.0, 28648.0, 20329.0, 14376.0, 9797.0, 6452.0, 4358.0, 2807.0, 1814.0, 1149.0, 753.0, 435.0, 310.0, 183.0, 107.0, 65.0, 28.0, 22.0, 11.0, 9.0, 4.0, 8.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.5533447265625, -9.231689453125, -8.9100341796875, -8.58837890625, -8.2667236328125, -7.945068359375, -7.6234130859375, -7.3017578125, -6.9801025390625, -6.658447265625, -6.3367919921875, -6.01513671875, -5.6934814453125, -5.371826171875, -5.0501708984375, -4.728515625, -4.4068603515625, -4.085205078125, -3.7635498046875, -3.44189453125, -3.1202392578125, -2.798583984375, -2.4769287109375, -2.1552734375, -1.8336181640625, -1.511962890625, -1.1903076171875, -0.86865234375, -0.5469970703125, -0.225341796875, 0.0963134765625, 0.41796875, 0.7396240234375, 1.061279296875, 1.3829345703125, 1.70458984375, 2.0262451171875, 2.347900390625, 2.6695556640625, 2.9912109375, 3.3128662109375, 3.634521484375, 3.9561767578125, 4.27783203125, 4.5994873046875, 4.921142578125, 5.2427978515625, 5.564453125, 5.8861083984375, 6.207763671875, 6.5294189453125, 6.85107421875, 7.1727294921875, 7.494384765625, 7.8160400390625, 8.1376953125, 8.4593505859375, 8.781005859375, 9.1026611328125, 9.42431640625, 9.7459716796875, 10.067626953125, 10.3892822265625, 10.7109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 10.0, 11.0, 9.0, 11.0, 18.0, 14.0, 22.0, 19.0, 37.0, 20.0, 29.0, 27.0, 25.0, 28.0, 33.0, 38.0, 35.0, 40.0, 57.0, 27.0, 43.0, 41.0, 52.0, 37.0, 37.0, 36.0, 26.0, 28.0, 33.0, 21.0, 30.0, 12.0, 13.0, 18.0, 6.0, 13.0, 7.0, 7.0, 8.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.0, -15.478271484375, -14.95654296875, -14.434814453125, -13.9130859375, -13.391357421875, -12.86962890625, -12.347900390625, -11.826171875, -11.304443359375, -10.78271484375, -10.260986328125, -9.7392578125, -9.217529296875, -8.69580078125, -8.174072265625, -7.65234375, -7.130615234375, -6.60888671875, -6.087158203125, -5.5654296875, -5.043701171875, -4.52197265625, -4.000244140625, -3.478515625, -2.956787109375, -2.43505859375, -1.913330078125, -1.3916015625, -0.869873046875, -0.34814453125, 0.173583984375, 0.6953125, 1.217041015625, 1.73876953125, 2.260498046875, 2.7822265625, 3.303955078125, 3.82568359375, 4.347412109375, 4.869140625, 5.390869140625, 5.91259765625, 6.434326171875, 6.9560546875, 7.477783203125, 7.99951171875, 8.521240234375, 9.04296875, 9.564697265625, 10.08642578125, 10.608154296875, 11.1298828125, 11.651611328125, 12.17333984375, 12.695068359375, 13.216796875, 13.738525390625, 14.26025390625, 14.781982421875, 15.3037109375, 15.825439453125, 16.34716796875, 16.868896484375, 17.390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 9.0, 16.0, 23.0, 23.0, 50.0, 90.0, 146.0, 213.0, 314.0, 514.0, 767.0, 1227.0, 1924.0, 3139.0, 4724.0, 7278.0, 11261.0, 16759.0, 24461.0, 34202.0, 46735.0, 60967.0, 74880.0, 88348.0, 97832.0, 100522.0, 97656.0, 87690.0, 75317.0, 60493.0, 45747.0, 33658.0, 23918.0, 16329.0, 11009.0, 7326.0, 4662.0, 3028.0, 1928.0, 1252.0, 789.0, 469.0, 325.0, 199.0, 112.0, 66.0, 58.0, 32.0, 28.0, 14.0, 7.0, 11.0, 6.0, 4.0, 2.0, 0.0, 3.0], "bins": [-12.1953125, -11.81982421875, -11.4443359375, -11.06884765625, -10.693359375, -10.31787109375, -9.9423828125, -9.56689453125, -9.19140625, -8.81591796875, -8.4404296875, -8.06494140625, -7.689453125, -7.31396484375, -6.9384765625, -6.56298828125, -6.1875, -5.81201171875, -5.4365234375, -5.06103515625, -4.685546875, -4.31005859375, -3.9345703125, -3.55908203125, -3.18359375, -2.80810546875, -2.4326171875, -2.05712890625, -1.681640625, -1.30615234375, -0.9306640625, -0.55517578125, -0.1796875, 0.19580078125, 0.5712890625, 0.94677734375, 1.322265625, 1.69775390625, 2.0732421875, 2.44873046875, 2.82421875, 3.19970703125, 3.5751953125, 3.95068359375, 4.326171875, 4.70166015625, 5.0771484375, 5.45263671875, 5.828125, 6.20361328125, 6.5791015625, 6.95458984375, 7.330078125, 7.70556640625, 8.0810546875, 8.45654296875, 8.83203125, 9.20751953125, 9.5830078125, 9.95849609375, 10.333984375, 10.70947265625, 11.0849609375, 11.46044921875, 11.8359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 7.0, 9.0, 3.0, 9.0, 10.0, 20.0, 16.0, 28.0, 14.0, 25.0, 33.0, 21.0, 35.0, 41.0, 38.0, 29.0, 36.0, 33.0, 47.0, 35.0, 36.0, 32.0, 39.0, 47.0, 42.0, 29.0, 36.0, 29.0, 33.0, 32.0, 29.0, 20.0, 12.0, 19.0, 15.0, 10.0, 13.0, 9.0, 4.0, 8.0, 2.0, 8.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5078125, -10.1484375, -9.7890625, -9.4296875, -9.0703125, -8.7109375, -8.3515625, -7.9921875, -7.6328125, -7.2734375, -6.9140625, -6.5546875, -6.1953125, -5.8359375, -5.4765625, -5.1171875, -4.7578125, -4.3984375, -4.0390625, -3.6796875, -3.3203125, -2.9609375, -2.6015625, -2.2421875, -1.8828125, -1.5234375, -1.1640625, -0.8046875, -0.4453125, -0.0859375, 0.2734375, 0.6328125, 0.9921875, 1.3515625, 1.7109375, 2.0703125, 2.4296875, 2.7890625, 3.1484375, 3.5078125, 3.8671875, 4.2265625, 4.5859375, 4.9453125, 5.3046875, 5.6640625, 6.0234375, 6.3828125, 6.7421875, 7.1015625, 7.4609375, 7.8203125, 8.1796875, 8.5390625, 8.8984375, 9.2578125, 9.6171875, 9.9765625, 10.3359375, 10.6953125, 11.0546875, 11.4140625, 11.7734375, 12.1328125, 12.4921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 14.0, 24.0, 30.0, 57.0, 72.0, 133.0, 208.0, 338.0, 622.0, 1046.0, 1696.0, 2987.0, 5147.0, 8609.0, 14766.0, 24238.0, 39167.0, 59647.0, 84694.0, 109975.0, 128324.0, 133447.0, 123542.0, 100522.0, 75016.0, 50948.0, 33308.0, 20387.0, 12180.0, 7141.0, 4177.0, 2438.0, 1441.0, 828.0, 538.0, 335.0, 202.0, 119.0, 74.0, 41.0, 28.0, 13.0, 10.0, 9.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.7421875, -4.599853515625, -4.45751953125, -4.315185546875, -4.1728515625, -4.030517578125, -3.88818359375, -3.745849609375, -3.603515625, -3.461181640625, -3.31884765625, -3.176513671875, -3.0341796875, -2.891845703125, -2.74951171875, -2.607177734375, -2.46484375, -2.322509765625, -2.18017578125, -2.037841796875, -1.8955078125, -1.753173828125, -1.61083984375, -1.468505859375, -1.326171875, -1.183837890625, -1.04150390625, -0.899169921875, -0.7568359375, -0.614501953125, -0.47216796875, -0.329833984375, -0.1875, -0.045166015625, 0.09716796875, 0.239501953125, 0.3818359375, 0.524169921875, 0.66650390625, 0.808837890625, 0.951171875, 1.093505859375, 1.23583984375, 1.378173828125, 1.5205078125, 1.662841796875, 1.80517578125, 1.947509765625, 2.08984375, 2.232177734375, 2.37451171875, 2.516845703125, 2.6591796875, 2.801513671875, 2.94384765625, 3.086181640625, 3.228515625, 3.370849609375, 3.51318359375, 3.655517578125, 3.7978515625, 3.940185546875, 4.08251953125, 4.224853515625, 4.3671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 10.0, 11.0, 14.0, 17.0, 27.0, 33.0, 28.0, 41.0, 49.0, 59.0, 62.0, 65.0, 52.0, 85.0, 51.0, 59.0, 53.0, 47.0, 47.0, 39.0, 34.0, 18.0, 25.0, 11.0, 13.0, 10.0, 14.0, 5.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000576019287109375, -0.0005540177226066589, -0.0005320161581039429, -0.0005100145936012268, -0.00048801302909851074, -0.0004660114645957947, -0.0004440099000930786, -0.00042200833559036255, -0.0004000067710876465, -0.0003780052065849304, -0.00035600364208221436, -0.0003340020775794983, -0.0003120005130767822, -0.00028999894857406616, -0.0002679973840713501, -0.00024599581956863403, -0.00022399425506591797, -0.0002019926905632019, -0.00017999112606048584, -0.00015798956155776978, -0.0001359879970550537, -0.00011398643255233765, -9.198486804962158e-05, -6.998330354690552e-05, -4.798173904418945e-05, -2.598017454147339e-05, -3.978610038757324e-06, 1.802295446395874e-05, 4.0024518966674805e-05, 6.202608346939087e-05, 8.402764797210693e-05, 0.000106029212474823, 0.00012803077697753906, 0.00015003234148025513, 0.0001720339059829712, 0.00019403547048568726, 0.00021603703498840332, 0.00023803859949111938, 0.00026004016399383545, 0.0002820417284965515, 0.0003040432929992676, 0.00032604485750198364, 0.0003480464220046997, 0.00037004798650741577, 0.00039204955101013184, 0.0004140511155128479, 0.00043605268001556396, 0.00045805424451828003, 0.0004800558090209961, 0.0005020573735237122, 0.0005240589380264282, 0.0005460605025291443, 0.0005680620670318604, 0.0005900636315345764, 0.0006120651960372925, 0.0006340667605400085, 0.0006560683250427246, 0.0006780698895454407, 0.0007000714540481567, 0.0007220730185508728, 0.0007440745830535889, 0.0007660761475563049, 0.000788077712059021, 0.0008100792765617371, 0.0008320808410644531]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 6.0, 9.0, 13.0, 27.0, 33.0, 35.0, 65.0, 108.0, 148.0, 234.0, 339.0, 492.0, 801.0, 1174.0, 1788.0, 2766.0, 4230.0, 6353.0, 9691.0, 14854.0, 22278.0, 32383.0, 46019.0, 62429.0, 79261.0, 94976.0, 106321.0, 109210.0, 103497.0, 90866.0, 73792.0, 56636.0, 41386.0, 28760.0, 19624.0, 13230.0, 8672.0, 5519.0, 3635.0, 2366.0, 1524.0, 1017.0, 657.0, 428.0, 301.0, 179.0, 146.0, 90.0, 73.0, 39.0, 30.0, 20.0, 10.0, 5.0, 8.0, 6.0, 3.0, 1.0, 0.0, 3.0], "bins": [-3.853515625, -3.730560302734375, -3.60760498046875, -3.484649658203125, -3.3616943359375, -3.238739013671875, -3.11578369140625, -2.992828369140625, -2.869873046875, -2.746917724609375, -2.62396240234375, -2.501007080078125, -2.3780517578125, -2.255096435546875, -2.13214111328125, -2.009185791015625, -1.88623046875, -1.763275146484375, -1.64031982421875, -1.517364501953125, -1.3944091796875, -1.271453857421875, -1.14849853515625, -1.025543212890625, -0.902587890625, -0.779632568359375, -0.65667724609375, -0.533721923828125, -0.4107666015625, -0.287811279296875, -0.16485595703125, -0.041900634765625, 0.0810546875, 0.204010009765625, 0.32696533203125, 0.449920654296875, 0.5728759765625, 0.695831298828125, 0.81878662109375, 0.941741943359375, 1.064697265625, 1.187652587890625, 1.31060791015625, 1.433563232421875, 1.5565185546875, 1.679473876953125, 1.80242919921875, 1.925384521484375, 2.04833984375, 2.171295166015625, 2.29425048828125, 2.417205810546875, 2.5401611328125, 2.663116455078125, 2.78607177734375, 2.909027099609375, 3.031982421875, 3.154937744140625, 3.27789306640625, 3.400848388671875, 3.5238037109375, 3.646759033203125, 3.76971435546875, 3.892669677734375, 4.015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 8.0, 4.0, 8.0, 8.0, 12.0, 10.0, 17.0, 21.0, 21.0, 25.0, 28.0, 36.0, 34.0, 40.0, 38.0, 48.0, 48.0, 48.0, 51.0, 38.0, 44.0, 53.0, 46.0, 39.0, 45.0, 40.0, 25.0, 26.0, 24.0, 19.0, 15.0, 17.0, 13.0, 9.0, 9.0, 6.0, 10.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.83203125, -1.768585205078125, -1.70513916015625, -1.641693115234375, -1.5782470703125, -1.514801025390625, -1.45135498046875, -1.387908935546875, -1.324462890625, -1.261016845703125, -1.19757080078125, -1.134124755859375, -1.0706787109375, -1.007232666015625, -0.94378662109375, -0.880340576171875, -0.81689453125, -0.753448486328125, -0.69000244140625, -0.626556396484375, -0.5631103515625, -0.499664306640625, -0.43621826171875, -0.372772216796875, -0.309326171875, -0.245880126953125, -0.18243408203125, -0.118988037109375, -0.0555419921875, 0.007904052734375, 0.07135009765625, 0.134796142578125, 0.1982421875, 0.261688232421875, 0.32513427734375, 0.388580322265625, 0.4520263671875, 0.515472412109375, 0.57891845703125, 0.642364501953125, 0.705810546875, 0.769256591796875, 0.83270263671875, 0.896148681640625, 0.9595947265625, 1.023040771484375, 1.08648681640625, 1.149932861328125, 1.21337890625, 1.276824951171875, 1.34027099609375, 1.403717041015625, 1.4671630859375, 1.530609130859375, 1.59405517578125, 1.657501220703125, 1.720947265625, 1.784393310546875, 1.84783935546875, 1.911285400390625, 1.9747314453125, 2.038177490234375, 2.10162353515625, 2.165069580078125, 2.228515625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 8.0, 13.0, 20.0, 18.0, 20.0, 26.0, 31.0, 30.0, 28.0, 34.0, 45.0, 45.0, 55.0, 50.0, 41.0, 60.0, 51.0, 43.0, 56.0, 38.0, 44.0, 37.0, 42.0, 32.0, 24.0, 15.0, 20.0, 21.0, 10.0, 5.0, 3.0, 9.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.70073127746582, -17.165332794189453, -16.629934310913086, -16.09453582763672, -15.559137344360352, -15.023738861083984, -14.488340377807617, -13.95294189453125, -13.417543411254883, -12.882144927978516, -12.346746444702148, -11.811347961425781, -11.275949478149414, -10.740550994873047, -10.20515251159668, -9.669754028320312, -9.134355545043945, -8.598957061767578, -8.063558578491211, -7.528160095214844, -6.992761611938477, -6.457363128662109, -5.921964645385742, -5.386566162109375, -4.851167678833008, -4.315769195556641, -3.7803707122802734, -3.2449722290039062, -2.709573745727539, -2.174175262451172, -1.6387767791748047, -1.1033782958984375, -0.5679817199707031, -0.03258323669433594, 0.5028152465820312, 1.0382137298583984, 1.5736122131347656, 2.109010696411133, 2.6444091796875, 3.179807662963867, 3.7152061462402344, 4.250604629516602, 4.786003112792969, 5.321401596069336, 5.856800079345703, 6.39219856262207, 6.9275970458984375, 7.462995529174805, 7.998394012451172, 8.533792495727539, 9.069190979003906, 9.604589462280273, 10.13998794555664, 10.675386428833008, 11.210784912109375, 11.746183395385742, 12.28158187866211, 12.816980361938477, 13.352378845214844, 13.887777328491211, 14.423175811767578, 14.958574295043945, 15.493972778320312, 16.02937126159668, 16.564769744873047]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 4.0, 3.0, 7.0, 7.0, 6.0, 12.0, 10.0, 10.0, 13.0, 18.0, 16.0, 13.0, 21.0, 27.0, 24.0, 29.0, 22.0, 24.0, 37.0, 40.0, 38.0, 45.0, 54.0, 40.0, 30.0, 34.0, 41.0, 43.0, 31.0, 33.0, 26.0, 32.0, 30.0, 23.0, 17.0, 23.0, 16.0, 20.0, 12.0, 18.0, 13.0, 13.0, 9.0, 6.0, 7.0, 2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.744568824768066, -15.233253479003906, -14.721938133239746, -14.210622787475586, -13.69930648803711, -13.18799114227295, -12.676675796508789, -12.165360450744629, -11.654045104980469, -11.142729759216309, -10.631414413452148, -10.120098114013672, -9.608782768249512, -9.097467422485352, -8.586152076721191, -8.074836730957031, -7.563520431518555, -7.0522050857543945, -6.540889263153076, -6.029573917388916, -5.518258094787598, -5.0069427490234375, -4.495627403259277, -3.984311819076538, -3.472996234893799, -2.9616806507110596, -2.4503650665283203, -1.9390497207641602, -1.427734136581421, -0.9164185523986816, -0.4051032066345215, 0.10621237754821777, 0.6175270080566406, 1.1288425922393799, 1.6401580572128296, 2.1514735221862793, 2.6627891063690186, 3.174104690551758, 3.685420036315918, 4.196735382080078, 4.7080512046813965, 5.219366550445557, 5.730682373046875, 6.241997718811035, 6.753313064575195, 7.264628887176514, 7.775944232940674, 8.287260055541992, 8.798575401306152, 9.309890747070312, 9.821206092834473, 10.332521438598633, 10.84383773803711, 11.35515308380127, 11.86646842956543, 12.37778377532959, 12.88909912109375, 13.40041446685791, 13.91172981262207, 14.423046112060547, 14.934361457824707, 15.445676803588867, 15.956992149353027, 16.468307495117188, 16.979623794555664]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [4.0, 0.0, 10.0, 11.0, 14.0, 25.0, 46.0, 75.0, 155.0, 238.0, 404.0, 680.0, 1093.0, 1758.0, 2832.0, 4622.0, 7306.0, 11485.0, 17661.0, 27544.0, 41717.0, 62965.0, 92189.0, 133255.0, 186400.0, 248617.0, 317671.0, 381587.0, 425782.0, 435985.0, 410916.0, 357859.0, 291090.0, 222501.0, 163635.0, 115944.0, 79599.0, 53132.0, 35038.0, 22866.0, 14287.0, 9307.0, 6058.0, 3731.0, 2283.0, 1512.0, 942.0, 596.0, 334.0, 218.0, 126.0, 86.0, 42.0, 34.0, 14.0, 11.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.1953125, -11.779052734375, -11.36279296875, -10.946533203125, -10.5302734375, -10.114013671875, -9.69775390625, -9.281494140625, -8.865234375, -8.448974609375, -8.03271484375, -7.616455078125, -7.2001953125, -6.783935546875, -6.36767578125, -5.951416015625, -5.53515625, -5.118896484375, -4.70263671875, -4.286376953125, -3.8701171875, -3.453857421875, -3.03759765625, -2.621337890625, -2.205078125, -1.788818359375, -1.37255859375, -0.956298828125, -0.5400390625, -0.123779296875, 0.29248046875, 0.708740234375, 1.125, 1.541259765625, 1.95751953125, 2.373779296875, 2.7900390625, 3.206298828125, 3.62255859375, 4.038818359375, 4.455078125, 4.871337890625, 5.28759765625, 5.703857421875, 6.1201171875, 6.536376953125, 6.95263671875, 7.368896484375, 7.78515625, 8.201416015625, 8.61767578125, 9.033935546875, 9.4501953125, 9.866455078125, 10.28271484375, 10.698974609375, 11.115234375, 11.531494140625, 11.94775390625, 12.364013671875, 12.7802734375, 13.196533203125, 13.61279296875, 14.029052734375, 14.4453125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 4.0, 5.0, 11.0, 8.0, 14.0, 10.0, 21.0, 14.0, 16.0, 22.0, 19.0, 23.0, 23.0, 30.0, 23.0, 28.0, 41.0, 41.0, 50.0, 44.0, 42.0, 35.0, 32.0, 37.0, 45.0, 35.0, 27.0, 35.0, 29.0, 29.0, 28.0, 20.0, 23.0, 15.0, 20.0, 12.0, 17.0, 14.0, 15.0, 7.0, 8.0, 6.0, 3.0, 3.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.5625, -13.1275634765625, -12.692626953125, -12.2576904296875, -11.82275390625, -11.3878173828125, -10.952880859375, -10.5179443359375, -10.0830078125, -9.6480712890625, -9.213134765625, -8.7781982421875, -8.34326171875, -7.9083251953125, -7.473388671875, -7.0384521484375, -6.603515625, -6.1685791015625, -5.733642578125, -5.2987060546875, -4.86376953125, -4.4288330078125, -3.993896484375, -3.5589599609375, -3.1240234375, -2.6890869140625, -2.254150390625, -1.8192138671875, -1.38427734375, -0.9493408203125, -0.514404296875, -0.0794677734375, 0.35546875, 0.7904052734375, 1.225341796875, 1.6602783203125, 2.09521484375, 2.5301513671875, 2.965087890625, 3.4000244140625, 3.8349609375, 4.2698974609375, 4.704833984375, 5.1397705078125, 5.57470703125, 6.0096435546875, 6.444580078125, 6.8795166015625, 7.314453125, 7.7493896484375, 8.184326171875, 8.6192626953125, 9.05419921875, 9.4891357421875, 9.924072265625, 10.3590087890625, 10.7939453125, 11.2288818359375, 11.663818359375, 12.0987548828125, 12.53369140625, 12.9686279296875, 13.403564453125, 13.8385009765625, 14.2734375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 14.0, 17.0, 34.0, 41.0, 95.0, 136.0, 249.0, 412.0, 689.0, 1142.0, 1992.0, 3209.0, 5357.0, 8892.0, 14524.0, 23432.0, 36690.0, 56037.0, 84491.0, 122558.0, 173219.0, 232053.0, 294147.0, 354749.0, 398549.0, 419177.0, 409500.0, 371827.0, 317128.0, 253806.0, 192536.0, 139641.0, 96951.0, 65345.0, 43445.0, 27869.0, 17398.0, 10718.0, 6469.0, 3931.0, 2361.0, 1411.0, 787.0, 550.0, 299.0, 171.0, 96.0, 58.0, 38.0, 26.0, 12.0, 9.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-12.765625, -12.375, -11.984375, -11.59375, -11.203125, -10.8125, -10.421875, -10.03125, -9.640625, -9.25, -8.859375, -8.46875, -8.078125, -7.6875, -7.296875, -6.90625, -6.515625, -6.125, -5.734375, -5.34375, -4.953125, -4.5625, -4.171875, -3.78125, -3.390625, -3.0, -2.609375, -2.21875, -1.828125, -1.4375, -1.046875, -0.65625, -0.265625, 0.125, 0.515625, 0.90625, 1.296875, 1.6875, 2.078125, 2.46875, 2.859375, 3.25, 3.640625, 4.03125, 4.421875, 4.8125, 5.203125, 5.59375, 5.984375, 6.375, 6.765625, 7.15625, 7.546875, 7.9375, 8.328125, 8.71875, 9.109375, 9.5, 9.890625, 10.28125, 10.671875, 11.0625, 11.453125, 11.84375, 12.234375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 1.0, 8.0, 7.0, 6.0, 14.0, 14.0, 12.0, 18.0, 27.0, 31.0, 31.0, 56.0, 66.0, 62.0, 98.0, 106.0, 125.0, 156.0, 162.0, 176.0, 190.0, 190.0, 205.0, 201.0, 214.0, 242.0, 202.0, 192.0, 197.0, 146.0, 165.0, 138.0, 122.0, 105.0, 82.0, 59.0, 60.0, 49.0, 35.0, 30.0, 23.0, 19.0, 11.0, 11.0, 4.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.83203125, -6.59185791015625, -6.3516845703125, -6.11151123046875, -5.871337890625, -5.63116455078125, -5.3909912109375, -5.15081787109375, -4.91064453125, -4.67047119140625, -4.4302978515625, -4.19012451171875, -3.949951171875, -3.70977783203125, -3.4696044921875, -3.22943115234375, -2.9892578125, -2.74908447265625, -2.5089111328125, -2.26873779296875, -2.028564453125, -1.78839111328125, -1.5482177734375, -1.30804443359375, -1.06787109375, -0.82769775390625, -0.5875244140625, -0.34735107421875, -0.107177734375, 0.13299560546875, 0.3731689453125, 0.61334228515625, 0.853515625, 1.09368896484375, 1.3338623046875, 1.57403564453125, 1.814208984375, 2.05438232421875, 2.2945556640625, 2.53472900390625, 2.77490234375, 3.01507568359375, 3.2552490234375, 3.49542236328125, 3.735595703125, 3.97576904296875, 4.2159423828125, 4.45611572265625, 4.6962890625, 4.93646240234375, 5.1766357421875, 5.41680908203125, 5.656982421875, 5.89715576171875, 6.1373291015625, 6.37750244140625, 6.61767578125, 6.85784912109375, 7.0980224609375, 7.33819580078125, 7.578369140625, 7.81854248046875, 8.0587158203125, 8.29888916015625, 8.5390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 8.0, 10.0, 12.0, 12.0, 14.0, 18.0, 16.0, 25.0, 25.0, 22.0, 29.0, 31.0, 24.0, 30.0, 32.0, 34.0, 60.0, 44.0, 43.0, 42.0, 44.0, 35.0, 37.0, 38.0, 35.0, 28.0, 28.0, 31.0, 24.0, 22.0, 22.0, 12.0, 17.0, 13.0, 9.0, 8.0, 12.0, 7.0, 6.0, 11.0, 8.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-15.44028377532959, -14.9876127243042, -14.534941673278809, -14.082270622253418, -13.629599571228027, -13.176928520202637, -12.724257469177246, -12.271586418151855, -11.818915367126465, -11.366244316101074, -10.913573265075684, -10.460902214050293, -10.008231163024902, -9.555560111999512, -9.102889060974121, -8.65021800994873, -8.19754695892334, -7.744875907897949, -7.292204856872559, -6.839533805847168, -6.386862754821777, -5.934191703796387, -5.481520652770996, -5.0288496017456055, -4.576178550720215, -4.123507499694824, -3.6708364486694336, -3.218165397644043, -2.7654943466186523, -2.3128232955932617, -1.860152244567871, -1.4074811935424805, -0.9548101425170898, -0.5021390914916992, -0.049468040466308594, 0.40320301055908203, 0.8558740615844727, 1.3085451126098633, 1.761216163635254, 2.2138872146606445, 2.666558265686035, 3.119229316711426, 3.5719003677368164, 4.024571418762207, 4.477242469787598, 4.929913520812988, 5.382584571838379, 5.8352556228637695, 6.28792667388916, 6.740597724914551, 7.193268775939941, 7.645939826965332, 8.098610877990723, 8.551281929016113, 9.003952980041504, 9.456624031066895, 9.909295082092285, 10.361966133117676, 10.814637184143066, 11.267308235168457, 11.719979286193848, 12.172650337219238, 12.625321388244629, 13.07799243927002, 13.53066349029541]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 3.0, 3.0, 4.0, 8.0, 17.0, 13.0, 10.0, 15.0, 13.0, 18.0, 21.0, 25.0, 31.0, 28.0, 45.0, 28.0, 35.0, 32.0, 41.0, 36.0, 36.0, 33.0, 33.0, 23.0, 42.0, 49.0, 25.0, 40.0, 27.0, 25.0, 37.0, 25.0, 24.0, 18.0, 14.0, 19.0, 16.0, 14.0, 16.0, 8.0, 6.0, 11.0, 7.0, 2.0, 4.0, 5.0, 3.0, 4.0, 4.0, 6.0], "bins": [-19.3382568359375, -18.801128387451172, -18.263999938964844, -17.726871490478516, -17.189743041992188, -16.65261459350586, -16.11548614501953, -15.578357696533203, -15.041229248046875, -14.504100799560547, -13.966972351074219, -13.42984390258789, -12.892715454101562, -12.355587005615234, -11.818458557128906, -11.281330108642578, -10.744200706481934, -10.207072257995605, -9.669943809509277, -9.13281536102295, -8.595686912536621, -8.058558464050293, -7.521429538726807, -6.9843010902404785, -6.44717264175415, -5.910044193267822, -5.372915744781494, -4.835786819458008, -4.29865837097168, -3.7615301609039307, -3.2244014739990234, -2.6872730255126953, -2.150143623352051, -1.6130151748657227, -1.075886607170105, -0.5387580394744873, -0.0016295909881591797, 0.535498857498169, 1.0726275444030762, 1.6097559928894043, 2.1468844413757324, 2.6840128898620605, 3.2211413383483887, 3.758270025253296, 4.295398712158203, 4.832527160644531, 5.369655609130859, 5.9067840576171875, 6.443912506103516, 6.981040954589844, 7.518169403076172, 8.0552978515625, 8.592426300048828, 9.129554748535156, 9.666683197021484, 10.203811645507812, 10.74094009399414, 11.278068542480469, 11.815196990966797, 12.352325439453125, 12.889453887939453, 13.426582336425781, 13.96371078491211, 14.500839233398438, 15.037968635559082]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 9.0, 14.0, 23.0, 34.0, 45.0, 70.0, 101.0, 162.0, 246.0, 392.0, 668.0, 1021.0, 1738.0, 2840.0, 4824.0, 7796.0, 12427.0, 19495.0, 30033.0, 44036.0, 61576.0, 80573.0, 98672.0, 110680.0, 115043.0, 108874.0, 95454.0, 76997.0, 57829.0, 41244.0, 27837.0, 18263.0, 11511.0, 6960.0, 4259.0, 2567.0, 1697.0, 952.0, 624.0, 361.0, 222.0, 138.0, 93.0, 55.0, 31.0, 27.0, 17.0, 9.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.2265625, -6.9888916015625, -6.751220703125, -6.5135498046875, -6.27587890625, -6.0382080078125, -5.800537109375, -5.5628662109375, -5.3251953125, -5.0875244140625, -4.849853515625, -4.6121826171875, -4.37451171875, -4.1368408203125, -3.899169921875, -3.6614990234375, -3.423828125, -3.1861572265625, -2.948486328125, -2.7108154296875, -2.47314453125, -2.2354736328125, -1.997802734375, -1.7601318359375, -1.5224609375, -1.2847900390625, -1.047119140625, -0.8094482421875, -0.57177734375, -0.3341064453125, -0.096435546875, 0.1412353515625, 0.37890625, 0.6165771484375, 0.854248046875, 1.0919189453125, 1.32958984375, 1.5672607421875, 1.804931640625, 2.0426025390625, 2.2802734375, 2.5179443359375, 2.755615234375, 2.9932861328125, 3.23095703125, 3.4686279296875, 3.706298828125, 3.9439697265625, 4.181640625, 4.4193115234375, 4.656982421875, 4.8946533203125, 5.13232421875, 5.3699951171875, 5.607666015625, 5.8453369140625, 6.0830078125, 6.3206787109375, 6.558349609375, 6.7960205078125, 7.03369140625, 7.2713623046875, 7.509033203125, 7.7467041015625, 7.984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 3.0, 3.0, 5.0, 7.0, 18.0, 13.0, 11.0, 14.0, 13.0, 21.0, 17.0, 30.0, 29.0, 27.0, 42.0, 33.0, 32.0, 37.0, 37.0, 34.0, 34.0, 40.0, 30.0, 23.0, 40.0, 50.0, 29.0, 39.0, 24.0, 27.0, 35.0, 29.0, 16.0, 26.0, 15.0, 15.0, 11.0, 18.0, 14.0, 8.0, 6.0, 14.0, 5.0, 2.0, 4.0, 6.0, 3.0, 4.0, 3.0, 6.0], "bins": [-19.625, -19.0799560546875, -18.534912109375, -17.9898681640625, -17.44482421875, -16.8997802734375, -16.354736328125, -15.8096923828125, -15.2646484375, -14.7196044921875, -14.174560546875, -13.6295166015625, -13.08447265625, -12.5394287109375, -11.994384765625, -11.4493408203125, -10.904296875, -10.3592529296875, -9.814208984375, -9.2691650390625, -8.72412109375, -8.1790771484375, -7.634033203125, -7.0889892578125, -6.5439453125, -5.9989013671875, -5.453857421875, -4.9088134765625, -4.36376953125, -3.8187255859375, -3.273681640625, -2.7286376953125, -2.18359375, -1.6385498046875, -1.093505859375, -0.5484619140625, -0.00341796875, 0.5416259765625, 1.086669921875, 1.6317138671875, 2.1767578125, 2.7218017578125, 3.266845703125, 3.8118896484375, 4.35693359375, 4.9019775390625, 5.447021484375, 5.9920654296875, 6.537109375, 7.0821533203125, 7.627197265625, 8.1722412109375, 8.71728515625, 9.2623291015625, 9.807373046875, 10.3524169921875, 10.8974609375, 11.4425048828125, 11.987548828125, 12.5325927734375, 13.07763671875, 13.6226806640625, 14.167724609375, 14.7127685546875, 15.2578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 7.0, 11.0, 11.0, 25.0, 30.0, 30.0, 62.0, 84.0, 134.0, 176.0, 264.0, 382.0, 547.0, 783.0, 1110.0, 1603.0, 2389.0, 3624.0, 5206.0, 7558.0, 11256.0, 16775.0, 26696.0, 128541.0, 737799.0, 38567.0, 21109.0, 13856.0, 9419.0, 6407.0, 4449.0, 2982.0, 2046.0, 1463.0, 994.0, 654.0, 462.0, 340.0, 198.0, 165.0, 100.0, 66.0, 58.0, 42.0, 24.0, 18.0, 10.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-15.6640625, -15.193359375, -14.72265625, -14.251953125, -13.78125, -13.310546875, -12.83984375, -12.369140625, -11.8984375, -11.427734375, -10.95703125, -10.486328125, -10.015625, -9.544921875, -9.07421875, -8.603515625, -8.1328125, -7.662109375, -7.19140625, -6.720703125, -6.25, -5.779296875, -5.30859375, -4.837890625, -4.3671875, -3.896484375, -3.42578125, -2.955078125, -2.484375, -2.013671875, -1.54296875, -1.072265625, -0.6015625, -0.130859375, 0.33984375, 0.810546875, 1.28125, 1.751953125, 2.22265625, 2.693359375, 3.1640625, 3.634765625, 4.10546875, 4.576171875, 5.046875, 5.517578125, 5.98828125, 6.458984375, 6.9296875, 7.400390625, 7.87109375, 8.341796875, 8.8125, 9.283203125, 9.75390625, 10.224609375, 10.6953125, 11.166015625, 11.63671875, 12.107421875, 12.578125, 13.048828125, 13.51953125, 13.990234375, 14.4609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 7.0, 3.0, 11.0, 8.0, 10.0, 7.0, 14.0, 23.0, 21.0, 17.0, 20.0, 34.0, 19.0, 29.0, 38.0, 39.0, 32.0, 41.0, 38.0, 37.0, 40.0, 52.0, 35.0, 48.0, 33.0, 39.0, 46.0, 38.0, 33.0, 21.0, 24.0, 20.0, 16.0, 15.0, 17.0, 10.0, 14.0, 11.0, 9.0, 10.0, 7.0, 2.0, 5.0, 1.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.8828125, -15.3963623046875, -14.909912109375, -14.4234619140625, -13.93701171875, -13.4505615234375, -12.964111328125, -12.4776611328125, -11.9912109375, -11.5047607421875, -11.018310546875, -10.5318603515625, -10.04541015625, -9.5589599609375, -9.072509765625, -8.5860595703125, -8.099609375, -7.6131591796875, -7.126708984375, -6.6402587890625, -6.15380859375, -5.6673583984375, -5.180908203125, -4.6944580078125, -4.2080078125, -3.7215576171875, -3.235107421875, -2.7486572265625, -2.26220703125, -1.7757568359375, -1.289306640625, -0.8028564453125, -0.31640625, 0.1700439453125, 0.656494140625, 1.1429443359375, 1.62939453125, 2.1158447265625, 2.602294921875, 3.0887451171875, 3.5751953125, 4.0616455078125, 4.548095703125, 5.0345458984375, 5.52099609375, 6.0074462890625, 6.493896484375, 6.9803466796875, 7.466796875, 7.9532470703125, 8.439697265625, 8.9261474609375, 9.41259765625, 9.8990478515625, 10.385498046875, 10.8719482421875, 11.3583984375, 11.8448486328125, 12.331298828125, 12.8177490234375, 13.30419921875, 13.7906494140625, 14.277099609375, 14.7635498046875, 15.25]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 7.0, 12.0, 10.0, 18.0, 25.0, 36.0, 51.0, 68.0, 90.0, 159.0, 205.0, 263.0, 399.0, 552.0, 829.0, 1267.0, 1884.0, 2726.0, 4169.0, 6568.0, 10610.0, 17040.0, 29616.0, 186617.0, 685130.0, 43221.0, 20825.0, 12802.0, 8095.0, 5073.0, 3269.0, 2145.0, 1505.0, 969.0, 716.0, 471.0, 323.0, 228.0, 167.0, 120.0, 64.0, 66.0, 37.0, 38.0, 18.0, 14.0, 9.0, 8.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-2.349609375, -2.27667236328125, -2.2037353515625, -2.13079833984375, -2.057861328125, -1.98492431640625, -1.9119873046875, -1.83905029296875, -1.76611328125, -1.69317626953125, -1.6202392578125, -1.54730224609375, -1.474365234375, -1.40142822265625, -1.3284912109375, -1.25555419921875, -1.1826171875, -1.10968017578125, -1.0367431640625, -0.96380615234375, -0.890869140625, -0.81793212890625, -0.7449951171875, -0.67205810546875, -0.59912109375, -0.52618408203125, -0.4532470703125, -0.38031005859375, -0.307373046875, -0.23443603515625, -0.1614990234375, -0.08856201171875, -0.015625, 0.05731201171875, 0.1302490234375, 0.20318603515625, 0.276123046875, 0.34906005859375, 0.4219970703125, 0.49493408203125, 0.56787109375, 0.64080810546875, 0.7137451171875, 0.78668212890625, 0.859619140625, 0.93255615234375, 1.0054931640625, 1.07843017578125, 1.1513671875, 1.22430419921875, 1.2972412109375, 1.37017822265625, 1.443115234375, 1.51605224609375, 1.5889892578125, 1.66192626953125, 1.73486328125, 1.80780029296875, 1.8807373046875, 1.95367431640625, 2.026611328125, 2.09954833984375, 2.1724853515625, 2.24542236328125, 2.318359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 3.0, 5.0, 9.0, 7.0, 12.0, 10.0, 11.0, 21.0, 25.0, 27.0, 42.0, 31.0, 43.0, 54.0, 54.0, 75.0, 68.0, 50.0, 69.0, 54.0, 56.0, 59.0, 41.0, 31.0, 22.0, 27.0, 14.0, 18.0, 10.0, 10.0, 9.0, 8.0, 4.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000545501708984375, -0.000528089702129364, -0.000510677695274353, -0.000493265688419342, -0.00047585368156433105, -0.00045844167470932007, -0.0004410296678543091, -0.0004236176609992981, -0.0004062056541442871, -0.0003887936472892761, -0.00037138164043426514, -0.00035396963357925415, -0.00033655762672424316, -0.0003191456198692322, -0.0003017336130142212, -0.0002843216061592102, -0.0002669095993041992, -0.00024949759244918823, -0.00023208558559417725, -0.00021467357873916626, -0.00019726157188415527, -0.0001798495650291443, -0.0001624375581741333, -0.00014502555131912231, -0.00012761354446411133, -0.00011020153760910034, -9.278953075408936e-05, -7.537752389907837e-05, -5.796551704406738e-05, -4.0553510189056396e-05, -2.314150333404541e-05, -5.729496479034424e-06, 1.1682510375976562e-05, 2.909451723098755e-05, 4.6506524085998535e-05, 6.391853094100952e-05, 8.133053779602051e-05, 9.87425446510315e-05, 0.00011615455150604248, 0.00013356655836105347, 0.00015097856521606445, 0.00016839057207107544, 0.00018580257892608643, 0.0002032145857810974, 0.0002206265926361084, 0.00023803859949111938, 0.00025545060634613037, 0.00027286261320114136, 0.00029027462005615234, 0.00030768662691116333, 0.0003250986337661743, 0.0003425106406211853, 0.0003599226474761963, 0.0003773346543312073, 0.00039474666118621826, 0.00041215866804122925, 0.00042957067489624023, 0.0004469826817512512, 0.0004643946886062622, 0.0004818066954612732, 0.0004992187023162842, 0.0005166307091712952, 0.0005340427160263062, 0.0005514547228813171, 0.0005688667297363281]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 11.0, 7.0, 19.0, 30.0, 43.0, 76.0, 125.0, 189.0, 360.0, 493.0, 829.0, 1400.0, 2287.0, 3544.0, 5518.0, 8870.0, 13795.0, 21479.0, 33475.0, 49996.0, 71907.0, 96014.0, 118181.0, 129504.0, 125472.0, 107214.0, 83263.0, 60109.0, 40606.0, 26606.0, 17352.0, 11003.0, 6950.0, 4437.0, 2811.0, 1732.0, 1090.0, 691.0, 435.0, 244.0, 144.0, 95.0, 55.0, 39.0, 23.0, 17.0, 7.0, 7.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8720703125, -0.8454360961914062, -0.8188018798828125, -0.7921676635742188, -0.765533447265625, -0.7388992309570312, -0.7122650146484375, -0.6856307983398438, -0.65899658203125, -0.6323623657226562, -0.6057281494140625, -0.5790939331054688, -0.552459716796875, -0.5258255004882812, -0.4991912841796875, -0.47255706787109375, -0.4459228515625, -0.41928863525390625, -0.3926544189453125, -0.36602020263671875, -0.339385986328125, -0.31275177001953125, -0.2861175537109375, -0.25948333740234375, -0.23284912109375, -0.20621490478515625, -0.1795806884765625, -0.15294647216796875, -0.126312255859375, -0.09967803955078125, -0.0730438232421875, -0.04640960693359375, -0.019775390625, 0.00685882568359375, 0.0334930419921875, 0.06012725830078125, 0.086761474609375, 0.11339569091796875, 0.1400299072265625, 0.16666412353515625, 0.19329833984375, 0.21993255615234375, 0.2465667724609375, 0.27320098876953125, 0.299835205078125, 0.32646942138671875, 0.3531036376953125, 0.37973785400390625, 0.4063720703125, 0.43300628662109375, 0.4596405029296875, 0.48627471923828125, 0.512908935546875, 0.5395431518554688, 0.5661773681640625, 0.5928115844726562, 0.61944580078125, 0.6460800170898438, 0.6727142333984375, 0.6993484497070312, 0.725982666015625, 0.7526168823242188, 0.7792510986328125, 0.8058853149414062, 0.83251953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 6.0, 3.0, 5.0, 5.0, 6.0, 7.0, 10.0, 14.0, 16.0, 12.0, 17.0, 21.0, 24.0, 41.0, 44.0, 45.0, 41.0, 50.0, 27.0, 45.0, 46.0, 47.0, 39.0, 37.0, 51.0, 36.0, 43.0, 40.0, 32.0, 25.0, 29.0, 25.0, 22.0, 15.0, 14.0, 7.0, 6.0, 6.0, 5.0, 7.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.388671875, -0.3764762878417969, -0.36428070068359375, -0.3520851135253906, -0.3398895263671875, -0.3276939392089844, -0.31549835205078125, -0.3033027648925781, -0.291107177734375, -0.2789115905761719, -0.26671600341796875, -0.2545204162597656, -0.2423248291015625, -0.23012924194335938, -0.21793365478515625, -0.20573806762695312, -0.19354248046875, -0.18134689331054688, -0.16915130615234375, -0.15695571899414062, -0.1447601318359375, -0.13256454467773438, -0.12036895751953125, -0.10817337036132812, -0.095977783203125, -0.08378219604492188, -0.07158660888671875, -0.059391021728515625, -0.0471954345703125, -0.034999847412109375, -0.02280426025390625, -0.010608673095703125, 0.0015869140625, 0.013782501220703125, 0.02597808837890625, 0.038173675537109375, 0.0503692626953125, 0.06256484985351562, 0.07476043701171875, 0.08695602416992188, 0.099151611328125, 0.11134719848632812, 0.12354278564453125, 0.13573837280273438, 0.1479339599609375, 0.16012954711914062, 0.17232513427734375, 0.18452072143554688, 0.19671630859375, 0.20891189575195312, 0.22110748291015625, 0.23330307006835938, 0.2454986572265625, 0.2576942443847656, 0.26988983154296875, 0.2820854187011719, 0.294281005859375, 0.3064765930175781, 0.31867218017578125, 0.3308677673339844, 0.3430633544921875, 0.3552589416503906, 0.36745452880859375, 0.3796501159667969, 0.391845703125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 3.0, 4.0, 7.0, 10.0, 6.0, 16.0, 17.0, 22.0, 28.0, 23.0, 38.0, 18.0, 31.0, 29.0, 46.0, 55.0, 44.0, 53.0, 41.0, 42.0, 55.0, 38.0, 53.0, 35.0, 40.0, 34.0, 28.0, 27.0, 16.0, 23.0, 25.0, 20.0, 11.0, 13.0, 5.0, 5.0, 12.0, 7.0, 0.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.711380004882812, -17.18816375732422, -16.664947509765625, -16.14173126220703, -15.618515014648438, -15.095298767089844, -14.57208251953125, -14.048866271972656, -13.525650024414062, -13.002433776855469, -12.479217529296875, -11.956001281738281, -11.432785034179688, -10.909568786621094, -10.3863525390625, -9.863136291503906, -9.339920997619629, -8.816704750061035, -8.293488502502441, -7.770272254943848, -7.247056007385254, -6.72383975982666, -6.200623989105225, -5.677407741546631, -5.154191493988037, -4.630975246429443, -4.10775899887085, -3.584542989730835, -3.061326742172241, -2.5381104946136475, -2.014894485473633, -1.491678237915039, -0.9684629440307617, -0.44524675607681274, 0.07796943187713623, 0.6011855602264404, 1.1244018077850342, 1.647618055343628, 2.1708340644836426, 2.6940503120422363, 3.21726655960083, 3.740482807159424, 4.263699054718018, 4.786914825439453, 5.310131072998047, 5.833347320556641, 6.356563568115234, 6.879779815673828, 7.402996063232422, 7.926212310791016, 8.44942855834961, 8.972644805908203, 9.495861053466797, 10.01907730102539, 10.542293548583984, 11.065509796142578, 11.588726043701172, 12.111942291259766, 12.63515853881836, 13.158374786376953, 13.681591033935547, 14.20480728149414, 14.728023529052734, 15.251239776611328, 15.774455070495605]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 7.0, 3.0, 7.0, 3.0, 14.0, 12.0, 8.0, 17.0, 14.0, 21.0, 13.0, 17.0, 33.0, 35.0, 24.0, 27.0, 40.0, 45.0, 27.0, 39.0, 42.0, 24.0, 36.0, 35.0, 37.0, 38.0, 42.0, 42.0, 28.0, 32.0, 25.0, 35.0, 21.0, 19.0, 22.0, 17.0, 12.0, 15.0, 20.0, 7.0, 9.0, 7.0, 7.0, 7.0, 2.0, 7.0, 2.0, 4.0, 5.0, 1.0, 5.0], "bins": [-19.915565490722656, -19.358291625976562, -18.80101776123047, -18.243743896484375, -17.68647003173828, -17.129196166992188, -16.571922302246094, -16.0146484375, -15.45737361907959, -14.900099754333496, -14.342825889587402, -13.785552024841309, -13.228277206420898, -12.671003341674805, -12.113729476928711, -11.556455612182617, -10.999181747436523, -10.44190788269043, -9.884634017944336, -9.327360153198242, -8.770086288452148, -8.212812423706055, -7.6555376052856445, -7.098263740539551, -6.540989875793457, -5.983716011047363, -5.4264421463012695, -4.869167804718018, -4.311893939971924, -3.75462007522583, -3.1973459720611572, -2.6400718688964844, -2.0827980041503906, -1.5255240201950073, -0.968250036239624, -0.4109760522842407, 0.14629793167114258, 0.7035717964172363, 1.2608458995819092, 1.818120002746582, 2.375393867492676, 2.9326677322387695, 3.4899418354034424, 4.047215938568115, 4.604489803314209, 5.161763668060303, 5.719038009643555, 6.276311874389648, 6.833585739135742, 7.390859603881836, 7.94813346862793, 8.505407333374023, 9.062681198120117, 9.619955062866211, 10.177229881286621, 10.734503746032715, 11.291777610778809, 11.849051475524902, 12.406325340270996, 12.96359920501709, 13.5208740234375, 14.078147888183594, 14.635421752929688, 15.192695617675781, 15.749969482421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 3.0, 6.0, 12.0, 21.0, 44.0, 49.0, 69.0, 107.0, 168.0, 262.0, 365.0, 570.0, 874.0, 1357.0, 2180.0, 3466.0, 5388.0, 8616.0, 13029.0, 19395.0, 29226.0, 41299.0, 56425.0, 73774.0, 89506.0, 101445.0, 107133.0, 104729.0, 95373.0, 80095.0, 64162.0, 47923.0, 34012.0, 23278.0, 15762.0, 10242.0, 6676.0, 4186.0, 2650.0, 1664.0, 1068.0, 647.0, 468.0, 254.0, 171.0, 139.0, 83.0, 57.0, 44.0, 32.0, 19.0, 10.0, 8.0, 8.0, 3.0, 3.0, 3.0, 2.0], "bins": [-13.1875, -12.784423828125, -12.38134765625, -11.978271484375, -11.5751953125, -11.172119140625, -10.76904296875, -10.365966796875, -9.962890625, -9.559814453125, -9.15673828125, -8.753662109375, -8.3505859375, -7.947509765625, -7.54443359375, -7.141357421875, -6.73828125, -6.335205078125, -5.93212890625, -5.529052734375, -5.1259765625, -4.722900390625, -4.31982421875, -3.916748046875, -3.513671875, -3.110595703125, -2.70751953125, -2.304443359375, -1.9013671875, -1.498291015625, -1.09521484375, -0.692138671875, -0.2890625, 0.114013671875, 0.51708984375, 0.920166015625, 1.3232421875, 1.726318359375, 2.12939453125, 2.532470703125, 2.935546875, 3.338623046875, 3.74169921875, 4.144775390625, 4.5478515625, 4.950927734375, 5.35400390625, 5.757080078125, 6.16015625, 6.563232421875, 6.96630859375, 7.369384765625, 7.7724609375, 8.175537109375, 8.57861328125, 8.981689453125, 9.384765625, 9.787841796875, 10.19091796875, 10.593994140625, 10.9970703125, 11.400146484375, 11.80322265625, 12.206298828125, 12.609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 6.0, 2.0, 16.0, 13.0, 5.0, 16.0, 17.0, 22.0, 14.0, 19.0, 29.0, 36.0, 26.0, 28.0, 43.0, 40.0, 29.0, 42.0, 38.0, 25.0, 36.0, 36.0, 34.0, 39.0, 38.0, 44.0, 30.0, 33.0, 23.0, 38.0, 20.0, 18.0, 18.0, 17.0, 17.0, 15.0, 15.0, 7.0, 8.0, 9.0, 5.0, 5.0, 5.0, 5.0, 2.0, 4.0, 5.0, 2.0, 4.0], "bins": [-18.921875, -18.3892822265625, -17.856689453125, -17.3240966796875, -16.79150390625, -16.2589111328125, -15.726318359375, -15.1937255859375, -14.6611328125, -14.1285400390625, -13.595947265625, -13.0633544921875, -12.53076171875, -11.9981689453125, -11.465576171875, -10.9329833984375, -10.400390625, -9.8677978515625, -9.335205078125, -8.8026123046875, -8.27001953125, -7.7374267578125, -7.204833984375, -6.6722412109375, -6.1396484375, -5.6070556640625, -5.074462890625, -4.5418701171875, -4.00927734375, -3.4766845703125, -2.944091796875, -2.4114990234375, -1.87890625, -1.3463134765625, -0.813720703125, -0.2811279296875, 0.25146484375, 0.7840576171875, 1.316650390625, 1.8492431640625, 2.3818359375, 2.9144287109375, 3.447021484375, 3.9796142578125, 4.51220703125, 5.0447998046875, 5.577392578125, 6.1099853515625, 6.642578125, 7.1751708984375, 7.707763671875, 8.2403564453125, 8.77294921875, 9.3055419921875, 9.838134765625, 10.3707275390625, 10.9033203125, 11.4359130859375, 11.968505859375, 12.5010986328125, 13.03369140625, 13.5662841796875, 14.098876953125, 14.6314697265625, 15.1640625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 3.0, 3.0, 4.0, 2.0, 8.0, 10.0, 20.0, 20.0, 49.0, 73.0, 77.0, 121.0, 179.0, 304.0, 450.0, 732.0, 1164.0, 1885.0, 2966.0, 4918.0, 7955.0, 13014.0, 20699.0, 32366.0, 48397.0, 68893.0, 91366.0, 112161.0, 123502.0, 122251.0, 110113.0, 88827.0, 66311.0, 46385.0, 30994.0, 19872.0, 12379.0, 7688.0, 4553.0, 2938.0, 1837.0, 1127.0, 688.0, 446.0, 266.0, 179.0, 127.0, 106.0, 53.0, 33.0, 17.0, 18.0, 12.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9765625, -15.4603271484375, -14.944091796875, -14.4278564453125, -13.91162109375, -13.3953857421875, -12.879150390625, -12.3629150390625, -11.8466796875, -11.3304443359375, -10.814208984375, -10.2979736328125, -9.78173828125, -9.2655029296875, -8.749267578125, -8.2330322265625, -7.716796875, -7.2005615234375, -6.684326171875, -6.1680908203125, -5.65185546875, -5.1356201171875, -4.619384765625, -4.1031494140625, -3.5869140625, -3.0706787109375, -2.554443359375, -2.0382080078125, -1.52197265625, -1.0057373046875, -0.489501953125, 0.0267333984375, 0.54296875, 1.0592041015625, 1.575439453125, 2.0916748046875, 2.60791015625, 3.1241455078125, 3.640380859375, 4.1566162109375, 4.6728515625, 5.1890869140625, 5.705322265625, 6.2215576171875, 6.73779296875, 7.2540283203125, 7.770263671875, 8.2864990234375, 8.802734375, 9.3189697265625, 9.835205078125, 10.3514404296875, 10.86767578125, 11.3839111328125, 11.900146484375, 12.4163818359375, 12.9326171875, 13.4488525390625, 13.965087890625, 14.4813232421875, 14.99755859375, 15.5137939453125, 16.030029296875, 16.5462646484375, 17.0625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 3.0, 7.0, 11.0, 16.0, 17.0, 23.0, 24.0, 31.0, 32.0, 32.0, 29.0, 28.0, 29.0, 51.0, 41.0, 35.0, 53.0, 54.0, 39.0, 36.0, 30.0, 47.0, 30.0, 34.0, 28.0, 40.0, 37.0, 23.0, 22.0, 20.0, 17.0, 10.0, 14.0, 10.0, 12.0, 5.0, 5.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.8515625, -12.441650390625, -12.03173828125, -11.621826171875, -11.2119140625, -10.802001953125, -10.39208984375, -9.982177734375, -9.572265625, -9.162353515625, -8.75244140625, -8.342529296875, -7.9326171875, -7.522705078125, -7.11279296875, -6.702880859375, -6.29296875, -5.883056640625, -5.47314453125, -5.063232421875, -4.6533203125, -4.243408203125, -3.83349609375, -3.423583984375, -3.013671875, -2.603759765625, -2.19384765625, -1.783935546875, -1.3740234375, -0.964111328125, -0.55419921875, -0.144287109375, 0.265625, 0.675537109375, 1.08544921875, 1.495361328125, 1.9052734375, 2.315185546875, 2.72509765625, 3.135009765625, 3.544921875, 3.954833984375, 4.36474609375, 4.774658203125, 5.1845703125, 5.594482421875, 6.00439453125, 6.414306640625, 6.82421875, 7.234130859375, 7.64404296875, 8.053955078125, 8.4638671875, 8.873779296875, 9.28369140625, 9.693603515625, 10.103515625, 10.513427734375, 10.92333984375, 11.333251953125, 11.7431640625, 12.153076171875, 12.56298828125, 12.972900390625, 13.3828125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 10.0, 14.0, 20.0, 36.0, 44.0, 69.0, 99.0, 129.0, 180.0, 270.0, 436.0, 672.0, 1075.0, 1662.0, 2575.0, 4150.0, 6973.0, 11651.0, 19917.0, 34413.0, 57562.0, 90913.0, 129323.0, 157012.0, 158523.0, 131335.0, 93359.0, 59421.0, 35195.0, 20574.0, 11977.0, 7238.0, 4240.0, 2677.0, 1646.0, 1101.0, 670.0, 466.0, 316.0, 181.0, 150.0, 100.0, 58.0, 33.0, 33.0, 12.0, 17.0, 9.0, 10.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.4765625, -6.27435302734375, -6.0721435546875, -5.86993408203125, -5.667724609375, -5.46551513671875, -5.2633056640625, -5.06109619140625, -4.85888671875, -4.65667724609375, -4.4544677734375, -4.25225830078125, -4.050048828125, -3.84783935546875, -3.6456298828125, -3.44342041015625, -3.2412109375, -3.03900146484375, -2.8367919921875, -2.63458251953125, -2.432373046875, -2.23016357421875, -2.0279541015625, -1.82574462890625, -1.62353515625, -1.42132568359375, -1.2191162109375, -1.01690673828125, -0.814697265625, -0.61248779296875, -0.4102783203125, -0.20806884765625, -0.005859375, 0.19635009765625, 0.3985595703125, 0.60076904296875, 0.802978515625, 1.00518798828125, 1.2073974609375, 1.40960693359375, 1.61181640625, 1.81402587890625, 2.0162353515625, 2.21844482421875, 2.420654296875, 2.62286376953125, 2.8250732421875, 3.02728271484375, 3.2294921875, 3.43170166015625, 3.6339111328125, 3.83612060546875, 4.038330078125, 4.24053955078125, 4.4427490234375, 4.64495849609375, 4.84716796875, 5.04937744140625, 5.2515869140625, 5.45379638671875, 5.656005859375, 5.85821533203125, 6.0604248046875, 6.26263427734375, 6.46484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 14.0, 14.0, 15.0, 18.0, 25.0, 29.0, 29.0, 46.0, 48.0, 58.0, 70.0, 85.0, 59.0, 61.0, 71.0, 58.0, 64.0, 47.0, 33.0, 38.0, 31.0, 22.0, 16.0, 10.0, 10.0, 4.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0010061264038085938, -0.0009785667061805725, -0.0009510070085525513, -0.00092344731092453, -0.0008958876132965088, -0.0008683279156684875, -0.0008407682180404663, -0.0008132085204124451, -0.0007856488227844238, -0.0007580891251564026, -0.0007305294275283813, -0.0007029697299003601, -0.0006754100322723389, -0.0006478503346443176, -0.0006202906370162964, -0.0005927309393882751, -0.0005651712417602539, -0.0005376115441322327, -0.0005100518465042114, -0.0004824921488761902, -0.00045493245124816895, -0.0004273727536201477, -0.00039981305599212646, -0.0003722533583641052, -0.000344693660736084, -0.00031713396310806274, -0.0002895742654800415, -0.00026201456785202026, -0.00023445487022399902, -0.00020689517259597778, -0.00017933547496795654, -0.0001517757773399353, -0.00012421607971191406, -9.665638208389282e-05, -6.909668445587158e-05, -4.153698682785034e-05, -1.3977289199829102e-05, 1.3582408428192139e-05, 4.114210605621338e-05, 6.870180368423462e-05, 9.626150131225586e-05, 0.0001238211989402771, 0.00015138089656829834, 0.00017894059419631958, 0.00020650029182434082, 0.00023405998945236206, 0.0002616196870803833, 0.00028917938470840454, 0.0003167390823364258, 0.000344298779964447, 0.00037185847759246826, 0.0003994181752204895, 0.00042697787284851074, 0.000454537570476532, 0.0004820972681045532, 0.0005096569657325745, 0.0005372166633605957, 0.0005647763609886169, 0.0005923360586166382, 0.0006198957562446594, 0.0006474554538726807, 0.0006750151515007019, 0.0007025748491287231, 0.0007301345467567444, 0.0007576942443847656]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 14.0, 10.0, 24.0, 20.0, 38.0, 56.0, 96.0, 104.0, 162.0, 229.0, 327.0, 457.0, 697.0, 930.0, 1527.0, 2223.0, 3380.0, 5258.0, 8530.0, 13173.0, 20888.0, 31852.0, 48262.0, 69902.0, 95216.0, 118006.0, 130153.0, 126313.0, 108808.0, 84485.0, 60624.0, 41196.0, 27181.0, 17230.0, 11023.0, 7043.0, 4516.0, 2855.0, 1875.0, 1199.0, 808.0, 563.0, 398.0, 280.0, 199.0, 139.0, 87.0, 64.0, 32.0, 33.0, 22.0, 23.0, 12.0, 6.0, 3.0, 6.0, 2.0, 2.0], "bins": [-5.47265625, -5.3057861328125, -5.138916015625, -4.9720458984375, -4.80517578125, -4.6383056640625, -4.471435546875, -4.3045654296875, -4.1376953125, -3.9708251953125, -3.803955078125, -3.6370849609375, -3.47021484375, -3.3033447265625, -3.136474609375, -2.9696044921875, -2.802734375, -2.6358642578125, -2.468994140625, -2.3021240234375, -2.13525390625, -1.9683837890625, -1.801513671875, -1.6346435546875, -1.4677734375, -1.3009033203125, -1.134033203125, -0.9671630859375, -0.80029296875, -0.6334228515625, -0.466552734375, -0.2996826171875, -0.1328125, 0.0340576171875, 0.200927734375, 0.3677978515625, 0.53466796875, 0.7015380859375, 0.868408203125, 1.0352783203125, 1.2021484375, 1.3690185546875, 1.535888671875, 1.7027587890625, 1.86962890625, 2.0364990234375, 2.203369140625, 2.3702392578125, 2.537109375, 2.7039794921875, 2.870849609375, 3.0377197265625, 3.20458984375, 3.3714599609375, 3.538330078125, 3.7052001953125, 3.8720703125, 4.0389404296875, 4.205810546875, 4.3726806640625, 4.53955078125, 4.7064208984375, 4.873291015625, 5.0401611328125, 5.20703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 6.0, 6.0, 6.0, 9.0, 10.0, 14.0, 14.0, 20.0, 32.0, 24.0, 36.0, 35.0, 48.0, 59.0, 55.0, 65.0, 69.0, 70.0, 48.0, 63.0, 55.0, 47.0, 29.0, 39.0, 28.0, 20.0, 13.0, 18.0, 9.0, 10.0, 8.0, 10.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.6015625, -3.497772216796875, -3.39398193359375, -3.290191650390625, -3.1864013671875, -3.082611083984375, -2.97882080078125, -2.875030517578125, -2.771240234375, -2.667449951171875, -2.56365966796875, -2.459869384765625, -2.3560791015625, -2.252288818359375, -2.14849853515625, -2.044708251953125, -1.94091796875, -1.837127685546875, -1.73333740234375, -1.629547119140625, -1.5257568359375, -1.421966552734375, -1.31817626953125, -1.214385986328125, -1.110595703125, -1.006805419921875, -0.90301513671875, -0.799224853515625, -0.6954345703125, -0.591644287109375, -0.48785400390625, -0.384063720703125, -0.2802734375, -0.176483154296875, -0.07269287109375, 0.031097412109375, 0.1348876953125, 0.238677978515625, 0.34246826171875, 0.446258544921875, 0.550048828125, 0.653839111328125, 0.75762939453125, 0.861419677734375, 0.9652099609375, 1.069000244140625, 1.17279052734375, 1.276580810546875, 1.38037109375, 1.484161376953125, 1.58795166015625, 1.691741943359375, 1.7955322265625, 1.899322509765625, 2.00311279296875, 2.106903076171875, 2.210693359375, 2.314483642578125, 2.41827392578125, 2.522064208984375, 2.6258544921875, 2.729644775390625, 2.83343505859375, 2.937225341796875, 3.041015625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 5.0, 2.0, 15.0, 10.0, 9.0, 20.0, 21.0, 23.0, 19.0, 25.0, 32.0, 31.0, 30.0, 42.0, 47.0, 56.0, 47.0, 61.0, 39.0, 40.0, 50.0, 45.0, 40.0, 39.0, 37.0, 35.0, 30.0, 17.0, 21.0, 25.0, 18.0, 15.0, 14.0, 8.0, 5.0, 4.0, 3.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.075115203857422, -19.527956008911133, -18.980798721313477, -18.433639526367188, -17.88648223876953, -17.339323043823242, -16.792165756225586, -16.245006561279297, -15.69784927368164, -15.150691032409668, -14.603532791137695, -14.056374549865723, -13.50921630859375, -12.962058067321777, -12.414899826049805, -11.867740631103516, -11.320582389831543, -10.77342414855957, -10.226265907287598, -9.679107666015625, -9.131949424743652, -8.58479118347168, -8.03763198852539, -7.490474224090576, -6.9433159828186035, -6.396157741546631, -5.848999500274658, -5.301840782165527, -4.754682540893555, -4.207524299621582, -3.6603660583496094, -3.1132078170776367, -2.5660486221313477, -2.018890380859375, -1.4717320203781128, -0.9245736598968506, -0.37741541862487793, 0.16974282264709473, 0.7169013023376465, 1.2640595436096191, 1.8112177848815918, 2.3583760261535645, 2.905534267425537, 3.452692747116089, 3.9998509883880615, 4.547009468078613, 5.094167709350586, 5.641325950622559, 6.188484191894531, 6.735642433166504, 7.282800674438477, 7.829958915710449, 8.377117156982422, 8.924275398254395, 9.471433639526367, 10.018592834472656, 10.565750122070312, 11.112908363342285, 11.660066604614258, 12.20722484588623, 12.754383087158203, 13.301541328430176, 13.848699569702148, 14.395858764648438, 14.94301700592041]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 8.0, 5.0, 5.0, 9.0, 8.0, 12.0, 10.0, 24.0, 15.0, 27.0, 19.0, 26.0, 35.0, 31.0, 36.0, 31.0, 31.0, 44.0, 44.0, 39.0, 37.0, 39.0, 45.0, 39.0, 38.0, 29.0, 39.0, 33.0, 28.0, 27.0, 27.0, 16.0, 23.0, 24.0, 6.0, 14.0, 14.0, 14.0, 9.0, 3.0, 6.0, 7.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.2109375, -17.617185592651367, -17.023433685302734, -16.42967987060547, -15.835927963256836, -15.242176055908203, -14.648423194885254, -14.054670333862305, -13.460918426513672, -12.867166519165039, -12.27341365814209, -11.67966079711914, -11.085908889770508, -10.492156982421875, -9.898404121398926, -9.304651260375977, -8.710899353027344, -8.117147445678711, -7.523394584655762, -6.929642200469971, -6.33588981628418, -5.742137432098389, -5.148385047912598, -4.554632663726807, -3.9608802795410156, -3.3671278953552246, -2.7733755111694336, -2.1796231269836426, -1.5858707427978516, -0.9921183586120605, -0.39836597442626953, 0.19538640975952148, 0.7891368865966797, 1.3828892707824707, 1.9766416549682617, 2.5703940391540527, 3.1641464233398438, 3.7578988075256348, 4.351651191711426, 4.945403575897217, 5.539155960083008, 6.132908344268799, 6.72666072845459, 7.320413112640381, 7.914165496826172, 8.507917404174805, 9.101670265197754, 9.695423126220703, 10.289175033569336, 10.882926940917969, 11.476679801940918, 12.070432662963867, 12.6641845703125, 13.257936477661133, 13.851689338684082, 14.445442199707031, 15.039194107055664, 15.632946014404297, 16.226699829101562, 16.820451736450195, 17.414203643798828, 18.00795555114746, 18.601707458496094, 19.19546127319336, 19.789213180541992]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [3.0, 3.0, 8.0, 10.0, 13.0, 20.0, 39.0, 71.0, 86.0, 147.0, 234.0, 372.0, 548.0, 878.0, 1400.0, 2188.0, 3388.0, 5351.0, 8256.0, 12341.0, 18994.0, 28130.0, 42113.0, 61024.0, 88994.0, 123689.0, 171619.0, 225883.0, 284791.0, 342914.0, 385923.0, 407092.0, 398334.0, 362379.0, 310302.0, 249395.0, 191751.0, 142227.0, 102004.0, 71993.0, 49987.0, 33086.0, 22667.0, 15261.0, 9744.0, 6566.0, 4239.0, 2748.0, 1812.0, 1205.0, 774.0, 468.0, 299.0, 195.0, 131.0, 80.0, 35.0, 42.0, 23.0, 15.0, 8.0, 5.0, 5.0, 2.0], "bins": [-11.625, -11.2584228515625, -10.891845703125, -10.5252685546875, -10.15869140625, -9.7921142578125, -9.425537109375, -9.0589599609375, -8.6923828125, -8.3258056640625, -7.959228515625, -7.5926513671875, -7.22607421875, -6.8594970703125, -6.492919921875, -6.1263427734375, -5.759765625, -5.3931884765625, -5.026611328125, -4.6600341796875, -4.29345703125, -3.9268798828125, -3.560302734375, -3.1937255859375, -2.8271484375, -2.4605712890625, -2.093994140625, -1.7274169921875, -1.36083984375, -0.9942626953125, -0.627685546875, -0.2611083984375, 0.10546875, 0.4720458984375, 0.838623046875, 1.2052001953125, 1.57177734375, 1.9383544921875, 2.304931640625, 2.6715087890625, 3.0380859375, 3.4046630859375, 3.771240234375, 4.1378173828125, 4.50439453125, 4.8709716796875, 5.237548828125, 5.6041259765625, 5.970703125, 6.3372802734375, 6.703857421875, 7.0704345703125, 7.43701171875, 7.8035888671875, 8.170166015625, 8.5367431640625, 8.9033203125, 9.2698974609375, 9.636474609375, 10.0030517578125, 10.36962890625, 10.7362060546875, 11.102783203125, 11.4693603515625, 11.8359375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 7.0, 7.0, 5.0, 9.0, 6.0, 12.0, 12.0, 10.0, 20.0, 18.0, 23.0, 27.0, 23.0, 37.0, 33.0, 31.0, 25.0, 43.0, 39.0, 35.0, 42.0, 39.0, 37.0, 50.0, 30.0, 40.0, 35.0, 37.0, 30.0, 32.0, 25.0, 24.0, 15.0, 27.0, 18.0, 9.0, 16.0, 13.0, 11.0, 10.0, 5.0, 9.0, 6.0, 2.0, 8.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-16.359375, -15.845947265625, -15.33251953125, -14.819091796875, -14.3056640625, -13.792236328125, -13.27880859375, -12.765380859375, -12.251953125, -11.738525390625, -11.22509765625, -10.711669921875, -10.1982421875, -9.684814453125, -9.17138671875, -8.657958984375, -8.14453125, -7.631103515625, -7.11767578125, -6.604248046875, -6.0908203125, -5.577392578125, -5.06396484375, -4.550537109375, -4.037109375, -3.523681640625, -3.01025390625, -2.496826171875, -1.9833984375, -1.469970703125, -0.95654296875, -0.443115234375, 0.0703125, 0.583740234375, 1.09716796875, 1.610595703125, 2.1240234375, 2.637451171875, 3.15087890625, 3.664306640625, 4.177734375, 4.691162109375, 5.20458984375, 5.718017578125, 6.2314453125, 6.744873046875, 7.25830078125, 7.771728515625, 8.28515625, 8.798583984375, 9.31201171875, 9.825439453125, 10.3388671875, 10.852294921875, 11.36572265625, 11.879150390625, 12.392578125, 12.906005859375, 13.41943359375, 13.932861328125, 14.4462890625, 14.959716796875, 15.47314453125, 15.986572265625, 16.5]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 7.0, 9.0, 22.0, 24.0, 55.0, 65.0, 127.0, 204.0, 320.0, 526.0, 891.0, 1486.0, 2439.0, 4118.0, 6500.0, 10806.0, 17043.0, 27179.0, 42268.0, 64067.0, 94016.0, 136423.0, 188698.0, 249492.0, 312554.0, 370272.0, 407229.0, 418581.0, 400524.0, 356285.0, 298661.0, 233855.0, 175755.0, 126083.0, 86998.0, 58575.0, 38025.0, 24200.0, 15369.0, 9496.0, 5909.0, 3593.0, 2185.0, 1338.0, 811.0, 474.0, 278.0, 191.0, 114.0, 62.0, 44.0, 17.0, 9.0, 9.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0], "bins": [-12.9296875, -12.5177001953125, -12.105712890625, -11.6937255859375, -11.28173828125, -10.8697509765625, -10.457763671875, -10.0457763671875, -9.6337890625, -9.2218017578125, -8.809814453125, -8.3978271484375, -7.98583984375, -7.5738525390625, -7.161865234375, -6.7498779296875, -6.337890625, -5.9259033203125, -5.513916015625, -5.1019287109375, -4.68994140625, -4.2779541015625, -3.865966796875, -3.4539794921875, -3.0419921875, -2.6300048828125, -2.218017578125, -1.8060302734375, -1.39404296875, -0.9820556640625, -0.570068359375, -0.1580810546875, 0.25390625, 0.6658935546875, 1.077880859375, 1.4898681640625, 1.90185546875, 2.3138427734375, 2.725830078125, 3.1378173828125, 3.5498046875, 3.9617919921875, 4.373779296875, 4.7857666015625, 5.19775390625, 5.6097412109375, 6.021728515625, 6.4337158203125, 6.845703125, 7.2576904296875, 7.669677734375, 8.0816650390625, 8.49365234375, 8.9056396484375, 9.317626953125, 9.7296142578125, 10.1416015625, 10.5535888671875, 10.965576171875, 11.3775634765625, 11.78955078125, 12.2015380859375, 12.613525390625, 13.0255126953125, 13.4375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 8.0, 7.0, 11.0, 7.0, 16.0, 23.0, 19.0, 37.0, 58.0, 54.0, 68.0, 85.0, 86.0, 130.0, 149.0, 163.0, 175.0, 202.0, 193.0, 214.0, 231.0, 231.0, 202.0, 191.0, 211.0, 202.0, 176.0, 167.0, 139.0, 107.0, 99.0, 82.0, 77.0, 65.0, 39.0, 35.0, 29.0, 27.0, 16.0, 16.0, 12.0, 8.0, 8.0, 5.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.171875, -8.8990478515625, -8.626220703125, -8.3533935546875, -8.08056640625, -7.8077392578125, -7.534912109375, -7.2620849609375, -6.9892578125, -6.7164306640625, -6.443603515625, -6.1707763671875, -5.89794921875, -5.6251220703125, -5.352294921875, -5.0794677734375, -4.806640625, -4.5338134765625, -4.260986328125, -3.9881591796875, -3.71533203125, -3.4425048828125, -3.169677734375, -2.8968505859375, -2.6240234375, -2.3511962890625, -2.078369140625, -1.8055419921875, -1.53271484375, -1.2598876953125, -0.987060546875, -0.7142333984375, -0.44140625, -0.1685791015625, 0.104248046875, 0.3770751953125, 0.64990234375, 0.9227294921875, 1.195556640625, 1.4683837890625, 1.7412109375, 2.0140380859375, 2.286865234375, 2.5596923828125, 2.83251953125, 3.1053466796875, 3.378173828125, 3.6510009765625, 3.923828125, 4.1966552734375, 4.469482421875, 4.7423095703125, 5.01513671875, 5.2879638671875, 5.560791015625, 5.8336181640625, 6.1064453125, 6.3792724609375, 6.652099609375, 6.9249267578125, 7.19775390625, 7.4705810546875, 7.743408203125, 8.0162353515625, 8.2890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 11.0, 16.0, 17.0, 18.0, 21.0, 14.0, 25.0, 26.0, 31.0, 35.0, 35.0, 50.0, 34.0, 39.0, 39.0, 49.0, 52.0, 49.0, 46.0, 48.0, 40.0, 35.0, 36.0, 40.0, 30.0, 31.0, 15.0, 27.0, 16.0, 12.0, 10.0, 8.0, 9.0, 9.0, 3.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.445018768310547, -19.851511001586914, -19.25800132751465, -18.664493560791016, -18.070985794067383, -17.47747802734375, -16.883968353271484, -16.29046058654785, -15.696951866149902, -15.103443145751953, -14.50993537902832, -13.916426658630371, -13.322917938232422, -12.729410171508789, -12.13590145111084, -11.54239273071289, -10.948884963989258, -10.355376243591309, -9.761868476867676, -9.168359756469727, -8.574851989746094, -7.9813432693481445, -7.387834548950195, -6.794326305389404, -6.200818061828613, -5.607309818267822, -5.013801574707031, -4.420292854309082, -3.826784610748291, -3.2332763671875, -2.63976788520813, -2.0462594032287598, -1.4527511596679688, -0.8592427968978882, -0.2657344341278076, 0.32777392864227295, 0.9212822914123535, 1.5147905349731445, 2.1082990169525146, 2.7018074989318848, 3.295315742492676, 3.888823986053467, 4.482332229614258, 5.075840950012207, 5.669349193572998, 6.262857437133789, 6.856366157531738, 7.449874401092529, 8.04338264465332, 8.63689136505127, 9.230399131774902, 9.823907852172852, 10.417415618896484, 11.010924339294434, 11.604433059692383, 12.197940826416016, 12.791449546813965, 13.384958267211914, 13.978466033935547, 14.571974754333496, 15.165483474731445, 15.758991241455078, 16.35249900817871, 16.946008682250977, 17.53951644897461]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 6.0, 6.0, 3.0, 11.0, 6.0, 10.0, 11.0, 14.0, 19.0, 19.0, 20.0, 31.0, 21.0, 28.0, 33.0, 37.0, 33.0, 43.0, 38.0, 36.0, 40.0, 30.0, 39.0, 27.0, 52.0, 28.0, 33.0, 35.0, 39.0, 29.0, 25.0, 27.0, 26.0, 25.0, 27.0, 16.0, 14.0, 8.0, 12.0, 5.0, 7.0, 6.0, 7.0, 3.0, 6.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-21.0124568939209, -20.368844985961914, -19.725234985351562, -19.081623077392578, -18.438011169433594, -17.79439926147461, -17.150787353515625, -16.507177352905273, -15.863565444946289, -15.219953536987305, -14.576342582702637, -13.932731628417969, -13.289119720458984, -12.6455078125, -12.001896858215332, -11.358285903930664, -10.71467399597168, -10.071062088012695, -9.427451133728027, -8.78384017944336, -8.140228271484375, -7.496616840362549, -6.853005409240723, -6.2093939781188965, -5.56578254699707, -4.922171115875244, -4.278559684753418, -3.634948253631592, -2.9913368225097656, -2.3477253913879395, -1.7041139602661133, -1.060502529144287, -0.41689300537109375, 0.22671842575073242, 0.8703298568725586, 1.5139412879943848, 2.157552719116211, 2.801164150238037, 3.4447755813598633, 4.0883870124816895, 4.731998443603516, 5.375609874725342, 6.019221305847168, 6.662832736968994, 7.30644416809082, 7.9500555992126465, 8.593667030334473, 9.23727798461914, 9.880889892578125, 10.52450180053711, 11.168112754821777, 11.811723709106445, 12.45533561706543, 13.098947525024414, 13.742558479309082, 14.38616943359375, 15.029781341552734, 15.673393249511719, 16.317005157470703, 16.960615158081055, 17.60422706604004, 18.247838973999023, 18.891448974609375, 19.53506088256836, 20.178672790527344]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 10.0, 6.0, 12.0, 18.0, 30.0, 33.0, 79.0, 84.0, 197.0, 263.0, 467.0, 705.0, 1164.0, 1701.0, 2726.0, 4032.0, 6429.0, 9508.0, 13753.0, 19891.0, 28567.0, 39039.0, 51060.0, 65030.0, 78152.0, 88801.0, 96606.0, 96611.0, 92050.0, 82165.0, 69623.0, 56086.0, 42697.0, 31353.0, 22362.0, 15830.0, 10752.0, 7205.0, 4757.0, 3114.0, 1969.0, 1300.0, 851.0, 570.0, 311.0, 209.0, 141.0, 93.0, 64.0, 37.0, 20.0, 14.0, 7.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-7.57421875, -7.3387451171875, -7.103271484375, -6.8677978515625, -6.63232421875, -6.3968505859375, -6.161376953125, -5.9259033203125, -5.6904296875, -5.4549560546875, -5.219482421875, -4.9840087890625, -4.74853515625, -4.5130615234375, -4.277587890625, -4.0421142578125, -3.806640625, -3.5711669921875, -3.335693359375, -3.1002197265625, -2.86474609375, -2.6292724609375, -2.393798828125, -2.1583251953125, -1.9228515625, -1.6873779296875, -1.451904296875, -1.2164306640625, -0.98095703125, -0.7454833984375, -0.510009765625, -0.2745361328125, -0.0390625, 0.1964111328125, 0.431884765625, 0.6673583984375, 0.90283203125, 1.1383056640625, 1.373779296875, 1.6092529296875, 1.8447265625, 2.0802001953125, 2.315673828125, 2.5511474609375, 2.78662109375, 3.0220947265625, 3.257568359375, 3.4930419921875, 3.728515625, 3.9639892578125, 4.199462890625, 4.4349365234375, 4.67041015625, 4.9058837890625, 5.141357421875, 5.3768310546875, 5.6123046875, 5.8477783203125, 6.083251953125, 6.3187255859375, 6.55419921875, 6.7896728515625, 7.025146484375, 7.2606201171875, 7.49609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 3.0, 8.0, 5.0, 3.0, 12.0, 5.0, 13.0, 10.0, 16.0, 21.0, 20.0, 17.0, 30.0, 21.0, 32.0, 35.0, 31.0, 42.0, 41.0, 36.0, 35.0, 40.0, 29.0, 36.0, 29.0, 52.0, 31.0, 32.0, 39.0, 32.0, 32.0, 24.0, 26.0, 25.0, 32.0, 21.0, 13.0, 12.0, 11.0, 9.0, 8.0, 5.0, 5.0, 8.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-21.390625, -20.7373046875, -20.083984375, -19.4306640625, -18.77734375, -18.1240234375, -17.470703125, -16.8173828125, -16.1640625, -15.5107421875, -14.857421875, -14.2041015625, -13.55078125, -12.8974609375, -12.244140625, -11.5908203125, -10.9375, -10.2841796875, -9.630859375, -8.9775390625, -8.32421875, -7.6708984375, -7.017578125, -6.3642578125, -5.7109375, -5.0576171875, -4.404296875, -3.7509765625, -3.09765625, -2.4443359375, -1.791015625, -1.1376953125, -0.484375, 0.1689453125, 0.822265625, 1.4755859375, 2.12890625, 2.7822265625, 3.435546875, 4.0888671875, 4.7421875, 5.3955078125, 6.048828125, 6.7021484375, 7.35546875, 8.0087890625, 8.662109375, 9.3154296875, 9.96875, 10.6220703125, 11.275390625, 11.9287109375, 12.58203125, 13.2353515625, 13.888671875, 14.5419921875, 15.1953125, 15.8486328125, 16.501953125, 17.1552734375, 17.80859375, 18.4619140625, 19.115234375, 19.7685546875, 20.421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 6.0, 13.0, 13.0, 24.0, 33.0, 37.0, 69.0, 93.0, 111.0, 167.0, 240.0, 329.0, 401.0, 594.0, 813.0, 1230.0, 1646.0, 2234.0, 3213.0, 4569.0, 6428.0, 9136.0, 12935.0, 18615.0, 30164.0, 392375.0, 466553.0, 31547.0, 19403.0, 13318.0, 9432.0, 6503.0, 4633.0, 3389.0, 2314.0, 1728.0, 1221.0, 845.0, 621.0, 446.0, 338.0, 225.0, 153.0, 108.0, 84.0, 70.0, 40.0, 31.0, 17.0, 21.0, 11.0, 2.0, 9.0, 3.0, 2.0, 2.0, 2.0], "bins": [-16.90625, -16.3944091796875, -15.882568359375, -15.3707275390625, -14.85888671875, -14.3470458984375, -13.835205078125, -13.3233642578125, -12.8115234375, -12.2996826171875, -11.787841796875, -11.2760009765625, -10.76416015625, -10.2523193359375, -9.740478515625, -9.2286376953125, -8.716796875, -8.2049560546875, -7.693115234375, -7.1812744140625, -6.66943359375, -6.1575927734375, -5.645751953125, -5.1339111328125, -4.6220703125, -4.1102294921875, -3.598388671875, -3.0865478515625, -2.57470703125, -2.0628662109375, -1.551025390625, -1.0391845703125, -0.52734375, -0.0155029296875, 0.496337890625, 1.0081787109375, 1.52001953125, 2.0318603515625, 2.543701171875, 3.0555419921875, 3.5673828125, 4.0792236328125, 4.591064453125, 5.1029052734375, 5.61474609375, 6.1265869140625, 6.638427734375, 7.1502685546875, 7.662109375, 8.1739501953125, 8.685791015625, 9.1976318359375, 9.70947265625, 10.2213134765625, 10.733154296875, 11.2449951171875, 11.7568359375, 12.2686767578125, 12.780517578125, 13.2923583984375, 13.80419921875, 14.3160400390625, 14.827880859375, 15.3397216796875, 15.8515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 8.0, 4.0, 6.0, 8.0, 5.0, 12.0, 13.0, 18.0, 14.0, 16.0, 18.0, 37.0, 25.0, 25.0, 30.0, 29.0, 26.0, 33.0, 28.0, 42.0, 38.0, 49.0, 32.0, 32.0, 38.0, 37.0, 36.0, 52.0, 26.0, 30.0, 26.0, 31.0, 23.0, 34.0, 20.0, 14.0, 15.0, 13.0, 13.0, 8.0, 6.0, 9.0, 9.0, 4.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0], "bins": [-20.328125, -19.718994140625, -19.10986328125, -18.500732421875, -17.8916015625, -17.282470703125, -16.67333984375, -16.064208984375, -15.455078125, -14.845947265625, -14.23681640625, -13.627685546875, -13.0185546875, -12.409423828125, -11.80029296875, -11.191162109375, -10.58203125, -9.972900390625, -9.36376953125, -8.754638671875, -8.1455078125, -7.536376953125, -6.92724609375, -6.318115234375, -5.708984375, -5.099853515625, -4.49072265625, -3.881591796875, -3.2724609375, -2.663330078125, -2.05419921875, -1.445068359375, -0.8359375, -0.226806640625, 0.38232421875, 0.991455078125, 1.6005859375, 2.209716796875, 2.81884765625, 3.427978515625, 4.037109375, 4.646240234375, 5.25537109375, 5.864501953125, 6.4736328125, 7.082763671875, 7.69189453125, 8.301025390625, 8.91015625, 9.519287109375, 10.12841796875, 10.737548828125, 11.3466796875, 11.955810546875, 12.56494140625, 13.174072265625, 13.783203125, 14.392333984375, 15.00146484375, 15.610595703125, 16.2197265625, 16.828857421875, 17.43798828125, 18.047119140625, 18.65625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 11.0, 11.0, 8.0, 17.0, 21.0, 20.0, 31.0, 51.0, 64.0, 94.0, 123.0, 169.0, 260.0, 370.0, 498.0, 668.0, 1054.0, 1528.0, 2307.0, 3396.0, 5132.0, 8244.0, 13574.0, 26069.0, 109525.0, 771280.0, 51376.0, 20654.0, 11445.0, 6856.0, 4468.0, 2849.0, 1933.0, 1276.0, 913.0, 652.0, 480.0, 319.0, 224.0, 150.0, 125.0, 98.0, 60.0, 41.0, 43.0, 22.0, 12.0, 10.0, 10.0, 7.0, 4.0, 8.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.8828125, -5.70086669921875, -5.5189208984375, -5.33697509765625, -5.155029296875, -4.97308349609375, -4.7911376953125, -4.60919189453125, -4.42724609375, -4.24530029296875, -4.0633544921875, -3.88140869140625, -3.699462890625, -3.51751708984375, -3.3355712890625, -3.15362548828125, -2.9716796875, -2.78973388671875, -2.6077880859375, -2.42584228515625, -2.243896484375, -2.06195068359375, -1.8800048828125, -1.69805908203125, -1.51611328125, -1.33416748046875, -1.1522216796875, -0.97027587890625, -0.788330078125, -0.60638427734375, -0.4244384765625, -0.24249267578125, -0.060546875, 0.12139892578125, 0.3033447265625, 0.48529052734375, 0.667236328125, 0.84918212890625, 1.0311279296875, 1.21307373046875, 1.39501953125, 1.57696533203125, 1.7589111328125, 1.94085693359375, 2.122802734375, 2.30474853515625, 2.4866943359375, 2.66864013671875, 2.8505859375, 3.03253173828125, 3.2144775390625, 3.39642333984375, 3.578369140625, 3.76031494140625, 3.9422607421875, 4.12420654296875, 4.30615234375, 4.48809814453125, 4.6700439453125, 4.85198974609375, 5.033935546875, 5.21588134765625, 5.3978271484375, 5.57977294921875, 5.76171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 8.0, 12.0, 7.0, 13.0, 13.0, 18.0, 19.0, 15.0, 26.0, 36.0, 41.0, 51.0, 66.0, 64.0, 57.0, 66.0, 83.0, 60.0, 55.0, 55.0, 51.0, 30.0, 24.0, 29.0, 13.0, 15.0, 9.0, 6.0, 9.0, 12.0, 6.0, 9.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00119781494140625, -0.0011629760265350342, -0.0011281371116638184, -0.0010932981967926025, -0.0010584592819213867, -0.001023620367050171, -0.000988781452178955, -0.0009539425373077393, -0.0009191036224365234, -0.0008842647075653076, -0.0008494257926940918, -0.000814586877822876, -0.0007797479629516602, -0.0007449090480804443, -0.0007100701332092285, -0.0006752312183380127, -0.0006403923034667969, -0.0006055533885955811, -0.0005707144737243652, -0.0005358755588531494, -0.0005010366439819336, -0.0004661977291107178, -0.00043135881423950195, -0.00039651989936828613, -0.0003616809844970703, -0.0003268420696258545, -0.00029200315475463867, -0.00025716423988342285, -0.00022232532501220703, -0.0001874864101409912, -0.0001526474952697754, -0.00011780858039855957, -8.296966552734375e-05, -4.813075065612793e-05, -1.329183578491211e-05, 2.154707908630371e-05, 5.638599395751953e-05, 9.122490882873535e-05, 0.00012606382369995117, 0.000160902738571167, 0.0001957416534423828, 0.00023058056831359863, 0.00026541948318481445, 0.0003002583980560303, 0.0003350973129272461, 0.0003699362277984619, 0.00040477514266967773, 0.00043961405754089355, 0.0004744529724121094, 0.0005092918872833252, 0.000544130802154541, 0.0005789697170257568, 0.0006138086318969727, 0.0006486475467681885, 0.0006834864616394043, 0.0007183253765106201, 0.0007531642913818359, 0.0007880032062530518, 0.0008228421211242676, 0.0008576810359954834, 0.0008925199508666992, 0.000927358865737915, 0.0009621977806091309, 0.0009970366954803467, 0.0010318756103515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [6.0, 7.0, 4.0, 11.0, 17.0, 21.0, 40.0, 59.0, 93.0, 93.0, 168.0, 253.0, 378.0, 552.0, 782.0, 1130.0, 1738.0, 2484.0, 3753.0, 5668.0, 8535.0, 12672.0, 18812.0, 28592.0, 43037.0, 64500.0, 93609.0, 127957.0, 151666.0, 141232.0, 109095.0, 76998.0, 51348.0, 34522.0, 22845.0, 15234.0, 10175.0, 6671.0, 4492.0, 2992.0, 2045.0, 1403.0, 942.0, 585.0, 436.0, 297.0, 213.0, 122.0, 102.0, 52.0, 47.0, 32.0, 13.0, 15.0, 9.0, 6.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6748046875, -1.6165008544921875, -1.558197021484375, -1.4998931884765625, -1.44158935546875, -1.3832855224609375, -1.324981689453125, -1.2666778564453125, -1.2083740234375, -1.1500701904296875, -1.091766357421875, -1.0334625244140625, -0.97515869140625, -0.9168548583984375, -0.858551025390625, -0.8002471923828125, -0.741943359375, -0.6836395263671875, -0.625335693359375, -0.5670318603515625, -0.50872802734375, -0.4504241943359375, -0.392120361328125, -0.3338165283203125, -0.2755126953125, -0.2172088623046875, -0.158905029296875, -0.1006011962890625, -0.04229736328125, 0.0160064697265625, 0.074310302734375, 0.1326141357421875, 0.19091796875, 0.2492218017578125, 0.307525634765625, 0.3658294677734375, 0.42413330078125, 0.4824371337890625, 0.540740966796875, 0.5990447998046875, 0.6573486328125, 0.7156524658203125, 0.773956298828125, 0.8322601318359375, 0.89056396484375, 0.9488677978515625, 1.007171630859375, 1.0654754638671875, 1.123779296875, 1.1820831298828125, 1.240386962890625, 1.2986907958984375, 1.35699462890625, 1.4152984619140625, 1.473602294921875, 1.5319061279296875, 1.5902099609375, 1.6485137939453125, 1.706817626953125, 1.7651214599609375, 1.82342529296875, 1.8817291259765625, 1.940032958984375, 1.9983367919921875, 2.056640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 2.0, 3.0, 11.0, 13.0, 14.0, 18.0, 14.0, 21.0, 24.0, 23.0, 31.0, 22.0, 25.0, 32.0, 34.0, 32.0, 11.0, 21.0, 22.0, 22.0, 33.0, 40.0, 40.0, 28.0, 21.0, 24.0, 29.0, 23.0, 30.0, 27.0, 28.0, 23.0, 35.0, 23.0, 35.0, 20.0, 19.0, 23.0, 19.0, 17.0, 17.0, 12.0, 17.0, 6.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.63671875, -0.616912841796875, -0.59710693359375, -0.577301025390625, -0.5574951171875, -0.537689208984375, -0.51788330078125, -0.498077392578125, -0.478271484375, -0.458465576171875, -0.43865966796875, -0.418853759765625, -0.3990478515625, -0.379241943359375, -0.35943603515625, -0.339630126953125, -0.31982421875, -0.300018310546875, -0.28021240234375, -0.260406494140625, -0.2406005859375, -0.220794677734375, -0.20098876953125, -0.181182861328125, -0.161376953125, -0.141571044921875, -0.12176513671875, -0.101959228515625, -0.0821533203125, -0.062347412109375, -0.04254150390625, -0.022735595703125, -0.0029296875, 0.016876220703125, 0.03668212890625, 0.056488037109375, 0.0762939453125, 0.096099853515625, 0.11590576171875, 0.135711669921875, 0.155517578125, 0.175323486328125, 0.19512939453125, 0.214935302734375, 0.2347412109375, 0.254547119140625, 0.27435302734375, 0.294158935546875, 0.31396484375, 0.333770751953125, 0.35357666015625, 0.373382568359375, 0.3931884765625, 0.412994384765625, 0.43280029296875, 0.452606201171875, 0.472412109375, 0.492218017578125, 0.51202392578125, 0.531829833984375, 0.5516357421875, 0.571441650390625, 0.59124755859375, 0.611053466796875, 0.630859375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 4.0, 11.0, 10.0, 20.0, 19.0, 15.0, 28.0, 26.0, 30.0, 32.0, 38.0, 41.0, 37.0, 52.0, 55.0, 55.0, 55.0, 48.0, 40.0, 52.0, 45.0, 57.0, 37.0, 38.0, 28.0, 22.0, 27.0, 9.0, 16.0, 12.0, 10.0, 5.0, 7.0, 3.0, 3.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.899293899536133, -25.20945930480957, -24.51962661743164, -23.829792022705078, -23.139957427978516, -22.450122833251953, -21.76028823852539, -21.07045555114746, -20.3806209564209, -19.690786361694336, -19.000953674316406, -18.311119079589844, -17.62128448486328, -16.93144989013672, -16.241615295410156, -15.551782608032227, -14.861948013305664, -14.172113418579102, -13.482279777526855, -12.79244613647461, -12.102611541748047, -11.412776947021484, -10.722943305969238, -10.033109664916992, -9.34327507019043, -8.653440475463867, -7.963606834411621, -7.273772716522217, -6.5839385986328125, -5.894104480743408, -5.204270362854004, -4.5144362449646, -3.8246021270751953, -3.134768009185791, -2.4449338912963867, -1.7550997734069824, -1.0652656555175781, -0.37543153762817383, 0.31440258026123047, 1.0042366981506348, 1.694070816040039, 2.3839049339294434, 3.0737390518188477, 3.763573169708252, 4.453407287597656, 5.1432414054870605, 5.833075523376465, 6.522909641265869, 7.212743759155273, 7.902577877044678, 8.592411994934082, 9.282245635986328, 9.97208023071289, 10.661914825439453, 11.3517484664917, 12.041582107543945, 12.731416702270508, 13.42125129699707, 14.111084938049316, 14.800918579101562, 15.490753173828125, 16.180587768554688, 16.87042236328125, 17.56025505065918, 18.250089645385742]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 5.0, 3.0, 3.0, 10.0, 9.0, 15.0, 14.0, 15.0, 24.0, 21.0, 34.0, 23.0, 23.0, 47.0, 42.0, 32.0, 30.0, 39.0, 38.0, 26.0, 38.0, 43.0, 32.0, 39.0, 44.0, 38.0, 36.0, 27.0, 21.0, 28.0, 31.0, 23.0, 32.0, 15.0, 16.0, 14.0, 14.0, 12.0, 10.0, 5.0, 3.0, 4.0, 2.0, 4.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-23.2727108001709, -22.58209228515625, -21.89147186279297, -21.20085334777832, -20.510234832763672, -19.81961441040039, -19.128995895385742, -18.438377380371094, -17.747756958007812, -17.057138442993164, -16.366518020629883, -15.675899505615234, -14.98528003692627, -14.294660568237305, -13.604042053222656, -12.913422584533691, -12.222803115844727, -11.532183647155762, -10.841564178466797, -10.150945663452148, -9.460326194763184, -8.769706726074219, -8.07908821105957, -7.3884687423706055, -6.697849273681641, -6.007229804992676, -5.316610813140869, -4.6259918212890625, -3.9353723526000977, -3.244753122329712, -2.554133892059326, -1.8635149002075195, -1.1728973388671875, -0.48227810859680176, 0.20834112167358398, 0.8989603519439697, 1.5895795822143555, 2.280198812484741, 2.970818042755127, 3.6614370346069336, 4.352056503295898, 5.042675971984863, 5.73329496383667, 6.423913955688477, 7.114533424377441, 7.805152893066406, 8.495771408081055, 9.18639087677002, 9.877010345458984, 10.56762981414795, 11.258249282836914, 11.948867797851562, 12.639487266540527, 13.330106735229492, 14.02072525024414, 14.711344718933105, 15.40196418762207, 16.09258270263672, 16.783203125, 17.47382164001465, 18.164440155029297, 18.855060577392578, 19.545679092407227, 20.236297607421875, 20.926918029785156]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 10.0, 9.0, 16.0, 27.0, 38.0, 38.0, 105.0, 142.0, 260.0, 462.0, 677.0, 1145.0, 1966.0, 3314.0, 5634.0, 9363.0, 16091.0, 26447.0, 42161.0, 63803.0, 90691.0, 115490.0, 133145.0, 134937.0, 120540.0, 95177.0, 68821.0, 45766.0, 29164.0, 17587.0, 10309.0, 6216.0, 3616.0, 2149.0, 1272.0, 704.0, 457.0, 312.0, 180.0, 103.0, 78.0, 42.0, 29.0, 22.0, 20.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.234375, -17.64794921875, -17.0615234375, -16.47509765625, -15.888671875, -15.30224609375, -14.7158203125, -14.12939453125, -13.54296875, -12.95654296875, -12.3701171875, -11.78369140625, -11.197265625, -10.61083984375, -10.0244140625, -9.43798828125, -8.8515625, -8.26513671875, -7.6787109375, -7.09228515625, -6.505859375, -5.91943359375, -5.3330078125, -4.74658203125, -4.16015625, -3.57373046875, -2.9873046875, -2.40087890625, -1.814453125, -1.22802734375, -0.6416015625, -0.05517578125, 0.53125, 1.11767578125, 1.7041015625, 2.29052734375, 2.876953125, 3.46337890625, 4.0498046875, 4.63623046875, 5.22265625, 5.80908203125, 6.3955078125, 6.98193359375, 7.568359375, 8.15478515625, 8.7412109375, 9.32763671875, 9.9140625, 10.50048828125, 11.0869140625, 11.67333984375, 12.259765625, 12.84619140625, 13.4326171875, 14.01904296875, 14.60546875, 15.19189453125, 15.7783203125, 16.36474609375, 16.951171875, 17.53759765625, 18.1240234375, 18.71044921875, 19.296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 4.0, 5.0, 5.0, 7.0, 9.0, 14.0, 11.0, 18.0, 26.0, 21.0, 28.0, 27.0, 19.0, 52.0, 38.0, 34.0, 31.0, 35.0, 38.0, 29.0, 37.0, 40.0, 34.0, 41.0, 43.0, 37.0, 39.0, 23.0, 30.0, 19.0, 36.0, 27.0, 28.0, 13.0, 18.0, 16.0, 12.0, 12.0, 11.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-21.6875, -21.046630859375, -20.40576171875, -19.764892578125, -19.1240234375, -18.483154296875, -17.84228515625, -17.201416015625, -16.560546875, -15.919677734375, -15.27880859375, -14.637939453125, -13.9970703125, -13.356201171875, -12.71533203125, -12.074462890625, -11.43359375, -10.792724609375, -10.15185546875, -9.510986328125, -8.8701171875, -8.229248046875, -7.58837890625, -6.947509765625, -6.306640625, -5.665771484375, -5.02490234375, -4.384033203125, -3.7431640625, -3.102294921875, -2.46142578125, -1.820556640625, -1.1796875, -0.538818359375, 0.10205078125, 0.742919921875, 1.3837890625, 2.024658203125, 2.66552734375, 3.306396484375, 3.947265625, 4.588134765625, 5.22900390625, 5.869873046875, 6.5107421875, 7.151611328125, 7.79248046875, 8.433349609375, 9.07421875, 9.715087890625, 10.35595703125, 10.996826171875, 11.6376953125, 12.278564453125, 12.91943359375, 13.560302734375, 14.201171875, 14.842041015625, 15.48291015625, 16.123779296875, 16.7646484375, 17.405517578125, 18.04638671875, 18.687255859375, 19.328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 6.0, 12.0, 14.0, 23.0, 21.0, 31.0, 45.0, 76.0, 94.0, 186.0, 335.0, 597.0, 1040.0, 1887.0, 3183.0, 5792.0, 10145.0, 18436.0, 32490.0, 55188.0, 88288.0, 126221.0, 156168.0, 160630.0, 136508.0, 98946.0, 63991.0, 38304.0, 21982.0, 12120.0, 6882.0, 3794.0, 2193.0, 1197.0, 718.0, 430.0, 212.0, 135.0, 76.0, 42.0, 35.0, 30.0, 15.0, 17.0, 11.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.78125, -22.992431640625, -22.20361328125, -21.414794921875, -20.6259765625, -19.837158203125, -19.04833984375, -18.259521484375, -17.470703125, -16.681884765625, -15.89306640625, -15.104248046875, -14.3154296875, -13.526611328125, -12.73779296875, -11.948974609375, -11.16015625, -10.371337890625, -9.58251953125, -8.793701171875, -8.0048828125, -7.216064453125, -6.42724609375, -5.638427734375, -4.849609375, -4.060791015625, -3.27197265625, -2.483154296875, -1.6943359375, -0.905517578125, -0.11669921875, 0.672119140625, 1.4609375, 2.249755859375, 3.03857421875, 3.827392578125, 4.6162109375, 5.405029296875, 6.19384765625, 6.982666015625, 7.771484375, 8.560302734375, 9.34912109375, 10.137939453125, 10.9267578125, 11.715576171875, 12.50439453125, 13.293212890625, 14.08203125, 14.870849609375, 15.65966796875, 16.448486328125, 17.2373046875, 18.026123046875, 18.81494140625, 19.603759765625, 20.392578125, 21.181396484375, 21.97021484375, 22.759033203125, 23.5478515625, 24.336669921875, 25.12548828125, 25.914306640625, 26.703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 8.0, 7.0, 13.0, 8.0, 11.0, 14.0, 17.0, 15.0, 16.0, 20.0, 22.0, 25.0, 32.0, 33.0, 40.0, 33.0, 50.0, 54.0, 43.0, 45.0, 51.0, 40.0, 46.0, 44.0, 29.0, 25.0, 40.0, 26.0, 29.0, 23.0, 25.0, 21.0, 22.0, 13.0, 12.0, 10.0, 7.0, 4.0, 9.0, 8.0, 5.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-19.8125, -19.2701416015625, -18.727783203125, -18.1854248046875, -17.64306640625, -17.1007080078125, -16.558349609375, -16.0159912109375, -15.4736328125, -14.9312744140625, -14.388916015625, -13.8465576171875, -13.30419921875, -12.7618408203125, -12.219482421875, -11.6771240234375, -11.134765625, -10.5924072265625, -10.050048828125, -9.5076904296875, -8.96533203125, -8.4229736328125, -7.880615234375, -7.3382568359375, -6.7958984375, -6.2535400390625, -5.711181640625, -5.1688232421875, -4.62646484375, -4.0841064453125, -3.541748046875, -2.9993896484375, -2.45703125, -1.9146728515625, -1.372314453125, -0.8299560546875, -0.28759765625, 0.2547607421875, 0.797119140625, 1.3394775390625, 1.8818359375, 2.4241943359375, 2.966552734375, 3.5089111328125, 4.05126953125, 4.5936279296875, 5.135986328125, 5.6783447265625, 6.220703125, 6.7630615234375, 7.305419921875, 7.8477783203125, 8.39013671875, 8.9324951171875, 9.474853515625, 10.0172119140625, 10.5595703125, 11.1019287109375, 11.644287109375, 12.1866455078125, 12.72900390625, 13.2713623046875, 13.813720703125, 14.3560791015625, 14.8984375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 6.0, 5.0, 9.0, 10.0, 15.0, 21.0, 31.0, 28.0, 32.0, 64.0, 90.0, 132.0, 158.0, 231.0, 342.0, 495.0, 728.0, 1078.0, 1513.0, 2146.0, 3387.0, 5113.0, 8084.0, 13425.0, 22151.0, 39115.0, 71078.0, 126436.0, 193308.0, 207602.0, 149477.0, 85793.0, 47000.0, 26575.0, 15545.0, 9460.0, 5939.0, 3882.0, 2567.0, 1774.0, 1116.0, 785.0, 540.0, 371.0, 255.0, 182.0, 133.0, 97.0, 62.0, 45.0, 36.0, 24.0, 24.0, 20.0, 15.0, 3.0, 4.0, 3.0, 2.0, 5.0, 2.0, 1.0], "bins": [-14.046875, -13.5960693359375, -13.145263671875, -12.6944580078125, -12.24365234375, -11.7928466796875, -11.342041015625, -10.8912353515625, -10.4404296875, -9.9896240234375, -9.538818359375, -9.0880126953125, -8.63720703125, -8.1864013671875, -7.735595703125, -7.2847900390625, -6.833984375, -6.3831787109375, -5.932373046875, -5.4815673828125, -5.03076171875, -4.5799560546875, -4.129150390625, -3.6783447265625, -3.2275390625, -2.7767333984375, -2.325927734375, -1.8751220703125, -1.42431640625, -0.9735107421875, -0.522705078125, -0.0718994140625, 0.37890625, 0.8297119140625, 1.280517578125, 1.7313232421875, 2.18212890625, 2.6329345703125, 3.083740234375, 3.5345458984375, 3.9853515625, 4.4361572265625, 4.886962890625, 5.3377685546875, 5.78857421875, 6.2393798828125, 6.690185546875, 7.1409912109375, 7.591796875, 8.0426025390625, 8.493408203125, 8.9442138671875, 9.39501953125, 9.8458251953125, 10.296630859375, 10.7474365234375, 11.1982421875, 11.6490478515625, 12.099853515625, 12.5506591796875, 13.00146484375, 13.4522705078125, 13.903076171875, 14.3538818359375, 14.8046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 6.0, 2.0, 7.0, 10.0, 14.0, 13.0, 17.0, 20.0, 24.0, 45.0, 47.0, 51.0, 49.0, 61.0, 60.0, 85.0, 64.0, 72.0, 63.0, 44.0, 54.0, 29.0, 40.0, 30.0, 24.0, 12.0, 14.0, 16.0, 5.0, 4.0, 4.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012912750244140625, -0.0012479126453399658, -0.0012045502662658691, -0.0011611878871917725, -0.0011178255081176758, -0.001074463129043579, -0.0010311007499694824, -0.0009877383708953857, -0.0009443759918212891, -0.0009010136127471924, -0.0008576512336730957, -0.000814288854598999, -0.0007709264755249023, -0.0007275640964508057, -0.000684201717376709, -0.0006408393383026123, -0.0005974769592285156, -0.0005541145801544189, -0.0005107522010803223, -0.0004673898220062256, -0.0004240274429321289, -0.0003806650638580322, -0.00033730268478393555, -0.00029394030570983887, -0.0002505779266357422, -0.0002072155475616455, -0.00016385316848754883, -0.00012049078941345215, -7.712841033935547e-05, -3.376603126525879e-05, 9.59634780883789e-06, 5.295872688293457e-05, 9.632110595703125e-05, 0.00013968348503112793, 0.0001830458641052246, 0.0002264082431793213, 0.00026977062225341797, 0.00031313300132751465, 0.00035649538040161133, 0.000399857759475708, 0.0004432201385498047, 0.00048658251762390137, 0.000529944896697998, 0.0005733072757720947, 0.0006166696548461914, 0.0006600320339202881, 0.0007033944129943848, 0.0007467567920684814, 0.0007901191711425781, 0.0008334815502166748, 0.0008768439292907715, 0.0009202063083648682, 0.0009635686874389648, 0.0010069310665130615, 0.0010502934455871582, 0.0010936558246612549, 0.0011370182037353516, 0.0011803805828094482, 0.001223742961883545, 0.0012671053409576416, 0.0013104677200317383, 0.001353830099105835, 0.0013971924781799316, 0.0014405548572540283, 0.001483917236328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 5.0, 6.0, 13.0, 11.0, 19.0, 37.0, 57.0, 95.0, 146.0, 207.0, 283.0, 473.0, 720.0, 1085.0, 1676.0, 2336.0, 3547.0, 5142.0, 7817.0, 11957.0, 18213.0, 28900.0, 45706.0, 70769.0, 104115.0, 136933.0, 152829.0, 139945.0, 107401.0, 73834.0, 47346.0, 30317.0, 19285.0, 12597.0, 8179.0, 5457.0, 3702.0, 2455.0, 1640.0, 1073.0, 750.0, 461.0, 373.0, 222.0, 157.0, 98.0, 56.0, 44.0, 24.0, 13.0, 16.0, 7.0, 3.0, 6.0, 0.0, 2.0, 3.0, 1.0], "bins": [-10.3828125, -10.0638427734375, -9.744873046875, -9.4259033203125, -9.10693359375, -8.7879638671875, -8.468994140625, -8.1500244140625, -7.8310546875, -7.5120849609375, -7.193115234375, -6.8741455078125, -6.55517578125, -6.2362060546875, -5.917236328125, -5.5982666015625, -5.279296875, -4.9603271484375, -4.641357421875, -4.3223876953125, -4.00341796875, -3.6844482421875, -3.365478515625, -3.0465087890625, -2.7275390625, -2.4085693359375, -2.089599609375, -1.7706298828125, -1.45166015625, -1.1326904296875, -0.813720703125, -0.4947509765625, -0.17578125, 0.1431884765625, 0.462158203125, 0.7811279296875, 1.10009765625, 1.4190673828125, 1.738037109375, 2.0570068359375, 2.3759765625, 2.6949462890625, 3.013916015625, 3.3328857421875, 3.65185546875, 3.9708251953125, 4.289794921875, 4.6087646484375, 4.927734375, 5.2467041015625, 5.565673828125, 5.8846435546875, 6.20361328125, 6.5225830078125, 6.841552734375, 7.1605224609375, 7.4794921875, 7.7984619140625, 8.117431640625, 8.4364013671875, 8.75537109375, 9.0743408203125, 9.393310546875, 9.7122802734375, 10.03125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 6.0, 7.0, 7.0, 14.0, 13.0, 16.0, 15.0, 14.0, 19.0, 34.0, 28.0, 40.0, 43.0, 29.0, 46.0, 48.0, 48.0, 52.0, 57.0, 62.0, 45.0, 48.0, 36.0, 38.0, 33.0, 25.0, 32.0, 14.0, 21.0, 16.0, 16.0, 15.0, 14.0, 7.0, 8.0, 6.0, 9.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3828125, -5.20440673828125, -5.0260009765625, -4.84759521484375, -4.669189453125, -4.49078369140625, -4.3123779296875, -4.13397216796875, -3.95556640625, -3.77716064453125, -3.5987548828125, -3.42034912109375, -3.241943359375, -3.06353759765625, -2.8851318359375, -2.70672607421875, -2.5283203125, -2.34991455078125, -2.1715087890625, -1.99310302734375, -1.814697265625, -1.63629150390625, -1.4578857421875, -1.27947998046875, -1.10107421875, -0.92266845703125, -0.7442626953125, -0.56585693359375, -0.387451171875, -0.20904541015625, -0.0306396484375, 0.14776611328125, 0.326171875, 0.50457763671875, 0.6829833984375, 0.86138916015625, 1.039794921875, 1.21820068359375, 1.3966064453125, 1.57501220703125, 1.75341796875, 1.93182373046875, 2.1102294921875, 2.28863525390625, 2.467041015625, 2.64544677734375, 2.8238525390625, 3.00225830078125, 3.1806640625, 3.35906982421875, 3.5374755859375, 3.71588134765625, 3.894287109375, 4.07269287109375, 4.2510986328125, 4.42950439453125, 4.60791015625, 4.78631591796875, 4.9647216796875, 5.14312744140625, 5.321533203125, 5.49993896484375, 5.6783447265625, 5.85675048828125, 6.03515625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 4.0, 8.0, 5.0, 7.0, 9.0, 12.0, 22.0, 18.0, 22.0, 29.0, 27.0, 33.0, 43.0, 41.0, 36.0, 39.0, 46.0, 42.0, 45.0, 43.0, 49.0, 44.0, 27.0, 43.0, 47.0, 33.0, 34.0, 32.0, 18.0, 31.0, 20.0, 26.0, 15.0, 10.0, 7.0, 9.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-21.286012649536133, -20.6816349029541, -20.077255249023438, -19.472877502441406, -18.868499755859375, -18.26412010192871, -17.65974235534668, -17.055362701416016, -16.450984954833984, -15.846606254577637, -15.242228507995605, -14.637849807739258, -14.03347110748291, -13.429092407226562, -12.824714660644531, -12.220335960388184, -11.615958213806152, -11.011579513549805, -10.407201766967773, -9.802823066711426, -9.198444366455078, -8.594066619873047, -7.989687919616699, -7.385309219360352, -6.780930995941162, -6.176552772521973, -5.572174072265625, -4.9677958488464355, -4.363417625427246, -3.7590389251708984, -3.154660701751709, -2.5502820014953613, -1.9459037780761719, -1.3415253162384033, -0.7371469736099243, -0.1327686309814453, 0.47160983085632324, 1.0759882926940918, 1.6803665161132812, 2.284745216369629, 2.8891234397888184, 3.493501901626587, 4.0978803634643555, 4.702258586883545, 5.306636810302734, 5.911015510559082, 6.5153937339782715, 7.119772434234619, 7.724150657653809, 8.328529357910156, 8.932907104492188, 9.537285804748535, 10.141664505004883, 10.746042251586914, 11.350420951843262, 11.95479965209961, 12.55917739868164, 13.163556098937988, 13.76793384552002, 14.372312545776367, 14.976691246032715, 15.581069946289062, 16.185447692871094, 16.789825439453125, 17.39420509338379]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 14.0, 8.0, 13.0, 14.0, 15.0, 17.0, 35.0, 30.0, 28.0, 43.0, 40.0, 33.0, 44.0, 50.0, 52.0, 44.0, 51.0, 50.0, 56.0, 37.0, 29.0, 36.0, 43.0, 52.0, 25.0, 28.0, 19.0, 17.0, 20.0, 11.0, 10.0, 5.0, 3.0, 4.0, 6.0, 5.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.364789962768555, -24.430877685546875, -23.496965408325195, -22.563053131103516, -21.629138946533203, -20.695226669311523, -19.761314392089844, -18.827402114868164, -17.893489837646484, -16.959577560424805, -16.025665283203125, -15.091752052307129, -14.157838821411133, -13.223926544189453, -12.290014266967773, -11.356101989746094, -10.422187805175781, -9.488275527954102, -8.554362297058105, -7.620450019836426, -6.686537265777588, -5.75262451171875, -4.81871223449707, -3.8847994804382324, -2.9508867263793945, -2.0169739723205566, -1.0830614566802979, -0.14914894104003906, 0.7847638130187988, 1.7186765670776367, 2.6525888442993164, 3.5865015983581543, 4.520412445068359, 5.454325199127197, 6.388237953186035, 7.322150230407715, 8.256063461303711, 9.18997573852539, 10.12388801574707, 11.05780029296875, 11.991713523864746, 12.925625801086426, 13.859539031982422, 14.793451309204102, 15.727363586425781, 16.661277770996094, 17.59518814086914, 18.529102325439453, 19.463014602661133, 20.396926879882812, 21.330839157104492, 22.264751434326172, 23.198665618896484, 24.132577896118164, 25.066490173339844, 26.000402450561523, 26.934314727783203, 27.868227005004883, 28.802139282226562, 29.736053466796875, 30.669965744018555, 31.603878021240234, 32.53778839111328, 33.471702575683594, 34.405616760253906]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 9.0, 8.0, 9.0, 24.0, 40.0, 37.0, 81.0, 104.0, 228.0, 361.0, 522.0, 833.0, 1381.0, 2165.0, 3483.0, 5526.0, 8530.0, 13828.0, 21367.0, 32786.0, 49458.0, 73929.0, 106768.0, 153337.0, 208999.0, 273051.0, 339278.0, 392401.0, 422852.0, 423334.0, 387737.0, 334823.0, 268620.0, 204083.0, 149682.0, 104507.0, 71884.0, 48522.0, 31982.0, 21034.0, 13280.0, 8353.0, 5490.0, 3436.0, 2296.0, 1430.0, 896.0, 555.0, 338.0, 206.0, 165.0, 85.0, 50.0, 48.0, 23.0, 13.0, 6.0, 9.0, 7.0, 1.0, 4.0], "bins": [-12.21875, -11.8365478515625, -11.454345703125, -11.0721435546875, -10.68994140625, -10.3077392578125, -9.925537109375, -9.5433349609375, -9.1611328125, -8.7789306640625, -8.396728515625, -8.0145263671875, -7.63232421875, -7.2501220703125, -6.867919921875, -6.4857177734375, -6.103515625, -5.7213134765625, -5.339111328125, -4.9569091796875, -4.57470703125, -4.1925048828125, -3.810302734375, -3.4281005859375, -3.0458984375, -2.6636962890625, -2.281494140625, -1.8992919921875, -1.51708984375, -1.1348876953125, -0.752685546875, -0.3704833984375, 0.01171875, 0.3939208984375, 0.776123046875, 1.1583251953125, 1.54052734375, 1.9227294921875, 2.304931640625, 2.6871337890625, 3.0693359375, 3.4515380859375, 3.833740234375, 4.2159423828125, 4.59814453125, 4.9803466796875, 5.362548828125, 5.7447509765625, 6.126953125, 6.5091552734375, 6.891357421875, 7.2735595703125, 7.65576171875, 8.0379638671875, 8.420166015625, 8.8023681640625, 9.1845703125, 9.5667724609375, 9.948974609375, 10.3311767578125, 10.71337890625, 11.0955810546875, 11.477783203125, 11.8599853515625, 12.2421875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 8.0, 11.0, 10.0, 12.0, 15.0, 18.0, 19.0, 24.0, 35.0, 31.0, 36.0, 47.0, 32.0, 39.0, 57.0, 42.0, 50.0, 64.0, 48.0, 42.0, 34.0, 41.0, 39.0, 41.0, 47.0, 31.0, 28.0, 20.0, 17.0, 14.0, 11.0, 14.0, 4.0, 3.0, 3.0, 4.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.25, -22.4248046875, -21.599609375, -20.7744140625, -19.94921875, -19.1240234375, -18.298828125, -17.4736328125, -16.6484375, -15.8232421875, -14.998046875, -14.1728515625, -13.34765625, -12.5224609375, -11.697265625, -10.8720703125, -10.046875, -9.2216796875, -8.396484375, -7.5712890625, -6.74609375, -5.9208984375, -5.095703125, -4.2705078125, -3.4453125, -2.6201171875, -1.794921875, -0.9697265625, -0.14453125, 0.6806640625, 1.505859375, 2.3310546875, 3.15625, 3.9814453125, 4.806640625, 5.6318359375, 6.45703125, 7.2822265625, 8.107421875, 8.9326171875, 9.7578125, 10.5830078125, 11.408203125, 12.2333984375, 13.05859375, 13.8837890625, 14.708984375, 15.5341796875, 16.359375, 17.1845703125, 18.009765625, 18.8349609375, 19.66015625, 20.4853515625, 21.310546875, 22.1357421875, 22.9609375, 23.7861328125, 24.611328125, 25.4365234375, 26.26171875, 27.0869140625, 27.912109375, 28.7373046875, 29.5625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 3.0, 5.0, 7.0, 17.0, 24.0, 54.0, 87.0, 133.0, 239.0, 411.0, 648.0, 1062.0, 1833.0, 3179.0, 5155.0, 9035.0, 15206.0, 24864.0, 40772.0, 65648.0, 101944.0, 152861.0, 219253.0, 295182.0, 374128.0, 436426.0, 468046.0, 456571.0, 407335.0, 334810.0, 256845.0, 182952.0, 126019.0, 82006.0, 51521.0, 32055.0, 19440.0, 11525.0, 6776.0, 4159.0, 2408.0, 1489.0, 834.0, 505.0, 336.0, 183.0, 116.0, 71.0, 43.0, 21.0, 23.0, 12.0, 9.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6015625, -14.1107177734375, -13.619873046875, -13.1290283203125, -12.63818359375, -12.1473388671875, -11.656494140625, -11.1656494140625, -10.6748046875, -10.1839599609375, -9.693115234375, -9.2022705078125, -8.71142578125, -8.2205810546875, -7.729736328125, -7.2388916015625, -6.748046875, -6.2572021484375, -5.766357421875, -5.2755126953125, -4.78466796875, -4.2938232421875, -3.802978515625, -3.3121337890625, -2.8212890625, -2.3304443359375, -1.839599609375, -1.3487548828125, -0.85791015625, -0.3670654296875, 0.123779296875, 0.6146240234375, 1.10546875, 1.5963134765625, 2.087158203125, 2.5780029296875, 3.06884765625, 3.5596923828125, 4.050537109375, 4.5413818359375, 5.0322265625, 5.5230712890625, 6.013916015625, 6.5047607421875, 6.99560546875, 7.4864501953125, 7.977294921875, 8.4681396484375, 8.958984375, 9.4498291015625, 9.940673828125, 10.4315185546875, 10.92236328125, 11.4132080078125, 11.904052734375, 12.3948974609375, 12.8857421875, 13.3765869140625, 13.867431640625, 14.3582763671875, 14.84912109375, 15.3399658203125, 15.830810546875, 16.3216552734375, 16.8125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 5.0, 13.0, 9.0, 22.0, 24.0, 35.0, 46.0, 54.0, 67.0, 77.0, 109.0, 110.0, 127.0, 143.0, 163.0, 187.0, 202.0, 208.0, 216.0, 198.0, 194.0, 205.0, 208.0, 179.0, 198.0, 183.0, 145.0, 127.0, 103.0, 104.0, 78.0, 61.0, 50.0, 40.0, 44.0, 35.0, 23.0, 15.0, 10.0, 8.0, 7.0, 8.0, 4.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.484375, -9.1719970703125, -8.859619140625, -8.5472412109375, -8.23486328125, -7.9224853515625, -7.610107421875, -7.2977294921875, -6.9853515625, -6.6729736328125, -6.360595703125, -6.0482177734375, -5.73583984375, -5.4234619140625, -5.111083984375, -4.7987060546875, -4.486328125, -4.1739501953125, -3.861572265625, -3.5491943359375, -3.23681640625, -2.9244384765625, -2.612060546875, -2.2996826171875, -1.9873046875, -1.6749267578125, -1.362548828125, -1.0501708984375, -0.73779296875, -0.4254150390625, -0.113037109375, 0.1993408203125, 0.51171875, 0.8240966796875, 1.136474609375, 1.4488525390625, 1.76123046875, 2.0736083984375, 2.385986328125, 2.6983642578125, 3.0107421875, 3.3231201171875, 3.635498046875, 3.9478759765625, 4.26025390625, 4.5726318359375, 4.885009765625, 5.1973876953125, 5.509765625, 5.8221435546875, 6.134521484375, 6.4468994140625, 6.75927734375, 7.0716552734375, 7.384033203125, 7.6964111328125, 8.0087890625, 8.3211669921875, 8.633544921875, 8.9459228515625, 9.25830078125, 9.5706787109375, 9.883056640625, 10.1954345703125, 10.5078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 8.0, 9.0, 5.0, 10.0, 16.0, 8.0, 17.0, 12.0, 22.0, 28.0, 23.0, 35.0, 43.0, 39.0, 45.0, 49.0, 46.0, 47.0, 47.0, 55.0, 41.0, 50.0, 50.0, 41.0, 32.0, 29.0, 35.0, 33.0, 20.0, 21.0, 21.0, 16.0, 11.0, 8.0, 7.0, 7.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.45985984802246, -22.79401206970215, -22.128162384033203, -21.46231460571289, -20.796466827392578, -20.130619049072266, -19.464771270751953, -18.798921585083008, -18.133073806762695, -17.467226028442383, -16.801376342773438, -16.135528564453125, -15.469680786132812, -14.8038330078125, -14.137984275817871, -13.472135543823242, -12.80628776550293, -12.140439987182617, -11.474591255187988, -10.80874252319336, -10.142894744873047, -9.477046966552734, -8.811198234558105, -8.145349502563477, -7.479501724243164, -6.813653469085693, -6.147805213928223, -5.481956958770752, -4.816108703613281, -4.1502604484558105, -3.48441219329834, -2.818563938140869, -2.1527156829833984, -1.4868674278259277, -0.821019172668457, -0.15517091751098633, 0.5106773376464844, 1.176525592803955, 1.8423738479614258, 2.5082221031188965, 3.174070358276367, 3.839918613433838, 4.505766868591309, 5.171615123748779, 5.83746337890625, 6.503311634063721, 7.169159889221191, 7.835008144378662, 8.500856399536133, 9.166704177856445, 9.832552909851074, 10.498401641845703, 11.164249420166016, 11.830097198486328, 12.495945930480957, 13.161794662475586, 13.827642440795898, 14.493490219116211, 15.15933895111084, 15.825187683105469, 16.49103546142578, 17.156883239746094, 17.822731018066406, 18.48858070373535, 19.154428482055664]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 4.0, 9.0, 5.0, 9.0, 17.0, 12.0, 20.0, 20.0, 30.0, 40.0, 37.0, 36.0, 38.0, 51.0, 38.0, 32.0, 40.0, 42.0, 49.0, 49.0, 33.0, 62.0, 45.0, 33.0, 41.0, 26.0, 25.0, 28.0, 22.0, 19.0, 13.0, 21.0, 9.0, 10.0, 6.0, 4.0, 10.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.593290328979492, -24.69228172302246, -23.791275024414062, -22.89026641845703, -21.9892578125, -21.08824920654297, -20.18724250793457, -19.28623390197754, -18.38522720336914, -17.48421859741211, -16.58321189880371, -15.68220329284668, -14.781194686889648, -13.880187034606934, -12.979179382324219, -12.078170776367188, -11.177162170410156, -10.276154518127441, -9.37514591217041, -8.474138259887695, -7.573130130767822, -6.672122001647949, -5.771114349365234, -4.870106220245361, -3.9690980911254883, -3.0680899620056152, -2.1670820713043213, -1.2660741806030273, -0.3650660514831543, 0.5359420776367188, 1.4369497299194336, 2.3379578590393066, 3.2389678955078125, 4.1399760246276855, 5.040984153747559, 5.941991806030273, 6.8429999351501465, 7.7440080642700195, 8.645015716552734, 9.546024322509766, 10.44703197479248, 11.348039627075195, 12.249048233032227, 13.150055885314941, 14.051063537597656, 14.952072143554688, 15.853079795837402, 16.754087448120117, 17.65509605407715, 18.55610466003418, 19.457111358642578, 20.35811996459961, 21.25912857055664, 22.160137176513672, 23.06114387512207, 23.9621524810791, 24.8631591796875, 25.76416778564453, 26.66517448425293, 27.56618309020996, 28.467191696166992, 29.36819839477539, 30.269207000732422, 31.170215606689453, 32.071224212646484]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 9.0, 16.0, 22.0, 25.0, 59.0, 70.0, 130.0, 184.0, 278.0, 417.0, 671.0, 1053.0, 1689.0, 2523.0, 3876.0, 5907.0, 8887.0, 13473.0, 19563.0, 28018.0, 39095.0, 52085.0, 66612.0, 81226.0, 92006.0, 99127.0, 99529.0, 93539.0, 82777.0, 68322.0, 54309.0, 40699.0, 29505.0, 20749.0, 14285.0, 9567.0, 6284.0, 4250.0, 2632.0, 1796.0, 1192.0, 721.0, 475.0, 303.0, 217.0, 151.0, 87.0, 59.0, 33.0, 27.0, 16.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.171875, -7.9248046875, -7.677734375, -7.4306640625, -7.18359375, -6.9365234375, -6.689453125, -6.4423828125, -6.1953125, -5.9482421875, -5.701171875, -5.4541015625, -5.20703125, -4.9599609375, -4.712890625, -4.4658203125, -4.21875, -3.9716796875, -3.724609375, -3.4775390625, -3.23046875, -2.9833984375, -2.736328125, -2.4892578125, -2.2421875, -1.9951171875, -1.748046875, -1.5009765625, -1.25390625, -1.0068359375, -0.759765625, -0.5126953125, -0.265625, -0.0185546875, 0.228515625, 0.4755859375, 0.72265625, 0.9697265625, 1.216796875, 1.4638671875, 1.7109375, 1.9580078125, 2.205078125, 2.4521484375, 2.69921875, 2.9462890625, 3.193359375, 3.4404296875, 3.6875, 3.9345703125, 4.181640625, 4.4287109375, 4.67578125, 4.9228515625, 5.169921875, 5.4169921875, 5.6640625, 5.9111328125, 6.158203125, 6.4052734375, 6.65234375, 6.8994140625, 7.146484375, 7.3935546875, 7.640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 4.0, 9.0, 4.0, 10.0, 16.0, 13.0, 18.0, 21.0, 30.0, 42.0, 34.0, 35.0, 37.0, 55.0, 36.0, 30.0, 43.0, 41.0, 53.0, 44.0, 35.0, 60.0, 46.0, 35.0, 40.0, 27.0, 24.0, 26.0, 25.0, 17.0, 16.0, 19.0, 10.0, 10.0, 5.0, 6.0, 9.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.90625, -24.9921875, -24.078125, -23.1640625, -22.25, -21.3359375, -20.421875, -19.5078125, -18.59375, -17.6796875, -16.765625, -15.8515625, -14.9375, -14.0234375, -13.109375, -12.1953125, -11.28125, -10.3671875, -9.453125, -8.5390625, -7.625, -6.7109375, -5.796875, -4.8828125, -3.96875, -3.0546875, -2.140625, -1.2265625, -0.3125, 0.6015625, 1.515625, 2.4296875, 3.34375, 4.2578125, 5.171875, 6.0859375, 7.0, 7.9140625, 8.828125, 9.7421875, 10.65625, 11.5703125, 12.484375, 13.3984375, 14.3125, 15.2265625, 16.140625, 17.0546875, 17.96875, 18.8828125, 19.796875, 20.7109375, 21.625, 22.5390625, 23.453125, 24.3671875, 25.28125, 26.1953125, 27.109375, 28.0234375, 28.9375, 29.8515625, 30.765625, 31.6796875, 32.59375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 3.0, 7.0, 12.0, 19.0, 20.0, 30.0, 52.0, 71.0, 97.0, 142.0, 228.0, 292.0, 402.0, 573.0, 835.0, 1122.0, 1531.0, 2067.0, 3116.0, 4426.0, 5986.0, 8415.0, 12103.0, 17641.0, 27328.0, 214430.0, 642474.0, 37031.0, 20643.0, 13822.0, 9690.0, 6926.0, 4996.0, 3457.0, 2493.0, 1812.0, 1271.0, 890.0, 609.0, 454.0, 264.0, 203.0, 174.0, 115.0, 88.0, 58.0, 40.0, 28.0, 29.0, 16.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0], "bins": [-17.375, -16.8515625, -16.328125, -15.8046875, -15.28125, -14.7578125, -14.234375, -13.7109375, -13.1875, -12.6640625, -12.140625, -11.6171875, -11.09375, -10.5703125, -10.046875, -9.5234375, -9.0, -8.4765625, -7.953125, -7.4296875, -6.90625, -6.3828125, -5.859375, -5.3359375, -4.8125, -4.2890625, -3.765625, -3.2421875, -2.71875, -2.1953125, -1.671875, -1.1484375, -0.625, -0.1015625, 0.421875, 0.9453125, 1.46875, 1.9921875, 2.515625, 3.0390625, 3.5625, 4.0859375, 4.609375, 5.1328125, 5.65625, 6.1796875, 6.703125, 7.2265625, 7.75, 8.2734375, 8.796875, 9.3203125, 9.84375, 10.3671875, 10.890625, 11.4140625, 11.9375, 12.4609375, 12.984375, 13.5078125, 14.03125, 14.5546875, 15.078125, 15.6015625, 16.125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 12.0, 5.0, 3.0, 7.0, 11.0, 15.0, 14.0, 17.0, 19.0, 22.0, 22.0, 34.0, 32.0, 22.0, 36.0, 40.0, 38.0, 43.0, 29.0, 31.0, 45.0, 27.0, 44.0, 34.0, 33.0, 38.0, 32.0, 26.0, 36.0, 24.0, 22.0, 35.0, 14.0, 15.0, 15.0, 11.0, 16.0, 17.0, 15.0, 9.0, 7.0, 10.0, 5.0, 2.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-18.703125, -18.063720703125, -17.42431640625, -16.784912109375, -16.1455078125, -15.506103515625, -14.86669921875, -14.227294921875, -13.587890625, -12.948486328125, -12.30908203125, -11.669677734375, -11.0302734375, -10.390869140625, -9.75146484375, -9.112060546875, -8.47265625, -7.833251953125, -7.19384765625, -6.554443359375, -5.9150390625, -5.275634765625, -4.63623046875, -3.996826171875, -3.357421875, -2.718017578125, -2.07861328125, -1.439208984375, -0.7998046875, -0.160400390625, 0.47900390625, 1.118408203125, 1.7578125, 2.397216796875, 3.03662109375, 3.676025390625, 4.3154296875, 4.954833984375, 5.59423828125, 6.233642578125, 6.873046875, 7.512451171875, 8.15185546875, 8.791259765625, 9.4306640625, 10.070068359375, 10.70947265625, 11.348876953125, 11.98828125, 12.627685546875, 13.26708984375, 13.906494140625, 14.5458984375, 15.185302734375, 15.82470703125, 16.464111328125, 17.103515625, 17.742919921875, 18.38232421875, 19.021728515625, 19.6611328125, 20.300537109375, 20.93994140625, 21.579345703125, 22.21875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 10.0, 10.0, 12.0, 25.0, 30.0, 40.0, 74.0, 91.0, 128.0, 182.0, 304.0, 496.0, 702.0, 1089.0, 1569.0, 2308.0, 3800.0, 5989.0, 10072.0, 18022.0, 35628.0, 593328.0, 301966.0, 31249.0, 16198.0, 9361.0, 5512.0, 3548.0, 2310.0, 1541.0, 974.0, 674.0, 421.0, 298.0, 192.0, 135.0, 92.0, 64.0, 44.0, 21.0, 14.0, 9.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0], "bins": [-4.7890625, -4.65191650390625, -4.5147705078125, -4.37762451171875, -4.240478515625, -4.10333251953125, -3.9661865234375, -3.82904052734375, -3.69189453125, -3.55474853515625, -3.4176025390625, -3.28045654296875, -3.143310546875, -3.00616455078125, -2.8690185546875, -2.73187255859375, -2.5947265625, -2.45758056640625, -2.3204345703125, -2.18328857421875, -2.046142578125, -1.90899658203125, -1.7718505859375, -1.63470458984375, -1.49755859375, -1.36041259765625, -1.2232666015625, -1.08612060546875, -0.948974609375, -0.81182861328125, -0.6746826171875, -0.53753662109375, -0.400390625, -0.26324462890625, -0.1260986328125, 0.01104736328125, 0.148193359375, 0.28533935546875, 0.4224853515625, 0.55963134765625, 0.69677734375, 0.83392333984375, 0.9710693359375, 1.10821533203125, 1.245361328125, 1.38250732421875, 1.5196533203125, 1.65679931640625, 1.7939453125, 1.93109130859375, 2.0682373046875, 2.20538330078125, 2.342529296875, 2.47967529296875, 2.6168212890625, 2.75396728515625, 2.89111328125, 3.02825927734375, 3.1654052734375, 3.30255126953125, 3.439697265625, 3.57684326171875, 3.7139892578125, 3.85113525390625, 3.98828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 10.0, 7.0, 11.0, 12.0, 24.0, 39.0, 43.0, 40.0, 36.0, 64.0, 37.0, 52.0, 68.0, 74.0, 67.0, 78.0, 51.0, 42.0, 47.0, 43.0, 24.0, 21.0, 14.0, 17.0, 14.0, 7.0, 10.0, 7.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0007719993591308594, -0.0007489696145057678, -0.0007259398698806763, -0.0007029101252555847, -0.0006798803806304932, -0.0006568506360054016, -0.0006338208913803101, -0.0006107911467552185, -0.000587761402130127, -0.0005647316575050354, -0.0005417019128799438, -0.0005186721682548523, -0.0004956424236297607, -0.0004726126790046692, -0.00044958293437957764, -0.0004265531897544861, -0.00040352344512939453, -0.000380493700504303, -0.0003574639558792114, -0.0003344342112541199, -0.0003114044666290283, -0.00028837472200393677, -0.0002653449773788452, -0.00024231523275375366, -0.0002192854881286621, -0.00019625574350357056, -0.000173225998878479, -0.00015019625425338745, -0.0001271665096282959, -0.00010413676500320435, -8.110702037811279e-05, -5.807727575302124e-05, -3.504753112792969e-05, -1.2017786502838135e-05, 1.1011958122253418e-05, 3.404170274734497e-05, 5.7071447372436523e-05, 8.010119199752808e-05, 0.00010313093662261963, 0.00012616068124771118, 0.00014919042587280273, 0.0001722201704978943, 0.00019524991512298584, 0.0002182796597480774, 0.00024130940437316895, 0.0002643391489982605, 0.00028736889362335205, 0.0003103986382484436, 0.00033342838287353516, 0.0003564581274986267, 0.00037948787212371826, 0.0004025176167488098, 0.00042554736137390137, 0.0004485771059989929, 0.00047160685062408447, 0.000494636595249176, 0.0005176663398742676, 0.0005406960844993591, 0.0005637258291244507, 0.0005867555737495422, 0.0006097853183746338, 0.0006328150629997253, 0.0006558448076248169, 0.0006788745522499084, 0.000701904296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 7.0, 9.0, 10.0, 28.0, 37.0, 51.0, 86.0, 107.0, 146.0, 224.0, 343.0, 545.0, 778.0, 1082.0, 1708.0, 2550.0, 3650.0, 5430.0, 8175.0, 12107.0, 18118.0, 26217.0, 38124.0, 54974.0, 75394.0, 97880.0, 115732.0, 122834.0, 115935.0, 96818.0, 75139.0, 54492.0, 38543.0, 26170.0, 17971.0, 12252.0, 8067.0, 5461.0, 3646.0, 2512.0, 1672.0, 1160.0, 754.0, 505.0, 384.0, 252.0, 161.0, 111.0, 62.0, 57.0, 29.0, 25.0, 22.0, 9.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.375, -1.3313446044921875, -1.287689208984375, -1.2440338134765625, -1.20037841796875, -1.1567230224609375, -1.113067626953125, -1.0694122314453125, -1.0257568359375, -0.9821014404296875, -0.938446044921875, -0.8947906494140625, -0.85113525390625, -0.8074798583984375, -0.763824462890625, -0.7201690673828125, -0.676513671875, -0.6328582763671875, -0.589202880859375, -0.5455474853515625, -0.50189208984375, -0.4582366943359375, -0.414581298828125, -0.3709259033203125, -0.3272705078125, -0.2836151123046875, -0.239959716796875, -0.1963043212890625, -0.15264892578125, -0.1089935302734375, -0.065338134765625, -0.0216827392578125, 0.02197265625, 0.0656280517578125, 0.109283447265625, 0.1529388427734375, 0.19659423828125, 0.2402496337890625, 0.283905029296875, 0.3275604248046875, 0.3712158203125, 0.4148712158203125, 0.458526611328125, 0.5021820068359375, 0.54583740234375, 0.5894927978515625, 0.633148193359375, 0.6768035888671875, 0.720458984375, 0.7641143798828125, 0.807769775390625, 0.8514251708984375, 0.89508056640625, 0.9387359619140625, 0.982391357421875, 1.0260467529296875, 1.0697021484375, 1.1133575439453125, 1.157012939453125, 1.2006683349609375, 1.24432373046875, 1.2879791259765625, 1.331634521484375, 1.3752899169921875, 1.4189453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 5.0, 9.0, 11.0, 18.0, 7.0, 26.0, 16.0, 30.0, 24.0, 39.0, 34.0, 26.0, 24.0, 19.0, 25.0, 28.0, 23.0, 28.0, 21.0, 30.0, 26.0, 19.0, 25.0, 29.0, 31.0, 21.0, 27.0, 31.0, 26.0, 37.0, 32.0, 26.0, 42.0, 32.0, 26.0, 19.0, 23.0, 19.0, 20.0, 12.0, 15.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.79833984375, -0.7733688354492188, -0.7483978271484375, -0.7234268188476562, -0.698455810546875, -0.6734848022460938, -0.6485137939453125, -0.6235427856445312, -0.59857177734375, -0.5736007690429688, -0.5486297607421875, -0.5236587524414062, -0.498687744140625, -0.47371673583984375, -0.4487457275390625, -0.42377471923828125, -0.3988037109375, -0.37383270263671875, -0.3488616943359375, -0.32389068603515625, -0.298919677734375, -0.27394866943359375, -0.2489776611328125, -0.22400665283203125, -0.19903564453125, -0.17406463623046875, -0.1490936279296875, -0.12412261962890625, -0.099151611328125, -0.07418060302734375, -0.0492095947265625, -0.02423858642578125, 0.000732421875, 0.02570343017578125, 0.0506744384765625, 0.07564544677734375, 0.100616455078125, 0.12558746337890625, 0.1505584716796875, 0.17552947998046875, 0.20050048828125, 0.22547149658203125, 0.2504425048828125, 0.27541351318359375, 0.300384521484375, 0.32535552978515625, 0.3503265380859375, 0.37529754638671875, 0.4002685546875, 0.42523956298828125, 0.4502105712890625, 0.47518157958984375, 0.500152587890625, 0.5251235961914062, 0.5500946044921875, 0.5750656127929688, 0.60003662109375, 0.6250076293945312, 0.6499786376953125, 0.6749496459960938, 0.699920654296875, 0.7248916625976562, 0.7498626708984375, 0.7748336791992188, 0.7998046875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 3.0, 5.0, 9.0, 10.0, 10.0, 16.0, 8.0, 13.0, 25.0, 22.0, 30.0, 26.0, 37.0, 44.0, 46.0, 41.0, 51.0, 44.0, 62.0, 41.0, 51.0, 45.0, 51.0, 47.0, 34.0, 37.0, 26.0, 32.0, 24.0, 25.0, 17.0, 17.0, 14.0, 6.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-27.527786254882812, -26.825218200683594, -26.122648239135742, -25.42007827758789, -24.717510223388672, -24.014942169189453, -23.3123722076416, -22.60980224609375, -21.90723419189453, -21.204666137695312, -20.50209617614746, -19.79952621459961, -19.09695816040039, -18.394390106201172, -17.69182014465332, -16.98925018310547, -16.28668212890625, -15.584113121032715, -14.88154411315918, -14.178975105285645, -13.47640609741211, -12.773837089538574, -12.071268081665039, -11.368699073791504, -10.666130065917969, -9.963561058044434, -9.260992050170898, -8.558423042297363, -7.855854034423828, -7.153285026550293, -6.450716018676758, -5.748147010803223, -5.04557991027832, -4.343010902404785, -3.64044189453125, -2.937872886657715, -2.2353038787841797, -1.5327348709106445, -0.8301658630371094, -0.12759685516357422, 0.5749721527099609, 1.277541160583496, 1.9801101684570312, 2.6826791763305664, 3.3852481842041016, 4.087817192077637, 4.790386199951172, 5.492955207824707, 6.195524215698242, 6.898093223571777, 7.6006622314453125, 8.303231239318848, 9.005800247192383, 9.708369255065918, 10.410938262939453, 11.113507270812988, 11.816076278686523, 12.518645286560059, 13.221214294433594, 13.923783302307129, 14.626352310180664, 15.3289213180542, 16.031490325927734, 16.734058380126953, 17.436628341674805]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 6.0, 3.0, 7.0, 6.0, 15.0, 13.0, 19.0, 32.0, 29.0, 41.0, 39.0, 38.0, 34.0, 41.0, 43.0, 35.0, 53.0, 34.0, 54.0, 48.0, 41.0, 46.0, 50.0, 37.0, 40.0, 35.0, 18.0, 32.0, 18.0, 18.0, 15.0, 7.0, 15.0, 10.0, 6.0, 6.0, 3.0, 1.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.0915584564209, -27.12256622314453, -26.153575897216797, -25.184585571289062, -24.215593338012695, -23.246601104736328, -22.277610778808594, -21.30862045288086, -20.339628219604492, -19.370635986328125, -18.40164566040039, -17.432655334472656, -16.46366310119629, -15.494671821594238, -14.525680541992188, -13.556689262390137, -12.587697982788086, -11.618706703186035, -10.649715423583984, -9.680724143981934, -8.711732864379883, -7.742741584777832, -6.773750305175781, -5.8047590255737305, -4.83576774597168, -3.866776466369629, -2.897785186767578, -1.9287939071655273, -0.9598026275634766, 0.009188652038574219, 0.978179931640625, 1.9471712112426758, 2.9161643981933594, 3.88515567779541, 4.854146957397461, 5.823138236999512, 6.7921295166015625, 7.761120796203613, 8.730112075805664, 9.699103355407715, 10.668094635009766, 11.637085914611816, 12.606077194213867, 13.575068473815918, 14.544059753417969, 15.51305103302002, 16.48204231262207, 17.451034545898438, 18.420024871826172, 19.389015197753906, 20.358007431030273, 21.32699966430664, 22.295989990234375, 23.26498031616211, 24.233972549438477, 25.202964782714844, 26.171955108642578, 27.140945434570312, 28.10993766784668, 29.078929901123047, 30.04792022705078, 31.016910552978516, 31.985902786254883, 32.95489501953125, 33.923885345458984]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 13.0, 12.0, 6.0, 20.0, 28.0, 40.0, 42.0, 95.0, 153.0, 238.0, 427.0, 781.0, 1340.0, 2421.0, 4484.0, 8282.0, 15231.0, 27957.0, 48573.0, 79314.0, 116299.0, 149023.0, 161388.0, 145534.0, 111043.0, 74357.0, 44963.0, 25843.0, 13784.0, 7623.0, 4050.0, 2195.0, 1220.0, 677.0, 430.0, 228.0, 149.0, 102.0, 60.0, 46.0, 23.0, 15.0, 16.0, 8.0, 6.0, 4.0, 3.0, 5.0, 4.0, 0.0, 1.0], "bins": [-26.5625, -25.812744140625, -25.06298828125, -24.313232421875, -23.5634765625, -22.813720703125, -22.06396484375, -21.314208984375, -20.564453125, -19.814697265625, -19.06494140625, -18.315185546875, -17.5654296875, -16.815673828125, -16.06591796875, -15.316162109375, -14.56640625, -13.816650390625, -13.06689453125, -12.317138671875, -11.5673828125, -10.817626953125, -10.06787109375, -9.318115234375, -8.568359375, -7.818603515625, -7.06884765625, -6.319091796875, -5.5693359375, -4.819580078125, -4.06982421875, -3.320068359375, -2.5703125, -1.820556640625, -1.07080078125, -0.321044921875, 0.4287109375, 1.178466796875, 1.92822265625, 2.677978515625, 3.427734375, 4.177490234375, 4.92724609375, 5.677001953125, 6.4267578125, 7.176513671875, 7.92626953125, 8.676025390625, 9.42578125, 10.175537109375, 10.92529296875, 11.675048828125, 12.4248046875, 13.174560546875, 13.92431640625, 14.674072265625, 15.423828125, 16.173583984375, 16.92333984375, 17.673095703125, 18.4228515625, 19.172607421875, 19.92236328125, 20.672119140625, 21.421875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 3.0, 6.0, 9.0, 12.0, 14.0, 20.0, 28.0, 32.0, 41.0, 32.0, 43.0, 33.0, 42.0, 42.0, 35.0, 45.0, 46.0, 52.0, 43.0, 52.0, 40.0, 51.0, 35.0, 37.0, 38.0, 22.0, 30.0, 16.0, 20.0, 13.0, 10.0, 13.0, 12.0, 3.0, 8.0, 3.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.640625, -25.723876953125, -24.80712890625, -23.890380859375, -22.9736328125, -22.056884765625, -21.14013671875, -20.223388671875, -19.306640625, -18.389892578125, -17.47314453125, -16.556396484375, -15.6396484375, -14.722900390625, -13.80615234375, -12.889404296875, -11.97265625, -11.055908203125, -10.13916015625, -9.222412109375, -8.3056640625, -7.388916015625, -6.47216796875, -5.555419921875, -4.638671875, -3.721923828125, -2.80517578125, -1.888427734375, -0.9716796875, -0.054931640625, 0.86181640625, 1.778564453125, 2.6953125, 3.612060546875, 4.52880859375, 5.445556640625, 6.3623046875, 7.279052734375, 8.19580078125, 9.112548828125, 10.029296875, 10.946044921875, 11.86279296875, 12.779541015625, 13.6962890625, 14.613037109375, 15.52978515625, 16.446533203125, 17.36328125, 18.280029296875, 19.19677734375, 20.113525390625, 21.0302734375, 21.947021484375, 22.86376953125, 23.780517578125, 24.697265625, 25.614013671875, 26.53076171875, 27.447509765625, 28.3642578125, 29.281005859375, 30.19775390625, 31.114501953125, 32.03125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 8.0, 15.0, 21.0, 35.0, 44.0, 74.0, 121.0, 171.0, 246.0, 396.0, 608.0, 1021.0, 1537.0, 2509.0, 3789.0, 6230.0, 9876.0, 16058.0, 25769.0, 40446.0, 60244.0, 86267.0, 112805.0, 131600.0, 133498.0, 120552.0, 96380.0, 69998.0, 46853.0, 30260.0, 19318.0, 11787.0, 7364.0, 4662.0, 2866.0, 1879.0, 1135.0, 708.0, 476.0, 336.0, 216.0, 127.0, 86.0, 57.0, 33.0, 30.0, 18.0, 9.0, 5.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.890625, -20.220703125, -19.55078125, -18.880859375, -18.2109375, -17.541015625, -16.87109375, -16.201171875, -15.53125, -14.861328125, -14.19140625, -13.521484375, -12.8515625, -12.181640625, -11.51171875, -10.841796875, -10.171875, -9.501953125, -8.83203125, -8.162109375, -7.4921875, -6.822265625, -6.15234375, -5.482421875, -4.8125, -4.142578125, -3.47265625, -2.802734375, -2.1328125, -1.462890625, -0.79296875, -0.123046875, 0.546875, 1.216796875, 1.88671875, 2.556640625, 3.2265625, 3.896484375, 4.56640625, 5.236328125, 5.90625, 6.576171875, 7.24609375, 7.916015625, 8.5859375, 9.255859375, 9.92578125, 10.595703125, 11.265625, 11.935546875, 12.60546875, 13.275390625, 13.9453125, 14.615234375, 15.28515625, 15.955078125, 16.625, 17.294921875, 17.96484375, 18.634765625, 19.3046875, 19.974609375, 20.64453125, 21.314453125, 21.984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 1.0, 6.0, 8.0, 6.0, 10.0, 10.0, 15.0, 10.0, 17.0, 21.0, 17.0, 17.0, 32.0, 28.0, 27.0, 33.0, 33.0, 39.0, 45.0, 28.0, 32.0, 47.0, 40.0, 29.0, 43.0, 36.0, 31.0, 25.0, 30.0, 27.0, 34.0, 40.0, 23.0, 20.0, 14.0, 16.0, 14.0, 16.0, 19.0, 11.0, 14.0, 3.0, 6.0, 5.0, 8.0, 6.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-16.78125, -16.25439453125, -15.7275390625, -15.20068359375, -14.673828125, -14.14697265625, -13.6201171875, -13.09326171875, -12.56640625, -12.03955078125, -11.5126953125, -10.98583984375, -10.458984375, -9.93212890625, -9.4052734375, -8.87841796875, -8.3515625, -7.82470703125, -7.2978515625, -6.77099609375, -6.244140625, -5.71728515625, -5.1904296875, -4.66357421875, -4.13671875, -3.60986328125, -3.0830078125, -2.55615234375, -2.029296875, -1.50244140625, -0.9755859375, -0.44873046875, 0.078125, 0.60498046875, 1.1318359375, 1.65869140625, 2.185546875, 2.71240234375, 3.2392578125, 3.76611328125, 4.29296875, 4.81982421875, 5.3466796875, 5.87353515625, 6.400390625, 6.92724609375, 7.4541015625, 7.98095703125, 8.5078125, 9.03466796875, 9.5615234375, 10.08837890625, 10.615234375, 11.14208984375, 11.6689453125, 12.19580078125, 12.72265625, 13.24951171875, 13.7763671875, 14.30322265625, 14.830078125, 15.35693359375, 15.8837890625, 16.41064453125, 16.9375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 7.0, 3.0, 13.0, 19.0, 15.0, 28.0, 36.0, 54.0, 74.0, 120.0, 159.0, 239.0, 349.0, 558.0, 994.0, 1815.0, 3290.0, 6313.0, 12199.0, 25187.0, 54684.0, 114892.0, 202961.0, 245776.0, 185565.0, 100784.0, 47223.0, 22031.0, 10641.0, 5391.0, 2998.0, 1582.0, 985.0, 553.0, 316.0, 226.0, 139.0, 87.0, 69.0, 48.0, 33.0, 28.0, 24.0, 11.0, 4.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0], "bins": [-14.3984375, -13.9674072265625, -13.536376953125, -13.1053466796875, -12.67431640625, -12.2432861328125, -11.812255859375, -11.3812255859375, -10.9501953125, -10.5191650390625, -10.088134765625, -9.6571044921875, -9.22607421875, -8.7950439453125, -8.364013671875, -7.9329833984375, -7.501953125, -7.0709228515625, -6.639892578125, -6.2088623046875, -5.77783203125, -5.3468017578125, -4.915771484375, -4.4847412109375, -4.0537109375, -3.6226806640625, -3.191650390625, -2.7606201171875, -2.32958984375, -1.8985595703125, -1.467529296875, -1.0364990234375, -0.60546875, -0.1744384765625, 0.256591796875, 0.6876220703125, 1.11865234375, 1.5496826171875, 1.980712890625, 2.4117431640625, 2.8427734375, 3.2738037109375, 3.704833984375, 4.1358642578125, 4.56689453125, 4.9979248046875, 5.428955078125, 5.8599853515625, 6.291015625, 6.7220458984375, 7.153076171875, 7.5841064453125, 8.01513671875, 8.4461669921875, 8.877197265625, 9.3082275390625, 9.7392578125, 10.1702880859375, 10.601318359375, 11.0323486328125, 11.46337890625, 11.8944091796875, 12.325439453125, 12.7564697265625, 13.1875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 2.0, 2.0, 3.0, 5.0, 10.0, 7.0, 15.0, 17.0, 16.0, 21.0, 27.0, 26.0, 40.0, 40.0, 57.0, 62.0, 53.0, 56.0, 45.0, 60.0, 57.0, 47.0, 46.0, 44.0, 34.0, 31.0, 40.0, 30.0, 23.0, 24.0, 17.0, 12.0, 6.0, 6.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0010356903076171875, -0.0010070279240608215, -0.0009783655405044556, -0.0009497031569480896, -0.0009210407733917236, -0.0008923783898353577, -0.0008637160062789917, -0.0008350536227226257, -0.0008063912391662598, -0.0007777288556098938, -0.0007490664720535278, -0.0007204040884971619, -0.0006917417049407959, -0.0006630793213844299, -0.000634416937828064, -0.000605754554271698, -0.000577092170715332, -0.0005484297871589661, -0.0005197674036026001, -0.0004911050200462341, -0.00046244263648986816, -0.0004337802529335022, -0.00040511786937713623, -0.00037645548582077026, -0.0003477931022644043, -0.00031913071870803833, -0.00029046833515167236, -0.0002618059515953064, -0.00023314356803894043, -0.00020448118448257446, -0.0001758188009262085, -0.00014715641736984253, -0.00011849403381347656, -8.98316502571106e-05, -6.116926670074463e-05, -3.250688314437866e-05, -3.844499588012695e-06, 2.481788396835327e-05, 5.348026752471924e-05, 8.21426510810852e-05, 0.00011080503463745117, 0.00013946741819381714, 0.0001681298017501831, 0.00019679218530654907, 0.00022545456886291504, 0.000254116952419281, 0.00028277933597564697, 0.00031144171953201294, 0.0003401041030883789, 0.0003687664866447449, 0.00039742887020111084, 0.0004260912537574768, 0.0004547536373138428, 0.00048341602087020874, 0.0005120784044265747, 0.0005407407879829407, 0.0005694031715393066, 0.0005980655550956726, 0.0006267279386520386, 0.0006553903222084045, 0.0006840527057647705, 0.0007127150893211365, 0.0007413774728775024, 0.0007700398564338684, 0.0007987022399902344]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 18.0, 10.0, 11.0, 28.0, 38.0, 53.0, 59.0, 113.0, 173.0, 248.0, 376.0, 544.0, 821.0, 1211.0, 1889.0, 2848.0, 4745.0, 7955.0, 13461.0, 22925.0, 38663.0, 64219.0, 100147.0, 139252.0, 162188.0, 154827.0, 121820.0, 82796.0, 51194.0, 30398.0, 18027.0, 10453.0, 6266.0, 3868.0, 2305.0, 1503.0, 955.0, 720.0, 439.0, 304.0, 204.0, 147.0, 113.0, 72.0, 34.0, 36.0, 19.0, 18.0, 17.0, 5.0, 2.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0], "bins": [-9.1953125, -8.9058837890625, -8.616455078125, -8.3270263671875, -8.03759765625, -7.7481689453125, -7.458740234375, -7.1693115234375, -6.8798828125, -6.5904541015625, -6.301025390625, -6.0115966796875, -5.72216796875, -5.4327392578125, -5.143310546875, -4.8538818359375, -4.564453125, -4.2750244140625, -3.985595703125, -3.6961669921875, -3.40673828125, -3.1173095703125, -2.827880859375, -2.5384521484375, -2.2490234375, -1.9595947265625, -1.670166015625, -1.3807373046875, -1.09130859375, -0.8018798828125, -0.512451171875, -0.2230224609375, 0.06640625, 0.3558349609375, 0.645263671875, 0.9346923828125, 1.22412109375, 1.5135498046875, 1.802978515625, 2.0924072265625, 2.3818359375, 2.6712646484375, 2.960693359375, 3.2501220703125, 3.53955078125, 3.8289794921875, 4.118408203125, 4.4078369140625, 4.697265625, 4.9866943359375, 5.276123046875, 5.5655517578125, 5.85498046875, 6.1444091796875, 6.433837890625, 6.7232666015625, 7.0126953125, 7.3021240234375, 7.591552734375, 7.8809814453125, 8.17041015625, 8.4598388671875, 8.749267578125, 9.0386962890625, 9.328125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 7.0, 5.0, 4.0, 8.0, 14.0, 7.0, 22.0, 23.0, 26.0, 32.0, 20.0, 33.0, 41.0, 44.0, 59.0, 41.0, 55.0, 56.0, 74.0, 49.0, 54.0, 50.0, 36.0, 52.0, 29.0, 31.0, 20.0, 24.0, 17.0, 11.0, 9.0, 11.0, 8.0, 5.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.73828125, -4.58880615234375, -4.4393310546875, -4.28985595703125, -4.140380859375, -3.99090576171875, -3.8414306640625, -3.69195556640625, -3.54248046875, -3.39300537109375, -3.2435302734375, -3.09405517578125, -2.944580078125, -2.79510498046875, -2.6456298828125, -2.49615478515625, -2.3466796875, -2.19720458984375, -2.0477294921875, -1.89825439453125, -1.748779296875, -1.59930419921875, -1.4498291015625, -1.30035400390625, -1.15087890625, -1.00140380859375, -0.8519287109375, -0.70245361328125, -0.552978515625, -0.40350341796875, -0.2540283203125, -0.10455322265625, 0.044921875, 0.19439697265625, 0.3438720703125, 0.49334716796875, 0.642822265625, 0.79229736328125, 0.9417724609375, 1.09124755859375, 1.24072265625, 1.39019775390625, 1.5396728515625, 1.68914794921875, 1.838623046875, 1.98809814453125, 2.1375732421875, 2.28704833984375, 2.4365234375, 2.58599853515625, 2.7354736328125, 2.88494873046875, 3.034423828125, 3.18389892578125, 3.3333740234375, 3.48284912109375, 3.63232421875, 3.78179931640625, 3.9312744140625, 4.08074951171875, 4.230224609375, 4.37969970703125, 4.5291748046875, 4.67864990234375, 4.828125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 10.0, 5.0, 5.0, 17.0, 12.0, 16.0, 13.0, 28.0, 18.0, 38.0, 40.0, 41.0, 45.0, 37.0, 57.0, 52.0, 57.0, 69.0, 50.0, 42.0, 46.0, 48.0, 48.0, 42.0, 29.0, 31.0, 22.0, 19.0, 22.0, 9.0, 5.0, 3.0, 8.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.964576721191406, -27.2130126953125, -26.461448669433594, -25.709882736206055, -24.95831871032715, -24.206754684448242, -23.455190658569336, -22.703624725341797, -21.95206069946289, -21.200496673583984, -20.448932647705078, -19.69736671447754, -18.945802688598633, -18.194238662719727, -17.44267463684082, -16.69110870361328, -15.939545631408691, -15.187981605529785, -14.436416625976562, -13.684852600097656, -12.933287620544434, -12.181723594665527, -11.430158615112305, -10.678594589233398, -9.927030563354492, -9.175466537475586, -8.423901557922363, -7.672337532043457, -6.920772552490234, -6.169208526611328, -5.417644023895264, -4.666079521179199, -3.9145145416259766, -3.162950038909912, -2.4113855361938477, -1.6598212718963623, -0.9082567691802979, -0.1566922664642334, 0.594871997833252, 1.3464365005493164, 2.098001003265381, 2.8495655059814453, 3.6011300086975098, 4.352694511413574, 5.1042585372924805, 5.855823516845703, 6.607387542724609, 7.358952045440674, 8.110516548156738, 8.862080574035645, 9.613645553588867, 10.365209579467773, 11.116774559020996, 11.868338584899902, 12.619903564453125, 13.371467590332031, 14.123031616210938, 14.874595642089844, 15.626160621643066, 16.37772560119629, 17.129289627075195, 17.8808536529541, 18.632417678833008, 19.383983612060547, 20.135547637939453]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 3.0, 11.0, 10.0, 6.0, 7.0, 15.0, 21.0, 19.0, 19.0, 25.0, 24.0, 32.0, 40.0, 40.0, 35.0, 37.0, 45.0, 48.0, 49.0, 48.0, 48.0, 44.0, 46.0, 51.0, 44.0, 33.0, 22.0, 30.0, 18.0, 17.0, 19.0, 18.0, 14.0, 16.0, 7.0, 11.0, 7.0, 3.0, 3.0, 6.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.197891235351562, -26.273113250732422, -25.34833526611328, -24.42355728149414, -23.498779296875, -22.57400131225586, -21.64922523498535, -20.72444725036621, -19.79966926574707, -18.87489128112793, -17.95011329650879, -17.02533531188965, -16.10055923461914, -15.175780296325684, -14.25100326538086, -13.326225280761719, -12.401447296142578, -11.476669311523438, -10.551891326904297, -9.627114295959473, -8.702336311340332, -7.777558326721191, -6.852780818939209, -5.928003311157227, -5.003225326538086, -4.078447341918945, -3.153669834136963, -2.2288920879364014, -1.3041143417358398, -0.3793363571166992, 0.5454411506652832, 1.4702186584472656, 2.3949947357177734, 3.319772481918335, 4.2445502281188965, 5.169327735900879, 6.0941057205200195, 7.01888370513916, 7.943661212921143, 8.868438720703125, 9.793216705322266, 10.717994689941406, 11.642772674560547, 12.567549705505371, 13.492327690124512, 14.417105674743652, 15.341882705688477, 16.266660690307617, 17.191438674926758, 18.1162166595459, 19.04099464416504, 19.96577262878418, 20.890548706054688, 21.815326690673828, 22.74010467529297, 23.66488265991211, 24.58966064453125, 25.51443862915039, 26.43921661376953, 27.363994598388672, 28.288772583007812, 29.213550567626953, 30.13832664489746, 31.0631046295166, 31.987882614135742]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 20.0, 16.0, 33.0, 78.0, 104.0, 153.0, 289.0, 461.0, 769.0, 1314.0, 2212.0, 3497.0, 5735.0, 9713.0, 15316.0, 25636.0, 41193.0, 64613.0, 98575.0, 147954.0, 211014.0, 287024.0, 364506.0, 428616.0, 462314.0, 455178.0, 410418.0, 340272.0, 261072.0, 188871.0, 130833.0, 86482.0, 56009.0, 35452.0, 22213.0, 14090.0, 8273.0, 5309.0, 3323.0, 2043.0, 1235.0, 784.0, 450.0, 312.0, 200.0, 109.0, 71.0, 47.0, 27.0, 23.0, 11.0, 11.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.171875, -12.744873046875, -12.31787109375, -11.890869140625, -11.4638671875, -11.036865234375, -10.60986328125, -10.182861328125, -9.755859375, -9.328857421875, -8.90185546875, -8.474853515625, -8.0478515625, -7.620849609375, -7.19384765625, -6.766845703125, -6.33984375, -5.912841796875, -5.48583984375, -5.058837890625, -4.6318359375, -4.204833984375, -3.77783203125, -3.350830078125, -2.923828125, -2.496826171875, -2.06982421875, -1.642822265625, -1.2158203125, -0.788818359375, -0.36181640625, 0.065185546875, 0.4921875, 0.919189453125, 1.34619140625, 1.773193359375, 2.2001953125, 2.627197265625, 3.05419921875, 3.481201171875, 3.908203125, 4.335205078125, 4.76220703125, 5.189208984375, 5.6162109375, 6.043212890625, 6.47021484375, 6.897216796875, 7.32421875, 7.751220703125, 8.17822265625, 8.605224609375, 9.0322265625, 9.459228515625, 9.88623046875, 10.313232421875, 10.740234375, 11.167236328125, 11.59423828125, 12.021240234375, 12.4482421875, 12.875244140625, 13.30224609375, 13.729248046875, 14.15625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 12.0, 8.0, 4.0, 12.0, 18.0, 20.0, 21.0, 21.0, 26.0, 25.0, 34.0, 41.0, 35.0, 40.0, 42.0, 44.0, 48.0, 45.0, 48.0, 49.0, 41.0, 47.0, 49.0, 38.0, 38.0, 25.0, 26.0, 13.0, 25.0, 16.0, 14.0, 17.0, 10.0, 9.0, 7.0, 7.0, 4.0, 4.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.265625, -23.453369140625, -22.64111328125, -21.828857421875, -21.0166015625, -20.204345703125, -19.39208984375, -18.579833984375, -17.767578125, -16.955322265625, -16.14306640625, -15.330810546875, -14.5185546875, -13.706298828125, -12.89404296875, -12.081787109375, -11.26953125, -10.457275390625, -9.64501953125, -8.832763671875, -8.0205078125, -7.208251953125, -6.39599609375, -5.583740234375, -4.771484375, -3.959228515625, -3.14697265625, -2.334716796875, -1.5224609375, -0.710205078125, 0.10205078125, 0.914306640625, 1.7265625, 2.538818359375, 3.35107421875, 4.163330078125, 4.9755859375, 5.787841796875, 6.60009765625, 7.412353515625, 8.224609375, 9.036865234375, 9.84912109375, 10.661376953125, 11.4736328125, 12.285888671875, 13.09814453125, 13.910400390625, 14.72265625, 15.534912109375, 16.34716796875, 17.159423828125, 17.9716796875, 18.783935546875, 19.59619140625, 20.408447265625, 21.220703125, 22.032958984375, 22.84521484375, 23.657470703125, 24.4697265625, 25.281982421875, 26.09423828125, 26.906494140625, 27.71875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 10.0, 6.0, 14.0, 25.0, 35.0, 69.0, 98.0, 134.0, 217.0, 369.0, 641.0, 1018.0, 1449.0, 2430.0, 3982.0, 6563.0, 10256.0, 16620.0, 25982.0, 39804.0, 60494.0, 90852.0, 130579.0, 181396.0, 240206.0, 302906.0, 360854.0, 401504.0, 417232.0, 402657.0, 362655.0, 306746.0, 242677.0, 184172.0, 133235.0, 92492.0, 61896.0, 40663.0, 26958.0, 16570.0, 10569.0, 6553.0, 4112.0, 2497.0, 1564.0, 970.0, 581.0, 378.0, 228.0, 144.0, 95.0, 51.0, 37.0, 20.0, 13.0, 8.0, 6.0, 2.0, 2.0], "bins": [-14.8671875, -14.4237060546875, -13.980224609375, -13.5367431640625, -13.09326171875, -12.6497802734375, -12.206298828125, -11.7628173828125, -11.3193359375, -10.8758544921875, -10.432373046875, -9.9888916015625, -9.54541015625, -9.1019287109375, -8.658447265625, -8.2149658203125, -7.771484375, -7.3280029296875, -6.884521484375, -6.4410400390625, -5.99755859375, -5.5540771484375, -5.110595703125, -4.6671142578125, -4.2236328125, -3.7801513671875, -3.336669921875, -2.8931884765625, -2.44970703125, -2.0062255859375, -1.562744140625, -1.1192626953125, -0.67578125, -0.2322998046875, 0.211181640625, 0.6546630859375, 1.09814453125, 1.5416259765625, 1.985107421875, 2.4285888671875, 2.8720703125, 3.3155517578125, 3.759033203125, 4.2025146484375, 4.64599609375, 5.0894775390625, 5.532958984375, 5.9764404296875, 6.419921875, 6.8634033203125, 7.306884765625, 7.7503662109375, 8.19384765625, 8.6373291015625, 9.080810546875, 9.5242919921875, 9.9677734375, 10.4112548828125, 10.854736328125, 11.2982177734375, 11.74169921875, 12.1851806640625, 12.628662109375, 13.0721435546875, 13.515625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 7.0, 4.0, 20.0, 13.0, 29.0, 30.0, 46.0, 54.0, 59.0, 70.0, 102.0, 100.0, 140.0, 155.0, 143.0, 201.0, 201.0, 219.0, 224.0, 201.0, 233.0, 234.0, 226.0, 217.0, 181.0, 158.0, 147.0, 124.0, 105.0, 85.0, 76.0, 56.0, 43.0, 46.0, 41.0, 21.0, 12.0, 13.0, 8.0, 7.0, 9.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.40625, -11.0714111328125, -10.736572265625, -10.4017333984375, -10.06689453125, -9.7320556640625, -9.397216796875, -9.0623779296875, -8.7275390625, -8.3927001953125, -8.057861328125, -7.7230224609375, -7.38818359375, -7.0533447265625, -6.718505859375, -6.3836669921875, -6.048828125, -5.7139892578125, -5.379150390625, -5.0443115234375, -4.70947265625, -4.3746337890625, -4.039794921875, -3.7049560546875, -3.3701171875, -3.0352783203125, -2.700439453125, -2.3656005859375, -2.03076171875, -1.6959228515625, -1.361083984375, -1.0262451171875, -0.69140625, -0.3565673828125, -0.021728515625, 0.3131103515625, 0.64794921875, 0.9827880859375, 1.317626953125, 1.6524658203125, 1.9873046875, 2.3221435546875, 2.656982421875, 2.9918212890625, 3.32666015625, 3.6614990234375, 3.996337890625, 4.3311767578125, 4.666015625, 5.0008544921875, 5.335693359375, 5.6705322265625, 6.00537109375, 6.3402099609375, 6.675048828125, 7.0098876953125, 7.3447265625, 7.6795654296875, 8.014404296875, 8.3492431640625, 8.68408203125, 9.0189208984375, 9.353759765625, 9.6885986328125, 10.0234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 4.0, 9.0, 12.0, 11.0, 16.0, 29.0, 17.0, 30.0, 33.0, 25.0, 35.0, 30.0, 37.0, 42.0, 49.0, 47.0, 62.0, 37.0, 56.0, 40.0, 48.0, 43.0, 45.0, 41.0, 33.0, 39.0, 30.0, 15.0, 18.0, 13.0, 14.0, 14.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.998960494995117, -23.297821044921875, -22.5966796875, -21.895540237426758, -21.194398880004883, -20.49325942993164, -19.792118072509766, -19.090978622436523, -18.38983917236328, -17.68869972229004, -16.987558364868164, -16.286418914794922, -15.585277557373047, -14.884138107299805, -14.182997703552246, -13.481857299804688, -12.780715942382812, -12.079575538635254, -11.378435134887695, -10.677295684814453, -9.976154327392578, -9.275014877319336, -8.573874473571777, -7.872734069824219, -7.17159366607666, -6.470453262329102, -5.769312858581543, -5.068172931671143, -4.367032527923584, -3.6658921241760254, -2.964752197265625, -2.2636117935180664, -1.5624713897705078, -0.8613311052322388, -0.16019082069396973, 0.5409493446350098, 1.2420897483825684, 1.943230152130127, 2.6443700790405273, 3.345510482788086, 4.0466508865356445, 4.747791290283203, 5.448931694030762, 6.150071620941162, 6.851212024688721, 7.552352428436279, 8.25349235534668, 8.954632759094238, 9.655773162841797, 10.356913566589355, 11.058053970336914, 11.759193420410156, 12.460334777832031, 13.161474227905273, 13.862614631652832, 14.56375503540039, 15.26489543914795, 15.966035842895508, 16.66717529296875, 17.368316650390625, 18.069456100463867, 18.770597457885742, 19.471736907958984, 20.17287826538086, 20.8740177154541]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 4.0, 5.0, 7.0, 9.0, 8.0, 14.0, 10.0, 12.0, 24.0, 17.0, 16.0, 25.0, 31.0, 26.0, 37.0, 33.0, 43.0, 45.0, 37.0, 58.0, 43.0, 51.0, 41.0, 34.0, 43.0, 33.0, 40.0, 26.0, 36.0, 23.0, 30.0, 18.0, 15.0, 20.0, 20.0, 17.0, 9.0, 12.0, 8.0, 3.0, 3.0, 7.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0], "bins": [-29.012317657470703, -28.184974670410156, -27.35763168334961, -26.530288696289062, -25.70294761657715, -24.8756046295166, -24.048261642456055, -23.220918655395508, -22.39357566833496, -21.566232681274414, -20.738889694213867, -19.911548614501953, -19.084205627441406, -18.25686264038086, -17.429519653320312, -16.602176666259766, -15.774834632873535, -14.947491645812988, -14.120149612426758, -13.292806625366211, -12.465463638305664, -11.638120651245117, -10.810778617858887, -9.98343563079834, -9.15609359741211, -8.328750610351562, -7.501408100128174, -6.674065589904785, -5.846722602844238, -5.01938009262085, -4.192037582397461, -3.364694595336914, -2.537351608276367, -1.7100088596343994, -0.8826662302017212, -0.05532360076904297, 0.7720191478729248, 1.5993618965148926, 2.4267044067382812, 3.254047393798828, 4.081389904022217, 4.9087324142456055, 5.736075401306152, 6.563417911529541, 7.39076042175293, 8.218103408813477, 9.045446395874023, 9.87278938293457, 10.7001314163208, 11.527474403381348, 12.354816436767578, 13.182159423828125, 14.009502410888672, 14.836845397949219, 15.66418743133545, 16.491531372070312, 17.318872451782227, 18.146215438842773, 18.97355842590332, 19.800899505615234, 20.62824249267578, 21.455585479736328, 22.282928466796875, 23.110271453857422, 23.93761444091797]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 1.0, 3.0, 9.0, 9.0, 16.0, 17.0, 32.0, 50.0, 79.0, 134.0, 229.0, 344.0, 674.0, 1030.0, 1798.0, 3269.0, 5863.0, 10189.0, 17497.0, 29294.0, 47614.0, 73042.0, 101869.0, 128530.0, 142769.0, 137163.0, 114767.0, 85103.0, 57784.0, 36912.0, 21891.0, 13127.0, 7597.0, 4151.0, 2411.0, 1369.0, 786.0, 440.0, 273.0, 158.0, 94.0, 74.0, 30.0, 23.0, 15.0, 18.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.484375, -8.18896484375, -7.8935546875, -7.59814453125, -7.302734375, -7.00732421875, -6.7119140625, -6.41650390625, -6.12109375, -5.82568359375, -5.5302734375, -5.23486328125, -4.939453125, -4.64404296875, -4.3486328125, -4.05322265625, -3.7578125, -3.46240234375, -3.1669921875, -2.87158203125, -2.576171875, -2.28076171875, -1.9853515625, -1.68994140625, -1.39453125, -1.09912109375, -0.8037109375, -0.50830078125, -0.212890625, 0.08251953125, 0.3779296875, 0.67333984375, 0.96875, 1.26416015625, 1.5595703125, 1.85498046875, 2.150390625, 2.44580078125, 2.7412109375, 3.03662109375, 3.33203125, 3.62744140625, 3.9228515625, 4.21826171875, 4.513671875, 4.80908203125, 5.1044921875, 5.39990234375, 5.6953125, 5.99072265625, 6.2861328125, 6.58154296875, 6.876953125, 7.17236328125, 7.4677734375, 7.76318359375, 8.05859375, 8.35400390625, 8.6494140625, 8.94482421875, 9.240234375, 9.53564453125, 9.8310546875, 10.12646484375, 10.421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 6.0, 4.0, 7.0, 8.0, 10.0, 10.0, 12.0, 9.0, 26.0, 19.0, 15.0, 22.0, 34.0, 26.0, 33.0, 34.0, 44.0, 41.0, 39.0, 56.0, 45.0, 51.0, 42.0, 35.0, 40.0, 37.0, 37.0, 31.0, 28.0, 30.0, 24.0, 26.0, 15.0, 13.0, 25.0, 18.0, 10.0, 12.0, 5.0, 6.0, 2.0, 7.0, 2.0, 4.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0], "bins": [-29.53125, -28.6943359375, -27.857421875, -27.0205078125, -26.18359375, -25.3466796875, -24.509765625, -23.6728515625, -22.8359375, -21.9990234375, -21.162109375, -20.3251953125, -19.48828125, -18.6513671875, -17.814453125, -16.9775390625, -16.140625, -15.3037109375, -14.466796875, -13.6298828125, -12.79296875, -11.9560546875, -11.119140625, -10.2822265625, -9.4453125, -8.6083984375, -7.771484375, -6.9345703125, -6.09765625, -5.2607421875, -4.423828125, -3.5869140625, -2.75, -1.9130859375, -1.076171875, -0.2392578125, 0.59765625, 1.4345703125, 2.271484375, 3.1083984375, 3.9453125, 4.7822265625, 5.619140625, 6.4560546875, 7.29296875, 8.1298828125, 8.966796875, 9.8037109375, 10.640625, 11.4775390625, 12.314453125, 13.1513671875, 13.98828125, 14.8251953125, 15.662109375, 16.4990234375, 17.3359375, 18.1728515625, 19.009765625, 19.8466796875, 20.68359375, 21.5205078125, 22.357421875, 23.1943359375, 24.03125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 3.0, 7.0, 4.0, 7.0, 12.0, 16.0, 20.0, 35.0, 43.0, 74.0, 83.0, 145.0, 215.0, 306.0, 421.0, 649.0, 930.0, 1339.0, 1951.0, 2832.0, 4281.0, 6253.0, 9486.0, 14458.0, 22858.0, 49963.0, 804709.0, 58723.0, 23778.0, 14903.0, 9757.0, 6579.0, 4397.0, 2999.0, 2034.0, 1351.0, 945.0, 632.0, 438.0, 288.0, 189.0, 149.0, 88.0, 68.0, 43.0, 37.0, 26.0, 12.0, 6.0, 9.0, 5.0, 6.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.017578125, -16.44140625, -15.865234375, -15.2890625, -14.712890625, -14.13671875, -13.560546875, -12.984375, -12.408203125, -11.83203125, -11.255859375, -10.6796875, -10.103515625, -9.52734375, -8.951171875, -8.375, -7.798828125, -7.22265625, -6.646484375, -6.0703125, -5.494140625, -4.91796875, -4.341796875, -3.765625, -3.189453125, -2.61328125, -2.037109375, -1.4609375, -0.884765625, -0.30859375, 0.267578125, 0.84375, 1.419921875, 1.99609375, 2.572265625, 3.1484375, 3.724609375, 4.30078125, 4.876953125, 5.453125, 6.029296875, 6.60546875, 7.181640625, 7.7578125, 8.333984375, 8.91015625, 9.486328125, 10.0625, 10.638671875, 11.21484375, 11.791015625, 12.3671875, 12.943359375, 13.51953125, 14.095703125, 14.671875, 15.248046875, 15.82421875, 16.400390625, 16.9765625, 17.552734375, 18.12890625, 18.705078125, 19.28125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 0.0, 8.0, 7.0, 9.0, 5.0, 11.0, 8.0, 11.0, 21.0, 22.0, 19.0, 16.0, 20.0, 29.0, 26.0, 46.0, 46.0, 42.0, 41.0, 42.0, 42.0, 46.0, 39.0, 33.0, 40.0, 38.0, 36.0, 24.0, 35.0, 43.0, 30.0, 29.0, 18.0, 16.0, 20.0, 18.0, 12.0, 11.0, 8.0, 5.0, 9.0, 7.0, 7.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.609375, -16.992919921875, -16.37646484375, -15.760009765625, -15.1435546875, -14.527099609375, -13.91064453125, -13.294189453125, -12.677734375, -12.061279296875, -11.44482421875, -10.828369140625, -10.2119140625, -9.595458984375, -8.97900390625, -8.362548828125, -7.74609375, -7.129638671875, -6.51318359375, -5.896728515625, -5.2802734375, -4.663818359375, -4.04736328125, -3.430908203125, -2.814453125, -2.197998046875, -1.58154296875, -0.965087890625, -0.3486328125, 0.267822265625, 0.88427734375, 1.500732421875, 2.1171875, 2.733642578125, 3.35009765625, 3.966552734375, 4.5830078125, 5.199462890625, 5.81591796875, 6.432373046875, 7.048828125, 7.665283203125, 8.28173828125, 8.898193359375, 9.5146484375, 10.131103515625, 10.74755859375, 11.364013671875, 11.98046875, 12.596923828125, 13.21337890625, 13.829833984375, 14.4462890625, 15.062744140625, 15.67919921875, 16.295654296875, 16.912109375, 17.528564453125, 18.14501953125, 18.761474609375, 19.3779296875, 19.994384765625, 20.61083984375, 21.227294921875, 21.84375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 4.0, 3.0, 1.0, 6.0, 11.0, 12.0, 22.0, 25.0, 29.0, 42.0, 69.0, 87.0, 132.0, 173.0, 221.0, 308.0, 504.0, 769.0, 1150.0, 1705.0, 2585.0, 4133.0, 6832.0, 11570.0, 21147.0, 54327.0, 822563.0, 65695.0, 22581.0, 12183.0, 7037.0, 4390.0, 2707.0, 1785.0, 1139.0, 804.0, 543.0, 364.0, 297.0, 159.0, 123.0, 105.0, 57.0, 49.0, 38.0, 14.0, 21.0, 19.0, 13.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.666015625, -2.581512451171875, -2.49700927734375, -2.412506103515625, -2.3280029296875, -2.243499755859375, -2.15899658203125, -2.074493408203125, -1.989990234375, -1.905487060546875, -1.82098388671875, -1.736480712890625, -1.6519775390625, -1.567474365234375, -1.48297119140625, -1.398468017578125, -1.31396484375, -1.229461669921875, -1.14495849609375, -1.060455322265625, -0.9759521484375, -0.891448974609375, -0.80694580078125, -0.722442626953125, -0.637939453125, -0.553436279296875, -0.46893310546875, -0.384429931640625, -0.2999267578125, -0.215423583984375, -0.13092041015625, -0.046417236328125, 0.0380859375, 0.122589111328125, 0.20709228515625, 0.291595458984375, 0.3760986328125, 0.460601806640625, 0.54510498046875, 0.629608154296875, 0.714111328125, 0.798614501953125, 0.88311767578125, 0.967620849609375, 1.0521240234375, 1.136627197265625, 1.22113037109375, 1.305633544921875, 1.39013671875, 1.474639892578125, 1.55914306640625, 1.643646240234375, 1.7281494140625, 1.812652587890625, 1.89715576171875, 1.981658935546875, 2.066162109375, 2.150665283203125, 2.23516845703125, 2.319671630859375, 2.4041748046875, 2.488677978515625, 2.57318115234375, 2.657684326171875, 2.7421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 7.0, 2.0, 6.0, 6.0, 14.0, 15.0, 17.0, 19.0, 21.0, 30.0, 37.0, 34.0, 41.0, 60.0, 70.0, 62.0, 99.0, 55.0, 69.0, 57.0, 49.0, 44.0, 27.0, 22.0, 27.0, 23.0, 17.0, 13.0, 15.0, 5.0, 6.0, 3.0, 2.0, 3.0, 6.0, 6.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.0003464221954345703, -0.0003360770642757416, -0.00032573193311691284, -0.0003153868019580841, -0.00030504167079925537, -0.00029469653964042664, -0.0002843514084815979, -0.00027400627732276917, -0.00026366114616394043, -0.0002533160150051117, -0.00024297088384628296, -0.00023262575268745422, -0.0002222806215286255, -0.00021193549036979675, -0.00020159035921096802, -0.00019124522805213928, -0.00018090009689331055, -0.0001705549657344818, -0.00016020983457565308, -0.00014986470341682434, -0.0001395195722579956, -0.00012917444109916687, -0.00011882930994033813, -0.0001084841787815094, -9.813904762268066e-05, -8.779391646385193e-05, -7.74487853050232e-05, -6.710365414619446e-05, -5.675852298736572e-05, -4.641339182853699e-05, -3.606826066970825e-05, -2.5723129510879517e-05, -1.537799835205078e-05, -5.032867193222046e-06, 5.3122639656066895e-06, 1.5657395124435425e-05, 2.600252628326416e-05, 3.6347657442092896e-05, 4.669278860092163e-05, 5.7037919759750366e-05, 6.73830509185791e-05, 7.772818207740784e-05, 8.807331323623657e-05, 9.841844439506531e-05, 0.00010876357555389404, 0.00011910870671272278, 0.00012945383787155151, 0.00013979896903038025, 0.00015014410018920898, 0.00016048923134803772, 0.00017083436250686646, 0.0001811794936656952, 0.00019152462482452393, 0.00020186975598335266, 0.0002122148871421814, 0.00022256001830101013, 0.00023290514945983887, 0.0002432502806186676, 0.00025359541177749634, 0.0002639405429363251, 0.0002742856740951538, 0.00028463080525398254, 0.0002949759364128113, 0.00030532106757164, 0.00031566619873046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 12.0, 16.0, 16.0, 31.0, 49.0, 67.0, 100.0, 152.0, 275.0, 383.0, 596.0, 928.0, 1452.0, 2302.0, 3685.0, 6161.0, 9864.0, 16225.0, 26736.0, 43217.0, 67590.0, 98757.0, 131693.0, 150569.0, 144845.0, 116323.0, 82714.0, 54476.0, 34420.0, 21510.0, 12639.0, 7902.0, 4770.0, 2972.0, 1869.0, 1139.0, 720.0, 477.0, 296.0, 206.0, 132.0, 81.0, 55.0, 38.0, 26.0, 24.0, 12.0, 12.0, 7.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1474609375, -1.1089019775390625, -1.070343017578125, -1.0317840576171875, -0.99322509765625, -0.9546661376953125, -0.916107177734375, -0.8775482177734375, -0.8389892578125, -0.8004302978515625, -0.761871337890625, -0.7233123779296875, -0.68475341796875, -0.6461944580078125, -0.607635498046875, -0.5690765380859375, -0.530517578125, -0.4919586181640625, -0.453399658203125, -0.4148406982421875, -0.37628173828125, -0.3377227783203125, -0.299163818359375, -0.2606048583984375, -0.2220458984375, -0.1834869384765625, -0.144927978515625, -0.1063690185546875, -0.06781005859375, -0.0292510986328125, 0.009307861328125, 0.0478668212890625, 0.08642578125, 0.1249847412109375, 0.163543701171875, 0.2021026611328125, 0.24066162109375, 0.2792205810546875, 0.317779541015625, 0.3563385009765625, 0.3948974609375, 0.4334564208984375, 0.472015380859375, 0.5105743408203125, 0.54913330078125, 0.5876922607421875, 0.626251220703125, 0.6648101806640625, 0.703369140625, 0.7419281005859375, 0.780487060546875, 0.8190460205078125, 0.85760498046875, 0.8961639404296875, 0.934722900390625, 0.9732818603515625, 1.0118408203125, 1.0503997802734375, 1.088958740234375, 1.1275177001953125, 1.16607666015625, 1.2046356201171875, 1.243194580078125, 1.2817535400390625, 1.3203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 8.0, 14.0, 12.0, 16.0, 19.0, 24.0, 25.0, 24.0, 28.0, 38.0, 37.0, 43.0, 41.0, 50.0, 83.0, 61.0, 58.0, 44.0, 50.0, 49.0, 34.0, 38.0, 30.0, 27.0, 27.0, 24.0, 19.0, 16.0, 18.0, 16.0, 6.0, 5.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69775390625, -0.677642822265625, -0.65753173828125, -0.637420654296875, -0.6173095703125, -0.597198486328125, -0.57708740234375, -0.556976318359375, -0.536865234375, -0.516754150390625, -0.49664306640625, -0.476531982421875, -0.4564208984375, -0.436309814453125, -0.41619873046875, -0.396087646484375, -0.3759765625, -0.355865478515625, -0.33575439453125, -0.315643310546875, -0.2955322265625, -0.275421142578125, -0.25531005859375, -0.235198974609375, -0.215087890625, -0.194976806640625, -0.17486572265625, -0.154754638671875, -0.1346435546875, -0.114532470703125, -0.09442138671875, -0.074310302734375, -0.05419921875, -0.034088134765625, -0.01397705078125, 0.006134033203125, 0.0262451171875, 0.046356201171875, 0.06646728515625, 0.086578369140625, 0.106689453125, 0.126800537109375, 0.14691162109375, 0.167022705078125, 0.1871337890625, 0.207244873046875, 0.22735595703125, 0.247467041015625, 0.267578125, 0.287689208984375, 0.30780029296875, 0.327911376953125, 0.3480224609375, 0.368133544921875, 0.38824462890625, 0.408355712890625, 0.428466796875, 0.448577880859375, 0.46868896484375, 0.488800048828125, 0.5089111328125, 0.529022216796875, 0.54913330078125, 0.569244384765625, 0.58935546875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 7.0, 11.0, 19.0, 21.0, 24.0, 29.0, 16.0, 26.0, 24.0, 33.0, 29.0, 47.0, 47.0, 38.0, 39.0, 56.0, 40.0, 53.0, 43.0, 37.0, 37.0, 43.0, 51.0, 38.0, 25.0, 31.0, 25.0, 13.0, 13.0, 10.0, 10.0, 10.0, 15.0, 7.0, 4.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.41260528564453, -20.75143051147461, -20.090255737304688, -19.429079055786133, -18.76790428161621, -18.10672950744629, -17.445552825927734, -16.784378051757812, -16.12320327758789, -15.462028503417969, -14.80085277557373, -14.139677047729492, -13.47850227355957, -12.817327499389648, -12.15615177154541, -11.494976043701172, -10.83380126953125, -10.172626495361328, -9.51145076751709, -8.850275039672852, -8.18910026550293, -7.52792501449585, -6.8667497634887695, -6.2055745124816895, -5.544399261474609, -4.883224010467529, -4.222048759460449, -3.560873508453369, -2.899698257446289, -2.238523006439209, -1.577347755432129, -0.9161725044250488, -0.25499534606933594, 0.40617990493774414, 1.0673551559448242, 1.7285304069519043, 2.3897056579589844, 3.0508809089660645, 3.7120561599731445, 4.373231410980225, 5.034406661987305, 5.695581912994385, 6.356757164001465, 7.017932415008545, 7.679107666015625, 8.340282440185547, 9.001458168029785, 9.662633895874023, 10.323808670043945, 10.984983444213867, 11.646159172058105, 12.307334899902344, 12.968509674072266, 13.629684448242188, 14.290860176086426, 14.952035903930664, 15.613210678100586, 16.274385452270508, 16.935562133789062, 17.596736907958984, 18.257911682128906, 18.919086456298828, 19.58026123046875, 20.241437911987305, 20.902612686157227]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 7.0, 6.0, 2.0, 13.0, 10.0, 12.0, 14.0, 9.0, 22.0, 21.0, 20.0, 23.0, 25.0, 33.0, 31.0, 40.0, 41.0, 35.0, 46.0, 46.0, 63.0, 41.0, 35.0, 36.0, 48.0, 36.0, 35.0, 35.0, 32.0, 28.0, 22.0, 18.0, 17.0, 18.0, 23.0, 12.0, 13.0, 7.0, 4.0, 6.0, 7.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-29.228919982910156, -28.371475219726562, -27.51403045654297, -26.656583786010742, -25.79913902282715, -24.941694259643555, -24.084247589111328, -23.226802825927734, -22.36935806274414, -21.511913299560547, -20.654468536376953, -19.797021865844727, -18.939577102661133, -18.08213233947754, -17.224685668945312, -16.36724090576172, -15.509796142578125, -14.652351379394531, -13.794905662536621, -12.937459945678711, -12.080015182495117, -11.222570419311523, -10.365124702453613, -9.507678985595703, -8.65023422241211, -7.792788982391357, -6.9353437423706055, -6.0778985023498535, -5.220453262329102, -4.36300802230835, -3.5055627822875977, -2.6481175422668457, -1.790670394897461, -0.933225154876709, -0.07577991485595703, 0.7816653251647949, 1.6391105651855469, 2.496555805206299, 3.354001045227051, 4.211446285247803, 5.068891525268555, 5.926336765289307, 6.783782005310059, 7.6412272453308105, 8.498672485351562, 9.356117248535156, 10.213562965393066, 11.071008682250977, 11.92845344543457, 12.785898208618164, 13.643343925476074, 14.500789642333984, 15.358234405517578, 16.215679168701172, 17.073123931884766, 17.930570602416992, 18.788015365600586, 19.64546012878418, 20.502906799316406, 21.3603515625, 22.217796325683594, 23.075241088867188, 23.93268585205078, 24.790132522583008, 25.6475772857666]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 6.0, 22.0, 21.0, 24.0, 55.0, 70.0, 124.0, 186.0, 296.0, 471.0, 753.0, 1324.0, 2225.0, 3672.0, 6375.0, 10690.0, 18155.0, 29111.0, 45650.0, 66596.0, 91846.0, 114255.0, 128438.0, 128357.0, 115665.0, 93076.0, 68475.0, 46489.0, 30131.0, 18246.0, 11318.0, 6663.0, 3827.0, 2408.0, 1393.0, 821.0, 478.0, 304.0, 205.0, 122.0, 67.0, 49.0, 26.0, 24.0, 17.0, 6.0, 7.0, 5.0, 0.0, 0.0, 2.0, 2.0], "bins": [-21.03125, -20.430908203125, -19.83056640625, -19.230224609375, -18.6298828125, -18.029541015625, -17.42919921875, -16.828857421875, -16.228515625, -15.628173828125, -15.02783203125, -14.427490234375, -13.8271484375, -13.226806640625, -12.62646484375, -12.026123046875, -11.42578125, -10.825439453125, -10.22509765625, -9.624755859375, -9.0244140625, -8.424072265625, -7.82373046875, -7.223388671875, -6.623046875, -6.022705078125, -5.42236328125, -4.822021484375, -4.2216796875, -3.621337890625, -3.02099609375, -2.420654296875, -1.8203125, -1.219970703125, -0.61962890625, -0.019287109375, 0.5810546875, 1.181396484375, 1.78173828125, 2.382080078125, 2.982421875, 3.582763671875, 4.18310546875, 4.783447265625, 5.3837890625, 5.984130859375, 6.58447265625, 7.184814453125, 7.78515625, 8.385498046875, 8.98583984375, 9.586181640625, 10.1865234375, 10.786865234375, 11.38720703125, 11.987548828125, 12.587890625, 13.188232421875, 13.78857421875, 14.388916015625, 14.9892578125, 15.589599609375, 16.18994140625, 16.790283203125, 17.390625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 8.0, 5.0, 4.0, 11.0, 9.0, 14.0, 12.0, 12.0, 17.0, 23.0, 21.0, 23.0, 23.0, 31.0, 35.0, 35.0, 42.0, 38.0, 43.0, 48.0, 56.0, 42.0, 42.0, 35.0, 39.0, 43.0, 36.0, 36.0, 28.0, 22.0, 30.0, 20.0, 15.0, 20.0, 22.0, 10.0, 16.0, 8.0, 5.0, 5.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-27.78125, -26.968994140625, -26.15673828125, -25.344482421875, -24.5322265625, -23.719970703125, -22.90771484375, -22.095458984375, -21.283203125, -20.470947265625, -19.65869140625, -18.846435546875, -18.0341796875, -17.221923828125, -16.40966796875, -15.597412109375, -14.78515625, -13.972900390625, -13.16064453125, -12.348388671875, -11.5361328125, -10.723876953125, -9.91162109375, -9.099365234375, -8.287109375, -7.474853515625, -6.66259765625, -5.850341796875, -5.0380859375, -4.225830078125, -3.41357421875, -2.601318359375, -1.7890625, -0.976806640625, -0.16455078125, 0.647705078125, 1.4599609375, 2.272216796875, 3.08447265625, 3.896728515625, 4.708984375, 5.521240234375, 6.33349609375, 7.145751953125, 7.9580078125, 8.770263671875, 9.58251953125, 10.394775390625, 11.20703125, 12.019287109375, 12.83154296875, 13.643798828125, 14.4560546875, 15.268310546875, 16.08056640625, 16.892822265625, 17.705078125, 18.517333984375, 19.32958984375, 20.141845703125, 20.9541015625, 21.766357421875, 22.57861328125, 23.390869140625, 24.203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 10.0, 11.0, 19.0, 22.0, 51.0, 76.0, 143.0, 199.0, 374.0, 617.0, 1078.0, 1930.0, 3569.0, 6484.0, 11920.0, 21836.0, 38596.0, 64520.0, 99660.0, 137474.0, 159267.0, 155984.0, 126413.0, 89458.0, 55646.0, 32533.0, 18415.0, 10028.0, 5379.0, 2984.0, 1646.0, 922.0, 524.0, 307.0, 182.0, 99.0, 67.0, 46.0, 25.0, 13.0, 10.0, 5.0, 8.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.578125, -24.799560546875, -24.02099609375, -23.242431640625, -22.4638671875, -21.685302734375, -20.90673828125, -20.128173828125, -19.349609375, -18.571044921875, -17.79248046875, -17.013916015625, -16.2353515625, -15.456787109375, -14.67822265625, -13.899658203125, -13.12109375, -12.342529296875, -11.56396484375, -10.785400390625, -10.0068359375, -9.228271484375, -8.44970703125, -7.671142578125, -6.892578125, -6.114013671875, -5.33544921875, -4.556884765625, -3.7783203125, -2.999755859375, -2.22119140625, -1.442626953125, -0.6640625, 0.114501953125, 0.89306640625, 1.671630859375, 2.4501953125, 3.228759765625, 4.00732421875, 4.785888671875, 5.564453125, 6.343017578125, 7.12158203125, 7.900146484375, 8.6787109375, 9.457275390625, 10.23583984375, 11.014404296875, 11.79296875, 12.571533203125, 13.35009765625, 14.128662109375, 14.9072265625, 15.685791015625, 16.46435546875, 17.242919921875, 18.021484375, 18.800048828125, 19.57861328125, 20.357177734375, 21.1357421875, 21.914306640625, 22.69287109375, 23.471435546875, 24.25]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 6.0, 10.0, 8.0, 17.0, 12.0, 11.0, 16.0, 14.0, 31.0, 23.0, 24.0, 20.0, 35.0, 31.0, 33.0, 33.0, 43.0, 36.0, 35.0, 46.0, 42.0, 36.0, 42.0, 43.0, 35.0, 38.0, 34.0, 34.0, 23.0, 22.0, 28.0, 15.0, 20.0, 17.0, 14.0, 9.0, 6.0, 13.0, 12.0, 5.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.0, -15.47705078125, -14.9541015625, -14.43115234375, -13.908203125, -13.38525390625, -12.8623046875, -12.33935546875, -11.81640625, -11.29345703125, -10.7705078125, -10.24755859375, -9.724609375, -9.20166015625, -8.6787109375, -8.15576171875, -7.6328125, -7.10986328125, -6.5869140625, -6.06396484375, -5.541015625, -5.01806640625, -4.4951171875, -3.97216796875, -3.44921875, -2.92626953125, -2.4033203125, -1.88037109375, -1.357421875, -0.83447265625, -0.3115234375, 0.21142578125, 0.734375, 1.25732421875, 1.7802734375, 2.30322265625, 2.826171875, 3.34912109375, 3.8720703125, 4.39501953125, 4.91796875, 5.44091796875, 5.9638671875, 6.48681640625, 7.009765625, 7.53271484375, 8.0556640625, 8.57861328125, 9.1015625, 9.62451171875, 10.1474609375, 10.67041015625, 11.193359375, 11.71630859375, 12.2392578125, 12.76220703125, 13.28515625, 13.80810546875, 14.3310546875, 14.85400390625, 15.376953125, 15.89990234375, 16.4228515625, 16.94580078125, 17.46875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 16.0, 3.0, 9.0, 22.0, 32.0, 65.0, 72.0, 109.0, 181.0, 304.0, 481.0, 817.0, 1498.0, 3043.0, 7764.0, 29654.0, 176052.0, 528833.0, 241896.0, 40417.0, 9521.0, 3642.0, 1770.0, 945.0, 521.0, 338.0, 217.0, 131.0, 69.0, 47.0, 26.0, 21.0, 13.0, 5.0, 5.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-37.90625, -36.84130859375, -35.7763671875, -34.71142578125, -33.646484375, -32.58154296875, -31.5166015625, -30.45166015625, -29.38671875, -28.32177734375, -27.2568359375, -26.19189453125, -25.126953125, -24.06201171875, -22.9970703125, -21.93212890625, -20.8671875, -19.80224609375, -18.7373046875, -17.67236328125, -16.607421875, -15.54248046875, -14.4775390625, -13.41259765625, -12.34765625, -11.28271484375, -10.2177734375, -9.15283203125, -8.087890625, -7.02294921875, -5.9580078125, -4.89306640625, -3.828125, -2.76318359375, -1.6982421875, -0.63330078125, 0.431640625, 1.49658203125, 2.5615234375, 3.62646484375, 4.69140625, 5.75634765625, 6.8212890625, 7.88623046875, 8.951171875, 10.01611328125, 11.0810546875, 12.14599609375, 13.2109375, 14.27587890625, 15.3408203125, 16.40576171875, 17.470703125, 18.53564453125, 19.6005859375, 20.66552734375, 21.73046875, 22.79541015625, 23.8603515625, 24.92529296875, 25.990234375, 27.05517578125, 28.1201171875, 29.18505859375, 30.25]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 6.0, 1.0, 3.0, 10.0, 10.0, 11.0, 22.0, 22.0, 28.0, 36.0, 39.0, 39.0, 54.0, 60.0, 62.0, 54.0, 75.0, 64.0, 64.0, 58.0, 41.0, 41.0, 43.0, 25.0, 27.0, 18.0, 16.0, 14.0, 13.0, 14.0, 7.0, 9.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0011138916015625, -0.0010805875062942505, -0.001047283411026001, -0.0010139793157577515, -0.000980675220489502, -0.0009473711252212524, -0.0009140670299530029, -0.0008807629346847534, -0.0008474588394165039, -0.0008141547441482544, -0.0007808506488800049, -0.0007475465536117554, -0.0007142424583435059, -0.0006809383630752563, -0.0006476342678070068, -0.0006143301725387573, -0.0005810260772705078, -0.0005477219820022583, -0.0005144178867340088, -0.0004811137914657593, -0.00044780969619750977, -0.00041450560092926025, -0.00038120150566101074, -0.00034789741039276123, -0.0003145933151245117, -0.0002812892198562622, -0.0002479851245880127, -0.00021468102931976318, -0.00018137693405151367, -0.00014807283878326416, -0.00011476874351501465, -8.146464824676514e-05, -4.8160552978515625e-05, -1.4856457710266113e-05, 1.84476375579834e-05, 5.175173282623291e-05, 8.505582809448242e-05, 0.00011835992336273193, 0.00015166401863098145, 0.00018496811389923096, 0.00021827220916748047, 0.00025157630443573, 0.0002848803997039795, 0.000318184494972229, 0.0003514885902404785, 0.00038479268550872803, 0.00041809678077697754, 0.00045140087604522705, 0.00048470497131347656, 0.0005180090665817261, 0.0005513131618499756, 0.0005846172571182251, 0.0006179213523864746, 0.0006512254476547241, 0.0006845295429229736, 0.0007178336381912231, 0.0007511377334594727, 0.0007844418287277222, 0.0008177459239959717, 0.0008510500192642212, 0.0008843541145324707, 0.0009176582098007202, 0.0009509623050689697, 0.0009842664003372192, 0.0010175704956054688]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 3.0, 4.0, 4.0, 11.0, 13.0, 11.0, 16.0, 24.0, 29.0, 49.0, 65.0, 91.0, 140.0, 185.0, 299.0, 475.0, 826.0, 1602.0, 3735.0, 11117.0, 40687.0, 158538.0, 379076.0, 311070.0, 101521.0, 25708.0, 7378.0, 2738.0, 1221.0, 693.0, 437.0, 246.0, 147.0, 91.0, 86.0, 54.0, 44.0, 35.0, 33.0, 16.0, 11.0, 3.0, 12.0, 4.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.71875, -18.955322265625, -18.19189453125, -17.428466796875, -16.6650390625, -15.901611328125, -15.13818359375, -14.374755859375, -13.611328125, -12.847900390625, -12.08447265625, -11.321044921875, -10.5576171875, -9.794189453125, -9.03076171875, -8.267333984375, -7.50390625, -6.740478515625, -5.97705078125, -5.213623046875, -4.4501953125, -3.686767578125, -2.92333984375, -2.159912109375, -1.396484375, -0.633056640625, 0.13037109375, 0.893798828125, 1.6572265625, 2.420654296875, 3.18408203125, 3.947509765625, 4.7109375, 5.474365234375, 6.23779296875, 7.001220703125, 7.7646484375, 8.528076171875, 9.29150390625, 10.054931640625, 10.818359375, 11.581787109375, 12.34521484375, 13.108642578125, 13.8720703125, 14.635498046875, 15.39892578125, 16.162353515625, 16.92578125, 17.689208984375, 18.45263671875, 19.216064453125, 19.9794921875, 20.742919921875, 21.50634765625, 22.269775390625, 23.033203125, 23.796630859375, 24.56005859375, 25.323486328125, 26.0869140625, 26.850341796875, 27.61376953125, 28.377197265625, 29.140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 10.0, 7.0, 8.0, 25.0, 27.0, 48.0, 81.0, 98.0, 114.0, 145.0, 126.0, 98.0, 75.0, 41.0, 28.0, 14.0, 14.0, 8.0, 9.0, 3.0, 4.0, 1.0, 4.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0], "bins": [-14.9609375, -14.599365234375, -14.23779296875, -13.876220703125, -13.5146484375, -13.153076171875, -12.79150390625, -12.429931640625, -12.068359375, -11.706787109375, -11.34521484375, -10.983642578125, -10.6220703125, -10.260498046875, -9.89892578125, -9.537353515625, -9.17578125, -8.814208984375, -8.45263671875, -8.091064453125, -7.7294921875, -7.367919921875, -7.00634765625, -6.644775390625, -6.283203125, -5.921630859375, -5.56005859375, -5.198486328125, -4.8369140625, -4.475341796875, -4.11376953125, -3.752197265625, -3.390625, -3.029052734375, -2.66748046875, -2.305908203125, -1.9443359375, -1.582763671875, -1.22119140625, -0.859619140625, -0.498046875, -0.136474609375, 0.22509765625, 0.586669921875, 0.9482421875, 1.309814453125, 1.67138671875, 2.032958984375, 2.39453125, 2.756103515625, 3.11767578125, 3.479248046875, 3.8408203125, 4.202392578125, 4.56396484375, 4.925537109375, 5.287109375, 5.648681640625, 6.01025390625, 6.371826171875, 6.7333984375, 7.094970703125, 7.45654296875, 7.818115234375, 8.1796875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 18.0, 11.0, 9.0, 24.0, 18.0, 25.0, 27.0, 29.0, 30.0, 30.0, 42.0, 48.0, 46.0, 57.0, 43.0, 48.0, 33.0, 49.0, 44.0, 47.0, 40.0, 39.0, 38.0, 35.0, 28.0, 27.0, 20.0, 15.0, 9.0, 11.0, 6.0, 9.0, 7.0, 5.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-23.234485626220703, -22.5601806640625, -21.88587760925293, -21.211572647094727, -20.537269592285156, -19.862964630126953, -19.18865966796875, -18.51435661315918, -17.84005355834961, -17.165748596191406, -16.491445541381836, -15.817140579223633, -15.142837524414062, -14.46853256225586, -13.794228553771973, -13.119924545288086, -12.445619583129883, -11.771315574645996, -11.09701156616211, -10.422706604003906, -9.748403549194336, -9.074098587036133, -8.399794578552246, -7.725490570068359, -7.051186561584473, -6.376882553100586, -5.702578544616699, -5.028274059295654, -4.353970050811768, -3.679666042327881, -3.005361557006836, -2.331057548522949, -1.6567554473876953, -0.982451319694519, -0.3081471920013428, 0.36615705490112305, 1.0404610633850098, 1.7147650718688965, 2.3890695571899414, 3.063373565673828, 3.737677574157715, 4.411981582641602, 5.086285591125488, 5.760590076446533, 6.43489408493042, 7.109198093414307, 7.783502578735352, 8.457806587219238, 9.132110595703125, 9.806414604187012, 10.480718612670898, 11.155023574829102, 11.829326629638672, 12.503631591796875, 13.177935600280762, 13.852239608764648, 14.526543617248535, 15.200847625732422, 15.875151634216309, 16.549455642700195, 17.2237606048584, 17.89806365966797, 18.572368621826172, 19.246673583984375, 19.920976638793945]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 6.0, 8.0, 13.0, 13.0, 8.0, 17.0, 13.0, 17.0, 22.0, 18.0, 25.0, 21.0, 29.0, 35.0, 31.0, 30.0, 35.0, 41.0, 23.0, 42.0, 49.0, 44.0, 49.0, 35.0, 39.0, 33.0, 34.0, 29.0, 20.0, 23.0, 26.0, 21.0, 19.0, 23.0, 17.0, 15.0, 17.0, 8.0, 12.0, 8.0, 5.0, 4.0, 3.0, 9.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.038774490356445, -24.252986907958984, -23.46719741821289, -22.681407928466797, -21.895620346069336, -21.109832763671875, -20.32404327392578, -19.538253784179688, -18.752466201782227, -17.966678619384766, -17.180889129638672, -16.395099639892578, -15.609312057495117, -14.82352352142334, -14.037734985351562, -13.251946449279785, -12.466157913208008, -11.68036937713623, -10.894580841064453, -10.108792304992676, -9.323003768920898, -8.537215232849121, -7.751426696777344, -6.965638160705566, -6.179849624633789, -5.394061088562012, -4.608272552490234, -3.822484016418457, -3.0366954803466797, -2.2509069442749023, -1.465118408203125, -0.6793298721313477, 0.10645866394042969, 0.892247200012207, 1.6780357360839844, 2.4638242721557617, 3.249612808227539, 4.035401344299316, 4.821189880371094, 5.606978416442871, 6.392766952514648, 7.178555488586426, 7.964344024658203, 8.75013256072998, 9.535921096801758, 10.321709632873535, 11.107498168945312, 11.89328670501709, 12.679075241088867, 13.464863777160645, 14.250652313232422, 15.0364408493042, 15.822229385375977, 16.608016967773438, 17.39380645751953, 18.179595947265625, 18.965383529663086, 19.751171112060547, 20.53696060180664, 21.322750091552734, 22.108537673950195, 22.894325256347656, 23.68011474609375, 24.465904235839844, 25.251691818237305]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 10.0, 20.0, 26.0, 53.0, 85.0, 110.0, 218.0, 339.0, 575.0, 969.0, 1611.0, 2723.0, 4523.0, 7343.0, 11893.0, 18834.0, 30214.0, 47123.0, 72012.0, 108880.0, 156863.0, 217754.0, 287391.0, 355221.0, 412400.0, 439778.0, 433666.0, 393755.0, 332918.0, 261311.0, 195771.0, 138767.0, 93940.0, 62195.0, 40044.0, 25204.0, 15710.0, 9493.0, 5836.0, 3542.0, 2076.0, 1239.0, 767.0, 444.0, 280.0, 150.0, 78.0, 51.0, 33.0, 15.0, 16.0, 6.0, 7.0, 0.0, 4.0, 2.0], "bins": [-14.1875, -13.7679443359375, -13.348388671875, -12.9288330078125, -12.50927734375, -12.0897216796875, -11.670166015625, -11.2506103515625, -10.8310546875, -10.4114990234375, -9.991943359375, -9.5723876953125, -9.15283203125, -8.7332763671875, -8.313720703125, -7.8941650390625, -7.474609375, -7.0550537109375, -6.635498046875, -6.2159423828125, -5.79638671875, -5.3768310546875, -4.957275390625, -4.5377197265625, -4.1181640625, -3.6986083984375, -3.279052734375, -2.8594970703125, -2.43994140625, -2.0203857421875, -1.600830078125, -1.1812744140625, -0.76171875, -0.3421630859375, 0.077392578125, 0.4969482421875, 0.91650390625, 1.3360595703125, 1.755615234375, 2.1751708984375, 2.5947265625, 3.0142822265625, 3.433837890625, 3.8533935546875, 4.27294921875, 4.6925048828125, 5.112060546875, 5.5316162109375, 5.951171875, 6.3707275390625, 6.790283203125, 7.2098388671875, 7.62939453125, 8.0489501953125, 8.468505859375, 8.8880615234375, 9.3076171875, 9.7271728515625, 10.146728515625, 10.5662841796875, 10.98583984375, 11.4053955078125, 11.824951171875, 12.2445068359375, 12.6640625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 5.0, 9.0, 9.0, 9.0, 17.0, 14.0, 12.0, 16.0, 16.0, 29.0, 22.0, 19.0, 28.0, 33.0, 34.0, 27.0, 36.0, 39.0, 28.0, 44.0, 48.0, 48.0, 37.0, 43.0, 33.0, 45.0, 27.0, 25.0, 24.0, 24.0, 23.0, 27.0, 18.0, 24.0, 19.0, 11.0, 13.0, 12.0, 13.0, 7.0, 4.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.828125, -21.138916015625, -20.44970703125, -19.760498046875, -19.0712890625, -18.382080078125, -17.69287109375, -17.003662109375, -16.314453125, -15.625244140625, -14.93603515625, -14.246826171875, -13.5576171875, -12.868408203125, -12.17919921875, -11.489990234375, -10.80078125, -10.111572265625, -9.42236328125, -8.733154296875, -8.0439453125, -7.354736328125, -6.66552734375, -5.976318359375, -5.287109375, -4.597900390625, -3.90869140625, -3.219482421875, -2.5302734375, -1.841064453125, -1.15185546875, -0.462646484375, 0.2265625, 0.915771484375, 1.60498046875, 2.294189453125, 2.9833984375, 3.672607421875, 4.36181640625, 5.051025390625, 5.740234375, 6.429443359375, 7.11865234375, 7.807861328125, 8.4970703125, 9.186279296875, 9.87548828125, 10.564697265625, 11.25390625, 11.943115234375, 12.63232421875, 13.321533203125, 14.0107421875, 14.699951171875, 15.38916015625, 16.078369140625, 16.767578125, 17.456787109375, 18.14599609375, 18.835205078125, 19.5244140625, 20.213623046875, 20.90283203125, 21.592041015625, 22.28125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 8.0, 13.0, 36.0, 55.0, 85.0, 116.0, 253.0, 394.0, 691.0, 1184.0, 1973.0, 3292.0, 5547.0, 9141.0, 14878.0, 23899.0, 36874.0, 56069.0, 84462.0, 122457.0, 169353.0, 224660.0, 284753.0, 340809.0, 382987.0, 404770.0, 399203.0, 370230.0, 321832.0, 264253.0, 204906.0, 151326.0, 107768.0, 73456.0, 49096.0, 31859.0, 20103.0, 12541.0, 7733.0, 4608.0, 2673.0, 1665.0, 960.0, 540.0, 328.0, 185.0, 118.0, 56.0, 46.0, 19.0, 13.0, 7.0, 3.0, 4.0, 1.0, 2.0], "bins": [-14.84375, -14.4049072265625, -13.966064453125, -13.5272216796875, -13.08837890625, -12.6495361328125, -12.210693359375, -11.7718505859375, -11.3330078125, -10.8941650390625, -10.455322265625, -10.0164794921875, -9.57763671875, -9.1387939453125, -8.699951171875, -8.2611083984375, -7.822265625, -7.3834228515625, -6.944580078125, -6.5057373046875, -6.06689453125, -5.6280517578125, -5.189208984375, -4.7503662109375, -4.3115234375, -3.8726806640625, -3.433837890625, -2.9949951171875, -2.55615234375, -2.1173095703125, -1.678466796875, -1.2396240234375, -0.80078125, -0.3619384765625, 0.076904296875, 0.5157470703125, 0.95458984375, 1.3934326171875, 1.832275390625, 2.2711181640625, 2.7099609375, 3.1488037109375, 3.587646484375, 4.0264892578125, 4.46533203125, 4.9041748046875, 5.343017578125, 5.7818603515625, 6.220703125, 6.6595458984375, 7.098388671875, 7.5372314453125, 7.97607421875, 8.4149169921875, 8.853759765625, 9.2926025390625, 9.7314453125, 10.1702880859375, 10.609130859375, 11.0479736328125, 11.48681640625, 11.9256591796875, 12.364501953125, 12.8033447265625, 13.2421875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 6.0, 6.0, 9.0, 18.0, 20.0, 23.0, 25.0, 27.0, 33.0, 56.0, 53.0, 68.0, 97.0, 121.0, 116.0, 142.0, 137.0, 188.0, 182.0, 154.0, 200.0, 200.0, 202.0, 198.0, 183.0, 171.0, 193.0, 170.0, 149.0, 136.0, 125.0, 121.0, 95.0, 68.0, 93.0, 70.0, 38.0, 38.0, 40.0, 24.0, 12.0, 19.0, 14.0, 13.0, 6.0, 5.0, 7.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.0390625, -8.7552490234375, -8.471435546875, -8.1876220703125, -7.90380859375, -7.6199951171875, -7.336181640625, -7.0523681640625, -6.7685546875, -6.4847412109375, -6.200927734375, -5.9171142578125, -5.63330078125, -5.3494873046875, -5.065673828125, -4.7818603515625, -4.498046875, -4.2142333984375, -3.930419921875, -3.6466064453125, -3.36279296875, -3.0789794921875, -2.795166015625, -2.5113525390625, -2.2275390625, -1.9437255859375, -1.659912109375, -1.3760986328125, -1.09228515625, -0.8084716796875, -0.524658203125, -0.2408447265625, 0.04296875, 0.3267822265625, 0.610595703125, 0.8944091796875, 1.17822265625, 1.4620361328125, 1.745849609375, 2.0296630859375, 2.3134765625, 2.5972900390625, 2.881103515625, 3.1649169921875, 3.44873046875, 3.7325439453125, 4.016357421875, 4.3001708984375, 4.583984375, 4.8677978515625, 5.151611328125, 5.4354248046875, 5.71923828125, 6.0030517578125, 6.286865234375, 6.5706787109375, 6.8544921875, 7.1383056640625, 7.422119140625, 7.7059326171875, 7.98974609375, 8.2735595703125, 8.557373046875, 8.8411865234375, 9.125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 3.0, 2.0, 6.0, 5.0, 7.0, 8.0, 12.0, 12.0, 11.0, 17.0, 14.0, 28.0, 29.0, 26.0, 24.0, 49.0, 47.0, 36.0, 50.0, 42.0, 47.0, 47.0, 52.0, 49.0, 47.0, 38.0, 41.0, 44.0, 45.0, 30.0, 21.0, 23.0, 19.0, 17.0, 14.0, 13.0, 9.0, 4.0, 7.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-22.742523193359375, -22.0609073638916, -21.379291534423828, -20.697677612304688, -20.016061782836914, -19.33444595336914, -18.652830123901367, -17.971214294433594, -17.289600372314453, -16.60798454284668, -15.926369667053223, -15.24475383758545, -14.563138961791992, -13.881523132324219, -13.199907302856445, -12.518291473388672, -11.836675643920898, -11.155059814453125, -10.473444938659668, -9.791829109191895, -9.110214233398438, -8.428598403930664, -7.746982574462891, -7.065367221832275, -6.38375186920166, -5.702136516571045, -5.02052116394043, -4.338905334472656, -3.657289981842041, -2.975674629211426, -2.2940587997436523, -1.612443447113037, -0.9308280944824219, -0.2492126226425171, 0.4324028491973877, 1.114018440246582, 1.7956337928771973, 2.4772491455078125, 3.158864974975586, 3.840480327606201, 4.522095680236816, 5.203711032867432, 5.885326385498047, 6.56694221496582, 7.2485575675964355, 7.930172920227051, 8.611788749694824, 9.293403625488281, 9.975019454956055, 10.656635284423828, 11.338250160217285, 12.019865989685059, 12.701480865478516, 13.383096694946289, 14.064712524414062, 14.746328353881836, 15.427943229675293, 16.10955810546875, 16.791173934936523, 17.472789764404297, 18.15440559387207, 18.836021423339844, 19.517635345458984, 20.199251174926758, 20.88086700439453]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 9.0, 7.0, 12.0, 13.0, 14.0, 18.0, 14.0, 17.0, 34.0, 35.0, 28.0, 29.0, 40.0, 33.0, 34.0, 53.0, 52.0, 36.0, 55.0, 45.0, 45.0, 36.0, 42.0, 39.0, 30.0, 23.0, 25.0, 29.0, 21.0, 31.0, 18.0, 19.0, 11.0, 13.0, 8.0, 8.0, 5.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-29.241161346435547, -28.385631561279297, -27.53010368347168, -26.67457389831543, -25.819046020507812, -24.963516235351562, -24.107986450195312, -23.252456665039062, -22.396928787231445, -21.541399002075195, -20.685871124267578, -19.830341339111328, -18.974811553955078, -18.11928367614746, -17.26375389099121, -16.408226013183594, -15.552696228027344, -14.69716739654541, -13.841638565063477, -12.986108779907227, -12.130579948425293, -11.27505111694336, -10.41952133178711, -9.563992500305176, -8.708463668823242, -7.852934837341309, -6.997405529022217, -6.141876220703125, -5.286347389221191, -4.430818557739258, -3.575289249420166, -2.719759941101074, -1.8642330169677734, -1.0087039470672607, -0.15317487716674805, 0.7023541927337646, 1.5578832626342773, 2.413412094116211, 3.2689414024353027, 4.1244707107543945, 4.979999542236328, 5.835528373718262, 6.6910576820373535, 7.546586990356445, 8.402115821838379, 9.257644653320312, 10.113174438476562, 10.968703269958496, 11.82423210144043, 12.679760932922363, 13.535289764404297, 14.390819549560547, 15.24634838104248, 16.101877212524414, 16.957406997680664, 17.81293487548828, 18.66846466064453, 19.52399444580078, 20.3795223236084, 21.23505210876465, 22.090579986572266, 22.946109771728516, 23.801639556884766, 24.657169342041016, 25.512697219848633]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 11.0, 11.0, 30.0, 55.0, 73.0, 116.0, 161.0, 270.0, 451.0, 666.0, 1073.0, 1733.0, 2832.0, 4536.0, 7109.0, 10669.0, 16288.0, 24399.0, 34992.0, 48569.0, 64713.0, 81251.0, 95707.0, 105051.0, 106837.0, 100725.0, 88261.0, 72285.0, 55323.0, 40344.0, 28668.0, 19475.0, 12961.0, 8371.0, 5362.0, 3436.0, 2162.0, 1331.0, 831.0, 488.0, 349.0, 217.0, 128.0, 86.0, 50.0, 29.0, 26.0, 13.0, 13.0, 7.0, 7.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.77734375, -6.57330322265625, -6.3692626953125, -6.16522216796875, -5.961181640625, -5.75714111328125, -5.5531005859375, -5.34906005859375, -5.14501953125, -4.94097900390625, -4.7369384765625, -4.53289794921875, -4.328857421875, -4.12481689453125, -3.9207763671875, -3.71673583984375, -3.5126953125, -3.30865478515625, -3.1046142578125, -2.90057373046875, -2.696533203125, -2.49249267578125, -2.2884521484375, -2.08441162109375, -1.88037109375, -1.67633056640625, -1.4722900390625, -1.26824951171875, -1.064208984375, -0.86016845703125, -0.6561279296875, -0.45208740234375, -0.248046875, -0.04400634765625, 0.1600341796875, 0.36407470703125, 0.568115234375, 0.77215576171875, 0.9761962890625, 1.18023681640625, 1.38427734375, 1.58831787109375, 1.7923583984375, 1.99639892578125, 2.200439453125, 2.40447998046875, 2.6085205078125, 2.81256103515625, 3.0166015625, 3.22064208984375, 3.4246826171875, 3.62872314453125, 3.832763671875, 4.03680419921875, 4.2408447265625, 4.44488525390625, 4.64892578125, 4.85296630859375, 5.0570068359375, 5.26104736328125, 5.465087890625, 5.66912841796875, 5.8731689453125, 6.07720947265625, 6.28125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 8.0, 7.0, 13.0, 13.0, 14.0, 18.0, 14.0, 17.0, 36.0, 32.0, 28.0, 30.0, 39.0, 35.0, 37.0, 50.0, 52.0, 34.0, 55.0, 49.0, 42.0, 38.0, 41.0, 36.0, 30.0, 24.0, 28.0, 28.0, 21.0, 30.0, 18.0, 18.0, 10.0, 14.0, 8.0, 7.0, 7.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-29.28125, -28.422607421875, -27.56396484375, -26.705322265625, -25.8466796875, -24.988037109375, -24.12939453125, -23.270751953125, -22.412109375, -21.553466796875, -20.69482421875, -19.836181640625, -18.9775390625, -18.118896484375, -17.26025390625, -16.401611328125, -15.54296875, -14.684326171875, -13.82568359375, -12.967041015625, -12.1083984375, -11.249755859375, -10.39111328125, -9.532470703125, -8.673828125, -7.815185546875, -6.95654296875, -6.097900390625, -5.2392578125, -4.380615234375, -3.52197265625, -2.663330078125, -1.8046875, -0.946044921875, -0.08740234375, 0.771240234375, 1.6298828125, 2.488525390625, 3.34716796875, 4.205810546875, 5.064453125, 5.923095703125, 6.78173828125, 7.640380859375, 8.4990234375, 9.357666015625, 10.21630859375, 11.074951171875, 11.93359375, 12.792236328125, 13.65087890625, 14.509521484375, 15.3681640625, 16.226806640625, 17.08544921875, 17.944091796875, 18.802734375, 19.661376953125, 20.52001953125, 21.378662109375, 22.2373046875, 23.095947265625, 23.95458984375, 24.813232421875, 25.671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 12.0, 13.0, 25.0, 33.0, 55.0, 76.0, 92.0, 125.0, 199.0, 323.0, 413.0, 581.0, 880.0, 1178.0, 1743.0, 2420.0, 3474.0, 4957.0, 7170.0, 10539.0, 15341.0, 23957.0, 72017.0, 791145.0, 43839.0, 21858.0, 14218.0, 9737.0, 6546.0, 4638.0, 3288.0, 2251.0, 1667.0, 1100.0, 791.0, 514.0, 412.0, 254.0, 207.0, 147.0, 94.0, 62.0, 56.0, 29.0, 22.0, 19.0, 10.0, 9.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-16.78125, -16.246826171875, -15.71240234375, -15.177978515625, -14.6435546875, -14.109130859375, -13.57470703125, -13.040283203125, -12.505859375, -11.971435546875, -11.43701171875, -10.902587890625, -10.3681640625, -9.833740234375, -9.29931640625, -8.764892578125, -8.23046875, -7.696044921875, -7.16162109375, -6.627197265625, -6.0927734375, -5.558349609375, -5.02392578125, -4.489501953125, -3.955078125, -3.420654296875, -2.88623046875, -2.351806640625, -1.8173828125, -1.282958984375, -0.74853515625, -0.214111328125, 0.3203125, 0.854736328125, 1.38916015625, 1.923583984375, 2.4580078125, 2.992431640625, 3.52685546875, 4.061279296875, 4.595703125, 5.130126953125, 5.66455078125, 6.198974609375, 6.7333984375, 7.267822265625, 7.80224609375, 8.336669921875, 8.87109375, 9.405517578125, 9.93994140625, 10.474365234375, 11.0087890625, 11.543212890625, 12.07763671875, 12.612060546875, 13.146484375, 13.680908203125, 14.21533203125, 14.749755859375, 15.2841796875, 15.818603515625, 16.35302734375, 16.887451171875, 17.421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 3.0, 4.0, 7.0, 3.0, 8.0, 13.0, 12.0, 10.0, 16.0, 14.0, 20.0, 29.0, 20.0, 23.0, 25.0, 37.0, 29.0, 37.0, 34.0, 33.0, 40.0, 31.0, 36.0, 22.0, 29.0, 41.0, 36.0, 36.0, 40.0, 43.0, 42.0, 24.0, 30.0, 22.0, 30.0, 20.0, 17.0, 16.0, 9.0, 16.0, 2.0, 6.0, 11.0, 3.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.625, -18.047607421875, -17.47021484375, -16.892822265625, -16.3154296875, -15.738037109375, -15.16064453125, -14.583251953125, -14.005859375, -13.428466796875, -12.85107421875, -12.273681640625, -11.6962890625, -11.118896484375, -10.54150390625, -9.964111328125, -9.38671875, -8.809326171875, -8.23193359375, -7.654541015625, -7.0771484375, -6.499755859375, -5.92236328125, -5.344970703125, -4.767578125, -4.190185546875, -3.61279296875, -3.035400390625, -2.4580078125, -1.880615234375, -1.30322265625, -0.725830078125, -0.1484375, 0.428955078125, 1.00634765625, 1.583740234375, 2.1611328125, 2.738525390625, 3.31591796875, 3.893310546875, 4.470703125, 5.048095703125, 5.62548828125, 6.202880859375, 6.7802734375, 7.357666015625, 7.93505859375, 8.512451171875, 9.08984375, 9.667236328125, 10.24462890625, 10.822021484375, 11.3994140625, 11.976806640625, 12.55419921875, 13.131591796875, 13.708984375, 14.286376953125, 14.86376953125, 15.441162109375, 16.0185546875, 16.595947265625, 17.17333984375, 17.750732421875, 18.328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 8.0, 10.0, 15.0, 23.0, 29.0, 48.0, 43.0, 89.0, 117.0, 165.0, 254.0, 270.0, 447.0, 610.0, 900.0, 1401.0, 2001.0, 2975.0, 4404.0, 6789.0, 10519.0, 17349.0, 31972.0, 374481.0, 508555.0, 34189.0, 18125.0, 11092.0, 7085.0, 4490.0, 3195.0, 2104.0, 1495.0, 1019.0, 698.0, 456.0, 309.0, 256.0, 176.0, 110.0, 83.0, 57.0, 48.0, 25.0, 24.0, 13.0, 13.0, 7.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6259765625, -1.5718536376953125, -1.517730712890625, -1.4636077880859375, -1.40948486328125, -1.3553619384765625, -1.301239013671875, -1.2471160888671875, -1.1929931640625, -1.1388702392578125, -1.084747314453125, -1.0306243896484375, -0.97650146484375, -0.9223785400390625, -0.868255615234375, -0.8141326904296875, -0.760009765625, -0.7058868408203125, -0.651763916015625, -0.5976409912109375, -0.54351806640625, -0.4893951416015625, -0.435272216796875, -0.3811492919921875, -0.3270263671875, -0.2729034423828125, -0.218780517578125, -0.1646575927734375, -0.11053466796875, -0.0564117431640625, -0.002288818359375, 0.0518341064453125, 0.10595703125, 0.1600799560546875, 0.214202880859375, 0.2683258056640625, 0.32244873046875, 0.3765716552734375, 0.430694580078125, 0.4848175048828125, 0.5389404296875, 0.5930633544921875, 0.647186279296875, 0.7013092041015625, 0.75543212890625, 0.8095550537109375, 0.863677978515625, 0.9178009033203125, 0.971923828125, 1.0260467529296875, 1.080169677734375, 1.1342926025390625, 1.18841552734375, 1.2425384521484375, 1.296661376953125, 1.3507843017578125, 1.4049072265625, 1.4590301513671875, 1.513153076171875, 1.5672760009765625, 1.62139892578125, 1.6755218505859375, 1.729644775390625, 1.7837677001953125, 1.837890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 3.0, 6.0, 8.0, 4.0, 3.0, 10.0, 13.0, 11.0, 19.0, 20.0, 30.0, 36.0, 25.0, 37.0, 34.0, 42.0, 37.0, 52.0, 57.0, 56.0, 47.0, 50.0, 44.0, 49.0, 31.0, 30.0, 31.0, 33.0, 21.0, 21.0, 27.0, 14.0, 13.0, 20.0, 12.0, 7.0, 6.0, 10.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.00017571449279785156, -0.0001703798770904541, -0.00016504526138305664, -0.00015971064567565918, -0.00015437602996826172, -0.00014904141426086426, -0.0001437067985534668, -0.00013837218284606934, -0.00013303756713867188, -0.00012770295143127441, -0.00012236833572387695, -0.00011703372001647949, -0.00011169910430908203, -0.00010636448860168457, -0.00010102987289428711, -9.569525718688965e-05, -9.036064147949219e-05, -8.502602577209473e-05, -7.969141006469727e-05, -7.43567943572998e-05, -6.902217864990234e-05, -6.368756294250488e-05, -5.835294723510742e-05, -5.301833152770996e-05, -4.76837158203125e-05, -4.234910011291504e-05, -3.701448440551758e-05, -3.167986869812012e-05, -2.6345252990722656e-05, -2.1010637283325195e-05, -1.5676021575927734e-05, -1.0341405868530273e-05, -5.0067901611328125e-06, 3.2782554626464844e-07, 5.662441253662109e-06, 1.099705696105957e-05, 1.633167266845703e-05, 2.1666288375854492e-05, 2.7000904083251953e-05, 3.2335519790649414e-05, 3.7670135498046875e-05, 4.3004751205444336e-05, 4.83393669128418e-05, 5.367398262023926e-05, 5.900859832763672e-05, 6.434321403503418e-05, 6.967782974243164e-05, 7.50124454498291e-05, 8.034706115722656e-05, 8.568167686462402e-05, 9.101629257202148e-05, 9.635090827941895e-05, 0.0001016855239868164, 0.00010702013969421387, 0.00011235475540161133, 0.00011768937110900879, 0.00012302398681640625, 0.0001283586025238037, 0.00013369321823120117, 0.00013902783393859863, 0.0001443624496459961, 0.00014969706535339355, 0.00015503168106079102, 0.00016036629676818848, 0.00016570091247558594]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 9.0, 9.0, 17.0, 24.0, 52.0, 82.0, 126.0, 231.0, 356.0, 656.0, 1149.0, 1875.0, 3328.0, 5765.0, 9910.0, 17863.0, 30345.0, 50366.0, 78575.0, 112557.0, 141888.0, 152496.0, 139837.0, 109583.0, 75255.0, 47863.0, 28828.0, 16665.0, 9697.0, 5599.0, 3136.0, 1856.0, 1070.0, 597.0, 366.0, 211.0, 141.0, 65.0, 42.0, 31.0, 14.0, 7.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96142578125, -0.9276351928710938, -0.8938446044921875, -0.8600540161132812, -0.826263427734375, -0.7924728393554688, -0.7586822509765625, -0.7248916625976562, -0.69110107421875, -0.6573104858398438, -0.6235198974609375, -0.5897293090820312, -0.555938720703125, -0.5221481323242188, -0.4883575439453125, -0.45456695556640625, -0.4207763671875, -0.38698577880859375, -0.3531951904296875, -0.31940460205078125, -0.285614013671875, -0.25182342529296875, -0.2180328369140625, -0.18424224853515625, -0.15045166015625, -0.11666107177734375, -0.0828704833984375, -0.04907989501953125, -0.015289306640625, 0.01850128173828125, 0.0522918701171875, 0.08608245849609375, 0.119873046875, 0.15366363525390625, 0.1874542236328125, 0.22124481201171875, 0.255035400390625, 0.28882598876953125, 0.3226165771484375, 0.35640716552734375, 0.39019775390625, 0.42398834228515625, 0.4577789306640625, 0.49156951904296875, 0.525360107421875, 0.5591506958007812, 0.5929412841796875, 0.6267318725585938, 0.6605224609375, 0.6943130493164062, 0.7281036376953125, 0.7618942260742188, 0.795684814453125, 0.8294754028320312, 0.8632659912109375, 0.8970565795898438, 0.93084716796875, 0.9646377563476562, 0.9984283447265625, 1.0322189331054688, 1.066009521484375, 1.0998001098632812, 1.1335906982421875, 1.1673812866210938, 1.201171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 9.0, 11.0, 13.0, 17.0, 23.0, 28.0, 27.0, 36.0, 35.0, 40.0, 29.0, 51.0, 47.0, 45.0, 48.0, 48.0, 51.0, 49.0, 45.0, 41.0, 36.0, 40.0, 34.0, 35.0, 30.0, 34.0, 15.0, 19.0, 9.0, 15.0, 5.0, 9.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.56103515625, -0.542022705078125, -0.52301025390625, -0.503997802734375, -0.4849853515625, -0.465972900390625, -0.44696044921875, -0.427947998046875, -0.408935546875, -0.389923095703125, -0.37091064453125, -0.351898193359375, -0.3328857421875, -0.313873291015625, -0.29486083984375, -0.275848388671875, -0.2568359375, -0.237823486328125, -0.21881103515625, -0.199798583984375, -0.1807861328125, -0.161773681640625, -0.14276123046875, -0.123748779296875, -0.104736328125, -0.085723876953125, -0.06671142578125, -0.047698974609375, -0.0286865234375, -0.009674072265625, 0.00933837890625, 0.028350830078125, 0.04736328125, 0.066375732421875, 0.08538818359375, 0.104400634765625, 0.1234130859375, 0.142425537109375, 0.16143798828125, 0.180450439453125, 0.199462890625, 0.218475341796875, 0.23748779296875, 0.256500244140625, 0.2755126953125, 0.294525146484375, 0.31353759765625, 0.332550048828125, 0.3515625, 0.370574951171875, 0.38958740234375, 0.408599853515625, 0.4276123046875, 0.446624755859375, 0.46563720703125, 0.484649658203125, 0.503662109375, 0.522674560546875, 0.54168701171875, 0.560699462890625, 0.5797119140625, 0.598724365234375, 0.61773681640625, 0.636749267578125, 0.65576171875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 6.0, 5.0, 6.0, 13.0, 12.0, 6.0, 15.0, 30.0, 18.0, 28.0, 27.0, 40.0, 38.0, 38.0, 44.0, 52.0, 56.0, 40.0, 51.0, 62.0, 44.0, 44.0, 41.0, 45.0, 40.0, 46.0, 28.0, 22.0, 19.0, 17.0, 11.0, 15.0, 12.0, 9.0, 6.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-23.965473175048828, -23.244504928588867, -22.523534774780273, -21.802566528320312, -21.08159637451172, -20.360628128051758, -19.639659881591797, -18.918689727783203, -18.19771957397461, -17.47675132751465, -16.755781173706055, -16.034812927246094, -15.3138427734375, -14.592874526977539, -13.871905326843262, -13.150936126708984, -12.429967880249023, -11.708998680114746, -10.988029479980469, -10.267061233520508, -9.546091079711914, -8.825122833251953, -8.104153633117676, -7.383184432983398, -6.662215232849121, -5.941246032714844, -5.220276832580566, -4.499308109283447, -3.77833890914917, -3.0573697090148926, -2.3364009857177734, -1.615431785583496, -0.8944625854492188, -0.17349350452423096, 0.5474755764007568, 1.268444538116455, 1.9894137382507324, 2.7103829383850098, 3.431351661682129, 4.152320861816406, 4.873290061950684, 5.594259262084961, 6.315228462219238, 7.036197185516357, 7.757166385650635, 8.47813606262207, 9.199104309082031, 9.920073509216309, 10.641042709350586, 11.362011909484863, 12.08298110961914, 12.803949356079102, 13.524919509887695, 14.245887756347656, 14.966856956481934, 15.687826156616211, 16.408794403076172, 17.129762649536133, 17.850732803344727, 18.571701049804688, 19.29267120361328, 20.013639450073242, 20.734607696533203, 21.455577850341797, 22.17654800415039]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 6.0, 8.0, 14.0, 15.0, 14.0, 18.0, 16.0, 25.0, 33.0, 34.0, 27.0, 36.0, 35.0, 38.0, 40.0, 46.0, 55.0, 49.0, 45.0, 47.0, 53.0, 30.0, 35.0, 40.0, 23.0, 28.0, 25.0, 30.0, 26.0, 22.0, 14.0, 14.0, 9.0, 11.0, 9.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-29.733400344848633, -28.845291137695312, -27.957181930541992, -27.069072723388672, -26.18096160888672, -25.2928524017334, -24.404743194580078, -23.516633987426758, -22.628524780273438, -21.740415573120117, -20.852306365966797, -19.964195251464844, -19.076086044311523, -18.187976837158203, -17.299867630004883, -16.411758422851562, -15.523648262023926, -14.635539054870605, -13.747428894042969, -12.859319686889648, -11.971210479736328, -11.083101272583008, -10.194991111755371, -9.30688190460205, -8.418771743774414, -7.5306620597839355, -6.642552852630615, -5.754443168640137, -4.866333961486816, -3.978224277496338, -3.0901145935058594, -2.202005386352539, -1.3138961791992188, -0.42578667402267456, 0.46232283115386963, 1.3504323959350586, 2.238541841506958, 3.1266512870788574, 4.014760971069336, 4.902870178222656, 5.790979862213135, 6.679089546203613, 7.567198753356934, 8.45530891418457, 9.34341812133789, 10.231527328491211, 11.119636535644531, 12.007745742797852, 12.895855903625488, 13.783965110778809, 14.672075271606445, 15.560184478759766, 16.448293685913086, 17.336402893066406, 18.22451400756836, 19.112621307373047, 20.000732421875, 20.88884162902832, 21.77695083618164, 22.665061950683594, 23.553171157836914, 24.441280364990234, 25.329389572143555, 26.217498779296875, 27.105607986450195]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 13.0, 26.0, 44.0, 92.0, 120.0, 211.0, 358.0, 644.0, 1127.0, 2010.0, 3580.0, 6134.0, 10847.0, 17695.0, 29098.0, 44984.0, 64941.0, 87491.0, 109050.0, 122389.0, 125089.0, 114394.0, 95731.0, 73598.0, 52141.0, 34024.0, 21819.0, 13181.0, 7569.0, 4360.0, 2535.0, 1394.0, 760.0, 484.0, 261.0, 151.0, 87.0, 47.0, 27.0, 22.0, 15.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.109375, -16.523193359375, -15.93701171875, -15.350830078125, -14.7646484375, -14.178466796875, -13.59228515625, -13.006103515625, -12.419921875, -11.833740234375, -11.24755859375, -10.661376953125, -10.0751953125, -9.489013671875, -8.90283203125, -8.316650390625, -7.73046875, -7.144287109375, -6.55810546875, -5.971923828125, -5.3857421875, -4.799560546875, -4.21337890625, -3.627197265625, -3.041015625, -2.454833984375, -1.86865234375, -1.282470703125, -0.6962890625, -0.110107421875, 0.47607421875, 1.062255859375, 1.6484375, 2.234619140625, 2.82080078125, 3.406982421875, 3.9931640625, 4.579345703125, 5.16552734375, 5.751708984375, 6.337890625, 6.924072265625, 7.51025390625, 8.096435546875, 8.6826171875, 9.268798828125, 9.85498046875, 10.441162109375, 11.02734375, 11.613525390625, 12.19970703125, 12.785888671875, 13.3720703125, 13.958251953125, 14.54443359375, 15.130615234375, 15.716796875, 16.302978515625, 16.88916015625, 17.475341796875, 18.0615234375, 18.647705078125, 19.23388671875, 19.820068359375, 20.40625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 10.0, 6.0, 6.0, 16.0, 13.0, 14.0, 20.0, 14.0, 26.0, 31.0, 33.0, 30.0, 34.0, 38.0, 33.0, 41.0, 51.0, 57.0, 45.0, 47.0, 51.0, 46.0, 32.0, 35.0, 38.0, 25.0, 27.0, 28.0, 28.0, 22.0, 29.0, 11.0, 12.0, 11.0, 11.0, 9.0, 8.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-28.765625, -27.90625, -27.046875, -26.1875, -25.328125, -24.46875, -23.609375, -22.75, -21.890625, -21.03125, -20.171875, -19.3125, -18.453125, -17.59375, -16.734375, -15.875, -15.015625, -14.15625, -13.296875, -12.4375, -11.578125, -10.71875, -9.859375, -9.0, -8.140625, -7.28125, -6.421875, -5.5625, -4.703125, -3.84375, -2.984375, -2.125, -1.265625, -0.40625, 0.453125, 1.3125, 2.171875, 3.03125, 3.890625, 4.75, 5.609375, 6.46875, 7.328125, 8.1875, 9.046875, 9.90625, 10.765625, 11.625, 12.484375, 13.34375, 14.203125, 15.0625, 15.921875, 16.78125, 17.640625, 18.5, 19.359375, 20.21875, 21.078125, 21.9375, 22.796875, 23.65625, 24.515625, 25.375, 26.234375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 7.0, 14.0, 17.0, 30.0, 55.0, 59.0, 96.0, 179.0, 271.0, 493.0, 834.0, 1472.0, 2665.0, 4633.0, 8152.0, 14532.0, 25308.0, 41815.0, 65828.0, 94852.0, 123617.0, 142179.0, 142252.0, 122757.0, 93888.0, 64000.0, 40842.0, 24664.0, 14299.0, 8123.0, 4552.0, 2516.0, 1430.0, 861.0, 511.0, 298.0, 154.0, 97.0, 67.0, 52.0, 27.0, 14.0, 17.0, 9.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-22.96875, -22.25048828125, -21.5322265625, -20.81396484375, -20.095703125, -19.37744140625, -18.6591796875, -17.94091796875, -17.22265625, -16.50439453125, -15.7861328125, -15.06787109375, -14.349609375, -13.63134765625, -12.9130859375, -12.19482421875, -11.4765625, -10.75830078125, -10.0400390625, -9.32177734375, -8.603515625, -7.88525390625, -7.1669921875, -6.44873046875, -5.73046875, -5.01220703125, -4.2939453125, -3.57568359375, -2.857421875, -2.13916015625, -1.4208984375, -0.70263671875, 0.015625, 0.73388671875, 1.4521484375, 2.17041015625, 2.888671875, 3.60693359375, 4.3251953125, 5.04345703125, 5.76171875, 6.47998046875, 7.1982421875, 7.91650390625, 8.634765625, 9.35302734375, 10.0712890625, 10.78955078125, 11.5078125, 12.22607421875, 12.9443359375, 13.66259765625, 14.380859375, 15.09912109375, 15.8173828125, 16.53564453125, 17.25390625, 17.97216796875, 18.6904296875, 19.40869140625, 20.126953125, 20.84521484375, 21.5634765625, 22.28173828125, 23.0]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 7.0, 8.0, 9.0, 9.0, 11.0, 14.0, 19.0, 34.0, 30.0, 29.0, 25.0, 27.0, 49.0, 39.0, 38.0, 44.0, 32.0, 51.0, 44.0, 43.0, 42.0, 45.0, 35.0, 46.0, 31.0, 29.0, 15.0, 29.0, 24.0, 29.0, 17.0, 10.0, 12.0, 16.0, 6.0, 8.0, 9.0, 5.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.921875, -17.401611328125, -16.88134765625, -16.361083984375, -15.8408203125, -15.320556640625, -14.80029296875, -14.280029296875, -13.759765625, -13.239501953125, -12.71923828125, -12.198974609375, -11.6787109375, -11.158447265625, -10.63818359375, -10.117919921875, -9.59765625, -9.077392578125, -8.55712890625, -8.036865234375, -7.5166015625, -6.996337890625, -6.47607421875, -5.955810546875, -5.435546875, -4.915283203125, -4.39501953125, -3.874755859375, -3.3544921875, -2.834228515625, -2.31396484375, -1.793701171875, -1.2734375, -0.753173828125, -0.23291015625, 0.287353515625, 0.8076171875, 1.327880859375, 1.84814453125, 2.368408203125, 2.888671875, 3.408935546875, 3.92919921875, 4.449462890625, 4.9697265625, 5.489990234375, 6.01025390625, 6.530517578125, 7.05078125, 7.571044921875, 8.09130859375, 8.611572265625, 9.1318359375, 9.652099609375, 10.17236328125, 10.692626953125, 11.212890625, 11.733154296875, 12.25341796875, 12.773681640625, 13.2939453125, 13.814208984375, 14.33447265625, 14.854736328125, 15.375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 12.0, 6.0, 5.0, 17.0, 20.0, 29.0, 40.0, 68.0, 119.0, 152.0, 259.0, 366.0, 584.0, 893.0, 1333.0, 2137.0, 3504.0, 5636.0, 9085.0, 15023.0, 24132.0, 38511.0, 58642.0, 84949.0, 112001.0, 131945.0, 136911.0, 123614.0, 98773.0, 71274.0, 47742.0, 30795.0, 19158.0, 11736.0, 7081.0, 4503.0, 2695.0, 1707.0, 1060.0, 693.0, 458.0, 315.0, 170.0, 137.0, 89.0, 61.0, 41.0, 34.0, 25.0, 12.0, 2.0, 2.0, 8.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.33203125, -7.097412109375, -6.86279296875, -6.628173828125, -6.3935546875, -6.158935546875, -5.92431640625, -5.689697265625, -5.455078125, -5.220458984375, -4.98583984375, -4.751220703125, -4.5166015625, -4.281982421875, -4.04736328125, -3.812744140625, -3.578125, -3.343505859375, -3.10888671875, -2.874267578125, -2.6396484375, -2.405029296875, -2.17041015625, -1.935791015625, -1.701171875, -1.466552734375, -1.23193359375, -0.997314453125, -0.7626953125, -0.528076171875, -0.29345703125, -0.058837890625, 0.17578125, 0.410400390625, 0.64501953125, 0.879638671875, 1.1142578125, 1.348876953125, 1.58349609375, 1.818115234375, 2.052734375, 2.287353515625, 2.52197265625, 2.756591796875, 2.9912109375, 3.225830078125, 3.46044921875, 3.695068359375, 3.9296875, 4.164306640625, 4.39892578125, 4.633544921875, 4.8681640625, 5.102783203125, 5.33740234375, 5.572021484375, 5.806640625, 6.041259765625, 6.27587890625, 6.510498046875, 6.7451171875, 6.979736328125, 7.21435546875, 7.448974609375, 7.68359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 5.0, 7.0, 9.0, 9.0, 10.0, 17.0, 13.0, 22.0, 19.0, 29.0, 34.0, 46.0, 37.0, 44.0, 48.0, 44.0, 52.0, 50.0, 59.0, 54.0, 49.0, 43.0, 60.0, 41.0, 32.0, 24.0, 26.0, 14.0, 19.0, 20.0, 19.0, 11.0, 10.0, 7.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009107589721679688, -0.0008830726146697998, -0.0008553862571716309, -0.0008276998996734619, -0.000800013542175293, -0.000772327184677124, -0.0007446408271789551, -0.0007169544696807861, -0.0006892681121826172, -0.0006615817546844482, -0.0006338953971862793, -0.0006062090396881104, -0.0005785226821899414, -0.0005508363246917725, -0.0005231499671936035, -0.0004954636096954346, -0.0004677772521972656, -0.0004400908946990967, -0.00041240453720092773, -0.0003847181797027588, -0.00035703182220458984, -0.0003293454647064209, -0.00030165910720825195, -0.000273972749710083, -0.00024628639221191406, -0.00021860003471374512, -0.00019091367721557617, -0.00016322731971740723, -0.00013554096221923828, -0.00010785460472106934, -8.016824722290039e-05, -5.2481889724731445e-05, -2.47955322265625e-05, 2.8908252716064453e-06, 3.057718276977539e-05, 5.8263540267944336e-05, 8.594989776611328e-05, 0.00011363625526428223, 0.00014132261276245117, 0.00016900897026062012, 0.00019669532775878906, 0.000224381685256958, 0.00025206804275512695, 0.0002797544002532959, 0.00030744075775146484, 0.0003351271152496338, 0.00036281347274780273, 0.0003904998302459717, 0.0004181861877441406, 0.00044587254524230957, 0.0004735589027404785, 0.0005012452602386475, 0.0005289316177368164, 0.0005566179752349854, 0.0005843043327331543, 0.0006119906902313232, 0.0006396770477294922, 0.0006673634052276611, 0.0006950497627258301, 0.000722736120223999, 0.000750422477722168, 0.0007781088352203369, 0.0008057951927185059, 0.0008334815502166748, 0.0008611679077148438]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 0.0, 2.0, 3.0, 1.0, 4.0, 7.0, 13.0, 24.0, 27.0, 44.0, 60.0, 100.0, 144.0, 257.0, 417.0, 649.0, 1077.0, 1604.0, 2817.0, 4480.0, 7232.0, 11972.0, 19660.0, 30466.0, 47033.0, 68285.0, 91847.0, 113273.0, 126907.0, 125652.0, 112263.0, 90078.0, 66655.0, 45833.0, 30159.0, 19252.0, 11649.0, 7254.0, 4308.0, 2625.0, 1658.0, 1004.0, 620.0, 399.0, 261.0, 159.0, 118.0, 82.0, 38.0, 26.0, 26.0, 9.0, 12.0, 6.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.06640625, -6.84539794921875, -6.6243896484375, -6.40338134765625, -6.182373046875, -5.96136474609375, -5.7403564453125, -5.51934814453125, -5.29833984375, -5.07733154296875, -4.8563232421875, -4.63531494140625, -4.414306640625, -4.19329833984375, -3.9722900390625, -3.75128173828125, -3.5302734375, -3.30926513671875, -3.0882568359375, -2.86724853515625, -2.646240234375, -2.42523193359375, -2.2042236328125, -1.98321533203125, -1.76220703125, -1.54119873046875, -1.3201904296875, -1.09918212890625, -0.878173828125, -0.65716552734375, -0.4361572265625, -0.21514892578125, 0.005859375, 0.22686767578125, 0.4478759765625, 0.66888427734375, 0.889892578125, 1.11090087890625, 1.3319091796875, 1.55291748046875, 1.77392578125, 1.99493408203125, 2.2159423828125, 2.43695068359375, 2.657958984375, 2.87896728515625, 3.0999755859375, 3.32098388671875, 3.5419921875, 3.76300048828125, 3.9840087890625, 4.20501708984375, 4.426025390625, 4.64703369140625, 4.8680419921875, 5.08905029296875, 5.31005859375, 5.53106689453125, 5.7520751953125, 5.97308349609375, 6.194091796875, 6.41510009765625, 6.6361083984375, 6.85711669921875, 7.078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 6.0, 6.0, 7.0, 9.0, 12.0, 17.0, 15.0, 14.0, 21.0, 28.0, 32.0, 34.0, 43.0, 41.0, 49.0, 64.0, 43.0, 58.0, 56.0, 71.0, 61.0, 43.0, 42.0, 44.0, 37.0, 29.0, 24.0, 24.0, 16.0, 15.0, 11.0, 12.0, 5.0, 8.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.921875, -4.790557861328125, -4.65924072265625, -4.527923583984375, -4.3966064453125, -4.265289306640625, -4.13397216796875, -4.002655029296875, -3.871337890625, -3.740020751953125, -3.60870361328125, -3.477386474609375, -3.3460693359375, -3.214752197265625, -3.08343505859375, -2.952117919921875, -2.82080078125, -2.689483642578125, -2.55816650390625, -2.426849365234375, -2.2955322265625, -2.164215087890625, -2.03289794921875, -1.901580810546875, -1.770263671875, -1.638946533203125, -1.50762939453125, -1.376312255859375, -1.2449951171875, -1.113677978515625, -0.98236083984375, -0.851043701171875, -0.7197265625, -0.588409423828125, -0.45709228515625, -0.325775146484375, -0.1944580078125, -0.063140869140625, 0.06817626953125, 0.199493408203125, 0.330810546875, 0.462127685546875, 0.59344482421875, 0.724761962890625, 0.8560791015625, 0.987396240234375, 1.11871337890625, 1.250030517578125, 1.38134765625, 1.512664794921875, 1.64398193359375, 1.775299072265625, 1.9066162109375, 2.037933349609375, 2.16925048828125, 2.300567626953125, 2.431884765625, 2.563201904296875, 2.69451904296875, 2.825836181640625, 2.9571533203125, 3.088470458984375, 3.21978759765625, 3.351104736328125, 3.482421875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 6.0, 5.0, 5.0, 9.0, 8.0, 29.0, 13.0, 23.0, 21.0, 36.0, 16.0, 29.0, 37.0, 31.0, 38.0, 49.0, 46.0, 46.0, 49.0, 45.0, 55.0, 36.0, 43.0, 51.0, 36.0, 35.0, 32.0, 22.0, 35.0, 20.0, 17.0, 11.0, 8.0, 5.0, 8.0, 12.0, 6.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.66183090209961, -20.00617790222168, -19.35052490234375, -18.694869995117188, -18.039216995239258, -17.383563995361328, -16.7279109954834, -16.07225799560547, -15.416603088378906, -14.760950088500977, -14.10529613494873, -13.4496431350708, -12.793989181518555, -12.138336181640625, -11.482683181762695, -10.82702922821045, -10.17137622833252, -9.51572322845459, -8.860069274902344, -8.204416275024414, -7.548762321472168, -6.893109321594238, -6.23745584487915, -5.5818023681640625, -4.926148891448975, -4.270495414733887, -3.614841938018799, -2.95918869972229, -2.303535223007202, -1.6478817462921143, -0.9922285079956055, -0.3365750312805176, 0.3190784454345703, 0.9747318625450134, 1.6303852796554565, 2.286038637161255, 2.9416921138763428, 3.5973455905914307, 4.2529988288879395, 4.908652305603027, 5.564305782318115, 6.219959259033203, 6.875612735748291, 7.531266212463379, 8.186919212341309, 8.842573165893555, 9.498226165771484, 10.153879165649414, 10.80953311920166, 11.46518611907959, 12.120840072631836, 12.776493072509766, 13.432147026062012, 14.087800025939941, 14.743453979492188, 15.399106979370117, 16.054759979248047, 16.710412979125977, 17.366065979003906, 18.02172088623047, 18.6773738861084, 19.333026885986328, 19.988679885864258, 20.644332885742188, 21.29998779296875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 10.0, 6.0, 12.0, 10.0, 9.0, 12.0, 12.0, 20.0, 26.0, 32.0, 21.0, 40.0, 50.0, 36.0, 34.0, 45.0, 45.0, 49.0, 52.0, 34.0, 48.0, 45.0, 54.0, 36.0, 36.0, 17.0, 32.0, 33.0, 22.0, 33.0, 19.0, 14.0, 12.0, 5.0, 8.0, 10.0, 2.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.90433120727539, -29.00824546813965, -28.112157821655273, -27.21607208251953, -26.319984436035156, -25.423898696899414, -24.52781105041504, -23.631725311279297, -22.735637664794922, -21.83955192565918, -20.943464279174805, -20.047378540039062, -19.151290893554688, -18.255205154418945, -17.35911750793457, -16.463031768798828, -15.56694507598877, -14.670858383178711, -13.774771690368652, -12.878684997558594, -11.982598304748535, -11.086511611938477, -10.190425872802734, -9.29433822631836, -8.398252487182617, -7.502165794372559, -6.6060791015625, -5.709992408752441, -4.813905715942383, -3.9178194999694824, -3.021732807159424, -2.1256461143493652, -1.2295589447021484, -0.3334723114967346, 0.5626143217086792, 1.4587008953094482, 2.354787588119507, 3.2508740425109863, 4.146960735321045, 5.0430474281311035, 5.939134120941162, 6.835220813751221, 7.731307506561279, 8.62739372253418, 9.523480415344238, 10.419567108154297, 11.315653800964355, 12.211740493774414, 13.107827186584473, 14.003913879394531, 14.90000057220459, 15.796087265014648, 16.69217300415039, 17.588260650634766, 18.484346389770508, 19.380434036254883, 20.276519775390625, 21.172605514526367, 22.068693161010742, 22.964778900146484, 23.86086654663086, 24.7569522857666, 25.653039932250977, 26.54912567138672, 27.445213317871094]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 10.0, 18.0, 34.0, 54.0, 96.0, 135.0, 236.0, 450.0, 741.0, 1359.0, 2231.0, 3943.0, 6656.0, 11347.0, 19155.0, 31680.0, 52310.0, 84024.0, 128421.0, 189968.0, 267361.0, 349687.0, 424798.0, 472224.0, 476267.0, 437715.0, 366938.0, 284537.0, 206579.0, 140709.0, 90785.0, 57360.0, 35557.0, 21076.0, 12433.0, 7349.0, 4222.0, 2443.0, 1430.0, 796.0, 472.0, 238.0, 182.0, 98.0, 63.0, 37.0, 24.0, 17.0, 11.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-15.25, -14.789306640625, -14.32861328125, -13.867919921875, -13.4072265625, -12.946533203125, -12.48583984375, -12.025146484375, -11.564453125, -11.103759765625, -10.64306640625, -10.182373046875, -9.7216796875, -9.260986328125, -8.80029296875, -8.339599609375, -7.87890625, -7.418212890625, -6.95751953125, -6.496826171875, -6.0361328125, -5.575439453125, -5.11474609375, -4.654052734375, -4.193359375, -3.732666015625, -3.27197265625, -2.811279296875, -2.3505859375, -1.889892578125, -1.42919921875, -0.968505859375, -0.5078125, -0.047119140625, 0.41357421875, 0.874267578125, 1.3349609375, 1.795654296875, 2.25634765625, 2.717041015625, 3.177734375, 3.638427734375, 4.09912109375, 4.559814453125, 5.0205078125, 5.481201171875, 5.94189453125, 6.402587890625, 6.86328125, 7.323974609375, 7.78466796875, 8.245361328125, 8.7060546875, 9.166748046875, 9.62744140625, 10.088134765625, 10.548828125, 11.009521484375, 11.47021484375, 11.930908203125, 12.3916015625, 12.852294921875, 13.31298828125, 13.773681640625, 14.234375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 12.0, 10.0, 8.0, 12.0, 13.0, 11.0, 23.0, 31.0, 25.0, 33.0, 40.0, 44.0, 35.0, 38.0, 48.0, 48.0, 51.0, 39.0, 48.0, 39.0, 55.0, 38.0, 44.0, 26.0, 24.0, 28.0, 34.0, 22.0, 27.0, 18.0, 13.0, 10.0, 4.0, 10.0, 8.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.8125, -26.025146484375, -25.23779296875, -24.450439453125, -23.6630859375, -22.875732421875, -22.08837890625, -21.301025390625, -20.513671875, -19.726318359375, -18.93896484375, -18.151611328125, -17.3642578125, -16.576904296875, -15.78955078125, -15.002197265625, -14.21484375, -13.427490234375, -12.64013671875, -11.852783203125, -11.0654296875, -10.278076171875, -9.49072265625, -8.703369140625, -7.916015625, -7.128662109375, -6.34130859375, -5.553955078125, -4.7666015625, -3.979248046875, -3.19189453125, -2.404541015625, -1.6171875, -0.829833984375, -0.04248046875, 0.744873046875, 1.5322265625, 2.319580078125, 3.10693359375, 3.894287109375, 4.681640625, 5.468994140625, 6.25634765625, 7.043701171875, 7.8310546875, 8.618408203125, 9.40576171875, 10.193115234375, 10.98046875, 11.767822265625, 12.55517578125, 13.342529296875, 14.1298828125, 14.917236328125, 15.70458984375, 16.491943359375, 17.279296875, 18.066650390625, 18.85400390625, 19.641357421875, 20.4287109375, 21.216064453125, 22.00341796875, 22.790771484375, 23.578125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 3.0, 10.0, 11.0, 41.0, 50.0, 69.0, 127.0, 204.0, 400.0, 641.0, 1035.0, 1627.0, 2782.0, 4716.0, 7703.0, 12612.0, 20542.0, 31683.0, 49293.0, 74771.0, 108111.0, 152729.0, 207191.0, 264061.0, 322915.0, 370021.0, 399105.0, 402118.0, 381863.0, 338299.0, 284052.0, 223419.0, 170022.0, 121869.0, 84997.0, 57069.0, 36938.0, 23518.0, 14812.0, 9196.0, 5376.0, 3285.0, 2014.0, 1187.0, 717.0, 453.0, 229.0, 146.0, 94.0, 63.0, 34.0, 28.0, 15.0, 14.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.2734375, -12.8333740234375, -12.393310546875, -11.9532470703125, -11.51318359375, -11.0731201171875, -10.633056640625, -10.1929931640625, -9.7529296875, -9.3128662109375, -8.872802734375, -8.4327392578125, -7.99267578125, -7.5526123046875, -7.112548828125, -6.6724853515625, -6.232421875, -5.7923583984375, -5.352294921875, -4.9122314453125, -4.47216796875, -4.0321044921875, -3.592041015625, -3.1519775390625, -2.7119140625, -2.2718505859375, -1.831787109375, -1.3917236328125, -0.95166015625, -0.5115966796875, -0.071533203125, 0.3685302734375, 0.80859375, 1.2486572265625, 1.688720703125, 2.1287841796875, 2.56884765625, 3.0089111328125, 3.448974609375, 3.8890380859375, 4.3291015625, 4.7691650390625, 5.209228515625, 5.6492919921875, 6.08935546875, 6.5294189453125, 6.969482421875, 7.4095458984375, 7.849609375, 8.2896728515625, 8.729736328125, 9.1697998046875, 9.60986328125, 10.0499267578125, 10.489990234375, 10.9300537109375, 11.3701171875, 11.8101806640625, 12.250244140625, 12.6903076171875, 13.13037109375, 13.5704345703125, 14.010498046875, 14.4505615234375, 14.890625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 7.0, 8.0, 8.0, 16.0, 17.0, 23.0, 26.0, 33.0, 47.0, 47.0, 65.0, 89.0, 94.0, 139.0, 131.0, 179.0, 160.0, 187.0, 215.0, 213.0, 218.0, 239.0, 215.0, 205.0, 199.0, 186.0, 171.0, 160.0, 128.0, 130.0, 100.0, 73.0, 88.0, 71.0, 54.0, 26.0, 23.0, 25.0, 22.0, 10.0, 10.0, 10.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1875, -8.880615234375, -8.57373046875, -8.266845703125, -7.9599609375, -7.653076171875, -7.34619140625, -7.039306640625, -6.732421875, -6.425537109375, -6.11865234375, -5.811767578125, -5.5048828125, -5.197998046875, -4.89111328125, -4.584228515625, -4.27734375, -3.970458984375, -3.66357421875, -3.356689453125, -3.0498046875, -2.742919921875, -2.43603515625, -2.129150390625, -1.822265625, -1.515380859375, -1.20849609375, -0.901611328125, -0.5947265625, -0.287841796875, 0.01904296875, 0.325927734375, 0.6328125, 0.939697265625, 1.24658203125, 1.553466796875, 1.8603515625, 2.167236328125, 2.47412109375, 2.781005859375, 3.087890625, 3.394775390625, 3.70166015625, 4.008544921875, 4.3154296875, 4.622314453125, 4.92919921875, 5.236083984375, 5.54296875, 5.849853515625, 6.15673828125, 6.463623046875, 6.7705078125, 7.077392578125, 7.38427734375, 7.691162109375, 7.998046875, 8.304931640625, 8.61181640625, 8.918701171875, 9.2255859375, 9.532470703125, 9.83935546875, 10.146240234375, 10.453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 8.0, 7.0, 2.0, 6.0, 7.0, 4.0, 6.0, 9.0, 7.0, 9.0, 13.0, 10.0, 19.0, 20.0, 23.0, 26.0, 32.0, 27.0, 32.0, 41.0, 41.0, 44.0, 52.0, 39.0, 41.0, 53.0, 39.0, 42.0, 32.0, 37.0, 42.0, 29.0, 32.0, 24.0, 26.0, 29.0, 15.0, 13.0, 13.0, 8.0, 10.0, 12.0, 9.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-18.765586853027344, -18.15207862854004, -17.538570404052734, -16.925060272216797, -16.311552047729492, -15.698043823242188, -15.084534645080566, -14.471025466918945, -13.85751724243164, -13.244009017944336, -12.630499839782715, -12.016990661621094, -11.403482437133789, -10.789974212646484, -10.176465034484863, -9.562955856323242, -8.949447631835938, -8.335939407348633, -7.722430229187012, -7.108921527862549, -6.495412826538086, -5.881904125213623, -5.26839542388916, -4.654886722564697, -4.041378021240234, -3.4278693199157715, -2.8143606185913086, -2.2008519172668457, -1.5873432159423828, -0.9738345146179199, -0.36032581329345703, 0.25318288803100586, 0.8666896820068359, 1.4801983833312988, 2.0937070846557617, 2.7072157859802246, 3.3207244873046875, 3.9342331886291504, 4.547741889953613, 5.161250591278076, 5.774759292602539, 6.388267993927002, 7.001776695251465, 7.615285396575928, 8.22879409790039, 8.842302322387695, 9.455811500549316, 10.069320678710938, 10.682828903198242, 11.296337127685547, 11.909846305847168, 12.523355484008789, 13.136863708496094, 13.750371932983398, 14.36388111114502, 14.97739028930664, 15.590898513793945, 16.20440673828125, 16.817916870117188, 17.431425094604492, 18.044933319091797, 18.6584415435791, 19.271949768066406, 19.885459899902344, 20.49896812438965]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 3.0, 7.0, 5.0, 14.0, 10.0, 16.0, 15.0, 26.0, 21.0, 26.0, 29.0, 29.0, 28.0, 44.0, 49.0, 53.0, 46.0, 41.0, 42.0, 60.0, 40.0, 46.0, 37.0, 46.0, 36.0, 36.0, 39.0, 18.0, 22.0, 21.0, 22.0, 18.0, 12.0, 8.0, 7.0, 7.0, 11.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.990938186645508, -29.099899291992188, -28.208860397338867, -27.31782341003418, -26.42678451538086, -25.53574562072754, -24.64470672607422, -23.75366973876953, -22.86263084411621, -21.97159194946289, -21.08055305480957, -20.189516067504883, -19.298477172851562, -18.407438278198242, -17.516399383544922, -16.625362396240234, -15.734322547912598, -14.843283653259277, -13.952245712280273, -13.061206817626953, -12.17016887664795, -11.279129981994629, -10.388092041015625, -9.497053146362305, -8.606014251708984, -7.714975833892822, -6.82393741607666, -5.93289852142334, -5.041860580444336, -4.150821685791016, -3.2597832679748535, -2.3687448501586914, -1.4777069091796875, -0.5866684317588806, 0.30437004566192627, 1.195408582687378, 2.08644700050354, 2.9774856567382812, 3.8685240745544434, 4.7595624923706055, 5.650600910186768, 6.54163932800293, 7.432677745819092, 8.323716163635254, 9.214755058288574, 10.105792999267578, 10.996831893920898, 11.887870788574219, 12.778908729553223, 13.669947624206543, 14.560985565185547, 15.452024459838867, 16.343063354492188, 17.234100341796875, 18.125139236450195, 19.016178131103516, 19.907217025756836, 20.798255920410156, 21.689294815063477, 22.580331802368164, 23.471370697021484, 24.362409591674805, 25.253448486328125, 26.144485473632812, 27.035524368286133]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 10.0, 5.0, 13.0, 31.0, 34.0, 55.0, 134.0, 218.0, 346.0, 588.0, 1011.0, 1778.0, 3048.0, 5495.0, 8977.0, 15406.0, 25139.0, 40088.0, 60288.0, 85819.0, 111582.0, 130812.0, 134317.0, 122191.0, 98876.0, 72317.0, 49783.0, 31870.0, 19791.0, 11930.0, 6918.0, 4119.0, 2391.0, 1365.0, 743.0, 416.0, 292.0, 154.0, 80.0, 45.0, 30.0, 25.0, 9.0, 7.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.17578125, -6.9599609375, -6.744140625, -6.5283203125, -6.3125, -6.0966796875, -5.880859375, -5.6650390625, -5.44921875, -5.2333984375, -5.017578125, -4.8017578125, -4.5859375, -4.3701171875, -4.154296875, -3.9384765625, -3.72265625, -3.5068359375, -3.291015625, -3.0751953125, -2.859375, -2.6435546875, -2.427734375, -2.2119140625, -1.99609375, -1.7802734375, -1.564453125, -1.3486328125, -1.1328125, -0.9169921875, -0.701171875, -0.4853515625, -0.26953125, -0.0537109375, 0.162109375, 0.3779296875, 0.59375, 0.8095703125, 1.025390625, 1.2412109375, 1.45703125, 1.6728515625, 1.888671875, 2.1044921875, 2.3203125, 2.5361328125, 2.751953125, 2.9677734375, 3.18359375, 3.3994140625, 3.615234375, 3.8310546875, 4.046875, 4.2626953125, 4.478515625, 4.6943359375, 4.91015625, 5.1259765625, 5.341796875, 5.5576171875, 5.7734375, 5.9892578125, 6.205078125, 6.4208984375, 6.63671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 5.0, 3.0, 8.0, 4.0, 15.0, 8.0, 16.0, 15.0, 27.0, 21.0, 22.0, 30.0, 34.0, 25.0, 43.0, 50.0, 53.0, 45.0, 41.0, 43.0, 59.0, 38.0, 48.0, 36.0, 45.0, 38.0, 37.0, 37.0, 21.0, 21.0, 23.0, 21.0, 17.0, 13.0, 8.0, 7.0, 7.0, 10.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.078125, -29.185791015625, -28.29345703125, -27.401123046875, -26.5087890625, -25.616455078125, -24.72412109375, -23.831787109375, -22.939453125, -22.047119140625, -21.15478515625, -20.262451171875, -19.3701171875, -18.477783203125, -17.58544921875, -16.693115234375, -15.80078125, -14.908447265625, -14.01611328125, -13.123779296875, -12.2314453125, -11.339111328125, -10.44677734375, -9.554443359375, -8.662109375, -7.769775390625, -6.87744140625, -5.985107421875, -5.0927734375, -4.200439453125, -3.30810546875, -2.415771484375, -1.5234375, -0.631103515625, 0.26123046875, 1.153564453125, 2.0458984375, 2.938232421875, 3.83056640625, 4.722900390625, 5.615234375, 6.507568359375, 7.39990234375, 8.292236328125, 9.1845703125, 10.076904296875, 10.96923828125, 11.861572265625, 12.75390625, 13.646240234375, 14.53857421875, 15.430908203125, 16.3232421875, 17.215576171875, 18.10791015625, 19.000244140625, 19.892578125, 20.784912109375, 21.67724609375, 22.569580078125, 23.4619140625, 24.354248046875, 25.24658203125, 26.138916015625, 27.03125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 13.0, 13.0, 19.0, 28.0, 30.0, 40.0, 64.0, 99.0, 140.0, 200.0, 268.0, 366.0, 528.0, 744.0, 1003.0, 1512.0, 2093.0, 3193.0, 4570.0, 6887.0, 10181.0, 15854.0, 25584.0, 110996.0, 766973.0, 37130.0, 20469.0, 12832.0, 8370.0, 5591.0, 3942.0, 2575.0, 1856.0, 1350.0, 893.0, 608.0, 456.0, 349.0, 231.0, 161.0, 96.0, 69.0, 56.0, 35.0, 34.0, 17.0, 8.0, 7.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.3125, -15.773681640625, -15.23486328125, -14.696044921875, -14.1572265625, -13.618408203125, -13.07958984375, -12.540771484375, -12.001953125, -11.463134765625, -10.92431640625, -10.385498046875, -9.8466796875, -9.307861328125, -8.76904296875, -8.230224609375, -7.69140625, -7.152587890625, -6.61376953125, -6.074951171875, -5.5361328125, -4.997314453125, -4.45849609375, -3.919677734375, -3.380859375, -2.842041015625, -2.30322265625, -1.764404296875, -1.2255859375, -0.686767578125, -0.14794921875, 0.390869140625, 0.9296875, 1.468505859375, 2.00732421875, 2.546142578125, 3.0849609375, 3.623779296875, 4.16259765625, 4.701416015625, 5.240234375, 5.779052734375, 6.31787109375, 6.856689453125, 7.3955078125, 7.934326171875, 8.47314453125, 9.011962890625, 9.55078125, 10.089599609375, 10.62841796875, 11.167236328125, 11.7060546875, 12.244873046875, 12.78369140625, 13.322509765625, 13.861328125, 14.400146484375, 14.93896484375, 15.477783203125, 16.0166015625, 16.555419921875, 17.09423828125, 17.633056640625, 18.171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 2.0, 2.0, 7.0, 3.0, 6.0, 8.0, 14.0, 7.0, 17.0, 21.0, 14.0, 18.0, 21.0, 27.0, 24.0, 25.0, 28.0, 29.0, 28.0, 32.0, 30.0, 43.0, 34.0, 37.0, 43.0, 32.0, 48.0, 36.0, 36.0, 36.0, 32.0, 34.0, 39.0, 27.0, 22.0, 26.0, 19.0, 17.0, 12.0, 12.0, 9.0, 8.0, 8.0, 12.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-18.5625, -17.99951171875, -17.4365234375, -16.87353515625, -16.310546875, -15.74755859375, -15.1845703125, -14.62158203125, -14.05859375, -13.49560546875, -12.9326171875, -12.36962890625, -11.806640625, -11.24365234375, -10.6806640625, -10.11767578125, -9.5546875, -8.99169921875, -8.4287109375, -7.86572265625, -7.302734375, -6.73974609375, -6.1767578125, -5.61376953125, -5.05078125, -4.48779296875, -3.9248046875, -3.36181640625, -2.798828125, -2.23583984375, -1.6728515625, -1.10986328125, -0.546875, 0.01611328125, 0.5791015625, 1.14208984375, 1.705078125, 2.26806640625, 2.8310546875, 3.39404296875, 3.95703125, 4.52001953125, 5.0830078125, 5.64599609375, 6.208984375, 6.77197265625, 7.3349609375, 7.89794921875, 8.4609375, 9.02392578125, 9.5869140625, 10.14990234375, 10.712890625, 11.27587890625, 11.8388671875, 12.40185546875, 12.96484375, 13.52783203125, 14.0908203125, 14.65380859375, 15.216796875, 15.77978515625, 16.3427734375, 16.90576171875, 17.46875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 10.0, 8.0, 9.0, 14.0, 21.0, 23.0, 46.0, 47.0, 78.0, 106.0, 146.0, 187.0, 299.0, 438.0, 666.0, 1036.0, 1531.0, 2435.0, 3829.0, 6460.0, 11270.0, 21027.0, 52958.0, 829930.0, 63849.0, 22067.0, 11887.0, 6748.0, 4082.0, 2488.0, 1645.0, 1003.0, 670.0, 461.0, 342.0, 215.0, 143.0, 100.0, 79.0, 58.0, 38.0, 26.0, 16.0, 15.0, 11.0, 12.0, 8.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0], "bins": [-1.7275390625, -1.6760406494140625, -1.624542236328125, -1.5730438232421875, -1.52154541015625, -1.4700469970703125, -1.418548583984375, -1.3670501708984375, -1.3155517578125, -1.2640533447265625, -1.212554931640625, -1.1610565185546875, -1.10955810546875, -1.0580596923828125, -1.006561279296875, -0.9550628662109375, -0.903564453125, -0.8520660400390625, -0.800567626953125, -0.7490692138671875, -0.69757080078125, -0.6460723876953125, -0.594573974609375, -0.5430755615234375, -0.4915771484375, -0.4400787353515625, -0.388580322265625, -0.3370819091796875, -0.28558349609375, -0.2340850830078125, -0.182586669921875, -0.1310882568359375, -0.07958984375, -0.0280914306640625, 0.023406982421875, 0.0749053955078125, 0.12640380859375, 0.1779022216796875, 0.229400634765625, 0.2808990478515625, 0.3323974609375, 0.3838958740234375, 0.435394287109375, 0.4868927001953125, 0.53839111328125, 0.5898895263671875, 0.641387939453125, 0.6928863525390625, 0.744384765625, 0.7958831787109375, 0.847381591796875, 0.8988800048828125, 0.95037841796875, 1.0018768310546875, 1.053375244140625, 1.1048736572265625, 1.1563720703125, 1.2078704833984375, 1.259368896484375, 1.3108673095703125, 1.36236572265625, 1.4138641357421875, 1.465362548828125, 1.5168609619140625, 1.568359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 0.0, 6.0, 3.0, 2.0, 2.0, 11.0, 11.0, 16.0, 15.0, 16.0, 14.0, 32.0, 42.0, 45.0, 50.0, 68.0, 58.0, 68.0, 62.0, 69.0, 68.0, 64.0, 34.0, 48.0, 42.0, 29.0, 21.0, 23.0, 15.0, 17.0, 14.0, 10.0, 9.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011360645294189453, -0.0001100003719329834, -0.00010639429092407227, -0.00010278820991516113, -9.918212890625e-05, -9.557604789733887e-05, -9.196996688842773e-05, -8.83638858795166e-05, -8.475780487060547e-05, -8.115172386169434e-05, -7.75456428527832e-05, -7.393956184387207e-05, -7.033348083496094e-05, -6.67273998260498e-05, -6.312131881713867e-05, -5.951523780822754e-05, -5.5909156799316406e-05, -5.2303075790405273e-05, -4.869699478149414e-05, -4.509091377258301e-05, -4.1484832763671875e-05, -3.787875175476074e-05, -3.427267074584961e-05, -3.0666589736938477e-05, -2.7060508728027344e-05, -2.345442771911621e-05, -1.9848346710205078e-05, -1.6242265701293945e-05, -1.2636184692382812e-05, -9.03010368347168e-06, -5.424022674560547e-06, -1.817941665649414e-06, 1.7881393432617188e-06, 5.3942203521728516e-06, 9.000301361083984e-06, 1.2606382369995117e-05, 1.621246337890625e-05, 1.9818544387817383e-05, 2.3424625396728516e-05, 2.703070640563965e-05, 3.063678741455078e-05, 3.4242868423461914e-05, 3.784894943237305e-05, 4.145503044128418e-05, 4.506111145019531e-05, 4.8667192459106445e-05, 5.227327346801758e-05, 5.587935447692871e-05, 5.9485435485839844e-05, 6.309151649475098e-05, 6.669759750366211e-05, 7.030367851257324e-05, 7.390975952148438e-05, 7.751584053039551e-05, 8.112192153930664e-05, 8.472800254821777e-05, 8.83340835571289e-05, 9.194016456604004e-05, 9.554624557495117e-05, 9.91523265838623e-05, 0.00010275840759277344, 0.00010636448860168457, 0.0001099705696105957, 0.00011357665061950684, 0.00011718273162841797]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 11.0, 7.0, 9.0, 23.0, 57.0, 43.0, 98.0, 106.0, 172.0, 301.0, 402.0, 627.0, 953.0, 1423.0, 2266.0, 3627.0, 5666.0, 9026.0, 14383.0, 22976.0, 35794.0, 53584.0, 76732.0, 101318.0, 123044.0, 131446.0, 123387.0, 103693.0, 79451.0, 56379.0, 36728.0, 23725.0, 15005.0, 9511.0, 6065.0, 3781.0, 2315.0, 1525.0, 983.0, 612.0, 448.0, 295.0, 169.0, 136.0, 85.0, 53.0, 37.0, 23.0, 15.0, 12.0, 15.0, 9.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.85107421875, -0.8240966796875, -0.797119140625, -0.7701416015625, -0.7431640625, -0.7161865234375, -0.689208984375, -0.6622314453125, -0.63525390625, -0.6082763671875, -0.581298828125, -0.5543212890625, -0.52734375, -0.5003662109375, -0.473388671875, -0.4464111328125, -0.41943359375, -0.3924560546875, -0.365478515625, -0.3385009765625, -0.3115234375, -0.2845458984375, -0.257568359375, -0.2305908203125, -0.20361328125, -0.1766357421875, -0.149658203125, -0.1226806640625, -0.095703125, -0.0687255859375, -0.041748046875, -0.0147705078125, 0.01220703125, 0.0391845703125, 0.066162109375, 0.0931396484375, 0.1201171875, 0.1470947265625, 0.174072265625, 0.2010498046875, 0.22802734375, 0.2550048828125, 0.281982421875, 0.3089599609375, 0.3359375, 0.3629150390625, 0.389892578125, 0.4168701171875, 0.44384765625, 0.4708251953125, 0.497802734375, 0.5247802734375, 0.5517578125, 0.5787353515625, 0.605712890625, 0.6326904296875, 0.65966796875, 0.6866455078125, 0.713623046875, 0.7406005859375, 0.767578125, 0.7945556640625, 0.821533203125, 0.8485107421875, 0.87548828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 9.0, 6.0, 6.0, 13.0, 7.0, 18.0, 16.0, 13.0, 17.0, 18.0, 21.0, 34.0, 33.0, 29.0, 32.0, 28.0, 32.0, 41.0, 32.0, 36.0, 39.0, 33.0, 37.0, 37.0, 39.0, 33.0, 29.0, 36.0, 34.0, 29.0, 27.0, 36.0, 25.0, 14.0, 22.0, 14.0, 13.0, 16.0, 14.0, 5.0, 7.0, 6.0, 5.0, 2.0, 5.0, 1.0, 2.0, 5.0, 4.0], "bins": [-0.491455078125, -0.4779319763183594, -0.46440887451171875, -0.4508857727050781, -0.4373626708984375, -0.4238395690917969, -0.41031646728515625, -0.3967933654785156, -0.383270263671875, -0.3697471618652344, -0.35622406005859375, -0.3427009582519531, -0.3291778564453125, -0.3156547546386719, -0.30213165283203125, -0.2886085510253906, -0.27508544921875, -0.2615623474121094, -0.24803924560546875, -0.23451614379882812, -0.2209930419921875, -0.20746994018554688, -0.19394683837890625, -0.18042373657226562, -0.166900634765625, -0.15337753295898438, -0.13985443115234375, -0.12633132934570312, -0.1128082275390625, -0.09928512573242188, -0.08576202392578125, -0.07223892211914062, -0.0587158203125, -0.045192718505859375, -0.03166961669921875, -0.018146514892578125, -0.0046234130859375, 0.008899688720703125, 0.02242279052734375, 0.035945892333984375, 0.049468994140625, 0.06299209594726562, 0.07651519775390625, 0.09003829956054688, 0.1035614013671875, 0.11708450317382812, 0.13060760498046875, 0.14413070678710938, 0.15765380859375, 0.17117691040039062, 0.18470001220703125, 0.19822311401367188, 0.2117462158203125, 0.22526931762695312, 0.23879241943359375, 0.2523155212402344, 0.265838623046875, 0.2793617248535156, 0.29288482666015625, 0.3064079284667969, 0.3199310302734375, 0.3334541320800781, 0.34697723388671875, 0.3605003356933594, 0.3740234375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 3.0, 6.0, 8.0, 7.0, 9.0, 11.0, 13.0, 13.0, 12.0, 30.0, 10.0, 25.0, 32.0, 34.0, 38.0, 41.0, 40.0, 37.0, 50.0, 44.0, 60.0, 39.0, 46.0, 41.0, 36.0, 42.0, 32.0, 33.0, 23.0, 29.0, 26.0, 25.0, 17.0, 13.0, 8.0, 10.0, 11.0, 8.0, 10.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.259614944458008, -18.628694534301758, -17.99777603149414, -17.36685562133789, -16.735937118530273, -16.105016708374023, -15.474098205566406, -14.843177795410156, -14.212259292602539, -13.581339836120605, -12.950420379638672, -12.319500923156738, -11.688581466674805, -11.057662010192871, -10.426742553710938, -9.795822143554688, -9.164902687072754, -8.53398323059082, -7.903063774108887, -7.272144317626953, -6.6412248611450195, -6.010305404663086, -5.379385471343994, -4.7484660148620605, -4.117546558380127, -3.4866271018981934, -2.8557076454162598, -2.224787950515747, -1.5938684940338135, -0.9629490375518799, -0.3320293426513672, 0.2988901138305664, 0.9298095703125, 1.5607290267944336, 2.191648483276367, 2.82256817817688, 3.4534876346588135, 4.084406852722168, 4.71532678604126, 5.346246242523193, 5.977165699005127, 6.6080851554870605, 7.239004611968994, 7.869924545288086, 8.50084400177002, 9.131763458251953, 9.762682914733887, 10.39360237121582, 11.024521827697754, 11.655441284179688, 12.286360740661621, 12.917280197143555, 13.548199653625488, 14.179119110107422, 14.810039520263672, 15.440958023071289, 16.07187843322754, 16.70279884338379, 17.333717346191406, 17.964637756347656, 18.595556259155273, 19.226476669311523, 19.85739517211914, 20.48831558227539, 21.119234085083008]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 2.0, 3.0, 10.0, 10.0, 14.0, 12.0, 14.0, 22.0, 16.0, 25.0, 36.0, 29.0, 21.0, 35.0, 50.0, 50.0, 48.0, 46.0, 48.0, 41.0, 50.0, 46.0, 47.0, 35.0, 47.0, 29.0, 38.0, 28.0, 24.0, 18.0, 22.0, 20.0, 18.0, 11.0, 6.0, 7.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-30.513530731201172, -29.620023727416992, -28.726516723632812, -27.833009719848633, -26.939502716064453, -26.04599380493164, -25.15248680114746, -24.25897979736328, -23.3654727935791, -22.471965789794922, -21.578458786010742, -20.684951782226562, -19.79144287109375, -18.897937774658203, -18.00442886352539, -17.11092185974121, -16.21741485595703, -15.323907852172852, -14.430400848388672, -13.536892890930176, -12.643385887145996, -11.749878883361816, -10.85637092590332, -9.96286392211914, -9.069356918334961, -8.175849914550781, -7.282342433929443, -6.3888349533081055, -5.495327949523926, -4.601820945739746, -3.708313465118408, -2.8148059844970703, -1.9212989807128906, -1.0277917385101318, -0.13428449630737305, 0.7592227458953857, 1.6527299880981445, 2.546236991882324, 3.439744472503662, 4.333251953125, 5.22675895690918, 6.120265960693359, 7.013773441314697, 7.907280921936035, 8.800787925720215, 9.694294929504395, 10.58780288696289, 11.48130989074707, 12.37481689453125, 13.26832389831543, 14.16183090209961, 15.055338859558105, 15.948845863342285, 16.84235382080078, 17.73586082458496, 18.62936782836914, 19.52287483215332, 20.4163818359375, 21.30988883972168, 22.20339584350586, 23.096904754638672, 23.99040985107422, 24.88391876220703, 25.77742576599121, 26.67093276977539]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 8.0, 10.0, 17.0, 13.0, 18.0, 30.0, 69.0, 87.0, 170.0, 233.0, 402.0, 575.0, 956.0, 1619.0, 2645.0, 4372.0, 7254.0, 11592.0, 18425.0, 28183.0, 41667.0, 58578.0, 77708.0, 96028.0, 111235.0, 115865.0, 110045.0, 98131.0, 79727.0, 60108.0, 43019.0, 29422.0, 19148.0, 12040.0, 7483.0, 4706.0, 2774.0, 1660.0, 955.0, 593.0, 332.0, 226.0, 161.0, 95.0, 56.0, 44.0, 35.0, 14.0, 9.0, 7.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.6875, -16.158447265625, -15.62939453125, -15.100341796875, -14.5712890625, -14.042236328125, -13.51318359375, -12.984130859375, -12.455078125, -11.926025390625, -11.39697265625, -10.867919921875, -10.3388671875, -9.809814453125, -9.28076171875, -8.751708984375, -8.22265625, -7.693603515625, -7.16455078125, -6.635498046875, -6.1064453125, -5.577392578125, -5.04833984375, -4.519287109375, -3.990234375, -3.461181640625, -2.93212890625, -2.403076171875, -1.8740234375, -1.344970703125, -0.81591796875, -0.286865234375, 0.2421875, 0.771240234375, 1.30029296875, 1.829345703125, 2.3583984375, 2.887451171875, 3.41650390625, 3.945556640625, 4.474609375, 5.003662109375, 5.53271484375, 6.061767578125, 6.5908203125, 7.119873046875, 7.64892578125, 8.177978515625, 8.70703125, 9.236083984375, 9.76513671875, 10.294189453125, 10.8232421875, 11.352294921875, 11.88134765625, 12.410400390625, 12.939453125, 13.468505859375, 13.99755859375, 14.526611328125, 15.0556640625, 15.584716796875, 16.11376953125, 16.642822265625, 17.171875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 2.0, 2.0, 10.0, 10.0, 13.0, 12.0, 14.0, 21.0, 15.0, 26.0, 31.0, 33.0, 25.0, 27.0, 53.0, 51.0, 48.0, 46.0, 50.0, 39.0, 52.0, 43.0, 53.0, 31.0, 51.0, 29.0, 37.0, 32.0, 20.0, 20.0, 24.0, 17.0, 16.0, 11.0, 6.0, 9.0, 11.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-29.765625, -28.8955078125, -28.025390625, -27.1552734375, -26.28515625, -25.4150390625, -24.544921875, -23.6748046875, -22.8046875, -21.9345703125, -21.064453125, -20.1943359375, -19.32421875, -18.4541015625, -17.583984375, -16.7138671875, -15.84375, -14.9736328125, -14.103515625, -13.2333984375, -12.36328125, -11.4931640625, -10.623046875, -9.7529296875, -8.8828125, -8.0126953125, -7.142578125, -6.2724609375, -5.40234375, -4.5322265625, -3.662109375, -2.7919921875, -1.921875, -1.0517578125, -0.181640625, 0.6884765625, 1.55859375, 2.4287109375, 3.298828125, 4.1689453125, 5.0390625, 5.9091796875, 6.779296875, 7.6494140625, 8.51953125, 9.3896484375, 10.259765625, 11.1298828125, 12.0, 12.8701171875, 13.740234375, 14.6103515625, 15.48046875, 16.3505859375, 17.220703125, 18.0908203125, 18.9609375, 19.8310546875, 20.701171875, 21.5712890625, 22.44140625, 23.3115234375, 24.181640625, 25.0517578125, 25.921875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 12.0, 8.0, 14.0, 15.0, 38.0, 52.0, 104.0, 168.0, 259.0, 375.0, 616.0, 1021.0, 1687.0, 2603.0, 4365.0, 6952.0, 10962.0, 17091.0, 25865.0, 37844.0, 53336.0, 71389.0, 89526.0, 103736.0, 111801.0, 109689.0, 100802.0, 84161.0, 66313.0, 49230.0, 34236.0, 23302.0, 15067.0, 9638.0, 6126.0, 3935.0, 2368.0, 1431.0, 890.0, 591.0, 360.0, 215.0, 135.0, 87.0, 59.0, 43.0, 24.0, 13.0, 9.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.375, -15.844482421875, -15.31396484375, -14.783447265625, -14.2529296875, -13.722412109375, -13.19189453125, -12.661376953125, -12.130859375, -11.600341796875, -11.06982421875, -10.539306640625, -10.0087890625, -9.478271484375, -8.94775390625, -8.417236328125, -7.88671875, -7.356201171875, -6.82568359375, -6.295166015625, -5.7646484375, -5.234130859375, -4.70361328125, -4.173095703125, -3.642578125, -3.112060546875, -2.58154296875, -2.051025390625, -1.5205078125, -0.989990234375, -0.45947265625, 0.071044921875, 0.6015625, 1.132080078125, 1.66259765625, 2.193115234375, 2.7236328125, 3.254150390625, 3.78466796875, 4.315185546875, 4.845703125, 5.376220703125, 5.90673828125, 6.437255859375, 6.9677734375, 7.498291015625, 8.02880859375, 8.559326171875, 9.08984375, 9.620361328125, 10.15087890625, 10.681396484375, 11.2119140625, 11.742431640625, 12.27294921875, 12.803466796875, 13.333984375, 13.864501953125, 14.39501953125, 14.925537109375, 15.4560546875, 15.986572265625, 16.51708984375, 17.047607421875, 17.578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 3.0, 5.0, 7.0, 11.0, 6.0, 17.0, 9.0, 13.0, 7.0, 18.0, 20.0, 21.0, 32.0, 22.0, 28.0, 26.0, 34.0, 38.0, 44.0, 40.0, 44.0, 39.0, 42.0, 49.0, 41.0, 35.0, 38.0, 45.0, 33.0, 38.0, 32.0, 19.0, 28.0, 24.0, 15.0, 19.0, 19.0, 2.0, 7.0, 4.0, 7.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 4.0], "bins": [-18.265625, -17.760498046875, -17.25537109375, -16.750244140625, -16.2451171875, -15.739990234375, -15.23486328125, -14.729736328125, -14.224609375, -13.719482421875, -13.21435546875, -12.709228515625, -12.2041015625, -11.698974609375, -11.19384765625, -10.688720703125, -10.18359375, -9.678466796875, -9.17333984375, -8.668212890625, -8.1630859375, -7.657958984375, -7.15283203125, -6.647705078125, -6.142578125, -5.637451171875, -5.13232421875, -4.627197265625, -4.1220703125, -3.616943359375, -3.11181640625, -2.606689453125, -2.1015625, -1.596435546875, -1.09130859375, -0.586181640625, -0.0810546875, 0.424072265625, 0.92919921875, 1.434326171875, 1.939453125, 2.444580078125, 2.94970703125, 3.454833984375, 3.9599609375, 4.465087890625, 4.97021484375, 5.475341796875, 5.98046875, 6.485595703125, 6.99072265625, 7.495849609375, 8.0009765625, 8.506103515625, 9.01123046875, 9.516357421875, 10.021484375, 10.526611328125, 11.03173828125, 11.536865234375, 12.0419921875, 12.547119140625, 13.05224609375, 13.557373046875, 14.0625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 11.0, 12.0, 24.0, 24.0, 50.0, 77.0, 137.0, 236.0, 375.0, 609.0, 975.0, 1750.0, 2822.0, 4926.0, 8162.0, 13985.0, 23920.0, 39138.0, 62073.0, 92140.0, 122569.0, 143209.0, 144439.0, 125035.0, 94773.0, 64657.0, 41356.0, 24908.0, 14946.0, 8678.0, 5132.0, 2966.0, 1692.0, 1104.0, 615.0, 375.0, 242.0, 146.0, 110.0, 51.0, 41.0, 27.0, 7.0, 12.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.3984375, -8.1279296875, -7.857421875, -7.5869140625, -7.31640625, -7.0458984375, -6.775390625, -6.5048828125, -6.234375, -5.9638671875, -5.693359375, -5.4228515625, -5.15234375, -4.8818359375, -4.611328125, -4.3408203125, -4.0703125, -3.7998046875, -3.529296875, -3.2587890625, -2.98828125, -2.7177734375, -2.447265625, -2.1767578125, -1.90625, -1.6357421875, -1.365234375, -1.0947265625, -0.82421875, -0.5537109375, -0.283203125, -0.0126953125, 0.2578125, 0.5283203125, 0.798828125, 1.0693359375, 1.33984375, 1.6103515625, 1.880859375, 2.1513671875, 2.421875, 2.6923828125, 2.962890625, 3.2333984375, 3.50390625, 3.7744140625, 4.044921875, 4.3154296875, 4.5859375, 4.8564453125, 5.126953125, 5.3974609375, 5.66796875, 5.9384765625, 6.208984375, 6.4794921875, 6.75, 7.0205078125, 7.291015625, 7.5615234375, 7.83203125, 8.1025390625, 8.373046875, 8.6435546875, 8.9140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 3.0, 5.0, 7.0, 7.0, 14.0, 15.0, 15.0, 15.0, 23.0, 38.0, 39.0, 28.0, 37.0, 50.0, 43.0, 42.0, 42.0, 48.0, 57.0, 55.0, 51.0, 39.0, 46.0, 47.0, 35.0, 31.0, 26.0, 16.0, 23.0, 15.0, 14.0, 13.0, 13.0, 10.0, 4.0, 10.0, 2.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0008306503295898438, -0.0008050352334976196, -0.0007794201374053955, -0.0007538050413131714, -0.0007281899452209473, -0.0007025748491287231, -0.000676959753036499, -0.0006513446569442749, -0.0006257295608520508, -0.0006001144647598267, -0.0005744993686676025, -0.0005488842725753784, -0.0005232691764831543, -0.0004976540803909302, -0.00047203898429870605, -0.00044642388820648193, -0.0004208087921142578, -0.0003951936960220337, -0.00036957859992980957, -0.00034396350383758545, -0.00031834840774536133, -0.0002927333116531372, -0.0002671182155609131, -0.00024150311946868896, -0.00021588802337646484, -0.00019027292728424072, -0.0001646578311920166, -0.00013904273509979248, -0.00011342763900756836, -8.781254291534424e-05, -6.219744682312012e-05, -3.6582350730895996e-05, -1.0967254638671875e-05, 1.4647841453552246e-05, 4.026293754577637e-05, 6.587803363800049e-05, 9.149312973022461e-05, 0.00011710822582244873, 0.00014272332191467285, 0.00016833841800689697, 0.0001939535140991211, 0.00021956861019134521, 0.00024518370628356934, 0.00027079880237579346, 0.0002964138984680176, 0.0003220289945602417, 0.0003476440906524658, 0.00037325918674468994, 0.00039887428283691406, 0.0004244893789291382, 0.0004501044750213623, 0.0004757195711135864, 0.0005013346672058105, 0.0005269497632980347, 0.0005525648593902588, 0.0005781799554824829, 0.000603795051574707, 0.0006294101476669312, 0.0006550252437591553, 0.0006806403398513794, 0.0007062554359436035, 0.0007318705320358276, 0.0007574856281280518, 0.0007831007242202759, 0.0008087158203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 5.0, 18.0, 19.0, 45.0, 47.0, 61.0, 116.0, 153.0, 263.0, 421.0, 616.0, 990.0, 1550.0, 2143.0, 3439.0, 5265.0, 7895.0, 12255.0, 18513.0, 27581.0, 40139.0, 56043.0, 75132.0, 94100.0, 108216.0, 114758.0, 111318.0, 97258.0, 79207.0, 59866.0, 42957.0, 29648.0, 20165.0, 13337.0, 8724.0, 5605.0, 3712.0, 2412.0, 1586.0, 1046.0, 695.0, 412.0, 286.0, 193.0, 111.0, 80.0, 56.0, 40.0, 19.0, 21.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0], "bins": [-7.140625, -6.9281005859375, -6.715576171875, -6.5030517578125, -6.29052734375, -6.0780029296875, -5.865478515625, -5.6529541015625, -5.4404296875, -5.2279052734375, -5.015380859375, -4.8028564453125, -4.59033203125, -4.3778076171875, -4.165283203125, -3.9527587890625, -3.740234375, -3.5277099609375, -3.315185546875, -3.1026611328125, -2.89013671875, -2.6776123046875, -2.465087890625, -2.2525634765625, -2.0400390625, -1.8275146484375, -1.614990234375, -1.4024658203125, -1.18994140625, -0.9774169921875, -0.764892578125, -0.5523681640625, -0.33984375, -0.1273193359375, 0.085205078125, 0.2977294921875, 0.51025390625, 0.7227783203125, 0.935302734375, 1.1478271484375, 1.3603515625, 1.5728759765625, 1.785400390625, 1.9979248046875, 2.21044921875, 2.4229736328125, 2.635498046875, 2.8480224609375, 3.060546875, 3.2730712890625, 3.485595703125, 3.6981201171875, 3.91064453125, 4.1231689453125, 4.335693359375, 4.5482177734375, 4.7607421875, 4.9732666015625, 5.185791015625, 5.3983154296875, 5.61083984375, 5.8233642578125, 6.035888671875, 6.2484130859375, 6.4609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 7.0, 9.0, 13.0, 15.0, 20.0, 23.0, 25.0, 20.0, 39.0, 42.0, 51.0, 51.0, 48.0, 48.0, 64.0, 47.0, 65.0, 57.0, 48.0, 39.0, 43.0, 35.0, 31.0, 31.0, 25.0, 16.0, 16.0, 14.0, 8.0, 7.0, 7.0, 6.0, 2.0, 0.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.9453125, -4.80438232421875, -4.6634521484375, -4.52252197265625, -4.381591796875, -4.24066162109375, -4.0997314453125, -3.95880126953125, -3.81787109375, -3.67694091796875, -3.5360107421875, -3.39508056640625, -3.254150390625, -3.11322021484375, -2.9722900390625, -2.83135986328125, -2.6904296875, -2.54949951171875, -2.4085693359375, -2.26763916015625, -2.126708984375, -1.98577880859375, -1.8448486328125, -1.70391845703125, -1.56298828125, -1.42205810546875, -1.2811279296875, -1.14019775390625, -0.999267578125, -0.85833740234375, -0.7174072265625, -0.57647705078125, -0.435546875, -0.29461669921875, -0.1536865234375, -0.01275634765625, 0.128173828125, 0.26910400390625, 0.4100341796875, 0.55096435546875, 0.69189453125, 0.83282470703125, 0.9737548828125, 1.11468505859375, 1.255615234375, 1.39654541015625, 1.5374755859375, 1.67840576171875, 1.8193359375, 1.96026611328125, 2.1011962890625, 2.24212646484375, 2.383056640625, 2.52398681640625, 2.6649169921875, 2.80584716796875, 2.94677734375, 3.08770751953125, 3.2286376953125, 3.36956787109375, 3.510498046875, 3.65142822265625, 3.7923583984375, 3.93328857421875, 4.07421875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 6.0, 5.0, 6.0, 1.0, 6.0, 9.0, 4.0, 14.0, 12.0, 19.0, 22.0, 26.0, 20.0, 29.0, 28.0, 28.0, 34.0, 33.0, 40.0, 43.0, 34.0, 46.0, 45.0, 32.0, 42.0, 37.0, 50.0, 47.0, 33.0, 32.0, 36.0, 26.0, 25.0, 15.0, 24.0, 12.0, 23.0, 12.0, 11.0, 6.0, 5.0, 8.0, 5.0, 5.0, 1.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-20.437000274658203, -19.82698631286621, -19.21697425842285, -18.60696029663086, -17.996946334838867, -17.386932373046875, -16.776920318603516, -16.166906356811523, -15.556893348693848, -14.946880340576172, -14.33686637878418, -13.726853370666504, -13.116840362548828, -12.506826400756836, -11.89681339263916, -11.286800384521484, -10.676786422729492, -10.066773414611816, -9.456759452819824, -8.846746444702148, -8.236732482910156, -7.6267194747924805, -7.016706466674805, -6.406692981719971, -5.796679496765137, -5.186666011810303, -4.576652526855469, -3.966639518737793, -3.356626033782959, -2.746612548828125, -2.13659930229187, -1.5265860557556152, -0.9165744781494141, -0.30656111240386963, 0.3034522533416748, 0.9134656190872192, 1.5234789848327637, 2.1334924697875977, 2.7435057163238525, 3.3535189628601074, 3.9635324478149414, 4.573545932769775, 5.183559417724609, 5.793572425842285, 6.403585910797119, 7.013599395751953, 7.623612403869629, 8.233625411987305, 8.843639373779297, 9.453652381896973, 10.063666343688965, 10.67367935180664, 11.283693313598633, 11.893706321716309, 12.503719329833984, 13.113733291625977, 13.723746299743652, 14.333759307861328, 14.94377326965332, 15.553786277770996, 16.163799285888672, 16.773813247680664, 17.383827209472656, 17.993839263916016, 18.603853225708008]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 9.0, 5.0, 6.0, 11.0, 19.0, 10.0, 11.0, 9.0, 22.0, 21.0, 25.0, 36.0, 25.0, 30.0, 34.0, 36.0, 33.0, 50.0, 67.0, 38.0, 34.0, 37.0, 38.0, 47.0, 41.0, 41.0, 22.0, 32.0, 35.0, 31.0, 21.0, 24.0, 14.0, 10.0, 14.0, 11.0, 13.0, 11.0, 9.0, 5.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-27.638744354248047, -26.830415725708008, -26.022085189819336, -25.213756561279297, -24.405427932739258, -23.59709930419922, -22.788768768310547, -21.980440139770508, -21.17211151123047, -20.36378288269043, -19.555452346801758, -18.74712371826172, -17.93879508972168, -17.13046646118164, -16.32213592529297, -15.51380729675293, -14.705476760864258, -13.897147178649902, -13.088818550109863, -12.280488967895508, -11.472160339355469, -10.663830757141113, -9.855501174926758, -9.047172546386719, -8.238842964172363, -7.430513858795166, -6.622184753417969, -5.813855171203613, -5.005526065826416, -4.197196960449219, -3.3888673782348633, -2.580538272857666, -1.772207260131836, -0.9638780355453491, -0.1555488109588623, 0.6527805328369141, 1.4611096382141113, 2.2694387435913086, 3.077768325805664, 3.8860974311828613, 4.694426536560059, 5.502755641937256, 6.311084747314453, 7.119414329528809, 7.927743434906006, 8.736072540283203, 9.544402122497559, 10.352731704711914, 11.161060333251953, 11.969389915466309, 12.777718544006348, 13.586048126220703, 14.394376754760742, 15.202706336975098, 16.011035919189453, 16.819364547729492, 17.62769317626953, 18.43602180480957, 19.244352340698242, 20.05268096923828, 20.86100959777832, 21.66933822631836, 22.47766876220703, 23.28599739074707, 24.094327926635742]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 10.0, 21.0, 46.0, 52.0, 83.0, 135.0, 240.0, 397.0, 693.0, 1085.0, 1987.0, 3202.0, 5453.0, 8796.0, 14396.0, 23456.0, 37164.0, 57944.0, 88338.0, 129710.0, 184262.0, 247015.0, 315683.0, 379618.0, 422236.0, 434941.0, 415831.0, 367444.0, 302986.0, 233780.0, 171461.0, 120677.0, 81660.0, 53417.0, 34520.0, 21774.0, 13499.0, 8045.0, 4951.0, 3027.0, 1766.0, 987.0, 636.0, 362.0, 197.0, 137.0, 77.0, 35.0, 22.0, 15.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.3828125, -12.9566650390625, -12.530517578125, -12.1043701171875, -11.67822265625, -11.2520751953125, -10.825927734375, -10.3997802734375, -9.9736328125, -9.5474853515625, -9.121337890625, -8.6951904296875, -8.26904296875, -7.8428955078125, -7.416748046875, -6.9906005859375, -6.564453125, -6.1383056640625, -5.712158203125, -5.2860107421875, -4.85986328125, -4.4337158203125, -4.007568359375, -3.5814208984375, -3.1552734375, -2.7291259765625, -2.302978515625, -1.8768310546875, -1.45068359375, -1.0245361328125, -0.598388671875, -0.1722412109375, 0.25390625, 0.6800537109375, 1.106201171875, 1.5323486328125, 1.95849609375, 2.3846435546875, 2.810791015625, 3.2369384765625, 3.6630859375, 4.0892333984375, 4.515380859375, 4.9415283203125, 5.36767578125, 5.7938232421875, 6.219970703125, 6.6461181640625, 7.072265625, 7.4984130859375, 7.924560546875, 8.3507080078125, 8.77685546875, 9.2030029296875, 9.629150390625, 10.0552978515625, 10.4814453125, 10.9075927734375, 11.333740234375, 11.7598876953125, 12.18603515625, 12.6121826171875, 13.038330078125, 13.4644775390625, 13.890625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 6.0, 8.0, 7.0, 9.0, 15.0, 10.0, 13.0, 18.0, 15.0, 21.0, 27.0, 39.0, 20.0, 34.0, 38.0, 32.0, 36.0, 51.0, 64.0, 42.0, 36.0, 41.0, 45.0, 35.0, 41.0, 40.0, 25.0, 27.0, 36.0, 28.0, 27.0, 20.0, 11.0, 12.0, 17.0, 5.0, 13.0, 10.0, 10.0, 3.0, 7.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-24.734375, -24.011962890625, -23.28955078125, -22.567138671875, -21.8447265625, -21.122314453125, -20.39990234375, -19.677490234375, -18.955078125, -18.232666015625, -17.51025390625, -16.787841796875, -16.0654296875, -15.343017578125, -14.62060546875, -13.898193359375, -13.17578125, -12.453369140625, -11.73095703125, -11.008544921875, -10.2861328125, -9.563720703125, -8.84130859375, -8.118896484375, -7.396484375, -6.674072265625, -5.95166015625, -5.229248046875, -4.5068359375, -3.784423828125, -3.06201171875, -2.339599609375, -1.6171875, -0.894775390625, -0.17236328125, 0.550048828125, 1.2724609375, 1.994873046875, 2.71728515625, 3.439697265625, 4.162109375, 4.884521484375, 5.60693359375, 6.329345703125, 7.0517578125, 7.774169921875, 8.49658203125, 9.218994140625, 9.94140625, 10.663818359375, 11.38623046875, 12.108642578125, 12.8310546875, 13.553466796875, 14.27587890625, 14.998291015625, 15.720703125, 16.443115234375, 17.16552734375, 17.887939453125, 18.6103515625, 19.332763671875, 20.05517578125, 20.777587890625, 21.5]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 11.0, 15.0, 28.0, 32.0, 99.0, 153.0, 273.0, 484.0, 899.0, 1589.0, 2762.0, 5057.0, 9045.0, 15568.0, 26440.0, 44478.0, 70765.0, 110975.0, 162042.0, 228026.0, 300352.0, 371103.0, 424860.0, 448806.0, 439365.0, 396029.0, 332672.0, 258691.0, 190339.0, 131584.0, 87080.0, 54970.0, 33666.0, 19894.0, 11402.0, 6409.0, 3678.0, 2054.0, 1154.0, 655.0, 322.0, 212.0, 89.0, 77.0, 37.0, 19.0, 12.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-16.140625, -15.6473388671875, -15.154052734375, -14.6607666015625, -14.16748046875, -13.6741943359375, -13.180908203125, -12.6876220703125, -12.1943359375, -11.7010498046875, -11.207763671875, -10.7144775390625, -10.22119140625, -9.7279052734375, -9.234619140625, -8.7413330078125, -8.248046875, -7.7547607421875, -7.261474609375, -6.7681884765625, -6.27490234375, -5.7816162109375, -5.288330078125, -4.7950439453125, -4.3017578125, -3.8084716796875, -3.315185546875, -2.8218994140625, -2.32861328125, -1.8353271484375, -1.342041015625, -0.8487548828125, -0.35546875, 0.1378173828125, 0.631103515625, 1.1243896484375, 1.61767578125, 2.1109619140625, 2.604248046875, 3.0975341796875, 3.5908203125, 4.0841064453125, 4.577392578125, 5.0706787109375, 5.56396484375, 6.0572509765625, 6.550537109375, 7.0438232421875, 7.537109375, 8.0303955078125, 8.523681640625, 9.0169677734375, 9.51025390625, 10.0035400390625, 10.496826171875, 10.9901123046875, 11.4833984375, 11.9766845703125, 12.469970703125, 12.9632568359375, 13.45654296875, 13.9498291015625, 14.443115234375, 14.9364013671875, 15.4296875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 0.0, 6.0, 2.0, 6.0, 11.0, 15.0, 19.0, 25.0, 32.0, 41.0, 51.0, 75.0, 83.0, 101.0, 91.0, 133.0, 137.0, 163.0, 162.0, 184.0, 178.0, 207.0, 221.0, 192.0, 184.0, 199.0, 188.0, 175.0, 213.0, 155.0, 153.0, 108.0, 108.0, 81.0, 70.0, 68.0, 48.0, 51.0, 42.0, 22.0, 30.0, 11.0, 16.0, 8.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66796875, -7.38140869140625, -7.0948486328125, -6.80828857421875, -6.521728515625, -6.23516845703125, -5.9486083984375, -5.66204833984375, -5.37548828125, -5.08892822265625, -4.8023681640625, -4.51580810546875, -4.229248046875, -3.94268798828125, -3.6561279296875, -3.36956787109375, -3.0830078125, -2.79644775390625, -2.5098876953125, -2.22332763671875, -1.936767578125, -1.65020751953125, -1.3636474609375, -1.07708740234375, -0.79052734375, -0.50396728515625, -0.2174072265625, 0.06915283203125, 0.355712890625, 0.64227294921875, 0.9288330078125, 1.21539306640625, 1.501953125, 1.78851318359375, 2.0750732421875, 2.36163330078125, 2.648193359375, 2.93475341796875, 3.2213134765625, 3.50787353515625, 3.79443359375, 4.08099365234375, 4.3675537109375, 4.65411376953125, 4.940673828125, 5.22723388671875, 5.5137939453125, 5.80035400390625, 6.0869140625, 6.37347412109375, 6.6600341796875, 6.94659423828125, 7.233154296875, 7.51971435546875, 7.8062744140625, 8.09283447265625, 8.37939453125, 8.66595458984375, 8.9525146484375, 9.23907470703125, 9.525634765625, 9.81219482421875, 10.0987548828125, 10.38531494140625, 10.671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 7.0, 11.0, 15.0, 10.0, 10.0, 15.0, 22.0, 16.0, 22.0, 23.0, 32.0, 29.0, 30.0, 42.0, 47.0, 35.0, 46.0, 51.0, 52.0, 41.0, 48.0, 47.0, 54.0, 38.0, 29.0, 31.0, 26.0, 33.0, 30.0, 18.0, 9.0, 10.0, 9.0, 11.0, 13.0, 5.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.877586364746094, -20.215364456176758, -19.553144454956055, -18.89092254638672, -18.228700637817383, -17.566478729248047, -16.904258728027344, -16.242036819458008, -15.579815864562988, -14.917594909667969, -14.255373001098633, -13.593152046203613, -12.930931091308594, -12.268709182739258, -11.606488227844238, -10.944267272949219, -10.282045364379883, -9.619824409484863, -8.957602500915527, -8.295381546020508, -7.63316011428833, -6.970938682556152, -6.308717727661133, -5.646496295928955, -4.984274864196777, -4.3220534324646, -3.659832239151001, -2.9976110458374023, -2.3353896141052246, -1.6731681823730469, -1.0109469890594482, -0.3487257957458496, 0.31349754333496094, 0.9757188558578491, 1.6379401683807373, 2.300161361694336, 2.9623827934265137, 3.6246042251586914, 4.286825180053711, 4.949046611785889, 5.611268043518066, 6.273489475250244, 6.935710906982422, 7.597931861877441, 8.260152816772461, 8.922374725341797, 9.584595680236816, 10.246816635131836, 10.909038543701172, 11.571259498596191, 12.233481407165527, 12.895702362060547, 13.557924270629883, 14.220145225524902, 14.882366180419922, 15.544588088989258, 16.206809997558594, 16.86903190612793, 17.531251907348633, 18.19347381591797, 18.855695724487305, 19.51791763305664, 20.180137634277344, 20.84235954284668, 21.504579544067383]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 5.0, 6.0, 8.0, 7.0, 7.0, 13.0, 10.0, 7.0, 11.0, 13.0, 20.0, 25.0, 26.0, 26.0, 32.0, 39.0, 39.0, 36.0, 43.0, 44.0, 34.0, 41.0, 41.0, 47.0, 35.0, 46.0, 28.0, 38.0, 39.0, 33.0, 22.0, 24.0, 30.0, 21.0, 18.0, 18.0, 10.0, 14.0, 13.0, 9.0, 9.0, 5.0, 6.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-27.612220764160156, -26.8282413482666, -26.044261932373047, -25.260284423828125, -24.47630500793457, -23.692325592041016, -22.908348083496094, -22.12436866760254, -21.340389251708984, -20.55640983581543, -19.772430419921875, -18.988452911376953, -18.2044734954834, -17.420494079589844, -16.636516571044922, -15.852537155151367, -15.068557739257812, -14.284578323364258, -13.50059986114502, -12.716621398925781, -11.932641983032227, -11.148662567138672, -10.364684104919434, -9.580705642700195, -8.79672622680664, -8.012746810913086, -7.228768348693848, -6.444789409637451, -5.660810470581055, -4.876831531524658, -4.092852592468262, -3.3088736534118652, -2.5248947143554688, -1.7409157752990723, -0.9569368362426758, -0.1729578971862793, 0.6110210418701172, 1.3949999809265137, 2.17897891998291, 2.9629578590393066, 3.746936798095703, 4.5309157371521, 5.314894676208496, 6.098873615264893, 6.882852554321289, 7.6668314933776855, 8.450810432434082, 9.23478889465332, 10.018768310546875, 10.80274772644043, 11.586726188659668, 12.370704650878906, 13.154684066772461, 13.938663482666016, 14.722641944885254, 15.506620407104492, 16.290599822998047, 17.0745792388916, 17.858558654785156, 18.642536163330078, 19.426515579223633, 20.210494995117188, 20.99447250366211, 21.778451919555664, 22.56243133544922]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 15.0, 21.0, 32.0, 44.0, 67.0, 91.0, 157.0, 225.0, 410.0, 649.0, 1074.0, 1710.0, 2652.0, 4112.0, 6441.0, 9778.0, 14841.0, 22603.0, 32961.0, 47592.0, 64925.0, 84531.0, 102666.0, 115416.0, 116052.0, 105725.0, 88392.0, 68464.0, 50415.0, 35806.0, 24363.0, 16340.0, 10747.0, 6984.0, 4507.0, 2907.0, 1787.0, 1146.0, 735.0, 441.0, 276.0, 182.0, 102.0, 63.0, 43.0, 22.0, 18.0, 14.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.578125, -4.430908203125, -4.28369140625, -4.136474609375, -3.9892578125, -3.842041015625, -3.69482421875, -3.547607421875, -3.400390625, -3.253173828125, -3.10595703125, -2.958740234375, -2.8115234375, -2.664306640625, -2.51708984375, -2.369873046875, -2.22265625, -2.075439453125, -1.92822265625, -1.781005859375, -1.6337890625, -1.486572265625, -1.33935546875, -1.192138671875, -1.044921875, -0.897705078125, -0.75048828125, -0.603271484375, -0.4560546875, -0.308837890625, -0.16162109375, -0.014404296875, 0.1328125, 0.280029296875, 0.42724609375, 0.574462890625, 0.7216796875, 0.868896484375, 1.01611328125, 1.163330078125, 1.310546875, 1.457763671875, 1.60498046875, 1.752197265625, 1.8994140625, 2.046630859375, 2.19384765625, 2.341064453125, 2.48828125, 2.635498046875, 2.78271484375, 2.929931640625, 3.0771484375, 3.224365234375, 3.37158203125, 3.518798828125, 3.666015625, 3.813232421875, 3.96044921875, 4.107666015625, 4.2548828125, 4.402099609375, 4.54931640625, 4.696533203125, 4.84375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 5.0, 6.0, 8.0, 7.0, 7.0, 13.0, 11.0, 8.0, 9.0, 13.0, 20.0, 26.0, 27.0, 25.0, 34.0, 37.0, 38.0, 37.0, 42.0, 49.0, 31.0, 43.0, 41.0, 46.0, 36.0, 41.0, 30.0, 38.0, 39.0, 34.0, 23.0, 20.0, 33.0, 19.0, 21.0, 16.0, 11.0, 13.0, 12.0, 9.0, 10.0, 5.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0], "bins": [-27.703125, -26.917236328125, -26.13134765625, -25.345458984375, -24.5595703125, -23.773681640625, -22.98779296875, -22.201904296875, -21.416015625, -20.630126953125, -19.84423828125, -19.058349609375, -18.2724609375, -17.486572265625, -16.70068359375, -15.914794921875, -15.12890625, -14.343017578125, -13.55712890625, -12.771240234375, -11.9853515625, -11.199462890625, -10.41357421875, -9.627685546875, -8.841796875, -8.055908203125, -7.27001953125, -6.484130859375, -5.6982421875, -4.912353515625, -4.12646484375, -3.340576171875, -2.5546875, -1.768798828125, -0.98291015625, -0.197021484375, 0.5888671875, 1.374755859375, 2.16064453125, 2.946533203125, 3.732421875, 4.518310546875, 5.30419921875, 6.090087890625, 6.8759765625, 7.661865234375, 8.44775390625, 9.233642578125, 10.01953125, 10.805419921875, 11.59130859375, 12.377197265625, 13.1630859375, 13.948974609375, 14.73486328125, 15.520751953125, 16.306640625, 17.092529296875, 17.87841796875, 18.664306640625, 19.4501953125, 20.236083984375, 21.02197265625, 21.807861328125, 22.59375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 6.0, 7.0, 17.0, 14.0, 18.0, 30.0, 41.0, 75.0, 70.0, 114.0, 173.0, 275.0, 320.0, 514.0, 712.0, 1127.0, 1630.0, 2414.0, 3884.0, 5748.0, 9196.0, 14802.0, 25303.0, 95020.0, 795717.0, 37454.0, 19993.0, 11903.0, 7724.0, 4739.0, 3152.0, 2102.0, 1363.0, 863.0, 624.0, 422.0, 282.0, 195.0, 138.0, 109.0, 84.0, 45.0, 45.0, 35.0, 17.0, 15.0, 7.0, 10.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-17.46875, -16.94384765625, -16.4189453125, -15.89404296875, -15.369140625, -14.84423828125, -14.3193359375, -13.79443359375, -13.26953125, -12.74462890625, -12.2197265625, -11.69482421875, -11.169921875, -10.64501953125, -10.1201171875, -9.59521484375, -9.0703125, -8.54541015625, -8.0205078125, -7.49560546875, -6.970703125, -6.44580078125, -5.9208984375, -5.39599609375, -4.87109375, -4.34619140625, -3.8212890625, -3.29638671875, -2.771484375, -2.24658203125, -1.7216796875, -1.19677734375, -0.671875, -0.14697265625, 0.3779296875, 0.90283203125, 1.427734375, 1.95263671875, 2.4775390625, 3.00244140625, 3.52734375, 4.05224609375, 4.5771484375, 5.10205078125, 5.626953125, 6.15185546875, 6.6767578125, 7.20166015625, 7.7265625, 8.25146484375, 8.7763671875, 9.30126953125, 9.826171875, 10.35107421875, 10.8759765625, 11.40087890625, 11.92578125, 12.45068359375, 12.9755859375, 13.50048828125, 14.025390625, 14.55029296875, 15.0751953125, 15.60009765625, 16.125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 0.0, 4.0, 7.0, 6.0, 9.0, 6.0, 15.0, 15.0, 22.0, 13.0, 25.0, 29.0, 29.0, 21.0, 35.0, 29.0, 40.0, 34.0, 42.0, 50.0, 48.0, 26.0, 38.0, 41.0, 29.0, 50.0, 32.0, 37.0, 45.0, 35.0, 31.0, 23.0, 21.0, 21.0, 7.0, 16.0, 14.0, 13.0, 7.0, 12.0, 3.0, 3.0, 7.0, 2.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.8125, -17.21337890625, -16.6142578125, -16.01513671875, -15.416015625, -14.81689453125, -14.2177734375, -13.61865234375, -13.01953125, -12.42041015625, -11.8212890625, -11.22216796875, -10.623046875, -10.02392578125, -9.4248046875, -8.82568359375, -8.2265625, -7.62744140625, -7.0283203125, -6.42919921875, -5.830078125, -5.23095703125, -4.6318359375, -4.03271484375, -3.43359375, -2.83447265625, -2.2353515625, -1.63623046875, -1.037109375, -0.43798828125, 0.1611328125, 0.76025390625, 1.359375, 1.95849609375, 2.5576171875, 3.15673828125, 3.755859375, 4.35498046875, 4.9541015625, 5.55322265625, 6.15234375, 6.75146484375, 7.3505859375, 7.94970703125, 8.548828125, 9.14794921875, 9.7470703125, 10.34619140625, 10.9453125, 11.54443359375, 12.1435546875, 12.74267578125, 13.341796875, 13.94091796875, 14.5400390625, 15.13916015625, 15.73828125, 16.33740234375, 16.9365234375, 17.53564453125, 18.134765625, 18.73388671875, 19.3330078125, 19.93212890625, 20.53125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 8.0, 3.0, 6.0, 8.0, 6.0, 13.0, 12.0, 24.0, 38.0, 43.0, 62.0, 79.0, 108.0, 155.0, 196.0, 297.0, 461.0, 669.0, 1025.0, 1741.0, 2812.0, 4929.0, 9103.0, 17335.0, 40837.0, 838116.0, 79821.0, 23633.0, 11283.0, 6279.0, 3487.0, 2075.0, 1320.0, 837.0, 520.0, 334.0, 239.0, 202.0, 139.0, 73.0, 59.0, 52.0, 29.0, 22.0, 22.0, 14.0, 8.0, 11.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.0625, -2.00128173828125, -1.9400634765625, -1.87884521484375, -1.817626953125, -1.75640869140625, -1.6951904296875, -1.63397216796875, -1.57275390625, -1.51153564453125, -1.4503173828125, -1.38909912109375, -1.327880859375, -1.26666259765625, -1.2054443359375, -1.14422607421875, -1.0830078125, -1.02178955078125, -0.9605712890625, -0.89935302734375, -0.838134765625, -0.77691650390625, -0.7156982421875, -0.65447998046875, -0.59326171875, -0.53204345703125, -0.4708251953125, -0.40960693359375, -0.348388671875, -0.28717041015625, -0.2259521484375, -0.16473388671875, -0.103515625, -0.04229736328125, 0.0189208984375, 0.08013916015625, 0.141357421875, 0.20257568359375, 0.2637939453125, 0.32501220703125, 0.38623046875, 0.44744873046875, 0.5086669921875, 0.56988525390625, 0.631103515625, 0.69232177734375, 0.7535400390625, 0.81475830078125, 0.8759765625, 0.93719482421875, 0.9984130859375, 1.05963134765625, 1.120849609375, 1.18206787109375, 1.2432861328125, 1.30450439453125, 1.36572265625, 1.42694091796875, 1.4881591796875, 1.54937744140625, 1.610595703125, 1.67181396484375, 1.7330322265625, 1.79425048828125, 1.85546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 5.0, 7.0, 5.0, 6.0, 5.0, 15.0, 12.0, 11.0, 21.0, 33.0, 22.0, 37.0, 45.0, 49.0, 65.0, 64.0, 75.0, 65.0, 54.0, 57.0, 60.0, 56.0, 34.0, 37.0, 31.0, 22.0, 11.0, 19.0, 13.0, 11.0, 11.0, 6.0, 5.0, 7.0, 6.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.383657455444336e-05, -6.181001663208008e-05, -5.97834587097168e-05, -5.7756900787353516e-05, -5.5730342864990234e-05, -5.370378494262695e-05, -5.167722702026367e-05, -4.965066909790039e-05, -4.762411117553711e-05, -4.559755325317383e-05, -4.357099533081055e-05, -4.1544437408447266e-05, -3.9517879486083984e-05, -3.74913215637207e-05, -3.546476364135742e-05, -3.343820571899414e-05, -3.141164779663086e-05, -2.9385089874267578e-05, -2.7358531951904297e-05, -2.5331974029541016e-05, -2.3305416107177734e-05, -2.1278858184814453e-05, -1.9252300262451172e-05, -1.722574234008789e-05, -1.519918441772461e-05, -1.3172626495361328e-05, -1.1146068572998047e-05, -9.119510650634766e-06, -7.092952728271484e-06, -5.066394805908203e-06, -3.039836883544922e-06, -1.0132789611816406e-06, 1.0132789611816406e-06, 3.039836883544922e-06, 5.066394805908203e-06, 7.092952728271484e-06, 9.119510650634766e-06, 1.1146068572998047e-05, 1.3172626495361328e-05, 1.519918441772461e-05, 1.722574234008789e-05, 1.9252300262451172e-05, 2.1278858184814453e-05, 2.3305416107177734e-05, 2.5331974029541016e-05, 2.7358531951904297e-05, 2.9385089874267578e-05, 3.141164779663086e-05, 3.343820571899414e-05, 3.546476364135742e-05, 3.74913215637207e-05, 3.9517879486083984e-05, 4.1544437408447266e-05, 4.357099533081055e-05, 4.559755325317383e-05, 4.762411117553711e-05, 4.965066909790039e-05, 5.167722702026367e-05, 5.370378494262695e-05, 5.5730342864990234e-05, 5.7756900787353516e-05, 5.97834587097168e-05, 6.181001663208008e-05, 6.383657455444336e-05, 6.586313247680664e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 16.0, 15.0, 33.0, 66.0, 127.0, 144.0, 309.0, 533.0, 941.0, 1508.0, 2725.0, 4915.0, 8262.0, 15006.0, 27069.0, 47578.0, 79669.0, 124658.0, 169471.0, 181221.0, 145509.0, 98511.0, 60040.0, 34831.0, 19724.0, 11029.0, 6389.0, 3585.0, 1999.0, 1106.0, 658.0, 374.0, 222.0, 127.0, 66.0, 47.0, 23.0, 14.0, 9.0, 5.0, 5.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.41796875, -1.3752899169921875, -1.332611083984375, -1.2899322509765625, -1.24725341796875, -1.2045745849609375, -1.161895751953125, -1.1192169189453125, -1.0765380859375, -1.0338592529296875, -0.991180419921875, -0.9485015869140625, -0.90582275390625, -0.8631439208984375, -0.820465087890625, -0.7777862548828125, -0.735107421875, -0.6924285888671875, -0.649749755859375, -0.6070709228515625, -0.56439208984375, -0.5217132568359375, -0.479034423828125, -0.4363555908203125, -0.3936767578125, -0.3509979248046875, -0.308319091796875, -0.2656402587890625, -0.22296142578125, -0.1802825927734375, -0.137603759765625, -0.0949249267578125, -0.05224609375, -0.0095672607421875, 0.033111572265625, 0.0757904052734375, 0.11846923828125, 0.1611480712890625, 0.203826904296875, 0.2465057373046875, 0.2891845703125, 0.3318634033203125, 0.374542236328125, 0.4172210693359375, 0.45989990234375, 0.5025787353515625, 0.545257568359375, 0.5879364013671875, 0.630615234375, 0.6732940673828125, 0.715972900390625, 0.7586517333984375, 0.80133056640625, 0.8440093994140625, 0.886688232421875, 0.9293670654296875, 0.9720458984375, 1.0147247314453125, 1.057403564453125, 1.1000823974609375, 1.14276123046875, 1.1854400634765625, 1.228118896484375, 1.2707977294921875, 1.3134765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 5.0, 7.0, 6.0, 3.0, 9.0, 8.0, 15.0, 12.0, 22.0, 26.0, 24.0, 25.0, 34.0, 40.0, 31.0, 38.0, 26.0, 31.0, 47.0, 30.0, 34.0, 29.0, 42.0, 46.0, 38.0, 44.0, 33.0, 24.0, 36.0, 39.0, 24.0, 24.0, 29.0, 26.0, 13.0, 17.0, 11.0, 14.0, 11.0, 7.0, 5.0, 9.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.84814453125, -0.8243179321289062, -0.8004913330078125, -0.7766647338867188, -0.752838134765625, -0.7290115356445312, -0.7051849365234375, -0.6813583374023438, -0.65753173828125, -0.6337051391601562, -0.6098785400390625, -0.5860519409179688, -0.562225341796875, -0.5383987426757812, -0.5145721435546875, -0.49074554443359375, -0.4669189453125, -0.44309234619140625, -0.4192657470703125, -0.39543914794921875, -0.371612548828125, -0.34778594970703125, -0.3239593505859375, -0.30013275146484375, -0.27630615234375, -0.25247955322265625, -0.2286529541015625, -0.20482635498046875, -0.180999755859375, -0.15717315673828125, -0.1333465576171875, -0.10951995849609375, -0.085693359375, -0.06186676025390625, -0.0380401611328125, -0.01421356201171875, 0.009613037109375, 0.03343963623046875, 0.0572662353515625, 0.08109283447265625, 0.10491943359375, 0.12874603271484375, 0.1525726318359375, 0.17639923095703125, 0.200225830078125, 0.22405242919921875, 0.2478790283203125, 0.27170562744140625, 0.2955322265625, 0.31935882568359375, 0.3431854248046875, 0.36701202392578125, 0.390838623046875, 0.41466522216796875, 0.4384918212890625, 0.46231842041015625, 0.48614501953125, 0.5099716186523438, 0.5337982177734375, 0.5576248168945312, 0.581451416015625, 0.6052780151367188, 0.6291046142578125, 0.6529312133789062, 0.6767578125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 9.0, 15.0, 16.0, 14.0, 19.0, 14.0, 17.0, 28.0, 31.0, 34.0, 26.0, 48.0, 41.0, 41.0, 36.0, 54.0, 51.0, 50.0, 42.0, 42.0, 48.0, 46.0, 35.0, 28.0, 28.0, 33.0, 29.0, 18.0, 12.0, 12.0, 8.0, 11.0, 12.0, 7.0, 5.0, 10.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.410541534423828, -19.74461555480957, -19.07868766784668, -18.412761688232422, -17.746835708618164, -17.080909729003906, -16.414981842041016, -15.749055862426758, -15.083128929138184, -14.41720199584961, -13.751276016235352, -13.085349082946777, -12.419422149658203, -11.753496170043945, -11.087569236755371, -10.421642303466797, -9.755716323852539, -9.089789390563965, -8.423863410949707, -7.757936477661133, -7.092010021209717, -6.426083564758301, -5.760156631469727, -5.0942301750183105, -4.4283037185668945, -3.7623772621154785, -3.0964505672454834, -2.4305238723754883, -1.7645974159240723, -1.0986709594726562, -0.43274426460266113, 0.23318243026733398, 0.8991107940673828, 1.5650373697280884, 2.230963945388794, 2.896890640258789, 3.562817096710205, 4.228743553161621, 4.894670486450195, 5.560596942901611, 6.226523399353027, 6.892449855804443, 7.558376312255859, 8.224303245544434, 8.890230178833008, 9.556156158447266, 10.22208309173584, 10.888010025024414, 11.553936004638672, 12.219862937927246, 12.885788917541504, 13.551715850830078, 14.217641830444336, 14.88356876373291, 15.549495697021484, 16.215421676635742, 16.88134765625, 17.547273635864258, 18.21320152282715, 18.879127502441406, 19.545053482055664, 20.210979461669922, 20.876907348632812, 21.54283332824707, 22.20876121520996]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 6.0, 10.0, 8.0, 9.0, 10.0, 10.0, 11.0, 15.0, 18.0, 18.0, 30.0, 38.0, 28.0, 40.0, 41.0, 34.0, 35.0, 39.0, 52.0, 32.0, 49.0, 41.0, 38.0, 43.0, 40.0, 39.0, 34.0, 23.0, 32.0, 29.0, 23.0, 16.0, 18.0, 19.0, 10.0, 13.0, 13.0, 13.0, 6.0, 4.0, 8.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-28.654403686523438, -27.840696334838867, -27.026988983154297, -26.213281631469727, -25.399574279785156, -24.585865020751953, -23.772157669067383, -22.958450317382812, -22.144742965698242, -21.331035614013672, -20.5173282623291, -19.70362091064453, -18.889911651611328, -18.07620620727539, -17.262496948242188, -16.448789596557617, -15.635082244873047, -14.821374893188477, -14.007667541503906, -13.19395923614502, -12.38025188446045, -11.566544532775879, -10.752836227416992, -9.939128875732422, -9.125421524047852, -8.311714172363281, -7.498006343841553, -6.684298515319824, -5.870591163635254, -5.056883811950684, -4.243175983428955, -3.4294681549072266, -2.6157588958740234, -1.802051305770874, -0.9883437156677246, -0.1746361255645752, 0.6390714645385742, 1.4527788162231445, 2.266486644744873, 3.0801944732666016, 3.893901824951172, 4.707609176635742, 5.521317005157471, 6.335024833679199, 7.1487321853637695, 7.96243953704834, 8.776147842407227, 9.589855194091797, 10.403562545776367, 11.217269897460938, 12.030977249145508, 12.844685554504395, 13.658392906188965, 14.472100257873535, 15.285808563232422, 16.099515914916992, 16.913223266601562, 17.726930618286133, 18.540637969970703, 19.354345321655273, 20.168052673339844, 20.981761932373047, 21.795469284057617, 22.609176635742188, 23.422883987426758]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 13.0, 12.0, 20.0, 22.0, 55.0, 82.0, 147.0, 213.0, 351.0, 622.0, 1028.0, 1665.0, 2863.0, 4745.0, 7970.0, 12919.0, 20010.0, 30449.0, 43945.0, 60943.0, 79134.0, 96096.0, 108060.0, 112361.0, 107599.0, 94932.0, 77987.0, 60152.0, 43193.0, 29784.0, 19491.0, 12372.0, 7691.0, 4669.0, 2827.0, 1655.0, 997.0, 550.0, 360.0, 226.0, 131.0, 70.0, 48.0, 34.0, 20.0, 9.0, 8.0, 8.0, 3.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-15.6171875, -15.13623046875, -14.6552734375, -14.17431640625, -13.693359375, -13.21240234375, -12.7314453125, -12.25048828125, -11.76953125, -11.28857421875, -10.8076171875, -10.32666015625, -9.845703125, -9.36474609375, -8.8837890625, -8.40283203125, -7.921875, -7.44091796875, -6.9599609375, -6.47900390625, -5.998046875, -5.51708984375, -5.0361328125, -4.55517578125, -4.07421875, -3.59326171875, -3.1123046875, -2.63134765625, -2.150390625, -1.66943359375, -1.1884765625, -0.70751953125, -0.2265625, 0.25439453125, 0.7353515625, 1.21630859375, 1.697265625, 2.17822265625, 2.6591796875, 3.14013671875, 3.62109375, 4.10205078125, 4.5830078125, 5.06396484375, 5.544921875, 6.02587890625, 6.5068359375, 6.98779296875, 7.46875, 7.94970703125, 8.4306640625, 8.91162109375, 9.392578125, 9.87353515625, 10.3544921875, 10.83544921875, 11.31640625, 11.79736328125, 12.2783203125, 12.75927734375, 13.240234375, 13.72119140625, 14.2021484375, 14.68310546875, 15.1640625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 10.0, 10.0, 8.0, 9.0, 11.0, 10.0, 15.0, 17.0, 20.0, 31.0, 33.0, 33.0, 33.0, 42.0, 31.0, 42.0, 39.0, 48.0, 35.0, 47.0, 42.0, 36.0, 47.0, 37.0, 42.0, 32.0, 24.0, 31.0, 28.0, 27.0, 19.0, 12.0, 22.0, 11.0, 11.0, 15.0, 9.0, 9.0, 6.0, 6.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-27.953125, -27.161376953125, -26.36962890625, -25.577880859375, -24.7861328125, -23.994384765625, -23.20263671875, -22.410888671875, -21.619140625, -20.827392578125, -20.03564453125, -19.243896484375, -18.4521484375, -17.660400390625, -16.86865234375, -16.076904296875, -15.28515625, -14.493408203125, -13.70166015625, -12.909912109375, -12.1181640625, -11.326416015625, -10.53466796875, -9.742919921875, -8.951171875, -8.159423828125, -7.36767578125, -6.575927734375, -5.7841796875, -4.992431640625, -4.20068359375, -3.408935546875, -2.6171875, -1.825439453125, -1.03369140625, -0.241943359375, 0.5498046875, 1.341552734375, 2.13330078125, 2.925048828125, 3.716796875, 4.508544921875, 5.30029296875, 6.092041015625, 6.8837890625, 7.675537109375, 8.46728515625, 9.259033203125, 10.05078125, 10.842529296875, 11.63427734375, 12.426025390625, 13.2177734375, 14.009521484375, 14.80126953125, 15.593017578125, 16.384765625, 17.176513671875, 17.96826171875, 18.760009765625, 19.5517578125, 20.343505859375, 21.13525390625, 21.927001953125, 22.71875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 2.0, 14.0, 26.0, 46.0, 70.0, 112.0, 215.0, 325.0, 608.0, 1142.0, 1962.0, 3576.0, 6466.0, 11177.0, 19131.0, 31555.0, 49000.0, 71530.0, 96586.0, 118691.0, 130893.0, 128902.0, 113146.0, 89906.0, 65021.0, 42891.0, 27171.0, 16587.0, 9485.0, 5529.0, 3071.0, 1642.0, 928.0, 500.0, 256.0, 180.0, 92.0, 49.0, 30.0, 13.0, 13.0, 6.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.328125, -17.770263671875, -17.21240234375, -16.654541015625, -16.0966796875, -15.538818359375, -14.98095703125, -14.423095703125, -13.865234375, -13.307373046875, -12.74951171875, -12.191650390625, -11.6337890625, -11.075927734375, -10.51806640625, -9.960205078125, -9.40234375, -8.844482421875, -8.28662109375, -7.728759765625, -7.1708984375, -6.613037109375, -6.05517578125, -5.497314453125, -4.939453125, -4.381591796875, -3.82373046875, -3.265869140625, -2.7080078125, -2.150146484375, -1.59228515625, -1.034423828125, -0.4765625, 0.081298828125, 0.63916015625, 1.197021484375, 1.7548828125, 2.312744140625, 2.87060546875, 3.428466796875, 3.986328125, 4.544189453125, 5.10205078125, 5.659912109375, 6.2177734375, 6.775634765625, 7.33349609375, 7.891357421875, 8.44921875, 9.007080078125, 9.56494140625, 10.122802734375, 10.6806640625, 11.238525390625, 11.79638671875, 12.354248046875, 12.912109375, 13.469970703125, 14.02783203125, 14.585693359375, 15.1435546875, 15.701416015625, 16.25927734375, 16.817138671875, 17.375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 9.0, 9.0, 8.0, 15.0, 10.0, 15.0, 17.0, 19.0, 26.0, 40.0, 29.0, 29.0, 31.0, 52.0, 43.0, 50.0, 49.0, 43.0, 51.0, 45.0, 46.0, 34.0, 38.0, 39.0, 41.0, 43.0, 30.0, 32.0, 17.0, 14.0, 13.0, 14.0, 7.0, 10.0, 10.0, 10.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.328125, -15.77294921875, -15.2177734375, -14.66259765625, -14.107421875, -13.55224609375, -12.9970703125, -12.44189453125, -11.88671875, -11.33154296875, -10.7763671875, -10.22119140625, -9.666015625, -9.11083984375, -8.5556640625, -8.00048828125, -7.4453125, -6.89013671875, -6.3349609375, -5.77978515625, -5.224609375, -4.66943359375, -4.1142578125, -3.55908203125, -3.00390625, -2.44873046875, -1.8935546875, -1.33837890625, -0.783203125, -0.22802734375, 0.3271484375, 0.88232421875, 1.4375, 1.99267578125, 2.5478515625, 3.10302734375, 3.658203125, 4.21337890625, 4.7685546875, 5.32373046875, 5.87890625, 6.43408203125, 6.9892578125, 7.54443359375, 8.099609375, 8.65478515625, 9.2099609375, 9.76513671875, 10.3203125, 10.87548828125, 11.4306640625, 11.98583984375, 12.541015625, 13.09619140625, 13.6513671875, 14.20654296875, 14.76171875, 15.31689453125, 15.8720703125, 16.42724609375, 16.982421875, 17.53759765625, 18.0927734375, 18.64794921875, 19.203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 0.0, 6.0, 6.0, 9.0, 8.0, 8.0, 21.0, 37.0, 38.0, 85.0, 150.0, 227.0, 373.0, 649.0, 993.0, 1721.0, 2818.0, 4792.0, 7858.0, 13265.0, 20994.0, 32432.0, 49094.0, 69497.0, 91427.0, 111919.0, 123342.0, 122368.0, 109497.0, 89471.0, 67174.0, 46712.0, 30861.0, 19907.0, 12008.0, 7467.0, 4518.0, 2733.0, 1610.0, 956.0, 538.0, 370.0, 239.0, 141.0, 71.0, 45.0, 40.0, 16.0, 17.0, 12.0, 8.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.2109375, -6.01019287109375, -5.8094482421875, -5.60870361328125, -5.407958984375, -5.20721435546875, -5.0064697265625, -4.80572509765625, -4.60498046875, -4.40423583984375, -4.2034912109375, -4.00274658203125, -3.802001953125, -3.60125732421875, -3.4005126953125, -3.19976806640625, -2.9990234375, -2.79827880859375, -2.5975341796875, -2.39678955078125, -2.196044921875, -1.99530029296875, -1.7945556640625, -1.59381103515625, -1.39306640625, -1.19232177734375, -0.9915771484375, -0.79083251953125, -0.590087890625, -0.38934326171875, -0.1885986328125, 0.01214599609375, 0.212890625, 0.41363525390625, 0.6143798828125, 0.81512451171875, 1.015869140625, 1.21661376953125, 1.4173583984375, 1.61810302734375, 1.81884765625, 2.01959228515625, 2.2203369140625, 2.42108154296875, 2.621826171875, 2.82257080078125, 3.0233154296875, 3.22406005859375, 3.4248046875, 3.62554931640625, 3.8262939453125, 4.02703857421875, 4.227783203125, 4.42852783203125, 4.6292724609375, 4.83001708984375, 5.03076171875, 5.23150634765625, 5.4322509765625, 5.63299560546875, 5.833740234375, 6.03448486328125, 6.2352294921875, 6.43597412109375, 6.63671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 7.0, 14.0, 11.0, 21.0, 16.0, 22.0, 21.0, 22.0, 32.0, 26.0, 45.0, 42.0, 42.0, 31.0, 45.0, 35.0, 36.0, 51.0, 42.0, 37.0, 46.0, 42.0, 39.0, 38.0, 42.0, 22.0, 13.0, 25.0, 19.0, 22.0, 15.0, 15.0, 12.0, 11.0, 10.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0006957054138183594, -0.0006732791662216187, -0.0006508529186248779, -0.0006284266710281372, -0.0006060004234313965, -0.0005835741758346558, -0.000561147928237915, -0.0005387216806411743, -0.0005162954330444336, -0.0004938691854476929, -0.00047144293785095215, -0.0004490166902542114, -0.0004265904426574707, -0.00040416419506073, -0.00038173794746398926, -0.00035931169986724854, -0.0003368854522705078, -0.0003144592046737671, -0.00029203295707702637, -0.00026960670948028564, -0.0002471804618835449, -0.0002247542142868042, -0.00020232796669006348, -0.00017990171909332275, -0.00015747547149658203, -0.0001350492238998413, -0.00011262297630310059, -9.019672870635986e-05, -6.777048110961914e-05, -4.534423351287842e-05, -2.2917985916137695e-05, -4.917383193969727e-07, 2.193450927734375e-05, 4.436075687408447e-05, 6.67870044708252e-05, 8.921325206756592e-05, 0.00011163949966430664, 0.00013406574726104736, 0.00015649199485778809, 0.0001789182424545288, 0.00020134449005126953, 0.00022377073764801025, 0.000246196985244751, 0.0002686232328414917, 0.0002910494804382324, 0.00031347572803497314, 0.00033590197563171387, 0.0003583282232284546, 0.0003807544708251953, 0.00040318071842193604, 0.00042560696601867676, 0.0004480332136154175, 0.0004704594612121582, 0.0004928857088088989, 0.0005153119564056396, 0.0005377382040023804, 0.0005601644515991211, 0.0005825906991958618, 0.0006050169467926025, 0.0006274431943893433, 0.000649869441986084, 0.0006722956895828247, 0.0006947219371795654, 0.0007171481847763062, 0.0007395744323730469]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 11.0, 14.0, 17.0, 27.0, 56.0, 93.0, 137.0, 211.0, 380.0, 592.0, 989.0, 1581.0, 2532.0, 4350.0, 7277.0, 11774.0, 18848.0, 29574.0, 44515.0, 64020.0, 86104.0, 105925.0, 120436.0, 122364.0, 112817.0, 94505.0, 72774.0, 52204.0, 35186.0, 22657.0, 14100.0, 8931.0, 5321.0, 3248.0, 1949.0, 1188.0, 733.0, 432.0, 250.0, 157.0, 99.0, 74.0, 48.0, 21.0, 18.0, 3.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5625, -6.34521484375, -6.1279296875, -5.91064453125, -5.693359375, -5.47607421875, -5.2587890625, -5.04150390625, -4.82421875, -4.60693359375, -4.3896484375, -4.17236328125, -3.955078125, -3.73779296875, -3.5205078125, -3.30322265625, -3.0859375, -2.86865234375, -2.6513671875, -2.43408203125, -2.216796875, -1.99951171875, -1.7822265625, -1.56494140625, -1.34765625, -1.13037109375, -0.9130859375, -0.69580078125, -0.478515625, -0.26123046875, -0.0439453125, 0.17333984375, 0.390625, 0.60791015625, 0.8251953125, 1.04248046875, 1.259765625, 1.47705078125, 1.6943359375, 1.91162109375, 2.12890625, 2.34619140625, 2.5634765625, 2.78076171875, 2.998046875, 3.21533203125, 3.4326171875, 3.64990234375, 3.8671875, 4.08447265625, 4.3017578125, 4.51904296875, 4.736328125, 4.95361328125, 5.1708984375, 5.38818359375, 5.60546875, 5.82275390625, 6.0400390625, 6.25732421875, 6.474609375, 6.69189453125, 6.9091796875, 7.12646484375, 7.34375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 8.0, 7.0, 12.0, 18.0, 11.0, 17.0, 22.0, 24.0, 34.0, 37.0, 42.0, 43.0, 39.0, 60.0, 63.0, 55.0, 40.0, 50.0, 62.0, 50.0, 44.0, 36.0, 39.0, 24.0, 22.0, 26.0, 21.0, 18.0, 12.0, 17.0, 8.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-4.04296875, -3.9202880859375, -3.797607421875, -3.6749267578125, -3.55224609375, -3.4295654296875, -3.306884765625, -3.1842041015625, -3.0615234375, -2.9388427734375, -2.816162109375, -2.6934814453125, -2.57080078125, -2.4481201171875, -2.325439453125, -2.2027587890625, -2.080078125, -1.9573974609375, -1.834716796875, -1.7120361328125, -1.58935546875, -1.4666748046875, -1.343994140625, -1.2213134765625, -1.0986328125, -0.9759521484375, -0.853271484375, -0.7305908203125, -0.60791015625, -0.4852294921875, -0.362548828125, -0.2398681640625, -0.1171875, 0.0054931640625, 0.128173828125, 0.2508544921875, 0.37353515625, 0.4962158203125, 0.618896484375, 0.7415771484375, 0.8642578125, 0.9869384765625, 1.109619140625, 1.2322998046875, 1.35498046875, 1.4776611328125, 1.600341796875, 1.7230224609375, 1.845703125, 1.9683837890625, 2.091064453125, 2.2137451171875, 2.33642578125, 2.4591064453125, 2.581787109375, 2.7044677734375, 2.8271484375, 2.9498291015625, 3.072509765625, 3.1951904296875, 3.31787109375, 3.4405517578125, 3.563232421875, 3.6859130859375, 3.80859375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 6.0, 8.0, 15.0, 10.0, 17.0, 13.0, 20.0, 21.0, 25.0, 22.0, 33.0, 30.0, 33.0, 27.0, 45.0, 61.0, 54.0, 38.0, 46.0, 48.0, 49.0, 39.0, 32.0, 38.0, 35.0, 24.0, 33.0, 24.0, 26.0, 14.0, 22.0, 15.0, 13.0, 12.0, 8.0, 8.0, 7.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-21.618755340576172, -20.986303329467773, -20.353851318359375, -19.721399307250977, -19.088947296142578, -18.45649528503418, -17.82404327392578, -17.191591262817383, -16.559139251708984, -15.926687240600586, -15.294235229492188, -14.661783218383789, -14.02933120727539, -13.396879196166992, -12.764427185058594, -12.131975173950195, -11.499523162841797, -10.867071151733398, -10.234619140625, -9.602167129516602, -8.969715118408203, -8.337263107299805, -7.704811096191406, -7.072359085083008, -6.439907073974609, -5.807455062866211, -5.1750030517578125, -4.542551040649414, -3.9100990295410156, -3.277647018432617, -2.6451950073242188, -2.0127429962158203, -1.380289077758789, -0.7478370666503906, -0.11538505554199219, 0.5170669555664062, 1.1495189666748047, 1.7819709777832031, 2.4144229888916016, 3.046875, 3.6793270111083984, 4.311779022216797, 4.944231033325195, 5.576683044433594, 6.209135055541992, 6.841587066650391, 7.474039077758789, 8.106491088867188, 8.738943099975586, 9.371395111083984, 10.003847122192383, 10.636299133300781, 11.26875114440918, 11.901203155517578, 12.533655166625977, 13.166107177734375, 13.798559188842773, 14.431011199951172, 15.06346321105957, 15.695915222167969, 16.328367233276367, 16.960819244384766, 17.593271255493164, 18.225723266601562, 18.85817527770996]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 7.0, 9.0, 10.0, 19.0, 6.0, 15.0, 15.0, 31.0, 26.0, 32.0, 28.0, 22.0, 40.0, 48.0, 41.0, 38.0, 42.0, 30.0, 38.0, 48.0, 39.0, 30.0, 42.0, 41.0, 30.0, 33.0, 26.0, 25.0, 23.0, 24.0, 19.0, 19.0, 19.0, 13.0, 11.0, 10.0, 9.0, 6.0, 11.0, 4.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-25.190431594848633, -24.427213668823242, -23.66399383544922, -22.900775909423828, -22.137557983398438, -21.374340057373047, -20.611120223999023, -19.847902297973633, -19.08468246459961, -18.32146453857422, -17.558244705200195, -16.795026779174805, -16.031808853149414, -15.268589973449707, -14.50537109375, -13.74215316772461, -12.978935241699219, -12.215716361999512, -11.452498435974121, -10.689279556274414, -9.926061630249023, -9.162842750549316, -8.39962387084961, -7.6364054679870605, -6.873187065124512, -6.109968662261963, -5.346750259399414, -4.583531379699707, -3.820312976837158, -3.0570945739746094, -2.2938756942749023, -1.5306572914123535, -0.7674369812011719, -0.004218459129333496, 0.7590000629425049, 1.5222187042236328, 2.2854371070861816, 3.0486555099487305, 3.8118743896484375, 4.575092792510986, 5.338311195373535, 6.101529598236084, 6.864748001098633, 7.62796688079834, 8.391185760498047, 9.154403686523438, 9.917622566223145, 10.680841445922852, 11.444059371948242, 12.20727825164795, 12.97049617767334, 13.733715057373047, 14.496932983398438, 15.260151863098145, 16.02337074279785, 16.786588668823242, 17.549808502197266, 18.313026428222656, 19.07624626159668, 19.83946418762207, 20.60268211364746, 21.365901947021484, 22.129119873046875, 22.892337799072266, 23.655555725097656]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 31.0, 21.0, 61.0, 85.0, 142.0, 228.0, 353.0, 644.0, 1042.0, 1658.0, 2710.0, 4302.0, 6959.0, 11181.0, 17296.0, 26961.0, 41349.0, 61128.0, 90708.0, 129032.0, 176210.0, 231476.0, 291191.0, 343034.0, 384167.0, 402981.0, 393433.0, 361796.0, 312103.0, 254044.0, 196676.0, 144760.0, 103517.0, 70398.0, 48036.0, 31209.0, 19831.0, 12878.0, 8011.0, 4979.0, 2992.0, 1825.0, 1096.0, 667.0, 434.0, 251.0, 168.0, 91.0, 62.0, 26.0, 18.0, 12.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-13.046875, -12.635009765625, -12.22314453125, -11.811279296875, -11.3994140625, -10.987548828125, -10.57568359375, -10.163818359375, -9.751953125, -9.340087890625, -8.92822265625, -8.516357421875, -8.1044921875, -7.692626953125, -7.28076171875, -6.868896484375, -6.45703125, -6.045166015625, -5.63330078125, -5.221435546875, -4.8095703125, -4.397705078125, -3.98583984375, -3.573974609375, -3.162109375, -2.750244140625, -2.33837890625, -1.926513671875, -1.5146484375, -1.102783203125, -0.69091796875, -0.279052734375, 0.1328125, 0.544677734375, 0.95654296875, 1.368408203125, 1.7802734375, 2.192138671875, 2.60400390625, 3.015869140625, 3.427734375, 3.839599609375, 4.25146484375, 4.663330078125, 5.0751953125, 5.487060546875, 5.89892578125, 6.310791015625, 6.72265625, 7.134521484375, 7.54638671875, 7.958251953125, 8.3701171875, 8.781982421875, 9.19384765625, 9.605712890625, 10.017578125, 10.429443359375, 10.84130859375, 11.253173828125, 11.6650390625, 12.076904296875, 12.48876953125, 12.900634765625, 13.3125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 8.0, 8.0, 7.0, 15.0, 8.0, 16.0, 18.0, 21.0, 28.0, 24.0, 34.0, 30.0, 34.0, 41.0, 47.0, 37.0, 37.0, 40.0, 36.0, 44.0, 43.0, 37.0, 39.0, 40.0, 26.0, 42.0, 29.0, 18.0, 26.0, 27.0, 18.0, 20.0, 15.0, 17.0, 9.0, 9.0, 13.0, 7.0, 10.0, 5.0, 0.0, 2.0, 0.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-22.71875, -22.031005859375, -21.34326171875, -20.655517578125, -19.9677734375, -19.280029296875, -18.59228515625, -17.904541015625, -17.216796875, -16.529052734375, -15.84130859375, -15.153564453125, -14.4658203125, -13.778076171875, -13.09033203125, -12.402587890625, -11.71484375, -11.027099609375, -10.33935546875, -9.651611328125, -8.9638671875, -8.276123046875, -7.58837890625, -6.900634765625, -6.212890625, -5.525146484375, -4.83740234375, -4.149658203125, -3.4619140625, -2.774169921875, -2.08642578125, -1.398681640625, -0.7109375, -0.023193359375, 0.66455078125, 1.352294921875, 2.0400390625, 2.727783203125, 3.41552734375, 4.103271484375, 4.791015625, 5.478759765625, 6.16650390625, 6.854248046875, 7.5419921875, 8.229736328125, 8.91748046875, 9.605224609375, 10.29296875, 10.980712890625, 11.66845703125, 12.356201171875, 13.0439453125, 13.731689453125, 14.41943359375, 15.107177734375, 15.794921875, 16.482666015625, 17.17041015625, 17.858154296875, 18.5458984375, 19.233642578125, 19.92138671875, 20.609130859375, 21.296875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 11.0, 15.0, 15.0, 47.0, 71.0, 119.0, 173.0, 369.0, 617.0, 1083.0, 1862.0, 2960.0, 5008.0, 8556.0, 13873.0, 21743.0, 34835.0, 52879.0, 78890.0, 113076.0, 156074.0, 208702.0, 262228.0, 315647.0, 359570.0, 386152.0, 389678.0, 371798.0, 333156.0, 282246.0, 229168.0, 174152.0, 129182.0, 90187.0, 61244.0, 41139.0, 25938.0, 16465.0, 10183.0, 6189.0, 3688.0, 2184.0, 1272.0, 748.0, 456.0, 275.0, 142.0, 101.0, 39.0, 32.0, 19.0, 13.0, 5.0, 5.0, 1.0, 1.0, 3.0, 4.0], "bins": [-14.171875, -13.7315673828125, -13.291259765625, -12.8509521484375, -12.41064453125, -11.9703369140625, -11.530029296875, -11.0897216796875, -10.6494140625, -10.2091064453125, -9.768798828125, -9.3284912109375, -8.88818359375, -8.4478759765625, -8.007568359375, -7.5672607421875, -7.126953125, -6.6866455078125, -6.246337890625, -5.8060302734375, -5.36572265625, -4.9254150390625, -4.485107421875, -4.0447998046875, -3.6044921875, -3.1641845703125, -2.723876953125, -2.2835693359375, -1.84326171875, -1.4029541015625, -0.962646484375, -0.5223388671875, -0.08203125, 0.3582763671875, 0.798583984375, 1.2388916015625, 1.67919921875, 2.1195068359375, 2.559814453125, 3.0001220703125, 3.4404296875, 3.8807373046875, 4.321044921875, 4.7613525390625, 5.20166015625, 5.6419677734375, 6.082275390625, 6.5225830078125, 6.962890625, 7.4031982421875, 7.843505859375, 8.2838134765625, 8.72412109375, 9.1644287109375, 9.604736328125, 10.0450439453125, 10.4853515625, 10.9256591796875, 11.365966796875, 11.8062744140625, 12.24658203125, 12.6868896484375, 13.127197265625, 13.5675048828125, 14.0078125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 8.0, 5.0, 14.0, 19.0, 25.0, 35.0, 38.0, 29.0, 40.0, 57.0, 72.0, 92.0, 124.0, 130.0, 144.0, 154.0, 176.0, 164.0, 168.0, 213.0, 192.0, 185.0, 222.0, 210.0, 221.0, 199.0, 174.0, 152.0, 124.0, 129.0, 100.0, 97.0, 91.0, 59.0, 56.0, 37.0, 29.0, 24.0, 11.0, 15.0, 11.0, 13.0, 11.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.515625, -9.2138671875, -8.912109375, -8.6103515625, -8.30859375, -8.0068359375, -7.705078125, -7.4033203125, -7.1015625, -6.7998046875, -6.498046875, -6.1962890625, -5.89453125, -5.5927734375, -5.291015625, -4.9892578125, -4.6875, -4.3857421875, -4.083984375, -3.7822265625, -3.48046875, -3.1787109375, -2.876953125, -2.5751953125, -2.2734375, -1.9716796875, -1.669921875, -1.3681640625, -1.06640625, -0.7646484375, -0.462890625, -0.1611328125, 0.140625, 0.4423828125, 0.744140625, 1.0458984375, 1.34765625, 1.6494140625, 1.951171875, 2.2529296875, 2.5546875, 2.8564453125, 3.158203125, 3.4599609375, 3.76171875, 4.0634765625, 4.365234375, 4.6669921875, 4.96875, 5.2705078125, 5.572265625, 5.8740234375, 6.17578125, 6.4775390625, 6.779296875, 7.0810546875, 7.3828125, 7.6845703125, 7.986328125, 8.2880859375, 8.58984375, 8.8916015625, 9.193359375, 9.4951171875, 9.796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 0.0, 4.0, 4.0, 4.0, 8.0, 7.0, 11.0, 22.0, 22.0, 24.0, 25.0, 31.0, 35.0, 30.0, 48.0, 46.0, 45.0, 54.0, 53.0, 47.0, 72.0, 47.0, 52.0, 50.0, 45.0, 33.0, 39.0, 32.0, 25.0, 20.0, 22.0, 13.0, 12.0, 8.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.32076644897461, -25.528947830200195, -24.73712921142578, -23.945308685302734, -23.15349006652832, -22.361671447753906, -21.569852828979492, -20.778034210205078, -19.986215591430664, -19.19439697265625, -18.402578353881836, -17.610759735107422, -16.818939208984375, -16.02712059020996, -15.235301971435547, -14.443483352661133, -13.651663780212402, -12.859845161437988, -12.068025588989258, -11.276206970214844, -10.48438835144043, -9.692569732666016, -8.900750160217285, -8.108931541442871, -7.317112445831299, -6.525293350219727, -5.7334747314453125, -4.94165563583374, -4.149836540222168, -3.358017921447754, -2.5661988258361816, -1.7743802070617676, -0.9825611114501953, -0.19074219465255737, 0.6010767221450806, 1.3928956985473633, 2.1847145557403564, 2.9765334129333496, 3.768352508544922, 4.560171127319336, 5.351990222930908, 6.1438093185424805, 6.9356279373168945, 7.727447032928467, 8.519266128540039, 9.311084747314453, 10.102903366088867, 10.894721984863281, 11.686541557312012, 12.478360176086426, 13.270179748535156, 14.06199836730957, 14.853816986083984, 15.645635604858398, 16.437454223632812, 17.22927474975586, 18.021093368530273, 18.812911987304688, 19.6047306060791, 20.396549224853516, 21.188369750976562, 21.980188369750977, 22.77200698852539, 23.563825607299805, 24.35564422607422]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 7.0, 7.0, 5.0, 14.0, 9.0, 15.0, 15.0, 14.0, 20.0, 26.0, 23.0, 34.0, 25.0, 37.0, 36.0, 37.0, 33.0, 39.0, 44.0, 36.0, 41.0, 39.0, 41.0, 40.0, 37.0, 35.0, 28.0, 24.0, 34.0, 24.0, 32.0, 18.0, 18.0, 21.0, 15.0, 10.0, 8.0, 10.0, 11.0, 12.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-24.675251007080078, -23.92003059387207, -23.16480827331543, -22.409587860107422, -21.654367446899414, -20.899145126342773, -20.143924713134766, -19.388702392578125, -18.633481979370117, -17.87826156616211, -17.12303924560547, -16.36781883239746, -15.612597465515137, -14.857376098632812, -14.102155685424805, -13.34693431854248, -12.591713905334473, -11.836492538452148, -11.08127212524414, -10.326050758361816, -9.570829391479492, -8.815608978271484, -8.06038761138916, -7.305166244506836, -6.54994535446167, -5.794724464416504, -5.03950309753418, -4.284282207489014, -3.5290610790252686, -2.7738399505615234, -2.0186190605163574, -1.2633976936340332, -0.5081768035888672, 0.24704426527023315, 1.0022653341293335, 1.757486343383789, 2.512707471847534, 3.2679286003112793, 4.023149490356445, 4.7783708572387695, 5.5335917472839355, 6.288812637329102, 7.044034004211426, 7.799254894256592, 8.554475784301758, 9.309697151184082, 10.064918518066406, 10.820138931274414, 11.575360298156738, 12.330581665039062, 13.08580207824707, 13.841023445129395, 14.596244812011719, 15.351465225219727, 16.106685638427734, 16.861907958984375, 17.617128372192383, 18.37234878540039, 19.12757110595703, 19.88279151916504, 20.638011932373047, 21.393234252929688, 22.148454666137695, 22.903675079345703, 23.658897399902344]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 9.0, 11.0, 16.0, 12.0, 26.0, 40.0, 65.0, 114.0, 174.0, 276.0, 485.0, 770.0, 1385.0, 2225.0, 3771.0, 6413.0, 10698.0, 18061.0, 29735.0, 46864.0, 70950.0, 99597.0, 126292.0, 141608.0, 136004.0, 113960.0, 85470.0, 58525.0, 37568.0, 23181.0, 13974.0, 8221.0, 4926.0, 2838.0, 1677.0, 988.0, 636.0, 370.0, 243.0, 145.0, 81.0, 54.0, 35.0, 21.0, 9.0, 15.0, 8.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.59765625, -4.457275390625, -4.31689453125, -4.176513671875, -4.0361328125, -3.895751953125, -3.75537109375, -3.614990234375, -3.474609375, -3.334228515625, -3.19384765625, -3.053466796875, -2.9130859375, -2.772705078125, -2.63232421875, -2.491943359375, -2.3515625, -2.211181640625, -2.07080078125, -1.930419921875, -1.7900390625, -1.649658203125, -1.50927734375, -1.368896484375, -1.228515625, -1.088134765625, -0.94775390625, -0.807373046875, -0.6669921875, -0.526611328125, -0.38623046875, -0.245849609375, -0.10546875, 0.034912109375, 0.17529296875, 0.315673828125, 0.4560546875, 0.596435546875, 0.73681640625, 0.877197265625, 1.017578125, 1.157958984375, 1.29833984375, 1.438720703125, 1.5791015625, 1.719482421875, 1.85986328125, 2.000244140625, 2.140625, 2.281005859375, 2.42138671875, 2.561767578125, 2.7021484375, 2.842529296875, 2.98291015625, 3.123291015625, 3.263671875, 3.404052734375, 3.54443359375, 3.684814453125, 3.8251953125, 3.965576171875, 4.10595703125, 4.246337890625, 4.38671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 7.0, 7.0, 2.0, 17.0, 8.0, 15.0, 17.0, 12.0, 21.0, 24.0, 23.0, 34.0, 23.0, 40.0, 36.0, 34.0, 35.0, 40.0, 41.0, 37.0, 40.0, 42.0, 39.0, 40.0, 36.0, 34.0, 33.0, 21.0, 34.0, 25.0, 30.0, 21.0, 15.0, 25.0, 14.0, 10.0, 8.0, 9.0, 11.0, 13.0, 8.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-24.796875, -24.04150390625, -23.2861328125, -22.53076171875, -21.775390625, -21.02001953125, -20.2646484375, -19.50927734375, -18.75390625, -17.99853515625, -17.2431640625, -16.48779296875, -15.732421875, -14.97705078125, -14.2216796875, -13.46630859375, -12.7109375, -11.95556640625, -11.2001953125, -10.44482421875, -9.689453125, -8.93408203125, -8.1787109375, -7.42333984375, -6.66796875, -5.91259765625, -5.1572265625, -4.40185546875, -3.646484375, -2.89111328125, -2.1357421875, -1.38037109375, -0.625, 0.13037109375, 0.8857421875, 1.64111328125, 2.396484375, 3.15185546875, 3.9072265625, 4.66259765625, 5.41796875, 6.17333984375, 6.9287109375, 7.68408203125, 8.439453125, 9.19482421875, 9.9501953125, 10.70556640625, 11.4609375, 12.21630859375, 12.9716796875, 13.72705078125, 14.482421875, 15.23779296875, 15.9931640625, 16.74853515625, 17.50390625, 18.25927734375, 19.0146484375, 19.77001953125, 20.525390625, 21.28076171875, 22.0361328125, 22.79150390625, 23.546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 10.0, 19.0, 26.0, 26.0, 41.0, 46.0, 102.0, 129.0, 181.0, 298.0, 429.0, 669.0, 1015.0, 1534.0, 2488.0, 3896.0, 6401.0, 10604.0, 18689.0, 37141.0, 794051.0, 109087.0, 25792.0, 13946.0, 8249.0, 5012.0, 3058.0, 2028.0, 1187.0, 817.0, 510.0, 336.0, 224.0, 169.0, 104.0, 77.0, 43.0, 39.0, 20.0, 19.0, 16.0, 12.0, 7.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.734375, -13.3018798828125, -12.869384765625, -12.4368896484375, -12.00439453125, -11.5718994140625, -11.139404296875, -10.7069091796875, -10.2744140625, -9.8419189453125, -9.409423828125, -8.9769287109375, -8.54443359375, -8.1119384765625, -7.679443359375, -7.2469482421875, -6.814453125, -6.3819580078125, -5.949462890625, -5.5169677734375, -5.08447265625, -4.6519775390625, -4.219482421875, -3.7869873046875, -3.3544921875, -2.9219970703125, -2.489501953125, -2.0570068359375, -1.62451171875, -1.1920166015625, -0.759521484375, -0.3270263671875, 0.10546875, 0.5379638671875, 0.970458984375, 1.4029541015625, 1.83544921875, 2.2679443359375, 2.700439453125, 3.1329345703125, 3.5654296875, 3.9979248046875, 4.430419921875, 4.8629150390625, 5.29541015625, 5.7279052734375, 6.160400390625, 6.5928955078125, 7.025390625, 7.4578857421875, 7.890380859375, 8.3228759765625, 8.75537109375, 9.1878662109375, 9.620361328125, 10.0528564453125, 10.4853515625, 10.9178466796875, 11.350341796875, 11.7828369140625, 12.21533203125, 12.6478271484375, 13.080322265625, 13.5128173828125, 13.9453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 3.0, 9.0, 7.0, 12.0, 11.0, 16.0, 19.0, 11.0, 19.0, 30.0, 32.0, 18.0, 35.0, 33.0, 43.0, 55.0, 41.0, 40.0, 35.0, 39.0, 53.0, 29.0, 45.0, 45.0, 34.0, 44.0, 32.0, 25.0, 26.0, 24.0, 26.0, 12.0, 20.0, 18.0, 12.0, 8.0, 10.0, 10.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.15625, -16.58251953125, -16.0087890625, -15.43505859375, -14.861328125, -14.28759765625, -13.7138671875, -13.14013671875, -12.56640625, -11.99267578125, -11.4189453125, -10.84521484375, -10.271484375, -9.69775390625, -9.1240234375, -8.55029296875, -7.9765625, -7.40283203125, -6.8291015625, -6.25537109375, -5.681640625, -5.10791015625, -4.5341796875, -3.96044921875, -3.38671875, -2.81298828125, -2.2392578125, -1.66552734375, -1.091796875, -0.51806640625, 0.0556640625, 0.62939453125, 1.203125, 1.77685546875, 2.3505859375, 2.92431640625, 3.498046875, 4.07177734375, 4.6455078125, 5.21923828125, 5.79296875, 6.36669921875, 6.9404296875, 7.51416015625, 8.087890625, 8.66162109375, 9.2353515625, 9.80908203125, 10.3828125, 10.95654296875, 11.5302734375, 12.10400390625, 12.677734375, 13.25146484375, 13.8251953125, 14.39892578125, 14.97265625, 15.54638671875, 16.1201171875, 16.69384765625, 17.267578125, 17.84130859375, 18.4150390625, 18.98876953125, 19.5625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 7.0, 8.0, 7.0, 13.0, 21.0, 16.0, 32.0, 55.0, 75.0, 122.0, 178.0, 248.0, 408.0, 678.0, 1107.0, 1932.0, 3465.0, 6566.0, 13133.0, 28115.0, 242455.0, 685664.0, 32820.0, 14857.0, 7465.0, 3862.0, 2114.0, 1164.0, 687.0, 458.0, 287.0, 185.0, 121.0, 70.0, 47.0, 40.0, 25.0, 15.0, 17.0, 5.0, 8.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.517578125, -1.467132568359375, -1.41668701171875, -1.366241455078125, -1.3157958984375, -1.265350341796875, -1.21490478515625, -1.164459228515625, -1.114013671875, -1.063568115234375, -1.01312255859375, -0.962677001953125, -0.9122314453125, -0.861785888671875, -0.81134033203125, -0.760894775390625, -0.71044921875, -0.660003662109375, -0.60955810546875, -0.559112548828125, -0.5086669921875, -0.458221435546875, -0.40777587890625, -0.357330322265625, -0.306884765625, -0.256439208984375, -0.20599365234375, -0.155548095703125, -0.1051025390625, -0.054656982421875, -0.00421142578125, 0.046234130859375, 0.0966796875, 0.147125244140625, 0.19757080078125, 0.248016357421875, 0.2984619140625, 0.348907470703125, 0.39935302734375, 0.449798583984375, 0.500244140625, 0.550689697265625, 0.60113525390625, 0.651580810546875, 0.7020263671875, 0.752471923828125, 0.80291748046875, 0.853363037109375, 0.90380859375, 0.954254150390625, 1.00469970703125, 1.055145263671875, 1.1055908203125, 1.156036376953125, 1.20648193359375, 1.256927490234375, 1.307373046875, 1.357818603515625, 1.40826416015625, 1.458709716796875, 1.5091552734375, 1.559600830078125, 1.61004638671875, 1.660491943359375, 1.7109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 5.0, 8.0, 6.0, 12.0, 14.0, 12.0, 22.0, 20.0, 25.0, 34.0, 33.0, 36.0, 51.0, 45.0, 44.0, 39.0, 41.0, 58.0, 53.0, 44.0, 48.0, 38.0, 53.0, 45.0, 35.0, 37.0, 26.0, 19.0, 16.0, 15.0, 15.0, 9.0, 5.0, 7.0, 7.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9385089874267578e-05, -2.8381124138832092e-05, -2.7377158403396606e-05, -2.637319266796112e-05, -2.5369226932525635e-05, -2.436526119709015e-05, -2.3361295461654663e-05, -2.2357329726219177e-05, -2.135336399078369e-05, -2.0349398255348206e-05, -1.934543251991272e-05, -1.8341466784477234e-05, -1.7337501049041748e-05, -1.6333535313606262e-05, -1.5329569578170776e-05, -1.432560384273529e-05, -1.3321638107299805e-05, -1.2317672371864319e-05, -1.1313706636428833e-05, -1.0309740900993347e-05, -9.305775165557861e-06, -8.301809430122375e-06, -7.29784369468689e-06, -6.293877959251404e-06, -5.289912223815918e-06, -4.285946488380432e-06, -3.2819807529449463e-06, -2.2780150175094604e-06, -1.2740492820739746e-06, -2.7008354663848877e-07, 7.338821887969971e-07, 1.737847924232483e-06, 2.7418136596679688e-06, 3.7457793951034546e-06, 4.7497451305389404e-06, 5.753710865974426e-06, 6.757676601409912e-06, 7.761642336845398e-06, 8.765608072280884e-06, 9.76957380771637e-06, 1.0773539543151855e-05, 1.1777505278587341e-05, 1.2781471014022827e-05, 1.3785436749458313e-05, 1.4789402484893799e-05, 1.5793368220329285e-05, 1.679733395576477e-05, 1.7801299691200256e-05, 1.8805265426635742e-05, 1.9809231162071228e-05, 2.0813196897506714e-05, 2.18171626329422e-05, 2.2821128368377686e-05, 2.382509410381317e-05, 2.4829059839248657e-05, 2.5833025574684143e-05, 2.683699131011963e-05, 2.7840957045555115e-05, 2.88449227809906e-05, 2.9848888516426086e-05, 3.085285425186157e-05, 3.185681998729706e-05, 3.2860785722732544e-05, 3.386475145816803e-05, 3.4868717193603516e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 3.0, 13.0, 13.0, 14.0, 29.0, 38.0, 37.0, 72.0, 121.0, 156.0, 269.0, 338.0, 615.0, 987.0, 1607.0, 2740.0, 4473.0, 7510.0, 12393.0, 20622.0, 32625.0, 51278.0, 76328.0, 106867.0, 136796.0, 149678.0, 134740.0, 104270.0, 73395.0, 49464.0, 31468.0, 19605.0, 11807.0, 7204.0, 4237.0, 2607.0, 1553.0, 944.0, 600.0, 335.0, 199.0, 172.0, 84.0, 73.0, 57.0, 24.0, 27.0, 20.0, 15.0, 9.0, 6.0, 5.0, 4.0, 4.0, 3.0, 3.0, 4.0], "bins": [-0.94189453125, -0.912872314453125, -0.88385009765625, -0.854827880859375, -0.8258056640625, -0.796783447265625, -0.76776123046875, -0.738739013671875, -0.709716796875, -0.680694580078125, -0.65167236328125, -0.622650146484375, -0.5936279296875, -0.564605712890625, -0.53558349609375, -0.506561279296875, -0.4775390625, -0.448516845703125, -0.41949462890625, -0.390472412109375, -0.3614501953125, -0.332427978515625, -0.30340576171875, -0.274383544921875, -0.245361328125, -0.216339111328125, -0.18731689453125, -0.158294677734375, -0.1292724609375, -0.100250244140625, -0.07122802734375, -0.042205810546875, -0.01318359375, 0.015838623046875, 0.04486083984375, 0.073883056640625, 0.1029052734375, 0.131927490234375, 0.16094970703125, 0.189971923828125, 0.218994140625, 0.248016357421875, 0.27703857421875, 0.306060791015625, 0.3350830078125, 0.364105224609375, 0.39312744140625, 0.422149658203125, 0.451171875, 0.480194091796875, 0.50921630859375, 0.538238525390625, 0.5672607421875, 0.596282958984375, 0.62530517578125, 0.654327392578125, 0.683349609375, 0.712371826171875, 0.74139404296875, 0.770416259765625, 0.7994384765625, 0.828460693359375, 0.85748291015625, 0.886505126953125, 0.91552734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 6.0, 8.0, 6.0, 11.0, 9.0, 16.0, 14.0, 22.0, 19.0, 37.0, 36.0, 52.0, 41.0, 51.0, 41.0, 40.0, 48.0, 51.0, 45.0, 37.0, 55.0, 55.0, 41.0, 42.0, 29.0, 36.0, 22.0, 22.0, 14.0, 16.0, 14.0, 12.0, 11.0, 11.0, 11.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.69091796875, -0.6702346801757812, -0.6495513916015625, -0.6288681030273438, -0.608184814453125, -0.5875015258789062, -0.5668182373046875, -0.5461349487304688, -0.52545166015625, -0.5047683715820312, -0.4840850830078125, -0.46340179443359375, -0.442718505859375, -0.42203521728515625, -0.4013519287109375, -0.38066864013671875, -0.3599853515625, -0.33930206298828125, -0.3186187744140625, -0.29793548583984375, -0.277252197265625, -0.25656890869140625, -0.2358856201171875, -0.21520233154296875, -0.19451904296875, -0.17383575439453125, -0.1531524658203125, -0.13246917724609375, -0.111785888671875, -0.09110260009765625, -0.0704193115234375, -0.04973602294921875, -0.029052734375, -0.00836944580078125, 0.0123138427734375, 0.03299713134765625, 0.053680419921875, 0.07436370849609375, 0.0950469970703125, 0.11573028564453125, 0.13641357421875, 0.15709686279296875, 0.1777801513671875, 0.19846343994140625, 0.219146728515625, 0.23983001708984375, 0.2605133056640625, 0.28119659423828125, 0.3018798828125, 0.32256317138671875, 0.3432464599609375, 0.36392974853515625, 0.384613037109375, 0.40529632568359375, 0.4259796142578125, 0.44666290283203125, 0.46734619140625, 0.48802947998046875, 0.5087127685546875, 0.5293960571289062, 0.550079345703125, 0.5707626342773438, 0.5914459228515625, 0.6121292114257812, 0.6328125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 3.0, 9.0, 6.0, 15.0, 17.0, 17.0, 26.0, 26.0, 30.0, 37.0, 29.0, 42.0, 44.0, 49.0, 44.0, 52.0, 49.0, 59.0, 63.0, 58.0, 43.0, 50.0, 37.0, 32.0, 33.0, 22.0, 34.0, 14.0, 14.0, 16.0, 7.0, 9.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.272634506225586, -25.488723754882812, -24.704811096191406, -23.920900344848633, -23.13698959350586, -22.353078842163086, -21.569168090820312, -20.785255432128906, -20.001344680786133, -19.21743392944336, -18.433521270751953, -17.64961051940918, -16.865699768066406, -16.081789016723633, -15.297877311706543, -14.513965606689453, -13.73005485534668, -12.946144104003906, -12.162232398986816, -11.378320693969727, -10.594409942626953, -9.81049919128418, -9.02658748626709, -8.24267578125, -7.458765029907227, -6.674853801727295, -5.890942573547363, -5.107031345367432, -4.3231201171875, -3.5392088890075684, -2.7552976608276367, -1.971386432647705, -1.1874732971191406, -0.403562068939209, 0.38034915924072266, 1.1642603874206543, 1.948171615600586, 2.7320828437805176, 3.515994071960449, 4.299905300140381, 5.0838165283203125, 5.867727756500244, 6.651638984680176, 7.435550212860107, 8.219461441040039, 9.003372192382812, 9.787283897399902, 10.571195602416992, 11.355106353759766, 12.139017105102539, 12.922928810119629, 13.706840515136719, 14.490751266479492, 15.274662017822266, 16.058574676513672, 16.842485427856445, 17.62639617919922, 18.410306930541992, 19.194217681884766, 19.978130340576172, 20.762041091918945, 21.54595184326172, 22.329864501953125, 23.1137752532959, 23.897686004638672]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 10.0, 5.0, 7.0, 13.0, 10.0, 17.0, 13.0, 16.0, 22.0, 20.0, 28.0, 28.0, 27.0, 37.0, 29.0, 41.0, 36.0, 40.0, 35.0, 39.0, 39.0, 41.0, 38.0, 38.0, 32.0, 41.0, 34.0, 25.0, 25.0, 25.0, 24.0, 28.0, 20.0, 17.0, 22.0, 11.0, 6.0, 10.0, 9.0, 11.0, 10.0, 7.0, 9.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-24.575664520263672, -23.827972412109375, -23.080278396606445, -22.33258628845215, -21.58489418029785, -20.837200164794922, -20.089508056640625, -19.341815948486328, -18.59412384033203, -17.846431732177734, -17.098737716674805, -16.351045608520508, -15.603353500366211, -14.855660438537598, -14.107967376708984, -13.360275268554688, -12.612581253051758, -11.864888191223145, -11.117196083068848, -10.369503021240234, -9.621810913085938, -8.874117851257324, -8.126424789428711, -7.378732204437256, -6.631039619445801, -5.883347034454346, -5.135654449462891, -4.387961387634277, -3.6402688026428223, -2.892576217651367, -2.144883155822754, -1.3971905708312988, -0.6494960784912109, 0.09819662570953369, 0.8458893299102783, 1.5935821533203125, 2.3412747383117676, 3.0889673233032227, 3.836660385131836, 4.584352970123291, 5.332045555114746, 6.079738140106201, 6.827430725097656, 7.5751237869262695, 8.322816848754883, 9.07050895690918, 9.818202018737793, 10.565895080566406, 11.313587188720703, 12.061280250549316, 12.808972358703613, 13.556665420532227, 14.304357528686523, 15.052050590515137, 15.79974365234375, 16.547435760498047, 17.295127868652344, 18.04281997680664, 18.79051399230957, 19.538206100463867, 20.285898208618164, 21.033592224121094, 21.78128433227539, 22.528976440429688, 23.276670455932617]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 19.0, 25.0, 28.0, 46.0, 93.0, 123.0, 216.0, 417.0, 657.0, 1045.0, 1749.0, 2834.0, 4802.0, 7479.0, 11819.0, 17623.0, 26216.0, 36605.0, 49956.0, 64662.0, 79599.0, 91809.0, 99639.0, 101683.0, 96095.0, 85833.0, 72473.0, 58061.0, 43162.0, 31595.0, 22183.0, 14711.0, 9619.0, 5977.0, 3848.0, 2300.0, 1450.0, 850.0, 524.0, 294.0, 170.0, 97.0, 57.0, 43.0, 28.0, 16.0, 7.0, 6.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-13.4296875, -13.0260009765625, -12.622314453125, -12.2186279296875, -11.81494140625, -11.4112548828125, -11.007568359375, -10.6038818359375, -10.2001953125, -9.7965087890625, -9.392822265625, -8.9891357421875, -8.58544921875, -8.1817626953125, -7.778076171875, -7.3743896484375, -6.970703125, -6.5670166015625, -6.163330078125, -5.7596435546875, -5.35595703125, -4.9522705078125, -4.548583984375, -4.1448974609375, -3.7412109375, -3.3375244140625, -2.933837890625, -2.5301513671875, -2.12646484375, -1.7227783203125, -1.319091796875, -0.9154052734375, -0.51171875, -0.1080322265625, 0.295654296875, 0.6993408203125, 1.10302734375, 1.5067138671875, 1.910400390625, 2.3140869140625, 2.7177734375, 3.1214599609375, 3.525146484375, 3.9288330078125, 4.33251953125, 4.7362060546875, 5.139892578125, 5.5435791015625, 5.947265625, 6.3509521484375, 6.754638671875, 7.1583251953125, 7.56201171875, 7.9656982421875, 8.369384765625, 8.7730712890625, 9.1767578125, 9.5804443359375, 9.984130859375, 10.3878173828125, 10.79150390625, 11.1951904296875, 11.598876953125, 12.0025634765625, 12.40625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 9.0, 4.0, 10.0, 13.0, 8.0, 16.0, 14.0, 15.0, 23.0, 20.0, 30.0, 26.0, 27.0, 38.0, 29.0, 41.0, 33.0, 42.0, 36.0, 37.0, 40.0, 40.0, 40.0, 37.0, 28.0, 41.0, 37.0, 24.0, 28.0, 22.0, 25.0, 30.0, 15.0, 20.0, 19.0, 15.0, 5.0, 10.0, 10.0, 11.0, 10.0, 7.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-23.921875, -23.194580078125, -22.46728515625, -21.739990234375, -21.0126953125, -20.285400390625, -19.55810546875, -18.830810546875, -18.103515625, -17.376220703125, -16.64892578125, -15.921630859375, -15.1943359375, -14.467041015625, -13.73974609375, -13.012451171875, -12.28515625, -11.557861328125, -10.83056640625, -10.103271484375, -9.3759765625, -8.648681640625, -7.92138671875, -7.194091796875, -6.466796875, -5.739501953125, -5.01220703125, -4.284912109375, -3.5576171875, -2.830322265625, -2.10302734375, -1.375732421875, -0.6484375, 0.078857421875, 0.80615234375, 1.533447265625, 2.2607421875, 2.988037109375, 3.71533203125, 4.442626953125, 5.169921875, 5.897216796875, 6.62451171875, 7.351806640625, 8.0791015625, 8.806396484375, 9.53369140625, 10.260986328125, 10.98828125, 11.715576171875, 12.44287109375, 13.170166015625, 13.8974609375, 14.624755859375, 15.35205078125, 16.079345703125, 16.806640625, 17.533935546875, 18.26123046875, 18.988525390625, 19.7158203125, 20.443115234375, 21.17041015625, 21.897705078125, 22.625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 9.0, 11.0, 25.0, 23.0, 51.0, 60.0, 115.0, 180.0, 332.0, 450.0, 750.0, 1113.0, 1795.0, 2805.0, 4326.0, 6696.0, 10042.0, 14738.0, 21644.0, 30672.0, 41433.0, 54253.0, 68217.0, 81353.0, 92190.0, 97368.0, 96464.0, 90509.0, 79654.0, 66950.0, 52781.0, 40232.0, 29166.0, 20679.0, 14304.0, 9495.0, 6324.0, 4109.0, 2657.0, 1667.0, 1033.0, 706.0, 445.0, 276.0, 165.0, 125.0, 59.0, 44.0, 27.0, 18.0, 9.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-12.171875, -11.790771484375, -11.40966796875, -11.028564453125, -10.6474609375, -10.266357421875, -9.88525390625, -9.504150390625, -9.123046875, -8.741943359375, -8.36083984375, -7.979736328125, -7.5986328125, -7.217529296875, -6.83642578125, -6.455322265625, -6.07421875, -5.693115234375, -5.31201171875, -4.930908203125, -4.5498046875, -4.168701171875, -3.78759765625, -3.406494140625, -3.025390625, -2.644287109375, -2.26318359375, -1.882080078125, -1.5009765625, -1.119873046875, -0.73876953125, -0.357666015625, 0.0234375, 0.404541015625, 0.78564453125, 1.166748046875, 1.5478515625, 1.928955078125, 2.31005859375, 2.691162109375, 3.072265625, 3.453369140625, 3.83447265625, 4.215576171875, 4.5966796875, 4.977783203125, 5.35888671875, 5.739990234375, 6.12109375, 6.502197265625, 6.88330078125, 7.264404296875, 7.6455078125, 8.026611328125, 8.40771484375, 8.788818359375, 9.169921875, 9.551025390625, 9.93212890625, 10.313232421875, 10.6943359375, 11.075439453125, 11.45654296875, 11.837646484375, 12.21875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 9.0, 15.0, 5.0, 6.0, 14.0, 16.0, 18.0, 15.0, 24.0, 19.0, 33.0, 30.0, 34.0, 37.0, 41.0, 53.0, 35.0, 48.0, 52.0, 42.0, 47.0, 34.0, 31.0, 47.0, 34.0, 38.0, 30.0, 26.0, 21.0, 23.0, 14.0, 17.0, 23.0, 10.0, 9.0, 8.0, 7.0, 9.0, 7.0, 4.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.96875, -14.462890625, -13.95703125, -13.451171875, -12.9453125, -12.439453125, -11.93359375, -11.427734375, -10.921875, -10.416015625, -9.91015625, -9.404296875, -8.8984375, -8.392578125, -7.88671875, -7.380859375, -6.875, -6.369140625, -5.86328125, -5.357421875, -4.8515625, -4.345703125, -3.83984375, -3.333984375, -2.828125, -2.322265625, -1.81640625, -1.310546875, -0.8046875, -0.298828125, 0.20703125, 0.712890625, 1.21875, 1.724609375, 2.23046875, 2.736328125, 3.2421875, 3.748046875, 4.25390625, 4.759765625, 5.265625, 5.771484375, 6.27734375, 6.783203125, 7.2890625, 7.794921875, 8.30078125, 8.806640625, 9.3125, 9.818359375, 10.32421875, 10.830078125, 11.3359375, 11.841796875, 12.34765625, 12.853515625, 13.359375, 13.865234375, 14.37109375, 14.876953125, 15.3828125, 15.888671875, 16.39453125, 16.900390625, 17.40625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 3.0, 14.0, 20.0, 18.0, 28.0, 38.0, 71.0, 108.0, 148.0, 220.0, 327.0, 548.0, 832.0, 1393.0, 1980.0, 3254.0, 4924.0, 7463.0, 11667.0, 17146.0, 25610.0, 36712.0, 49967.0, 65300.0, 80957.0, 93493.0, 102166.0, 103445.0, 97614.0, 86133.0, 71163.0, 55685.0, 41417.0, 29495.0, 20443.0, 13535.0, 9111.0, 5664.0, 3689.0, 2458.0, 1525.0, 949.0, 642.0, 399.0, 247.0, 192.0, 108.0, 89.0, 45.0, 41.0, 27.0, 18.0, 10.0, 9.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.34765625, -5.17620849609375, -5.0047607421875, -4.83331298828125, -4.661865234375, -4.49041748046875, -4.3189697265625, -4.14752197265625, -3.97607421875, -3.80462646484375, -3.6331787109375, -3.46173095703125, -3.290283203125, -3.11883544921875, -2.9473876953125, -2.77593994140625, -2.6044921875, -2.43304443359375, -2.2615966796875, -2.09014892578125, -1.918701171875, -1.74725341796875, -1.5758056640625, -1.40435791015625, -1.23291015625, -1.06146240234375, -0.8900146484375, -0.71856689453125, -0.547119140625, -0.37567138671875, -0.2042236328125, -0.03277587890625, 0.138671875, 0.31011962890625, 0.4815673828125, 0.65301513671875, 0.824462890625, 0.99591064453125, 1.1673583984375, 1.33880615234375, 1.51025390625, 1.68170166015625, 1.8531494140625, 2.02459716796875, 2.196044921875, 2.36749267578125, 2.5389404296875, 2.71038818359375, 2.8818359375, 3.05328369140625, 3.2247314453125, 3.39617919921875, 3.567626953125, 3.73907470703125, 3.9105224609375, 4.08197021484375, 4.25341796875, 4.42486572265625, 4.5963134765625, 4.76776123046875, 4.939208984375, 5.11065673828125, 5.2821044921875, 5.45355224609375, 5.625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 5.0, 7.0, 17.0, 13.0, 20.0, 13.0, 20.0, 21.0, 18.0, 37.0, 43.0, 42.0, 34.0, 28.0, 37.0, 41.0, 36.0, 44.0, 42.0, 57.0, 31.0, 44.0, 33.0, 34.0, 21.0, 35.0, 32.0, 28.0, 30.0, 24.0, 14.0, 18.0, 12.0, 14.0, 12.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006504058837890625, -0.000629521906375885, -0.0006086379289627075, -0.00058775395154953, -0.0005668699741363525, -0.000545985996723175, -0.0005251020193099976, -0.0005042180418968201, -0.0004833340644836426, -0.0004624500870704651, -0.0004415661096572876, -0.0004206821322441101, -0.0003997981548309326, -0.0003789141774177551, -0.00035803020000457764, -0.00033714622259140015, -0.00031626224517822266, -0.00029537826776504517, -0.0002744942903518677, -0.0002536103129386902, -0.0002327263355255127, -0.0002118423581123352, -0.00019095838069915771, -0.00017007440328598022, -0.00014919042587280273, -0.00012830644845962524, -0.00010742247104644775, -8.653849363327026e-05, -6.565451622009277e-05, -4.477053880691528e-05, -2.3886561393737793e-05, -3.0025839805603027e-06, 1.7881393432617188e-05, 3.876537084579468e-05, 5.964934825897217e-05, 8.053332567214966e-05, 0.00010141730308532715, 0.00012230128049850464, 0.00014318525791168213, 0.00016406923532485962, 0.0001849532127380371, 0.0002058371901512146, 0.0002267211675643921, 0.0002476051449775696, 0.00026848912239074707, 0.00028937309980392456, 0.00031025707721710205, 0.00033114105463027954, 0.00035202503204345703, 0.0003729090094566345, 0.000393792986869812, 0.0004146769642829895, 0.000435560941696167, 0.0004564449191093445, 0.00047732889652252197, 0.0004982128739356995, 0.000519096851348877, 0.0005399808287620544, 0.0005608648061752319, 0.0005817487835884094, 0.0006026327610015869, 0.0006235167384147644, 0.0006444007158279419, 0.0006652846932411194, 0.0006861686706542969]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 14.0, 14.0, 19.0, 24.0, 62.0, 80.0, 104.0, 159.0, 235.0, 374.0, 582.0, 834.0, 1352.0, 2194.0, 3340.0, 5327.0, 8556.0, 13229.0, 20220.0, 30305.0, 43626.0, 59863.0, 77936.0, 94676.0, 106872.0, 110748.0, 106583.0, 94388.0, 77428.0, 59521.0, 43071.0, 30499.0, 20142.0, 13244.0, 8523.0, 5256.0, 3222.0, 2165.0, 1335.0, 901.0, 505.0, 351.0, 231.0, 165.0, 88.0, 61.0, 48.0, 31.0, 17.0, 16.0, 7.0, 10.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0], "bins": [-6.39453125, -6.19146728515625, -5.9884033203125, -5.78533935546875, -5.582275390625, -5.37921142578125, -5.1761474609375, -4.97308349609375, -4.77001953125, -4.56695556640625, -4.3638916015625, -4.16082763671875, -3.957763671875, -3.75469970703125, -3.5516357421875, -3.34857177734375, -3.1455078125, -2.94244384765625, -2.7393798828125, -2.53631591796875, -2.333251953125, -2.13018798828125, -1.9271240234375, -1.72406005859375, -1.52099609375, -1.31793212890625, -1.1148681640625, -0.91180419921875, -0.708740234375, -0.50567626953125, -0.3026123046875, -0.09954833984375, 0.103515625, 0.30657958984375, 0.5096435546875, 0.71270751953125, 0.915771484375, 1.11883544921875, 1.3218994140625, 1.52496337890625, 1.72802734375, 1.93109130859375, 2.1341552734375, 2.33721923828125, 2.540283203125, 2.74334716796875, 2.9464111328125, 3.14947509765625, 3.3525390625, 3.55560302734375, 3.7586669921875, 3.96173095703125, 4.164794921875, 4.36785888671875, 4.5709228515625, 4.77398681640625, 4.97705078125, 5.18011474609375, 5.3831787109375, 5.58624267578125, 5.789306640625, 5.99237060546875, 6.1954345703125, 6.39849853515625, 6.6015625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 4.0, 7.0, 1.0, 6.0, 8.0, 10.0, 17.0, 14.0, 14.0, 21.0, 19.0, 24.0, 25.0, 41.0, 25.0, 29.0, 32.0, 41.0, 45.0, 44.0, 46.0, 49.0, 42.0, 33.0, 32.0, 48.0, 41.0, 40.0, 29.0, 31.0, 21.0, 29.0, 23.0, 16.0, 8.0, 21.0, 6.0, 11.0, 13.0, 15.0, 3.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0], "bins": [-3.55078125, -3.44512939453125, -3.3394775390625, -3.23382568359375, -3.128173828125, -3.02252197265625, -2.9168701171875, -2.81121826171875, -2.70556640625, -2.59991455078125, -2.4942626953125, -2.38861083984375, -2.282958984375, -2.17730712890625, -2.0716552734375, -1.96600341796875, -1.8603515625, -1.75469970703125, -1.6490478515625, -1.54339599609375, -1.437744140625, -1.33209228515625, -1.2264404296875, -1.12078857421875, -1.01513671875, -0.90948486328125, -0.8038330078125, -0.69818115234375, -0.592529296875, -0.48687744140625, -0.3812255859375, -0.27557373046875, -0.169921875, -0.06427001953125, 0.0413818359375, 0.14703369140625, 0.252685546875, 0.35833740234375, 0.4639892578125, 0.56964111328125, 0.67529296875, 0.78094482421875, 0.8865966796875, 0.99224853515625, 1.097900390625, 1.20355224609375, 1.3092041015625, 1.41485595703125, 1.5205078125, 1.62615966796875, 1.7318115234375, 1.83746337890625, 1.943115234375, 2.04876708984375, 2.1544189453125, 2.26007080078125, 2.36572265625, 2.47137451171875, 2.5770263671875, 2.68267822265625, 2.788330078125, 2.89398193359375, 2.9996337890625, 3.10528564453125, 3.2109375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 7.0, 4.0, 4.0, 6.0, 6.0, 8.0, 17.0, 17.0, 16.0, 26.0, 19.0, 34.0, 33.0, 31.0, 39.0, 36.0, 36.0, 44.0, 51.0, 45.0, 39.0, 46.0, 58.0, 49.0, 41.0, 39.0, 38.0, 30.0, 37.0, 27.0, 18.0, 24.0, 17.0, 10.0, 12.0, 12.0, 9.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.13426399230957, -20.455615997314453, -19.776968002319336, -19.09832000732422, -18.419673919677734, -17.741025924682617, -17.0623779296875, -16.383729934692383, -15.705081939697266, -15.026433944702148, -14.347785949707031, -13.66913890838623, -12.990490913391113, -12.311842918395996, -11.633195877075195, -10.954547882080078, -10.275899887084961, -9.597251892089844, -8.918603897094727, -8.239956855773926, -7.561308860778809, -6.882660865783691, -6.204013347625732, -5.525365829467773, -4.846717834472656, -4.168069839477539, -3.48942232131958, -2.810774564743042, -2.132126808166504, -1.4534790515899658, -0.7748312950134277, -0.09618377685546875, 0.5824642181396484, 1.2611119747161865, 1.9397597312927246, 2.6184074878692627, 3.297055244445801, 3.975703001022339, 4.654350757598877, 5.332998275756836, 6.011646270751953, 6.69029426574707, 7.368941783905029, 8.047589302062988, 8.726237297058105, 9.404885292053223, 10.083532333374023, 10.76218032836914, 11.440828323364258, 12.119476318359375, 12.798124313354492, 13.476771354675293, 14.15541934967041, 14.834067344665527, 15.512714385986328, 16.191362380981445, 16.870010375976562, 17.54865837097168, 18.227306365966797, 18.905954360961914, 19.58460235595703, 20.263248443603516, 20.941896438598633, 21.62054443359375, 22.299192428588867]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 7.0, 8.0, 15.0, 11.0, 15.0, 13.0, 26.0, 27.0, 15.0, 28.0, 34.0, 33.0, 40.0, 41.0, 33.0, 49.0, 44.0, 58.0, 44.0, 36.0, 42.0, 33.0, 41.0, 37.0, 40.0, 23.0, 29.0, 27.0, 23.0, 15.0, 22.0, 15.0, 15.0, 10.0, 4.0, 9.0, 9.0, 6.0, 5.0, 5.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0], "bins": [-30.095386505126953, -29.267641067504883, -28.439897537231445, -27.612152099609375, -26.784408569335938, -25.956663131713867, -25.12891960144043, -24.30117416381836, -23.473430633544922, -22.64568519592285, -21.817941665649414, -20.990196228027344, -20.162452697753906, -19.334707260131836, -18.5069637298584, -17.679218292236328, -16.85147476196289, -16.02372932434082, -15.195985794067383, -14.368241310119629, -13.540496826171875, -12.712751388549805, -11.885007858276367, -11.057262420654297, -10.229516983032227, -9.401772499084473, -8.574028015136719, -7.746283531188965, -6.918539047241211, -6.090794086456299, -5.263049602508545, -4.435305118560791, -3.6075611114501953, -2.7798166275024414, -1.952072024345398, -1.1243274211883545, -0.2965829372406006, 0.5311617851257324, 1.3589062690734863, 2.1866507530212402, 3.014395236968994, 3.842139720916748, 4.669884204864502, 5.497629165649414, 6.325373649597168, 7.153118133544922, 7.980862617492676, 8.80860710144043, 9.636351585388184, 10.464096069335938, 11.291840553283691, 12.119585037231445, 12.9473295211792, 13.775074005126953, 14.602819442749023, 15.430562973022461, 16.25830841064453, 17.0860538482666, 17.91379737854004, 18.74154281616211, 19.569286346435547, 20.397031784057617, 21.224775314331055, 22.052520751953125, 22.880264282226562]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [4.0, 4.0, 3.0, 18.0, 14.0, 23.0, 39.0, 41.0, 78.0, 143.0, 187.0, 329.0, 534.0, 885.0, 1441.0, 2200.0, 3594.0, 5581.0, 8740.0, 13477.0, 20385.0, 30743.0, 45777.0, 66198.0, 93350.0, 127923.0, 170969.0, 219453.0, 267506.0, 313540.0, 349910.0, 367714.0, 368037.0, 346662.0, 310019.0, 265036.0, 215048.0, 167496.0, 125936.0, 91286.0, 64397.0, 44358.0, 30007.0, 19606.0, 12920.0, 8256.0, 5497.0, 3460.0, 2087.0, 1328.0, 833.0, 476.0, 314.0, 160.0, 102.0, 65.0, 47.0, 35.0, 14.0, 3.0, 7.0, 3.0, 5.0, 1.0], "bins": [-12.671875, -12.275390625, -11.87890625, -11.482421875, -11.0859375, -10.689453125, -10.29296875, -9.896484375, -9.5, -9.103515625, -8.70703125, -8.310546875, -7.9140625, -7.517578125, -7.12109375, -6.724609375, -6.328125, -5.931640625, -5.53515625, -5.138671875, -4.7421875, -4.345703125, -3.94921875, -3.552734375, -3.15625, -2.759765625, -2.36328125, -1.966796875, -1.5703125, -1.173828125, -0.77734375, -0.380859375, 0.015625, 0.412109375, 0.80859375, 1.205078125, 1.6015625, 1.998046875, 2.39453125, 2.791015625, 3.1875, 3.583984375, 3.98046875, 4.376953125, 4.7734375, 5.169921875, 5.56640625, 5.962890625, 6.359375, 6.755859375, 7.15234375, 7.548828125, 7.9453125, 8.341796875, 8.73828125, 9.134765625, 9.53125, 9.927734375, 10.32421875, 10.720703125, 11.1171875, 11.513671875, 11.91015625, 12.306640625, 12.703125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 11.0, 10.0, 11.0, 13.0, 16.0, 24.0, 24.0, 15.0, 25.0, 37.0, 35.0, 32.0, 41.0, 35.0, 48.0, 45.0, 48.0, 57.0, 42.0, 32.0, 40.0, 34.0, 47.0, 35.0, 26.0, 33.0, 21.0, 26.0, 19.0, 15.0, 21.0, 15.0, 12.0, 4.0, 9.0, 5.0, 11.0, 4.0, 6.0, 3.0, 7.0, 1.0, 2.0, 2.0, 2.0], "bins": [-27.453125, -26.70458984375, -25.9560546875, -25.20751953125, -24.458984375, -23.71044921875, -22.9619140625, -22.21337890625, -21.46484375, -20.71630859375, -19.9677734375, -19.21923828125, -18.470703125, -17.72216796875, -16.9736328125, -16.22509765625, -15.4765625, -14.72802734375, -13.9794921875, -13.23095703125, -12.482421875, -11.73388671875, -10.9853515625, -10.23681640625, -9.48828125, -8.73974609375, -7.9912109375, -7.24267578125, -6.494140625, -5.74560546875, -4.9970703125, -4.24853515625, -3.5, -2.75146484375, -2.0029296875, -1.25439453125, -0.505859375, 0.24267578125, 0.9912109375, 1.73974609375, 2.48828125, 3.23681640625, 3.9853515625, 4.73388671875, 5.482421875, 6.23095703125, 6.9794921875, 7.72802734375, 8.4765625, 9.22509765625, 9.9736328125, 10.72216796875, 11.470703125, 12.21923828125, 12.9677734375, 13.71630859375, 14.46484375, 15.21337890625, 15.9619140625, 16.71044921875, 17.458984375, 18.20751953125, 18.9560546875, 19.70458984375, 20.453125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 17.0, 26.0, 28.0, 65.0, 76.0, 174.0, 273.0, 467.0, 780.0, 1249.0, 2147.0, 3579.0, 5739.0, 9304.0, 15002.0, 23298.0, 35579.0, 52768.0, 76759.0, 107199.0, 145364.0, 188854.0, 238290.0, 284830.0, 324919.0, 352753.0, 364421.0, 357773.0, 333913.0, 295765.0, 248480.0, 201439.0, 155719.0, 116318.0, 83437.0, 57841.0, 39643.0, 26011.0, 16898.0, 10527.0, 6637.0, 3954.0, 2485.0, 1459.0, 844.0, 485.0, 285.0, 176.0, 88.0, 64.0, 46.0, 24.0, 8.0, 8.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.671875, -13.2528076171875, -12.833740234375, -12.4146728515625, -11.99560546875, -11.5765380859375, -11.157470703125, -10.7384033203125, -10.3193359375, -9.9002685546875, -9.481201171875, -9.0621337890625, -8.64306640625, -8.2239990234375, -7.804931640625, -7.3858642578125, -6.966796875, -6.5477294921875, -6.128662109375, -5.7095947265625, -5.29052734375, -4.8714599609375, -4.452392578125, -4.0333251953125, -3.6142578125, -3.1951904296875, -2.776123046875, -2.3570556640625, -1.93798828125, -1.5189208984375, -1.099853515625, -0.6807861328125, -0.26171875, 0.1573486328125, 0.576416015625, 0.9954833984375, 1.41455078125, 1.8336181640625, 2.252685546875, 2.6717529296875, 3.0908203125, 3.5098876953125, 3.928955078125, 4.3480224609375, 4.76708984375, 5.1861572265625, 5.605224609375, 6.0242919921875, 6.443359375, 6.8624267578125, 7.281494140625, 7.7005615234375, 8.11962890625, 8.5386962890625, 8.957763671875, 9.3768310546875, 9.7958984375, 10.2149658203125, 10.634033203125, 11.0531005859375, 11.47216796875, 11.8912353515625, 12.310302734375, 12.7293701171875, 13.1484375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 7.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 11.0, 15.0, 13.0, 20.0, 44.0, 43.0, 41.0, 54.0, 51.0, 82.0, 94.0, 100.0, 116.0, 127.0, 143.0, 138.0, 157.0, 159.0, 181.0, 171.0, 193.0, 182.0, 210.0, 171.0, 176.0, 157.0, 158.0, 137.0, 129.0, 133.0, 117.0, 114.0, 64.0, 69.0, 66.0, 42.0, 40.0, 34.0, 23.0, 15.0, 14.0, 11.0, 6.0, 8.0, 4.0, 4.0, 9.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-8.9921875, -8.71728515625, -8.4423828125, -8.16748046875, -7.892578125, -7.61767578125, -7.3427734375, -7.06787109375, -6.79296875, -6.51806640625, -6.2431640625, -5.96826171875, -5.693359375, -5.41845703125, -5.1435546875, -4.86865234375, -4.59375, -4.31884765625, -4.0439453125, -3.76904296875, -3.494140625, -3.21923828125, -2.9443359375, -2.66943359375, -2.39453125, -2.11962890625, -1.8447265625, -1.56982421875, -1.294921875, -1.02001953125, -0.7451171875, -0.47021484375, -0.1953125, 0.07958984375, 0.3544921875, 0.62939453125, 0.904296875, 1.17919921875, 1.4541015625, 1.72900390625, 2.00390625, 2.27880859375, 2.5537109375, 2.82861328125, 3.103515625, 3.37841796875, 3.6533203125, 3.92822265625, 4.203125, 4.47802734375, 4.7529296875, 5.02783203125, 5.302734375, 5.57763671875, 5.8525390625, 6.12744140625, 6.40234375, 6.67724609375, 6.9521484375, 7.22705078125, 7.501953125, 7.77685546875, 8.0517578125, 8.32666015625, 8.6015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 8.0, 7.0, 12.0, 6.0, 11.0, 15.0, 20.0, 15.0, 24.0, 45.0, 34.0, 39.0, 42.0, 38.0, 41.0, 58.0, 56.0, 52.0, 55.0, 53.0, 54.0, 52.0, 49.0, 42.0, 41.0, 35.0, 18.0, 21.0, 16.0, 11.0, 14.0, 1.0, 6.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.67163848876953, -30.846296310424805, -30.02095603942871, -29.195613861083984, -28.37027359008789, -27.544931411743164, -26.719589233398438, -25.894248962402344, -25.06890869140625, -24.243566513061523, -23.41822624206543, -22.592884063720703, -21.76754379272461, -20.942201614379883, -20.116859436035156, -19.291519165039062, -18.466176986694336, -17.64083480834961, -16.815494537353516, -15.990152359008789, -15.164812088012695, -14.339469909667969, -13.514128684997559, -12.688787460327148, -11.863446235656738, -11.038105010986328, -10.212763786315918, -9.387422561645508, -8.562080383300781, -7.736739635467529, -6.911397933959961, -6.086056709289551, -5.260717391967773, -4.435376167297363, -3.610034704208374, -2.7846932411193848, -1.9593520164489746, -1.1340107917785645, -0.3086690902709961, 0.5166721343994141, 1.3420133590698242, 2.1673545837402344, 2.9926960468292236, 3.818037509918213, 4.643378734588623, 5.468719959259033, 6.294061660766602, 7.119402885437012, 7.944744110107422, 8.770085334777832, 9.595426559448242, 10.420768737792969, 11.246109008789062, 12.071451187133789, 12.8967924118042, 13.72213363647461, 14.54747486114502, 15.37281608581543, 16.198158264160156, 17.02349853515625, 17.848840713500977, 18.67418098449707, 19.499523162841797, 20.32486343383789, 21.150205612182617]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 5.0, 9.0, 6.0, 15.0, 12.0, 21.0, 21.0, 21.0, 27.0, 30.0, 32.0, 43.0, 32.0, 47.0, 28.0, 46.0, 50.0, 37.0, 37.0, 51.0, 44.0, 57.0, 42.0, 32.0, 30.0, 29.0, 24.0, 24.0, 18.0, 18.0, 21.0, 12.0, 14.0, 13.0, 8.0, 6.0, 7.0, 6.0, 4.0, 3.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-29.759483337402344, -28.911277770996094, -28.063072204589844, -27.214866638183594, -26.366661071777344, -25.518455505371094, -24.670249938964844, -23.822044372558594, -22.973838806152344, -22.125633239746094, -21.277427673339844, -20.429222106933594, -19.581016540527344, -18.732810974121094, -17.884605407714844, -17.036399841308594, -16.188194274902344, -15.339988708496094, -14.491783142089844, -13.643577575683594, -12.795372009277344, -11.947166442871094, -11.098960876464844, -10.250755310058594, -9.402551651000977, -8.554346084594727, -7.706140518188477, -6.857934951782227, -6.009729385375977, -5.161524295806885, -4.313318729400635, -3.4651131629943848, -2.6169071197509766, -1.7687015533447266, -0.9204961061477661, -0.07229065895080566, 0.7759149074554443, 1.6241202354431152, 2.4723258018493652, 3.3205313682556152, 4.168736934661865, 5.016942501068115, 5.865148067474365, 6.713353157043457, 7.561558723449707, 8.409764289855957, 9.257969856262207, 10.106175422668457, 10.954380989074707, 11.802586555480957, 12.650792121887207, 13.498997688293457, 14.347203254699707, 15.19540786743164, 16.04361343383789, 16.89181900024414, 17.74002456665039, 18.58823013305664, 19.43643569946289, 20.28464126586914, 21.13284683227539, 21.98105239868164, 22.82925796508789, 23.67746353149414, 24.52566909790039]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 5.0, 3.0, 5.0, 10.0, 29.0, 51.0, 85.0, 156.0, 301.0, 507.0, 916.0, 1746.0, 3075.0, 5635.0, 10417.0, 18494.0, 32070.0, 53804.0, 83806.0, 120794.0, 151172.0, 159092.0, 137958.0, 103164.0, 68038.0, 41699.0, 24636.0, 13851.0, 7675.0, 4198.0, 2315.0, 1295.0, 647.0, 385.0, 217.0, 144.0, 60.0, 44.0, 21.0, 17.0, 10.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.80859375, -4.668212890625, -4.52783203125, -4.387451171875, -4.2470703125, -4.106689453125, -3.96630859375, -3.825927734375, -3.685546875, -3.545166015625, -3.40478515625, -3.264404296875, -3.1240234375, -2.983642578125, -2.84326171875, -2.702880859375, -2.5625, -2.422119140625, -2.28173828125, -2.141357421875, -2.0009765625, -1.860595703125, -1.72021484375, -1.579833984375, -1.439453125, -1.299072265625, -1.15869140625, -1.018310546875, -0.8779296875, -0.737548828125, -0.59716796875, -0.456787109375, -0.31640625, -0.176025390625, -0.03564453125, 0.104736328125, 0.2451171875, 0.385498046875, 0.52587890625, 0.666259765625, 0.806640625, 0.947021484375, 1.08740234375, 1.227783203125, 1.3681640625, 1.508544921875, 1.64892578125, 1.789306640625, 1.9296875, 2.070068359375, 2.21044921875, 2.350830078125, 2.4912109375, 2.631591796875, 2.77197265625, 2.912353515625, 3.052734375, 3.193115234375, 3.33349609375, 3.473876953125, 3.6142578125, 3.754638671875, 3.89501953125, 4.035400390625, 4.17578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 5.0, 9.0, 6.0, 15.0, 14.0, 20.0, 21.0, 21.0, 26.0, 30.0, 32.0, 44.0, 29.0, 47.0, 31.0, 42.0, 49.0, 39.0, 39.0, 46.0, 49.0, 53.0, 41.0, 35.0, 30.0, 29.0, 25.0, 24.0, 19.0, 17.0, 18.0, 13.0, 14.0, 14.0, 9.0, 7.0, 7.0, 6.0, 4.0, 3.0, 6.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-29.796875, -28.951904296875, -28.10693359375, -27.261962890625, -26.4169921875, -25.572021484375, -24.72705078125, -23.882080078125, -23.037109375, -22.192138671875, -21.34716796875, -20.502197265625, -19.6572265625, -18.812255859375, -17.96728515625, -17.122314453125, -16.27734375, -15.432373046875, -14.58740234375, -13.742431640625, -12.8974609375, -12.052490234375, -11.20751953125, -10.362548828125, -9.517578125, -8.672607421875, -7.82763671875, -6.982666015625, -6.1376953125, -5.292724609375, -4.44775390625, -3.602783203125, -2.7578125, -1.912841796875, -1.06787109375, -0.222900390625, 0.6220703125, 1.467041015625, 2.31201171875, 3.156982421875, 4.001953125, 4.846923828125, 5.69189453125, 6.536865234375, 7.3818359375, 8.226806640625, 9.07177734375, 9.916748046875, 10.76171875, 11.606689453125, 12.45166015625, 13.296630859375, 14.1416015625, 14.986572265625, 15.83154296875, 16.676513671875, 17.521484375, 18.366455078125, 19.21142578125, 20.056396484375, 20.9013671875, 21.746337890625, 22.59130859375, 23.436279296875, 24.28125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 15.0, 26.0, 34.0, 50.0, 93.0, 175.0, 225.0, 393.0, 572.0, 961.0, 1586.0, 2481.0, 4190.0, 6901.0, 11671.0, 19988.0, 43408.0, 820059.0, 77359.0, 24302.0, 13545.0, 7967.0, 4827.0, 2917.0, 1762.0, 1162.0, 713.0, 413.0, 262.0, 181.0, 102.0, 73.0, 44.0, 35.0, 25.0, 13.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1328125, -10.781005859375, -10.42919921875, -10.077392578125, -9.7255859375, -9.373779296875, -9.02197265625, -8.670166015625, -8.318359375, -7.966552734375, -7.61474609375, -7.262939453125, -6.9111328125, -6.559326171875, -6.20751953125, -5.855712890625, -5.50390625, -5.152099609375, -4.80029296875, -4.448486328125, -4.0966796875, -3.744873046875, -3.39306640625, -3.041259765625, -2.689453125, -2.337646484375, -1.98583984375, -1.634033203125, -1.2822265625, -0.930419921875, -0.57861328125, -0.226806640625, 0.125, 0.476806640625, 0.82861328125, 1.180419921875, 1.5322265625, 1.884033203125, 2.23583984375, 2.587646484375, 2.939453125, 3.291259765625, 3.64306640625, 3.994873046875, 4.3466796875, 4.698486328125, 5.05029296875, 5.402099609375, 5.75390625, 6.105712890625, 6.45751953125, 6.809326171875, 7.1611328125, 7.512939453125, 7.86474609375, 8.216552734375, 8.568359375, 8.920166015625, 9.27197265625, 9.623779296875, 9.9755859375, 10.327392578125, 10.67919921875, 11.031005859375, 11.3828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 8.0, 5.0, 7.0, 6.0, 12.0, 13.0, 13.0, 15.0, 14.0, 23.0, 26.0, 22.0, 33.0, 30.0, 33.0, 39.0, 29.0, 39.0, 51.0, 35.0, 32.0, 44.0, 48.0, 26.0, 39.0, 34.0, 28.0, 27.0, 29.0, 31.0, 20.0, 26.0, 26.0, 22.0, 19.0, 24.0, 11.0, 14.0, 14.0, 12.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0], "bins": [-18.84375, -18.2763671875, -17.708984375, -17.1416015625, -16.57421875, -16.0068359375, -15.439453125, -14.8720703125, -14.3046875, -13.7373046875, -13.169921875, -12.6025390625, -12.03515625, -11.4677734375, -10.900390625, -10.3330078125, -9.765625, -9.1982421875, -8.630859375, -8.0634765625, -7.49609375, -6.9287109375, -6.361328125, -5.7939453125, -5.2265625, -4.6591796875, -4.091796875, -3.5244140625, -2.95703125, -2.3896484375, -1.822265625, -1.2548828125, -0.6875, -0.1201171875, 0.447265625, 1.0146484375, 1.58203125, 2.1494140625, 2.716796875, 3.2841796875, 3.8515625, 4.4189453125, 4.986328125, 5.5537109375, 6.12109375, 6.6884765625, 7.255859375, 7.8232421875, 8.390625, 8.9580078125, 9.525390625, 10.0927734375, 10.66015625, 11.2275390625, 11.794921875, 12.3623046875, 12.9296875, 13.4970703125, 14.064453125, 14.6318359375, 15.19921875, 15.7666015625, 16.333984375, 16.9013671875, 17.46875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 10.0, 13.0, 19.0, 33.0, 36.0, 48.0, 64.0, 78.0, 105.0, 205.0, 247.0, 371.0, 564.0, 802.0, 1142.0, 1893.0, 2960.0, 4600.0, 7877.0, 13295.0, 23218.0, 57340.0, 833142.0, 46928.0, 21405.0, 12321.0, 7134.0, 4516.0, 2777.0, 1749.0, 1164.0, 769.0, 529.0, 356.0, 258.0, 174.0, 118.0, 89.0, 63.0, 39.0, 30.0, 18.0, 13.0, 14.0, 9.0, 5.0, 3.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1240234375, -1.08709716796875, -1.0501708984375, -1.01324462890625, -0.976318359375, -0.93939208984375, -0.9024658203125, -0.86553955078125, -0.82861328125, -0.79168701171875, -0.7547607421875, -0.71783447265625, -0.680908203125, -0.64398193359375, -0.6070556640625, -0.57012939453125, -0.533203125, -0.49627685546875, -0.4593505859375, -0.42242431640625, -0.385498046875, -0.34857177734375, -0.3116455078125, -0.27471923828125, -0.23779296875, -0.20086669921875, -0.1639404296875, -0.12701416015625, -0.090087890625, -0.05316162109375, -0.0162353515625, 0.02069091796875, 0.0576171875, 0.09454345703125, 0.1314697265625, 0.16839599609375, 0.205322265625, 0.24224853515625, 0.2791748046875, 0.31610107421875, 0.35302734375, 0.38995361328125, 0.4268798828125, 0.46380615234375, 0.500732421875, 0.53765869140625, 0.5745849609375, 0.61151123046875, 0.6484375, 0.68536376953125, 0.7222900390625, 0.75921630859375, 0.796142578125, 0.83306884765625, 0.8699951171875, 0.90692138671875, 0.94384765625, 0.98077392578125, 1.0177001953125, 1.05462646484375, 1.091552734375, 1.12847900390625, 1.1654052734375, 1.20233154296875, 1.2392578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 10.0, 5.0, 4.0, 12.0, 20.0, 25.0, 24.0, 29.0, 28.0, 22.0, 40.0, 49.0, 51.0, 52.0, 38.0, 59.0, 57.0, 47.0, 65.0, 51.0, 60.0, 44.0, 37.0, 32.0, 27.0, 17.0, 22.0, 9.0, 15.0, 6.0, 6.0, 6.0, 2.0, 9.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7060508728027344e-05, -2.612639218568802e-05, -2.5192275643348694e-05, -2.425815910100937e-05, -2.3324042558670044e-05, -2.238992601633072e-05, -2.1455809473991394e-05, -2.052169293165207e-05, -1.9587576389312744e-05, -1.865345984697342e-05, -1.7719343304634094e-05, -1.678522676229477e-05, -1.5851110219955444e-05, -1.491699367761612e-05, -1.3982877135276794e-05, -1.304876059293747e-05, -1.2114644050598145e-05, -1.118052750825882e-05, -1.0246410965919495e-05, -9.31229442358017e-06, -8.378177881240845e-06, -7.44406133890152e-06, -6.509944796562195e-06, -5.57582825422287e-06, -4.641711711883545e-06, -3.70759516954422e-06, -2.773478627204895e-06, -1.83936208486557e-06, -9.052455425262451e-07, 2.8870999813079834e-08, 9.629875421524048e-07, 1.8971040844917297e-06, 2.8312206268310547e-06, 3.7653371691703796e-06, 4.699453711509705e-06, 5.6335702538490295e-06, 6.5676867961883545e-06, 7.5018033385276794e-06, 8.435919880867004e-06, 9.37003642320633e-06, 1.0304152965545654e-05, 1.123826950788498e-05, 1.2172386050224304e-05, 1.3106502592563629e-05, 1.4040619134902954e-05, 1.4974735677242279e-05, 1.5908852219581604e-05, 1.684296876192093e-05, 1.7777085304260254e-05, 1.871120184659958e-05, 1.9645318388938904e-05, 2.057943493127823e-05, 2.1513551473617554e-05, 2.244766801595688e-05, 2.3381784558296204e-05, 2.431590110063553e-05, 2.5250017642974854e-05, 2.618413418531418e-05, 2.7118250727653503e-05, 2.805236726999283e-05, 2.8986483812332153e-05, 2.9920600354671478e-05, 3.08547168970108e-05, 3.178883343935013e-05, 3.272294998168945e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 12.0, 9.0, 31.0, 43.0, 66.0, 96.0, 138.0, 220.0, 325.0, 522.0, 864.0, 1348.0, 2221.0, 3470.0, 5555.0, 8603.0, 13886.0, 22243.0, 34645.0, 52970.0, 79510.0, 113176.0, 147085.0, 155454.0, 129778.0, 94888.0, 64919.0, 42305.0, 27370.0, 17481.0, 10844.0, 6753.0, 4295.0, 2813.0, 1613.0, 1116.0, 666.0, 456.0, 279.0, 170.0, 109.0, 73.0, 49.0, 27.0, 20.0, 13.0, 16.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.845703125, -0.8177337646484375, -0.789764404296875, -0.7617950439453125, -0.73382568359375, -0.7058563232421875, -0.677886962890625, -0.6499176025390625, -0.6219482421875, -0.5939788818359375, -0.566009521484375, -0.5380401611328125, -0.51007080078125, -0.4821014404296875, -0.454132080078125, -0.4261627197265625, -0.398193359375, -0.3702239990234375, -0.342254638671875, -0.3142852783203125, -0.28631591796875, -0.2583465576171875, -0.230377197265625, -0.2024078369140625, -0.1744384765625, -0.1464691162109375, -0.118499755859375, -0.0905303955078125, -0.06256103515625, -0.0345916748046875, -0.006622314453125, 0.0213470458984375, 0.04931640625, 0.0772857666015625, 0.105255126953125, 0.1332244873046875, 0.16119384765625, 0.1891632080078125, 0.217132568359375, 0.2451019287109375, 0.2730712890625, 0.3010406494140625, 0.329010009765625, 0.3569793701171875, 0.38494873046875, 0.4129180908203125, 0.440887451171875, 0.4688568115234375, 0.496826171875, 0.5247955322265625, 0.552764892578125, 0.5807342529296875, 0.60870361328125, 0.6366729736328125, 0.664642333984375, 0.6926116943359375, 0.7205810546875, 0.7485504150390625, 0.776519775390625, 0.8044891357421875, 0.83245849609375, 0.8604278564453125, 0.888397216796875, 0.9163665771484375, 0.9443359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 2.0, 6.0, 2.0, 7.0, 5.0, 4.0, 9.0, 14.0, 9.0, 18.0, 19.0, 33.0, 26.0, 33.0, 29.0, 54.0, 42.0, 45.0, 51.0, 53.0, 55.0, 56.0, 56.0, 65.0, 46.0, 41.0, 34.0, 34.0, 24.0, 19.0, 12.0, 12.0, 19.0, 11.0, 8.0, 11.0, 9.0, 4.0, 6.0, 7.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.728515625, -0.7067108154296875, -0.684906005859375, -0.6631011962890625, -0.64129638671875, -0.6194915771484375, -0.597686767578125, -0.5758819580078125, -0.5540771484375, -0.5322723388671875, -0.510467529296875, -0.4886627197265625, -0.46685791015625, -0.4450531005859375, -0.423248291015625, -0.4014434814453125, -0.379638671875, -0.3578338623046875, -0.336029052734375, -0.3142242431640625, -0.29241943359375, -0.2706146240234375, -0.248809814453125, -0.2270050048828125, -0.2052001953125, -0.1833953857421875, -0.161590576171875, -0.1397857666015625, -0.11798095703125, -0.0961761474609375, -0.074371337890625, -0.0525665283203125, -0.03076171875, -0.0089569091796875, 0.012847900390625, 0.0346527099609375, 0.05645751953125, 0.0782623291015625, 0.100067138671875, 0.1218719482421875, 0.1436767578125, 0.1654815673828125, 0.187286376953125, 0.2090911865234375, 0.23089599609375, 0.2527008056640625, 0.274505615234375, 0.2963104248046875, 0.318115234375, 0.3399200439453125, 0.361724853515625, 0.3835296630859375, 0.40533447265625, 0.4271392822265625, 0.448944091796875, 0.4707489013671875, 0.4925537109375, 0.5143585205078125, 0.536163330078125, 0.5579681396484375, 0.57977294921875, 0.6015777587890625, 0.623382568359375, 0.6451873779296875, 0.6669921875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 12.0, 8.0, 8.0, 11.0, 19.0, 19.0, 16.0, 37.0, 32.0, 36.0, 53.0, 37.0, 41.0, 44.0, 59.0, 56.0, 57.0, 48.0, 70.0, 52.0, 44.0, 51.0, 42.0, 32.0, 28.0, 16.0, 19.0, 16.0, 6.0, 11.0, 3.0, 9.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.688480377197266, -31.84552001953125, -31.002561569213867, -30.15960121154785, -29.316640853881836, -28.473682403564453, -27.630722045898438, -26.787761688232422, -25.944801330566406, -25.10184097290039, -24.258882522583008, -23.415922164916992, -22.572961807250977, -21.730003356933594, -20.887042999267578, -20.044082641601562, -19.20112419128418, -18.358163833618164, -17.51520538330078, -16.672245025634766, -15.82928466796875, -14.98632526397705, -14.143365859985352, -13.300405502319336, -12.457446098327637, -11.614486694335938, -10.771526336669922, -9.928566932678223, -9.085607528686523, -8.242647171020508, -7.399687767028809, -6.556727886199951, -5.713768005371094, -4.870808124542236, -4.027848243713379, -3.1848888397216797, -2.3419289588928223, -1.4989690780639648, -0.6560096740722656, 0.1869502067565918, 1.0299100875854492, 1.872869849205017, 2.715829610824585, 3.5587892532348633, 4.401749134063721, 5.244709014892578, 6.087668418884277, 6.930628299713135, 7.773588180541992, 8.616547584533691, 9.459507942199707, 10.302467346191406, 11.145427703857422, 11.988387107849121, 12.83134651184082, 13.674306869506836, 14.517266273498535, 15.360225677490234, 16.20318603515625, 17.046146392822266, 17.88910484313965, 18.732065200805664, 19.575023651123047, 20.417984008789062, 21.260944366455078]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 9.0, 5.0, 13.0, 21.0, 13.0, 19.0, 23.0, 31.0, 28.0, 36.0, 34.0, 37.0, 40.0, 34.0, 38.0, 52.0, 33.0, 43.0, 44.0, 49.0, 48.0, 48.0, 32.0, 29.0, 31.0, 27.0, 23.0, 18.0, 18.0, 14.0, 17.0, 16.0, 12.0, 11.0, 9.0, 6.0, 6.0, 5.0, 3.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0], "bins": [-29.457197189331055, -28.623476028442383, -27.789752960205078, -26.956031799316406, -26.122310638427734, -25.288589477539062, -24.454866409301758, -23.621145248413086, -22.787424087524414, -21.953702926635742, -21.119979858398438, -20.286258697509766, -19.452537536621094, -18.618816375732422, -17.785093307495117, -16.951372146606445, -16.11764907836914, -15.283926963806152, -14.45020580291748, -13.616483688354492, -12.78276252746582, -11.949040412902832, -11.115318298339844, -10.281597137451172, -9.4478759765625, -8.614153861999512, -7.78043270111084, -6.946710586547852, -6.11298942565918, -5.279267311096191, -4.445545673370361, -3.6118240356445312, -2.7781028747558594, -1.9443812370300293, -1.1106594800949097, -0.27693772315979004, 0.55678391456604, 1.3905057907104492, 2.2242274284362793, 3.0579490661621094, 3.8916707038879395, 4.7253923416137695, 5.5591139793396, 6.39283561706543, 7.226557731628418, 8.060279846191406, 8.894001007080078, 9.72772216796875, 10.561444282531738, 11.395166397094727, 12.228887557983398, 13.062609672546387, 13.896330833435059, 14.730052947998047, 15.563774108886719, 16.39749526977539, 17.231218338012695, 18.064939498901367, 18.898662567138672, 19.732383728027344, 20.566104888916016, 21.399826049804688, 22.233549118041992, 23.067270278930664, 23.900991439819336]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 6.0, 6.0, 12.0, 20.0, 29.0, 61.0, 65.0, 122.0, 173.0, 327.0, 501.0, 739.0, 1178.0, 1822.0, 2842.0, 4149.0, 6339.0, 9527.0, 13647.0, 19626.0, 26892.0, 35706.0, 46812.0, 57628.0, 69520.0, 78422.0, 85613.0, 89148.0, 87537.0, 81865.0, 73462.0, 62476.0, 50956.0, 39529.0, 30313.0, 22448.0, 15881.0, 11150.0, 7558.0, 4979.0, 3336.0, 2225.0, 1419.0, 905.0, 596.0, 405.0, 232.0, 134.0, 92.0, 61.0, 30.0, 15.0, 11.0, 5.0, 5.0, 3.0, 2.0, 3.0], "bins": [-11.4453125, -11.105712890625, -10.76611328125, -10.426513671875, -10.0869140625, -9.747314453125, -9.40771484375, -9.068115234375, -8.728515625, -8.388916015625, -8.04931640625, -7.709716796875, -7.3701171875, -7.030517578125, -6.69091796875, -6.351318359375, -6.01171875, -5.672119140625, -5.33251953125, -4.992919921875, -4.6533203125, -4.313720703125, -3.97412109375, -3.634521484375, -3.294921875, -2.955322265625, -2.61572265625, -2.276123046875, -1.9365234375, -1.596923828125, -1.25732421875, -0.917724609375, -0.578125, -0.238525390625, 0.10107421875, 0.440673828125, 0.7802734375, 1.119873046875, 1.45947265625, 1.799072265625, 2.138671875, 2.478271484375, 2.81787109375, 3.157470703125, 3.4970703125, 3.836669921875, 4.17626953125, 4.515869140625, 4.85546875, 5.195068359375, 5.53466796875, 5.874267578125, 6.2138671875, 6.553466796875, 6.89306640625, 7.232666015625, 7.572265625, 7.911865234375, 8.25146484375, 8.591064453125, 8.9306640625, 9.270263671875, 9.60986328125, 9.949462890625, 10.2890625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 3.0, 6.0, 8.0, 8.0, 11.0, 18.0, 14.0, 21.0, 23.0, 28.0, 30.0, 34.0, 41.0, 34.0, 33.0, 44.0, 38.0, 48.0, 31.0, 44.0, 42.0, 53.0, 48.0, 49.0, 30.0, 30.0, 34.0, 27.0, 21.0, 17.0, 19.0, 16.0, 14.0, 17.0, 11.0, 12.0, 8.0, 6.0, 6.0, 6.0, 3.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0], "bins": [-29.046875, -28.225341796875, -27.40380859375, -26.582275390625, -25.7607421875, -24.939208984375, -24.11767578125, -23.296142578125, -22.474609375, -21.653076171875, -20.83154296875, -20.010009765625, -19.1884765625, -18.366943359375, -17.54541015625, -16.723876953125, -15.90234375, -15.080810546875, -14.25927734375, -13.437744140625, -12.6162109375, -11.794677734375, -10.97314453125, -10.151611328125, -9.330078125, -8.508544921875, -7.68701171875, -6.865478515625, -6.0439453125, -5.222412109375, -4.40087890625, -3.579345703125, -2.7578125, -1.936279296875, -1.11474609375, -0.293212890625, 0.5283203125, 1.349853515625, 2.17138671875, 2.992919921875, 3.814453125, 4.635986328125, 5.45751953125, 6.279052734375, 7.1005859375, 7.922119140625, 8.74365234375, 9.565185546875, 10.38671875, 11.208251953125, 12.02978515625, 12.851318359375, 13.6728515625, 14.494384765625, 15.31591796875, 16.137451171875, 16.958984375, 17.780517578125, 18.60205078125, 19.423583984375, 20.2451171875, 21.066650390625, 21.88818359375, 22.709716796875, 23.53125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 13.0, 16.0, 21.0, 40.0, 74.0, 145.0, 259.0, 421.0, 861.0, 1528.0, 2752.0, 5094.0, 8773.0, 15063.0, 24815.0, 38746.0, 57132.0, 79143.0, 101217.0, 118187.0, 123887.0, 119422.0, 103978.0, 82357.0, 60147.0, 40811.0, 26267.0, 16099.0, 9337.0, 5404.0, 2985.0, 1676.0, 836.0, 482.0, 251.0, 137.0, 75.0, 52.0, 19.0, 9.0, 8.0, 8.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-16.328125, -15.855712890625, -15.38330078125, -14.910888671875, -14.4384765625, -13.966064453125, -13.49365234375, -13.021240234375, -12.548828125, -12.076416015625, -11.60400390625, -11.131591796875, -10.6591796875, -10.186767578125, -9.71435546875, -9.241943359375, -8.76953125, -8.297119140625, -7.82470703125, -7.352294921875, -6.8798828125, -6.407470703125, -5.93505859375, -5.462646484375, -4.990234375, -4.517822265625, -4.04541015625, -3.572998046875, -3.1005859375, -2.628173828125, -2.15576171875, -1.683349609375, -1.2109375, -0.738525390625, -0.26611328125, 0.206298828125, 0.6787109375, 1.151123046875, 1.62353515625, 2.095947265625, 2.568359375, 3.040771484375, 3.51318359375, 3.985595703125, 4.4580078125, 4.930419921875, 5.40283203125, 5.875244140625, 6.34765625, 6.820068359375, 7.29248046875, 7.764892578125, 8.2373046875, 8.709716796875, 9.18212890625, 9.654541015625, 10.126953125, 10.599365234375, 11.07177734375, 11.544189453125, 12.0166015625, 12.489013671875, 12.96142578125, 13.433837890625, 13.90625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 6.0, 4.0, 5.0, 8.0, 12.0, 12.0, 12.0, 20.0, 23.0, 23.0, 26.0, 22.0, 36.0, 37.0, 32.0, 28.0, 43.0, 45.0, 45.0, 53.0, 50.0, 47.0, 42.0, 36.0, 36.0, 41.0, 44.0, 23.0, 24.0, 20.0, 23.0, 19.0, 23.0, 16.0, 12.0, 16.0, 10.0, 8.0, 4.0, 9.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8203125, -15.2576904296875, -14.695068359375, -14.1324462890625, -13.56982421875, -13.0072021484375, -12.444580078125, -11.8819580078125, -11.3193359375, -10.7567138671875, -10.194091796875, -9.6314697265625, -9.06884765625, -8.5062255859375, -7.943603515625, -7.3809814453125, -6.818359375, -6.2557373046875, -5.693115234375, -5.1304931640625, -4.56787109375, -4.0052490234375, -3.442626953125, -2.8800048828125, -2.3173828125, -1.7547607421875, -1.192138671875, -0.6295166015625, -0.06689453125, 0.4957275390625, 1.058349609375, 1.6209716796875, 2.18359375, 2.7462158203125, 3.308837890625, 3.8714599609375, 4.43408203125, 4.9967041015625, 5.559326171875, 6.1219482421875, 6.6845703125, 7.2471923828125, 7.809814453125, 8.3724365234375, 8.93505859375, 9.4976806640625, 10.060302734375, 10.6229248046875, 11.185546875, 11.7481689453125, 12.310791015625, 12.8734130859375, 13.43603515625, 13.9986572265625, 14.561279296875, 15.1239013671875, 15.6865234375, 16.2491455078125, 16.811767578125, 17.3743896484375, 17.93701171875, 18.4996337890625, 19.062255859375, 19.6248779296875, 20.1875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 0.0, 9.0, 17.0, 25.0, 43.0, 68.0, 93.0, 165.0, 316.0, 470.0, 915.0, 1617.0, 2768.0, 5082.0, 8561.0, 14725.0, 24542.0, 38461.0, 57427.0, 79816.0, 102364.0, 119490.0, 126032.0, 120203.0, 103989.0, 81415.0, 58881.0, 39562.0, 25196.0, 15354.0, 9045.0, 5096.0, 2940.0, 1625.0, 950.0, 535.0, 303.0, 196.0, 99.0, 65.0, 35.0, 21.0, 18.0, 7.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.18359375, -5.9810791015625, -5.778564453125, -5.5760498046875, -5.37353515625, -5.1710205078125, -4.968505859375, -4.7659912109375, -4.5634765625, -4.3609619140625, -4.158447265625, -3.9559326171875, -3.75341796875, -3.5509033203125, -3.348388671875, -3.1458740234375, -2.943359375, -2.7408447265625, -2.538330078125, -2.3358154296875, -2.13330078125, -1.9307861328125, -1.728271484375, -1.5257568359375, -1.3232421875, -1.1207275390625, -0.918212890625, -0.7156982421875, -0.51318359375, -0.3106689453125, -0.108154296875, 0.0943603515625, 0.296875, 0.4993896484375, 0.701904296875, 0.9044189453125, 1.10693359375, 1.3094482421875, 1.511962890625, 1.7144775390625, 1.9169921875, 2.1195068359375, 2.322021484375, 2.5245361328125, 2.72705078125, 2.9295654296875, 3.132080078125, 3.3345947265625, 3.537109375, 3.7396240234375, 3.942138671875, 4.1446533203125, 4.34716796875, 4.5496826171875, 4.752197265625, 4.9547119140625, 5.1572265625, 5.3597412109375, 5.562255859375, 5.7647705078125, 5.96728515625, 6.1697998046875, 6.372314453125, 6.5748291015625, 6.77734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 6.0, 2.0, 3.0, 3.0, 10.0, 9.0, 7.0, 16.0, 13.0, 17.0, 12.0, 17.0, 20.0, 26.0, 25.0, 24.0, 34.0, 34.0, 44.0, 27.0, 41.0, 46.0, 35.0, 45.0, 37.0, 51.0, 43.0, 33.0, 41.0, 32.0, 39.0, 25.0, 27.0, 24.0, 28.0, 24.0, 9.0, 20.0, 10.0, 6.0, 7.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.000667572021484375, -0.0006482750177383423, -0.0006289780139923096, -0.0006096810102462769, -0.0005903840065002441, -0.0005710870027542114, -0.0005517899990081787, -0.000532492995262146, -0.0005131959915161133, -0.0004938989877700806, -0.00047460198402404785, -0.00045530498027801514, -0.0004360079765319824, -0.0004167109727859497, -0.000397413969039917, -0.0003781169652938843, -0.00035881996154785156, -0.00033952295780181885, -0.00032022595405578613, -0.0003009289503097534, -0.0002816319465637207, -0.000262334942817688, -0.00024303793907165527, -0.00022374093532562256, -0.00020444393157958984, -0.00018514692783355713, -0.00016584992408752441, -0.0001465529203414917, -0.00012725591659545898, -0.00010795891284942627, -8.866190910339355e-05, -6.936490535736084e-05, -5.0067901611328125e-05, -3.077089786529541e-05, -1.1473894119262695e-05, 7.82310962677002e-06, 2.7120113372802734e-05, 4.641711711883545e-05, 6.571412086486816e-05, 8.501112461090088e-05, 0.0001043081283569336, 0.0001236051321029663, 0.00014290213584899902, 0.00016219913959503174, 0.00018149614334106445, 0.00020079314708709717, 0.00022009015083312988, 0.0002393871545791626, 0.0002586841583251953, 0.00027798116207122803, 0.00029727816581726074, 0.00031657516956329346, 0.00033587217330932617, 0.0003551691770553589, 0.0003744661808013916, 0.0003937631845474243, 0.00041306018829345703, 0.00043235719203948975, 0.00045165419578552246, 0.0004709511995315552, 0.0004902482032775879, 0.0005095452070236206, 0.0005288422107696533, 0.000548139214515686, 0.0005674362182617188]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 13.0, 17.0, 17.0, 30.0, 40.0, 52.0, 88.0, 129.0, 188.0, 327.0, 531.0, 842.0, 1209.0, 1958.0, 3076.0, 4862.0, 7583.0, 12114.0, 18733.0, 27800.0, 39977.0, 55769.0, 73331.0, 90317.0, 103012.0, 110397.0, 107323.0, 97524.0, 81593.0, 64256.0, 47604.0, 33684.0, 22919.0, 15032.0, 9522.0, 6187.0, 3859.0, 2389.0, 1564.0, 906.0, 620.0, 399.0, 264.0, 162.0, 114.0, 72.0, 45.0, 40.0, 26.0, 18.0, 6.0, 7.0, 8.0, 4.0, 3.0, 1.0, 3.0], "bins": [-6.5078125, -6.30908203125, -6.1103515625, -5.91162109375, -5.712890625, -5.51416015625, -5.3154296875, -5.11669921875, -4.91796875, -4.71923828125, -4.5205078125, -4.32177734375, -4.123046875, -3.92431640625, -3.7255859375, -3.52685546875, -3.328125, -3.12939453125, -2.9306640625, -2.73193359375, -2.533203125, -2.33447265625, -2.1357421875, -1.93701171875, -1.73828125, -1.53955078125, -1.3408203125, -1.14208984375, -0.943359375, -0.74462890625, -0.5458984375, -0.34716796875, -0.1484375, 0.05029296875, 0.2490234375, 0.44775390625, 0.646484375, 0.84521484375, 1.0439453125, 1.24267578125, 1.44140625, 1.64013671875, 1.8388671875, 2.03759765625, 2.236328125, 2.43505859375, 2.6337890625, 2.83251953125, 3.03125, 3.22998046875, 3.4287109375, 3.62744140625, 3.826171875, 4.02490234375, 4.2236328125, 4.42236328125, 4.62109375, 4.81982421875, 5.0185546875, 5.21728515625, 5.416015625, 5.61474609375, 5.8134765625, 6.01220703125, 6.2109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 4.0, 7.0, 4.0, 7.0, 8.0, 15.0, 23.0, 13.0, 25.0, 24.0, 21.0, 21.0, 38.0, 49.0, 49.0, 41.0, 39.0, 60.0, 53.0, 51.0, 48.0, 46.0, 51.0, 41.0, 44.0, 31.0, 41.0, 18.0, 29.0, 19.0, 13.0, 13.0, 10.0, 15.0, 5.0, 5.0, 9.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.119140625, -3.006683349609375, -2.89422607421875, -2.781768798828125, -2.6693115234375, -2.556854248046875, -2.44439697265625, -2.331939697265625, -2.219482421875, -2.107025146484375, -1.99456787109375, -1.882110595703125, -1.7696533203125, -1.657196044921875, -1.54473876953125, -1.432281494140625, -1.31982421875, -1.207366943359375, -1.09490966796875, -0.982452392578125, -0.8699951171875, -0.757537841796875, -0.64508056640625, -0.532623291015625, -0.420166015625, -0.307708740234375, -0.19525146484375, -0.082794189453125, 0.0296630859375, 0.142120361328125, 0.25457763671875, 0.367034912109375, 0.4794921875, 0.591949462890625, 0.70440673828125, 0.816864013671875, 0.9293212890625, 1.041778564453125, 1.15423583984375, 1.266693115234375, 1.379150390625, 1.491607666015625, 1.60406494140625, 1.716522216796875, 1.8289794921875, 1.941436767578125, 2.05389404296875, 2.166351318359375, 2.27880859375, 2.391265869140625, 2.50372314453125, 2.616180419921875, 2.7286376953125, 2.841094970703125, 2.95355224609375, 3.066009521484375, 3.178466796875, 3.290924072265625, 3.40338134765625, 3.515838623046875, 3.6282958984375, 3.740753173828125, 3.85321044921875, 3.965667724609375, 4.078125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 1.0, 9.0, 11.0, 11.0, 11.0, 16.0, 11.0, 32.0, 33.0, 28.0, 37.0, 35.0, 38.0, 43.0, 59.0, 51.0, 44.0, 49.0, 50.0, 59.0, 51.0, 54.0, 44.0, 43.0, 31.0, 34.0, 29.0, 15.0, 10.0, 13.0, 18.0, 8.0, 6.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.37105369567871, -29.57705307006836, -28.783052444458008, -27.989051818847656, -27.195051193237305, -26.401050567626953, -25.6070499420166, -24.81304931640625, -24.0190486907959, -23.225048065185547, -22.431047439575195, -21.637046813964844, -20.843046188354492, -20.04904556274414, -19.25504493713379, -18.461044311523438, -17.667041778564453, -16.8730411529541, -16.07904052734375, -15.285039901733398, -14.491039276123047, -13.697038650512695, -12.903038024902344, -12.109037399291992, -11.31503677368164, -10.521036148071289, -9.727035522460938, -8.933034896850586, -8.139034271240234, -7.345033645629883, -6.551032543182373, -5.7570319175720215, -4.963031768798828, -4.169031143188477, -3.375030517578125, -2.5810296535491943, -1.7870290279388428, -0.9930284023284912, -0.19902753829956055, 0.594973087310791, 1.3889737129211426, 2.182974338531494, 2.9769749641418457, 3.7709758281707764, 4.564976692199707, 5.358977317810059, 6.15297794342041, 6.946978569030762, 7.740979194641113, 8.534979820251465, 9.328980445861816, 10.122981071472168, 10.91698169708252, 11.710982322692871, 12.504983901977539, 13.29898452758789, 14.092985153198242, 14.886985778808594, 15.680986404418945, 16.474987030029297, 17.26898765563965, 18.06298828125, 18.85698890686035, 19.650989532470703, 20.444990158081055]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 2.0, 5.0, 9.0, 9.0, 16.0, 9.0, 17.0, 15.0, 18.0, 22.0, 31.0, 39.0, 32.0, 39.0, 36.0, 34.0, 54.0, 53.0, 48.0, 58.0, 51.0, 49.0, 40.0, 32.0, 40.0, 31.0, 36.0, 27.0, 21.0, 27.0, 17.0, 16.0, 20.0, 11.0, 7.0, 11.0, 4.0, 2.0, 8.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-33.63252639770508, -32.673912048339844, -31.715299606323242, -30.75668716430664, -29.798072814941406, -28.839458465576172, -27.88084602355957, -26.92223358154297, -25.963619232177734, -25.0050048828125, -24.0463924407959, -23.087779998779297, -22.129165649414062, -21.170551300048828, -20.211938858032227, -19.253326416015625, -18.29471206665039, -17.336097717285156, -16.377485275268555, -15.418871879577637, -14.460258483886719, -13.5016450881958, -12.543031692504883, -11.584418296813965, -10.625804901123047, -9.667191505432129, -8.708578109741211, -7.749964714050293, -6.791351318359375, -5.832737922668457, -4.874124526977539, -3.915511131286621, -2.9568958282470703, -1.9982824325561523, -1.0396690368652344, -0.0810556411743164, 0.8775577545166016, 1.8361711502075195, 2.7947845458984375, 3.7533979415893555, 4.712011337280273, 5.670624732971191, 6.629238128662109, 7.587851524353027, 8.546464920043945, 9.505078315734863, 10.463691711425781, 11.4223051071167, 12.380918502807617, 13.339531898498535, 14.298145294189453, 15.256758689880371, 16.21537208557129, 17.17398452758789, 18.132598876953125, 19.09121322631836, 20.04982566833496, 21.008438110351562, 21.967052459716797, 22.92566680908203, 23.884279251098633, 24.842891693115234, 25.80150604248047, 26.760120391845703, 27.718732833862305]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 7.0, 10.0, 21.0, 29.0, 49.0, 57.0, 106.0, 184.0, 325.0, 482.0, 830.0, 1367.0, 2284.0, 3742.0, 6165.0, 10213.0, 16305.0, 26020.0, 40748.0, 61857.0, 91893.0, 132532.0, 182532.0, 242086.0, 301214.0, 356437.0, 396210.0, 410323.0, 397796.0, 360678.0, 305243.0, 247658.0, 186915.0, 136397.0, 96538.0, 65332.0, 42524.0, 27319.0, 17249.0, 10397.0, 6468.0, 3954.0, 2458.0, 1388.0, 803.0, 443.0, 298.0, 148.0, 111.0, 58.0, 41.0, 25.0, 11.0, 5.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0], "bins": [-14.4375, -13.9798583984375, -13.522216796875, -13.0645751953125, -12.60693359375, -12.1492919921875, -11.691650390625, -11.2340087890625, -10.7763671875, -10.3187255859375, -9.861083984375, -9.4034423828125, -8.94580078125, -8.4881591796875, -8.030517578125, -7.5728759765625, -7.115234375, -6.6575927734375, -6.199951171875, -5.7423095703125, -5.28466796875, -4.8270263671875, -4.369384765625, -3.9117431640625, -3.4541015625, -2.9964599609375, -2.538818359375, -2.0811767578125, -1.62353515625, -1.1658935546875, -0.708251953125, -0.2506103515625, 0.20703125, 0.6646728515625, 1.122314453125, 1.5799560546875, 2.03759765625, 2.4952392578125, 2.952880859375, 3.4105224609375, 3.8681640625, 4.3258056640625, 4.783447265625, 5.2410888671875, 5.69873046875, 6.1563720703125, 6.614013671875, 7.0716552734375, 7.529296875, 7.9869384765625, 8.444580078125, 8.9022216796875, 9.35986328125, 9.8175048828125, 10.275146484375, 10.7327880859375, 11.1904296875, 11.6480712890625, 12.105712890625, 12.5633544921875, 13.02099609375, 13.4786376953125, 13.936279296875, 14.3939208984375, 14.8515625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 7.0, 9.0, 7.0, 14.0, 11.0, 18.0, 15.0, 17.0, 28.0, 30.0, 37.0, 36.0, 38.0, 31.0, 42.0, 56.0, 53.0, 55.0, 56.0, 46.0, 50.0, 36.0, 26.0, 43.0, 32.0, 39.0, 20.0, 26.0, 23.0, 18.0, 15.0, 22.0, 9.0, 4.0, 10.0, 6.0, 3.0, 7.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-30.6875, -29.81103515625, -28.9345703125, -28.05810546875, -27.181640625, -26.30517578125, -25.4287109375, -24.55224609375, -23.67578125, -22.79931640625, -21.9228515625, -21.04638671875, -20.169921875, -19.29345703125, -18.4169921875, -17.54052734375, -16.6640625, -15.78759765625, -14.9111328125, -14.03466796875, -13.158203125, -12.28173828125, -11.4052734375, -10.52880859375, -9.65234375, -8.77587890625, -7.8994140625, -7.02294921875, -6.146484375, -5.27001953125, -4.3935546875, -3.51708984375, -2.640625, -1.76416015625, -0.8876953125, -0.01123046875, 0.865234375, 1.74169921875, 2.6181640625, 3.49462890625, 4.37109375, 5.24755859375, 6.1240234375, 7.00048828125, 7.876953125, 8.75341796875, 9.6298828125, 10.50634765625, 11.3828125, 12.25927734375, 13.1357421875, 14.01220703125, 14.888671875, 15.76513671875, 16.6416015625, 17.51806640625, 18.39453125, 19.27099609375, 20.1474609375, 21.02392578125, 21.900390625, 22.77685546875, 23.6533203125, 24.52978515625, 25.40625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 4.0, 9.0, 18.0, 28.0, 53.0, 95.0, 151.0, 295.0, 527.0, 840.0, 1374.0, 2316.0, 3830.0, 6180.0, 10046.0, 15921.0, 24259.0, 36467.0, 53678.0, 77388.0, 106958.0, 145102.0, 186690.0, 232909.0, 277749.0, 315790.0, 344036.0, 355930.0, 351943.0, 329736.0, 295177.0, 252875.0, 206757.0, 161739.0, 123124.0, 89312.0, 62695.0, 43338.0, 28577.0, 18758.0, 12184.0, 7527.0, 4647.0, 2910.0, 1740.0, 1047.0, 643.0, 364.0, 230.0, 132.0, 75.0, 59.0, 24.0, 21.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0], "bins": [-13.3984375, -12.9759521484375, -12.553466796875, -12.1309814453125, -11.70849609375, -11.2860107421875, -10.863525390625, -10.4410400390625, -10.0185546875, -9.5960693359375, -9.173583984375, -8.7510986328125, -8.32861328125, -7.9061279296875, -7.483642578125, -7.0611572265625, -6.638671875, -6.2161865234375, -5.793701171875, -5.3712158203125, -4.94873046875, -4.5262451171875, -4.103759765625, -3.6812744140625, -3.2587890625, -2.8363037109375, -2.413818359375, -1.9913330078125, -1.56884765625, -1.1463623046875, -0.723876953125, -0.3013916015625, 0.12109375, 0.5435791015625, 0.966064453125, 1.3885498046875, 1.81103515625, 2.2335205078125, 2.656005859375, 3.0784912109375, 3.5009765625, 3.9234619140625, 4.345947265625, 4.7684326171875, 5.19091796875, 5.6134033203125, 6.035888671875, 6.4583740234375, 6.880859375, 7.3033447265625, 7.725830078125, 8.1483154296875, 8.57080078125, 8.9932861328125, 9.415771484375, 9.8382568359375, 10.2607421875, 10.6832275390625, 11.105712890625, 11.5281982421875, 11.95068359375, 12.3731689453125, 12.795654296875, 13.2181396484375, 13.640625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 8.0, 6.0, 6.0, 10.0, 9.0, 10.0, 21.0, 26.0, 33.0, 51.0, 64.0, 66.0, 68.0, 78.0, 101.0, 121.0, 161.0, 128.0, 159.0, 177.0, 204.0, 214.0, 205.0, 202.0, 197.0, 187.0, 180.0, 165.0, 180.0, 157.0, 140.0, 131.0, 106.0, 95.0, 95.0, 74.0, 62.0, 42.0, 40.0, 22.0, 22.0, 16.0, 10.0, 10.0, 10.0, 4.0, 2.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.4453125, -10.118896484375, -9.79248046875, -9.466064453125, -9.1396484375, -8.813232421875, -8.48681640625, -8.160400390625, -7.833984375, -7.507568359375, -7.18115234375, -6.854736328125, -6.5283203125, -6.201904296875, -5.87548828125, -5.549072265625, -5.22265625, -4.896240234375, -4.56982421875, -4.243408203125, -3.9169921875, -3.590576171875, -3.26416015625, -2.937744140625, -2.611328125, -2.284912109375, -1.95849609375, -1.632080078125, -1.3056640625, -0.979248046875, -0.65283203125, -0.326416015625, 0.0, 0.326416015625, 0.65283203125, 0.979248046875, 1.3056640625, 1.632080078125, 1.95849609375, 2.284912109375, 2.611328125, 2.937744140625, 3.26416015625, 3.590576171875, 3.9169921875, 4.243408203125, 4.56982421875, 4.896240234375, 5.22265625, 5.549072265625, 5.87548828125, 6.201904296875, 6.5283203125, 6.854736328125, 7.18115234375, 7.507568359375, 7.833984375, 8.160400390625, 8.48681640625, 8.813232421875, 9.1396484375, 9.466064453125, 9.79248046875, 10.118896484375, 10.4453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 8.0, 10.0, 9.0, 14.0, 12.0, 23.0, 19.0, 11.0, 24.0, 18.0, 26.0, 36.0, 38.0, 27.0, 42.0, 31.0, 45.0, 46.0, 37.0, 48.0, 45.0, 40.0, 41.0, 32.0, 34.0, 41.0, 36.0, 34.0, 26.0, 25.0, 20.0, 26.0, 17.0, 10.0, 18.0, 4.0, 7.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.507322311401367, -19.853736877441406, -19.200149536132812, -18.54656410217285, -17.89297866821289, -17.239391326904297, -16.585805892944336, -15.932220458984375, -15.278634071350098, -14.62504768371582, -13.97146224975586, -13.317875862121582, -12.664289474487305, -12.010704040527344, -11.357117652893066, -10.703531265258789, -10.049945831298828, -9.39635944366455, -8.74277400970459, -8.089187622070312, -7.435601711273193, -6.782015800476074, -6.128429412841797, -5.474843502044678, -4.821257591247559, -4.1676716804504395, -3.514085531234741, -2.860499382019043, -2.206913471221924, -1.5533275604248047, -0.8997414112091064, -0.2461552619934082, 0.40743064880371094, 1.0610166788101196, 1.7146027088165283, 2.3681888580322266, 3.0217747688293457, 3.675360679626465, 4.328947067260742, 4.982532978057861, 5.6361188888549805, 6.2897047996521, 6.943290710449219, 7.596877098083496, 8.250463485717773, 8.904048919677734, 9.557635307312012, 10.211221694946289, 10.86480712890625, 11.518393516540527, 12.171978950500488, 12.825565338134766, 13.479150772094727, 14.132737159729004, 14.786323547363281, 15.439908981323242, 16.093494415283203, 16.747079849243164, 17.400667190551758, 18.05425262451172, 18.70783805847168, 19.36142349243164, 20.015010833740234, 20.668596267700195, 21.32218360900879]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 5.0, 7.0, 8.0, 6.0, 8.0, 11.0, 9.0, 21.0, 16.0, 24.0, 29.0, 40.0, 37.0, 32.0, 38.0, 44.0, 50.0, 56.0, 46.0, 48.0, 59.0, 32.0, 36.0, 37.0, 42.0, 46.0, 37.0, 22.0, 26.0, 21.0, 28.0, 29.0, 16.0, 8.0, 10.0, 9.0, 8.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-38.89293670654297, -37.8299560546875, -36.76697540283203, -35.70399856567383, -34.64101791381836, -33.57803726196289, -32.51506042480469, -31.45207977294922, -30.38909912109375, -29.32611846923828, -28.263139724731445, -27.20016098022461, -26.13718032836914, -25.074199676513672, -24.011220932006836, -22.9482421875, -21.88526153564453, -20.822280883789062, -19.759302139282227, -18.69632339477539, -17.633342742919922, -16.570362091064453, -15.507383346557617, -14.444403648376465, -13.381423950195312, -12.31844425201416, -11.255464553833008, -10.192484855651855, -9.129505157470703, -8.06652545928955, -7.003545761108398, -5.940566062927246, -4.877590179443359, -3.814610481262207, -2.7516307830810547, -1.6886510848999023, -0.62567138671875, 0.43730831146240234, 1.5002880096435547, 2.563267707824707, 3.6262474060058594, 4.689227104187012, 5.752206802368164, 6.815186500549316, 7.878166198730469, 8.941145896911621, 10.004125595092773, 11.067105293273926, 12.130084991455078, 13.19306468963623, 14.256044387817383, 15.319024085998535, 16.382003784179688, 17.444984436035156, 18.507963180541992, 19.570941925048828, 20.633922576904297, 21.696903228759766, 22.7598819732666, 23.822860717773438, 24.885841369628906, 25.948822021484375, 27.01180076599121, 28.074779510498047, 29.137760162353516]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 12.0, 11.0, 14.0, 20.0, 45.0, 87.0, 165.0, 224.0, 385.0, 588.0, 1118.0, 1668.0, 2709.0, 4171.0, 6724.0, 10628.0, 16101.0, 24450.0, 36041.0, 50518.0, 68725.0, 89086.0, 106060.0, 115523.0, 114387.0, 102720.0, 85287.0, 65577.0, 47910.0, 33541.0, 22803.0, 14934.0, 9708.0, 6276.0, 3976.0, 2430.0, 1471.0, 951.0, 583.0, 369.0, 209.0, 144.0, 79.0, 45.0, 22.0, 35.0, 17.0, 10.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.142578125, -3.047088623046875, -2.95159912109375, -2.856109619140625, -2.7606201171875, -2.665130615234375, -2.56964111328125, -2.474151611328125, -2.378662109375, -2.283172607421875, -2.18768310546875, -2.092193603515625, -1.9967041015625, -1.901214599609375, -1.80572509765625, -1.710235595703125, -1.61474609375, -1.519256591796875, -1.42376708984375, -1.328277587890625, -1.2327880859375, -1.137298583984375, -1.04180908203125, -0.946319580078125, -0.850830078125, -0.755340576171875, -0.65985107421875, -0.564361572265625, -0.4688720703125, -0.373382568359375, -0.27789306640625, -0.182403564453125, -0.0869140625, 0.008575439453125, 0.10406494140625, 0.199554443359375, 0.2950439453125, 0.390533447265625, 0.48602294921875, 0.581512451171875, 0.677001953125, 0.772491455078125, 0.86798095703125, 0.963470458984375, 1.0589599609375, 1.154449462890625, 1.24993896484375, 1.345428466796875, 1.44091796875, 1.536407470703125, 1.63189697265625, 1.727386474609375, 1.8228759765625, 1.918365478515625, 2.01385498046875, 2.109344482421875, 2.204833984375, 2.300323486328125, 2.39581298828125, 2.491302490234375, 2.5867919921875, 2.682281494140625, 2.77777099609375, 2.873260498046875, 2.96875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 4.0, 7.0, 8.0, 6.0, 9.0, 10.0, 10.0, 20.0, 16.0, 23.0, 30.0, 42.0, 34.0, 33.0, 40.0, 43.0, 48.0, 57.0, 46.0, 48.0, 60.0, 31.0, 36.0, 38.0, 40.0, 47.0, 37.0, 22.0, 28.0, 19.0, 28.0, 29.0, 16.0, 9.0, 10.0, 8.0, 8.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-38.9375, -37.87353515625, -36.8095703125, -35.74560546875, -34.681640625, -33.61767578125, -32.5537109375, -31.48974609375, -30.42578125, -29.36181640625, -28.2978515625, -27.23388671875, -26.169921875, -25.10595703125, -24.0419921875, -22.97802734375, -21.9140625, -20.85009765625, -19.7861328125, -18.72216796875, -17.658203125, -16.59423828125, -15.5302734375, -14.46630859375, -13.40234375, -12.33837890625, -11.2744140625, -10.21044921875, -9.146484375, -8.08251953125, -7.0185546875, -5.95458984375, -4.890625, -3.82666015625, -2.7626953125, -1.69873046875, -0.634765625, 0.42919921875, 1.4931640625, 2.55712890625, 3.62109375, 4.68505859375, 5.7490234375, 6.81298828125, 7.876953125, 8.94091796875, 10.0048828125, 11.06884765625, 12.1328125, 13.19677734375, 14.2607421875, 15.32470703125, 16.388671875, 17.45263671875, 18.5166015625, 19.58056640625, 20.64453125, 21.70849609375, 22.7724609375, 23.83642578125, 24.900390625, 25.96435546875, 27.0283203125, 28.09228515625, 29.15625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 7.0, 5.0, 7.0, 12.0, 17.0, 36.0, 34.0, 57.0, 96.0, 138.0, 174.0, 275.0, 360.0, 597.0, 815.0, 1181.0, 1629.0, 2472.0, 3504.0, 4873.0, 6982.0, 10328.0, 16082.0, 27057.0, 144152.0, 708875.0, 53526.0, 22297.0, 13500.0, 9015.0, 6119.0, 4341.0, 3036.0, 2160.0, 1485.0, 970.0, 747.0, 494.0, 339.0, 227.0, 166.0, 121.0, 91.0, 47.0, 38.0, 27.0, 21.0, 12.0, 9.0, 2.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.7652587890625, -5.546142578125, -5.3270263671875, -5.10791015625, -4.8887939453125, -4.669677734375, -4.4505615234375, -4.2314453125, -4.0123291015625, -3.793212890625, -3.5740966796875, -3.35498046875, -3.1358642578125, -2.916748046875, -2.6976318359375, -2.478515625, -2.2593994140625, -2.040283203125, -1.8211669921875, -1.60205078125, -1.3829345703125, -1.163818359375, -0.9447021484375, -0.7255859375, -0.5064697265625, -0.287353515625, -0.0682373046875, 0.15087890625, 0.3699951171875, 0.589111328125, 0.8082275390625, 1.02734375, 1.2464599609375, 1.465576171875, 1.6846923828125, 1.90380859375, 2.1229248046875, 2.342041015625, 2.5611572265625, 2.7802734375, 2.9993896484375, 3.218505859375, 3.4376220703125, 3.65673828125, 3.8758544921875, 4.094970703125, 4.3140869140625, 4.533203125, 4.7523193359375, 4.971435546875, 5.1905517578125, 5.40966796875, 5.6287841796875, 5.847900390625, 6.0670166015625, 6.2861328125, 6.5052490234375, 6.724365234375, 6.9434814453125, 7.16259765625, 7.3817138671875, 7.600830078125, 7.8199462890625, 8.0390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 7.0, 4.0, 7.0, 8.0, 5.0, 11.0, 9.0, 17.0, 15.0, 14.0, 15.0, 27.0, 23.0, 29.0, 31.0, 35.0, 37.0, 33.0, 39.0, 41.0, 44.0, 34.0, 39.0, 29.0, 41.0, 40.0, 41.0, 38.0, 34.0, 27.0, 27.0, 22.0, 25.0, 32.0, 13.0, 18.0, 16.0, 18.0, 18.0, 10.0, 5.0, 10.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.078125, -21.361572265625, -20.64501953125, -19.928466796875, -19.2119140625, -18.495361328125, -17.77880859375, -17.062255859375, -16.345703125, -15.629150390625, -14.91259765625, -14.196044921875, -13.4794921875, -12.762939453125, -12.04638671875, -11.329833984375, -10.61328125, -9.896728515625, -9.18017578125, -8.463623046875, -7.7470703125, -7.030517578125, -6.31396484375, -5.597412109375, -4.880859375, -4.164306640625, -3.44775390625, -2.731201171875, -2.0146484375, -1.298095703125, -0.58154296875, 0.135009765625, 0.8515625, 1.568115234375, 2.28466796875, 3.001220703125, 3.7177734375, 4.434326171875, 5.15087890625, 5.867431640625, 6.583984375, 7.300537109375, 8.01708984375, 8.733642578125, 9.4501953125, 10.166748046875, 10.88330078125, 11.599853515625, 12.31640625, 13.032958984375, 13.74951171875, 14.466064453125, 15.1826171875, 15.899169921875, 16.61572265625, 17.332275390625, 18.048828125, 18.765380859375, 19.48193359375, 20.198486328125, 20.9150390625, 21.631591796875, 22.34814453125, 23.064697265625, 23.78125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 11.0, 10.0, 16.0, 15.0, 11.0, 42.0, 37.0, 51.0, 58.0, 83.0, 111.0, 145.0, 195.0, 274.0, 378.0, 521.0, 699.0, 1027.0, 1520.0, 2305.0, 3309.0, 5056.0, 8064.0, 12740.0, 21888.0, 49511.0, 822926.0, 56940.0, 22939.0, 13398.0, 8034.0, 5153.0, 3421.0, 2332.0, 1486.0, 1075.0, 742.0, 539.0, 402.0, 262.0, 224.0, 141.0, 126.0, 83.0, 72.0, 52.0, 38.0, 27.0, 11.0, 16.0, 16.0, 13.0, 4.0, 2.0, 0.0, 1.0, 4.0], "bins": [-1.1923828125, -1.156829833984375, -1.12127685546875, -1.085723876953125, -1.0501708984375, -1.014617919921875, -0.97906494140625, -0.943511962890625, -0.907958984375, -0.872406005859375, -0.83685302734375, -0.801300048828125, -0.7657470703125, -0.730194091796875, -0.69464111328125, -0.659088134765625, -0.62353515625, -0.587982177734375, -0.55242919921875, -0.516876220703125, -0.4813232421875, -0.445770263671875, -0.41021728515625, -0.374664306640625, -0.339111328125, -0.303558349609375, -0.26800537109375, -0.232452392578125, -0.1968994140625, -0.161346435546875, -0.12579345703125, -0.090240478515625, -0.0546875, -0.019134521484375, 0.01641845703125, 0.051971435546875, 0.0875244140625, 0.123077392578125, 0.15863037109375, 0.194183349609375, 0.229736328125, 0.265289306640625, 0.30084228515625, 0.336395263671875, 0.3719482421875, 0.407501220703125, 0.44305419921875, 0.478607177734375, 0.51416015625, 0.549713134765625, 0.58526611328125, 0.620819091796875, 0.6563720703125, 0.691925048828125, 0.72747802734375, 0.763031005859375, 0.798583984375, 0.834136962890625, 0.86968994140625, 0.905242919921875, 0.9407958984375, 0.976348876953125, 1.01190185546875, 1.047454833984375, 1.0830078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 7.0, 5.0, 1.0, 3.0, 6.0, 3.0, 8.0, 6.0, 8.0, 10.0, 12.0, 14.0, 18.0, 22.0, 31.0, 29.0, 32.0, 34.0, 39.0, 38.0, 46.0, 37.0, 45.0, 48.0, 51.0, 41.0, 45.0, 39.0, 35.0, 30.0, 37.0, 38.0, 35.0, 20.0, 24.0, 20.0, 15.0, 23.0, 10.0, 14.0, 9.0, 5.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.1636486053466797e-05, -2.0969659090042114e-05, -2.030283212661743e-05, -1.963600516319275e-05, -1.8969178199768066e-05, -1.8302351236343384e-05, -1.76355242729187e-05, -1.696869730949402e-05, -1.6301870346069336e-05, -1.5635043382644653e-05, -1.496821641921997e-05, -1.4301389455795288e-05, -1.3634562492370605e-05, -1.2967735528945923e-05, -1.230090856552124e-05, -1.1634081602096558e-05, -1.0967254638671875e-05, -1.0300427675247192e-05, -9.63360071182251e-06, -8.966773748397827e-06, -8.299946784973145e-06, -7.633119821548462e-06, -6.966292858123779e-06, -6.299465894699097e-06, -5.632638931274414e-06, -4.9658119678497314e-06, -4.298985004425049e-06, -3.632158041000366e-06, -2.9653310775756836e-06, -2.298504114151001e-06, -1.6316771507263184e-06, -9.648501873016357e-07, -2.980232238769531e-07, 3.688037395477295e-07, 1.0356307029724121e-06, 1.7024576663970947e-06, 2.3692846298217773e-06, 3.03611159324646e-06, 3.7029385566711426e-06, 4.369765520095825e-06, 5.036592483520508e-06, 5.7034194469451904e-06, 6.370246410369873e-06, 7.037073373794556e-06, 7.703900337219238e-06, 8.370727300643921e-06, 9.037554264068604e-06, 9.704381227493286e-06, 1.0371208190917969e-05, 1.1038035154342651e-05, 1.1704862117767334e-05, 1.2371689081192017e-05, 1.30385160446167e-05, 1.3705343008041382e-05, 1.4372169971466064e-05, 1.5038996934890747e-05, 1.570582389831543e-05, 1.6372650861740112e-05, 1.7039477825164795e-05, 1.7706304788589478e-05, 1.837313175201416e-05, 1.9039958715438843e-05, 1.9706785678863525e-05, 2.0373612642288208e-05, 2.104043960571289e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 10.0, 16.0, 24.0, 36.0, 62.0, 84.0, 135.0, 189.0, 268.0, 379.0, 543.0, 808.0, 1234.0, 1812.0, 2649.0, 3814.0, 5745.0, 8630.0, 13214.0, 20122.0, 30754.0, 45911.0, 68629.0, 100827.0, 138694.0, 158532.0, 138188.0, 101183.0, 68848.0, 46469.0, 30622.0, 19971.0, 13417.0, 8786.0, 5874.0, 3926.0, 2616.0, 1759.0, 1250.0, 812.0, 556.0, 337.0, 252.0, 179.0, 121.0, 85.0, 58.0, 30.0, 30.0, 15.0, 9.0, 10.0, 11.0, 6.0, 5.0, 2.0, 2.0], "bins": [-0.89697265625, -0.8693771362304688, -0.8417816162109375, -0.8141860961914062, -0.786590576171875, -0.7589950561523438, -0.7313995361328125, -0.7038040161132812, -0.67620849609375, -0.6486129760742188, -0.6210174560546875, -0.5934219360351562, -0.565826416015625, -0.5382308959960938, -0.5106353759765625, -0.48303985595703125, -0.4554443359375, -0.42784881591796875, -0.4002532958984375, -0.37265777587890625, -0.345062255859375, -0.31746673583984375, -0.2898712158203125, -0.26227569580078125, -0.23468017578125, -0.20708465576171875, -0.1794891357421875, -0.15189361572265625, -0.124298095703125, -0.09670257568359375, -0.0691070556640625, -0.04151153564453125, -0.013916015625, 0.01367950439453125, 0.0412750244140625, 0.06887054443359375, 0.096466064453125, 0.12406158447265625, 0.1516571044921875, 0.17925262451171875, 0.20684814453125, 0.23444366455078125, 0.2620391845703125, 0.28963470458984375, 0.317230224609375, 0.34482574462890625, 0.3724212646484375, 0.40001678466796875, 0.4276123046875, 0.45520782470703125, 0.4828033447265625, 0.5103988647460938, 0.537994384765625, 0.5655899047851562, 0.5931854248046875, 0.6207809448242188, 0.64837646484375, 0.6759719848632812, 0.7035675048828125, 0.7311630249023438, 0.758758544921875, 0.7863540649414062, 0.8139495849609375, 0.8415451049804688, 0.869140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 8.0, 5.0, 5.0, 12.0, 9.0, 7.0, 7.0, 11.0, 7.0, 11.0, 13.0, 24.0, 36.0, 31.0, 48.0, 33.0, 40.0, 35.0, 38.0, 41.0, 48.0, 58.0, 42.0, 60.0, 41.0, 39.0, 33.0, 37.0, 27.0, 40.0, 21.0, 24.0, 22.0, 13.0, 20.0, 13.0, 12.0, 4.0, 6.0, 8.0, 6.0, 4.0, 3.0, 0.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.990234375, -0.9612655639648438, -0.9322967529296875, -0.9033279418945312, -0.874359130859375, -0.8453903198242188, -0.8164215087890625, -0.7874526977539062, -0.75848388671875, -0.7295150756835938, -0.7005462646484375, -0.6715774536132812, -0.642608642578125, -0.6136398315429688, -0.5846710205078125, -0.5557022094726562, -0.5267333984375, -0.49776458740234375, -0.4687957763671875, -0.43982696533203125, -0.410858154296875, -0.38188934326171875, -0.3529205322265625, -0.32395172119140625, -0.29498291015625, -0.26601409912109375, -0.2370452880859375, -0.20807647705078125, -0.179107666015625, -0.15013885498046875, -0.1211700439453125, -0.09220123291015625, -0.063232421875, -0.03426361083984375, -0.0052947998046875, 0.02367401123046875, 0.052642822265625, 0.08161163330078125, 0.1105804443359375, 0.13954925537109375, 0.16851806640625, 0.19748687744140625, 0.2264556884765625, 0.25542449951171875, 0.284393310546875, 0.31336212158203125, 0.3423309326171875, 0.37129974365234375, 0.4002685546875, 0.42923736572265625, 0.4582061767578125, 0.48717498779296875, 0.516143798828125, 0.5451126098632812, 0.5740814208984375, 0.6030502319335938, 0.63201904296875, 0.6609878540039062, 0.6899566650390625, 0.7189254760742188, 0.747894287109375, 0.7768630981445312, 0.8058319091796875, 0.8348007202148438, 0.86376953125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0, 9.0, 11.0, 9.0, 11.0, 12.0, 23.0, 21.0, 14.0, 21.0, 21.0, 26.0, 36.0, 25.0, 37.0, 39.0, 37.0, 35.0, 43.0, 42.0, 43.0, 44.0, 51.0, 37.0, 31.0, 45.0, 31.0, 39.0, 28.0, 28.0, 22.0, 23.0, 25.0, 18.0, 18.0, 13.0, 6.0, 5.0, 10.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.4130859375, -19.76155662536621, -19.110027313232422, -18.458498001098633, -17.806968688964844, -17.155439376831055, -16.503910064697266, -15.852381706237793, -15.200852394104004, -14.549323081970215, -13.897793769836426, -13.246264457702637, -12.594736099243164, -11.943206787109375, -11.291677474975586, -10.640148162841797, -9.988618850708008, -9.337089538574219, -8.68556022644043, -8.03403091430664, -7.38250207901001, -6.730972766876221, -6.07944393157959, -5.427914619445801, -4.776385307312012, -4.124855995178223, -3.4733269214630127, -2.8217978477478027, -2.1702685356140137, -1.5187392234802246, -0.8672101497650146, -0.2156810760498047, 0.4358501434326172, 1.0873793363571167, 1.7389085292816162, 2.390437602996826, 3.0419669151306152, 3.6934962272644043, 4.345025062561035, 4.996554374694824, 5.648083686828613, 6.299612998962402, 6.951142311096191, 7.602671146392822, 8.254199981689453, 8.905729293823242, 9.557258605957031, 10.20878791809082, 10.86031723022461, 11.511846542358398, 12.163375854492188, 12.814905166625977, 13.466434478759766, 14.117963790893555, 14.769492149353027, 15.421021461486816, 16.072551727294922, 16.72408103942871, 17.3756103515625, 18.02713966369629, 18.678668975830078, 19.330198287963867, 19.981727600097656, 20.633255004882812, 21.2847843170166]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 10.0, 8.0, 6.0, 8.0, 10.0, 11.0, 19.0, 18.0, 23.0, 32.0, 33.0, 40.0, 33.0, 46.0, 36.0, 54.0, 43.0, 57.0, 51.0, 46.0, 44.0, 37.0, 33.0, 39.0, 49.0, 33.0, 24.0, 23.0, 25.0, 30.0, 22.0, 19.0, 11.0, 10.0, 6.0, 9.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-38.49296569824219, -37.4401741027832, -36.387386322021484, -35.3345947265625, -34.28180694580078, -33.2290153503418, -32.17622756958008, -31.123435974121094, -30.070648193359375, -29.017858505249023, -27.965068817138672, -26.91227912902832, -25.85948944091797, -24.806699752807617, -23.753910064697266, -22.70111846923828, -21.64832878112793, -20.595539093017578, -19.542749404907227, -18.489959716796875, -17.437170028686523, -16.384380340576172, -15.331589698791504, -14.278800010681152, -13.2260103225708, -12.17322063446045, -11.120430946350098, -10.06764030456543, -9.014850616455078, -7.962061405181885, -6.909271240234375, -5.856481552124023, -4.803691864013672, -3.7509021759033203, -2.6981122493743896, -1.645322322845459, -0.5925326347351074, 0.46025705337524414, 1.513047218322754, 2.5658369064331055, 3.618626594543457, 4.671416282653809, 5.72420597076416, 6.77699613571167, 7.8297858238220215, 8.882575988769531, 9.935365676879883, 10.988155364990234, 12.040945053100586, 13.093734741210938, 14.146524429321289, 15.19931411743164, 16.252103805541992, 17.304893493652344, 18.357685089111328, 19.410472869873047, 20.46326446533203, 21.516054153442383, 22.568843841552734, 23.621633529663086, 24.674423217773438, 25.72721290588379, 26.78000259399414, 27.832794189453125, 28.885581970214844]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 8.0, 16.0, 19.0, 37.0, 36.0, 64.0, 113.0, 158.0, 287.0, 407.0, 727.0, 1152.0, 1778.0, 2827.0, 4417.0, 6682.0, 9925.0, 14485.0, 20731.0, 28913.0, 38795.0, 50093.0, 61786.0, 73414.0, 83316.0, 89585.0, 91048.0, 88703.0, 80786.0, 70861.0, 59635.0, 46858.0, 35922.0, 26578.0, 19260.0, 13366.0, 9051.0, 6074.0, 3941.0, 2489.0, 1555.0, 986.0, 641.0, 376.0, 241.0, 175.0, 90.0, 55.0, 34.0, 23.0, 22.0, 12.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-11.71875, -11.3568115234375, -10.994873046875, -10.6329345703125, -10.27099609375, -9.9090576171875, -9.547119140625, -9.1851806640625, -8.8232421875, -8.4613037109375, -8.099365234375, -7.7374267578125, -7.37548828125, -7.0135498046875, -6.651611328125, -6.2896728515625, -5.927734375, -5.5657958984375, -5.203857421875, -4.8419189453125, -4.47998046875, -4.1180419921875, -3.756103515625, -3.3941650390625, -3.0322265625, -2.6702880859375, -2.308349609375, -1.9464111328125, -1.58447265625, -1.2225341796875, -0.860595703125, -0.4986572265625, -0.13671875, 0.2252197265625, 0.587158203125, 0.9490966796875, 1.31103515625, 1.6729736328125, 2.034912109375, 2.3968505859375, 2.7587890625, 3.1207275390625, 3.482666015625, 3.8446044921875, 4.20654296875, 4.5684814453125, 4.930419921875, 5.2923583984375, 5.654296875, 6.0162353515625, 6.378173828125, 6.7401123046875, 7.10205078125, 7.4639892578125, 7.825927734375, 8.1878662109375, 8.5498046875, 8.9117431640625, 9.273681640625, 9.6356201171875, 9.99755859375, 10.3594970703125, 10.721435546875, 11.0833740234375, 11.4453125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 9.0, 8.0, 8.0, 7.0, 10.0, 10.0, 19.0, 20.0, 23.0, 34.0, 32.0, 41.0, 32.0, 43.0, 40.0, 55.0, 48.0, 54.0, 50.0, 49.0, 39.0, 37.0, 31.0, 47.0, 46.0, 31.0, 23.0, 22.0, 25.0, 32.0, 21.0, 15.0, 12.0, 11.0, 5.0, 8.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-37.625, -36.592529296875, -35.56005859375, -34.527587890625, -33.4951171875, -32.462646484375, -31.43017578125, -30.397705078125, -29.365234375, -28.332763671875, -27.30029296875, -26.267822265625, -25.2353515625, -24.202880859375, -23.17041015625, -22.137939453125, -21.10546875, -20.072998046875, -19.04052734375, -18.008056640625, -16.9755859375, -15.943115234375, -14.91064453125, -13.878173828125, -12.845703125, -11.813232421875, -10.78076171875, -9.748291015625, -8.7158203125, -7.683349609375, -6.65087890625, -5.618408203125, -4.5859375, -3.553466796875, -2.52099609375, -1.488525390625, -0.4560546875, 0.576416015625, 1.60888671875, 2.641357421875, 3.673828125, 4.706298828125, 5.73876953125, 6.771240234375, 7.8037109375, 8.836181640625, 9.86865234375, 10.901123046875, 11.93359375, 12.966064453125, 13.99853515625, 15.031005859375, 16.0634765625, 17.095947265625, 18.12841796875, 19.160888671875, 20.193359375, 21.225830078125, 22.25830078125, 23.290771484375, 24.3232421875, 25.355712890625, 26.38818359375, 27.420654296875, 28.453125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 6.0, 8.0, 11.0, 17.0, 42.0, 70.0, 73.0, 137.0, 189.0, 301.0, 470.0, 703.0, 1130.0, 1657.0, 2395.0, 3707.0, 5373.0, 7712.0, 11226.0, 15655.0, 21532.0, 29349.0, 38031.0, 48330.0, 58819.0, 69357.0, 77733.0, 83580.0, 85727.0, 83561.0, 78452.0, 70120.0, 59452.0, 49306.0, 39302.0, 30131.0, 22492.0, 16088.0, 11689.0, 8144.0, 5515.0, 3697.0, 2467.0, 1632.0, 1137.0, 737.0, 465.0, 313.0, 184.0, 132.0, 75.0, 50.0, 32.0, 15.0, 14.0, 8.0, 10.0, 3.0, 1.0, 3.0, 1.0], "bins": [-11.1015625, -10.7496337890625, -10.397705078125, -10.0457763671875, -9.69384765625, -9.3419189453125, -8.989990234375, -8.6380615234375, -8.2861328125, -7.9342041015625, -7.582275390625, -7.2303466796875, -6.87841796875, -6.5264892578125, -6.174560546875, -5.8226318359375, -5.470703125, -5.1187744140625, -4.766845703125, -4.4149169921875, -4.06298828125, -3.7110595703125, -3.359130859375, -3.0072021484375, -2.6552734375, -2.3033447265625, -1.951416015625, -1.5994873046875, -1.24755859375, -0.8956298828125, -0.543701171875, -0.1917724609375, 0.16015625, 0.5120849609375, 0.864013671875, 1.2159423828125, 1.56787109375, 1.9197998046875, 2.271728515625, 2.6236572265625, 2.9755859375, 3.3275146484375, 3.679443359375, 4.0313720703125, 4.38330078125, 4.7352294921875, 5.087158203125, 5.4390869140625, 5.791015625, 6.1429443359375, 6.494873046875, 6.8468017578125, 7.19873046875, 7.5506591796875, 7.902587890625, 8.2545166015625, 8.6064453125, 8.9583740234375, 9.310302734375, 9.6622314453125, 10.01416015625, 10.3660888671875, 10.718017578125, 11.0699462890625, 11.421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 8.0, 11.0, 11.0, 15.0, 12.0, 15.0, 15.0, 23.0, 25.0, 27.0, 31.0, 25.0, 47.0, 61.0, 48.0, 54.0, 61.0, 50.0, 41.0, 40.0, 52.0, 37.0, 41.0, 30.0, 39.0, 31.0, 33.0, 21.0, 16.0, 10.0, 18.0, 12.0, 12.0, 8.0, 4.0, 9.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.75, -19.0380859375, -18.326171875, -17.6142578125, -16.90234375, -16.1904296875, -15.478515625, -14.7666015625, -14.0546875, -13.3427734375, -12.630859375, -11.9189453125, -11.20703125, -10.4951171875, -9.783203125, -9.0712890625, -8.359375, -7.6474609375, -6.935546875, -6.2236328125, -5.51171875, -4.7998046875, -4.087890625, -3.3759765625, -2.6640625, -1.9521484375, -1.240234375, -0.5283203125, 0.18359375, 0.8955078125, 1.607421875, 2.3193359375, 3.03125, 3.7431640625, 4.455078125, 5.1669921875, 5.87890625, 6.5908203125, 7.302734375, 8.0146484375, 8.7265625, 9.4384765625, 10.150390625, 10.8623046875, 11.57421875, 12.2861328125, 12.998046875, 13.7099609375, 14.421875, 15.1337890625, 15.845703125, 16.5576171875, 17.26953125, 17.9814453125, 18.693359375, 19.4052734375, 20.1171875, 20.8291015625, 21.541015625, 22.2529296875, 22.96484375, 23.6767578125, 24.388671875, 25.1005859375, 25.8125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 2.0, 10.0, 18.0, 33.0, 34.0, 66.0, 100.0, 192.0, 304.0, 491.0, 804.0, 1377.0, 2181.0, 3534.0, 5559.0, 8489.0, 12690.0, 19117.0, 27301.0, 37262.0, 50088.0, 63251.0, 77676.0, 88944.0, 96425.0, 98330.0, 94150.0, 84445.0, 72154.0, 57627.0, 44604.0, 32495.0, 23233.0, 15927.0, 10667.0, 7072.0, 4424.0, 2843.0, 1845.0, 1120.0, 638.0, 430.0, 237.0, 147.0, 98.0, 42.0, 27.0, 18.0, 20.0, 10.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.70703125, -5.52459716796875, -5.3421630859375, -5.15972900390625, -4.977294921875, -4.79486083984375, -4.6124267578125, -4.42999267578125, -4.24755859375, -4.06512451171875, -3.8826904296875, -3.70025634765625, -3.517822265625, -3.33538818359375, -3.1529541015625, -2.97052001953125, -2.7880859375, -2.60565185546875, -2.4232177734375, -2.24078369140625, -2.058349609375, -1.87591552734375, -1.6934814453125, -1.51104736328125, -1.32861328125, -1.14617919921875, -0.9637451171875, -0.78131103515625, -0.598876953125, -0.41644287109375, -0.2340087890625, -0.05157470703125, 0.130859375, 0.31329345703125, 0.4957275390625, 0.67816162109375, 0.860595703125, 1.04302978515625, 1.2254638671875, 1.40789794921875, 1.59033203125, 1.77276611328125, 1.9552001953125, 2.13763427734375, 2.320068359375, 2.50250244140625, 2.6849365234375, 2.86737060546875, 3.0498046875, 3.23223876953125, 3.4146728515625, 3.59710693359375, 3.779541015625, 3.96197509765625, 4.1444091796875, 4.32684326171875, 4.50927734375, 4.69171142578125, 4.8741455078125, 5.05657958984375, 5.239013671875, 5.42144775390625, 5.6038818359375, 5.78631591796875, 5.96875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 5.0, 12.0, 11.0, 22.0, 24.0, 24.0, 22.0, 31.0, 28.0, 29.0, 41.0, 31.0, 47.0, 43.0, 44.0, 43.0, 54.0, 41.0, 47.0, 45.0, 36.0, 40.0, 41.0, 30.0, 30.0, 33.0, 20.0, 16.0, 22.0, 17.0, 7.0, 14.0, 8.0, 5.0, 3.0, 7.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0006995201110839844, -0.000675298273563385, -0.0006510764360427856, -0.0006268545985221863, -0.0006026327610015869, -0.0005784109234809875, -0.0005541890859603882, -0.0005299672484397888, -0.0005057454109191895, -0.0004815235733985901, -0.0004573017358779907, -0.00043307989835739136, -0.000408858060836792, -0.0003846362233161926, -0.00036041438579559326, -0.0003361925482749939, -0.00031197071075439453, -0.00028774887323379517, -0.0002635270357131958, -0.00023930519819259644, -0.00021508336067199707, -0.0001908615231513977, -0.00016663968563079834, -0.00014241784811019897, -0.00011819601058959961, -9.397417306900024e-05, -6.975233554840088e-05, -4.5530498027801514e-05, -2.130866050720215e-05, 2.913177013397217e-06, 2.7135014533996582e-05, 5.135685205459595e-05, 7.557868957519531e-05, 9.980052709579468e-05, 0.00012402236461639404, 0.0001482442021369934, 0.00017246603965759277, 0.00019668787717819214, 0.0002209097146987915, 0.00024513155221939087, 0.00026935338973999023, 0.0002935752272605896, 0.00031779706478118896, 0.00034201890230178833, 0.0003662407398223877, 0.00039046257734298706, 0.0004146844148635864, 0.0004389062523841858, 0.00046312808990478516, 0.0004873499274253845, 0.0005115717649459839, 0.0005357936024665833, 0.0005600154399871826, 0.000584237277507782, 0.0006084591150283813, 0.0006326809525489807, 0.0006569027900695801, 0.0006811246275901794, 0.0007053464651107788, 0.0007295683026313782, 0.0007537901401519775, 0.0007780119776725769, 0.0008022338151931763, 0.0008264556527137756, 0.000850677490234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 19.0, 23.0, 45.0, 48.0, 96.0, 147.0, 243.0, 348.0, 542.0, 815.0, 1313.0, 2044.0, 3244.0, 4889.0, 7225.0, 10685.0, 15802.0, 22600.0, 30709.0, 40629.0, 52768.0, 65030.0, 76240.0, 85860.0, 91199.0, 91906.0, 87441.0, 79188.0, 68361.0, 56044.0, 43566.0, 33191.0, 23949.0, 17314.0, 11764.0, 8096.0, 5323.0, 3443.0, 2305.0, 1509.0, 921.0, 634.0, 383.0, 251.0, 145.0, 84.0, 63.0, 41.0, 34.0, 17.0, 6.0, 9.0, 4.0, 1.0, 1.0], "bins": [-6.4375, -6.24884033203125, -6.0601806640625, -5.87152099609375, -5.682861328125, -5.49420166015625, -5.3055419921875, -5.11688232421875, -4.92822265625, -4.73956298828125, -4.5509033203125, -4.36224365234375, -4.173583984375, -3.98492431640625, -3.7962646484375, -3.60760498046875, -3.4189453125, -3.23028564453125, -3.0416259765625, -2.85296630859375, -2.664306640625, -2.47564697265625, -2.2869873046875, -2.09832763671875, -1.90966796875, -1.72100830078125, -1.5323486328125, -1.34368896484375, -1.155029296875, -0.96636962890625, -0.7777099609375, -0.58905029296875, -0.400390625, -0.21173095703125, -0.0230712890625, 0.16558837890625, 0.354248046875, 0.54290771484375, 0.7315673828125, 0.92022705078125, 1.10888671875, 1.29754638671875, 1.4862060546875, 1.67486572265625, 1.863525390625, 2.05218505859375, 2.2408447265625, 2.42950439453125, 2.6181640625, 2.80682373046875, 2.9954833984375, 3.18414306640625, 3.372802734375, 3.56146240234375, 3.7501220703125, 3.93878173828125, 4.12744140625, 4.31610107421875, 4.5047607421875, 4.69342041015625, 4.882080078125, 5.07073974609375, 5.2593994140625, 5.44805908203125, 5.63671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 6.0, 3.0, 5.0, 4.0, 3.0, 10.0, 6.0, 7.0, 15.0, 15.0, 17.0, 14.0, 24.0, 25.0, 33.0, 27.0, 34.0, 31.0, 31.0, 29.0, 37.0, 40.0, 50.0, 42.0, 29.0, 38.0, 40.0, 47.0, 40.0, 33.0, 39.0, 29.0, 28.0, 31.0, 18.0, 17.0, 12.0, 13.0, 12.0, 16.0, 14.0, 6.0, 6.0, 9.0, 3.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-3.615234375, -3.508026123046875, -3.40081787109375, -3.293609619140625, -3.1864013671875, -3.079193115234375, -2.97198486328125, -2.864776611328125, -2.757568359375, -2.650360107421875, -2.54315185546875, -2.435943603515625, -2.3287353515625, -2.221527099609375, -2.11431884765625, -2.007110595703125, -1.89990234375, -1.792694091796875, -1.68548583984375, -1.578277587890625, -1.4710693359375, -1.363861083984375, -1.25665283203125, -1.149444580078125, -1.042236328125, -0.935028076171875, -0.82781982421875, -0.720611572265625, -0.6134033203125, -0.506195068359375, -0.39898681640625, -0.291778564453125, -0.1845703125, -0.077362060546875, 0.02984619140625, 0.137054443359375, 0.2442626953125, 0.351470947265625, 0.45867919921875, 0.565887451171875, 0.673095703125, 0.780303955078125, 0.88751220703125, 0.994720458984375, 1.1019287109375, 1.209136962890625, 1.31634521484375, 1.423553466796875, 1.53076171875, 1.637969970703125, 1.74517822265625, 1.852386474609375, 1.9595947265625, 2.066802978515625, 2.17401123046875, 2.281219482421875, 2.388427734375, 2.495635986328125, 2.60284423828125, 2.710052490234375, 2.8172607421875, 2.924468994140625, 3.03167724609375, 3.138885498046875, 3.24609375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 4.0, 3.0, 5.0, 5.0, 11.0, 12.0, 14.0, 7.0, 19.0, 22.0, 25.0, 21.0, 27.0, 30.0, 32.0, 37.0, 51.0, 39.0, 44.0, 47.0, 46.0, 46.0, 37.0, 40.0, 25.0, 43.0, 42.0, 35.0, 40.0, 23.0, 33.0, 25.0, 27.0, 18.0, 14.0, 9.0, 15.0, 9.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-23.804046630859375, -23.125524520874023, -22.447002410888672, -21.768478393554688, -21.089956283569336, -20.411434173583984, -19.732912063598633, -19.05438995361328, -18.375865936279297, -17.697343826293945, -17.018821716308594, -16.34029769897461, -15.661775588989258, -14.983253479003906, -14.304731369018555, -13.626208305358887, -12.947686195373535, -12.269164085388184, -11.590641021728516, -10.912118911743164, -10.233595848083496, -9.555073738098145, -8.876550674438477, -8.198028564453125, -7.519505977630615, -6.8409833908081055, -6.162460803985596, -5.483938217163086, -4.805416107177734, -4.126893043518066, -3.448370933532715, -2.769848346710205, -2.0913257598876953, -1.4128031730651855, -0.7342807054519653, -0.05575823783874512, 0.6227643489837646, 1.3012869358062744, 1.979809284210205, 2.658331871032715, 3.3368544578552246, 4.015377044677734, 4.693899631500244, 5.372422218322754, 6.0509443283081055, 6.729467391967773, 7.407989501953125, 8.086511611938477, 8.765034675598145, 9.443556785583496, 10.122079849243164, 10.800601959228516, 11.479125022888184, 12.157647132873535, 12.836170196533203, 13.514692306518555, 14.193214416503906, 14.871736526489258, 15.550259590148926, 16.228782653808594, 16.907304763793945, 17.585826873779297, 18.26434898376465, 18.94287109375, 19.621395111083984]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 1.0, 5.0, 11.0, 12.0, 13.0, 16.0, 15.0, 29.0, 33.0, 34.0, 37.0, 40.0, 37.0, 44.0, 50.0, 56.0, 62.0, 52.0, 45.0, 40.0, 38.0, 39.0, 44.0, 33.0, 39.0, 29.0, 28.0, 24.0, 23.0, 15.0, 10.0, 9.0, 8.0, 8.0, 5.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-44.31892776489258, -43.096038818359375, -41.87314987182617, -40.650264739990234, -39.42737579345703, -38.20448684692383, -36.981597900390625, -35.75870895385742, -34.53582000732422, -33.312931060791016, -32.09004211425781, -30.867155075073242, -29.644268035888672, -28.42137908935547, -27.198490142822266, -25.975601196289062, -24.752716064453125, -23.529827117919922, -22.30694007873535, -21.08405113220215, -19.861164093017578, -18.638275146484375, -17.415386199951172, -16.19249725341797, -14.969610214233398, -13.746722221374512, -12.523834228515625, -11.300945281982422, -10.078057289123535, -8.855169296264648, -7.6322808265686035, -6.409392356872559, -5.186504364013672, -3.963616132736206, -2.7407279014587402, -1.5178396701812744, -0.2949514389038086, 0.9279365539550781, 2.150825023651123, 3.373713493347168, 4.596601486206055, 5.819489479064941, 7.042377948760986, 8.265266418457031, 9.488154411315918, 10.711042404174805, 11.933931350708008, 13.156819343566895, 14.379707336425781, 15.602595329284668, 16.825483322143555, 18.048372268676758, 19.271259307861328, 20.49414825439453, 21.717037200927734, 22.939926147460938, 24.162813186645508, 25.38570213317871, 26.60858917236328, 27.831478118896484, 29.054367065429688, 30.277254104614258, 31.50014305114746, 32.72303009033203, 33.945919036865234]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 9.0, 8.0, 17.0, 21.0, 29.0, 56.0, 108.0, 155.0, 272.0, 483.0, 761.0, 1307.0, 2103.0, 3418.0, 5469.0, 8830.0, 13853.0, 22026.0, 34320.0, 51881.0, 77711.0, 112575.0, 157862.0, 211504.0, 270154.0, 328107.0, 376218.0, 402188.0, 403429.0, 377989.0, 332315.0, 274986.0, 215214.0, 161196.0, 116655.0, 80159.0, 54162.0, 35367.0, 23005.0, 14558.0, 9408.0, 5756.0, 3429.0, 2138.0, 1306.0, 740.0, 412.0, 268.0, 135.0, 91.0, 56.0, 39.0, 17.0, 10.0, 5.0, 3.0, 1.0, 2.0], "bins": [-16.296875, -15.818115234375, -15.33935546875, -14.860595703125, -14.3818359375, -13.903076171875, -13.42431640625, -12.945556640625, -12.466796875, -11.988037109375, -11.50927734375, -11.030517578125, -10.5517578125, -10.072998046875, -9.59423828125, -9.115478515625, -8.63671875, -8.157958984375, -7.67919921875, -7.200439453125, -6.7216796875, -6.242919921875, -5.76416015625, -5.285400390625, -4.806640625, -4.327880859375, -3.84912109375, -3.370361328125, -2.8916015625, -2.412841796875, -1.93408203125, -1.455322265625, -0.9765625, -0.497802734375, -0.01904296875, 0.459716796875, 0.9384765625, 1.417236328125, 1.89599609375, 2.374755859375, 2.853515625, 3.332275390625, 3.81103515625, 4.289794921875, 4.7685546875, 5.247314453125, 5.72607421875, 6.204833984375, 6.68359375, 7.162353515625, 7.64111328125, 8.119873046875, 8.5986328125, 9.077392578125, 9.55615234375, 10.034912109375, 10.513671875, 10.992431640625, 11.47119140625, 11.949951171875, 12.4287109375, 12.907470703125, 13.38623046875, 13.864990234375, 14.34375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 5.0, 6.0, 3.0, 3.0, 12.0, 11.0, 14.0, 14.0, 17.0, 28.0, 38.0, 31.0, 48.0, 32.0, 37.0, 43.0, 60.0, 52.0, 61.0, 57.0, 38.0, 42.0, 42.0, 36.0, 40.0, 35.0, 37.0, 32.0, 23.0, 25.0, 21.0, 12.0, 12.0, 8.0, 8.0, 7.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-41.84375, -40.68408203125, -39.5244140625, -38.36474609375, -37.205078125, -36.04541015625, -34.8857421875, -33.72607421875, -32.56640625, -31.40673828125, -30.2470703125, -29.08740234375, -27.927734375, -26.76806640625, -25.6083984375, -24.44873046875, -23.2890625, -22.12939453125, -20.9697265625, -19.81005859375, -18.650390625, -17.49072265625, -16.3310546875, -15.17138671875, -14.01171875, -12.85205078125, -11.6923828125, -10.53271484375, -9.373046875, -8.21337890625, -7.0537109375, -5.89404296875, -4.734375, -3.57470703125, -2.4150390625, -1.25537109375, -0.095703125, 1.06396484375, 2.2236328125, 3.38330078125, 4.54296875, 5.70263671875, 6.8623046875, 8.02197265625, 9.181640625, 10.34130859375, 11.5009765625, 12.66064453125, 13.8203125, 14.97998046875, 16.1396484375, 17.29931640625, 18.458984375, 19.61865234375, 20.7783203125, 21.93798828125, 23.09765625, 24.25732421875, 25.4169921875, 26.57666015625, 27.736328125, 28.89599609375, 30.0556640625, 31.21533203125, 32.375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 4.0, 14.0, 19.0, 42.0, 48.0, 85.0, 153.0, 281.0, 399.0, 693.0, 1078.0, 1848.0, 3027.0, 4686.0, 7462.0, 11960.0, 17919.0, 27120.0, 39600.0, 56893.0, 79347.0, 108899.0, 142614.0, 181015.0, 222370.0, 261585.0, 296914.0, 322971.0, 336436.0, 334184.0, 319606.0, 291748.0, 256421.0, 214272.0, 174650.0, 136334.0, 103348.0, 75518.0, 53577.0, 37256.0, 25257.0, 16964.0, 11071.0, 7033.0, 4522.0, 2758.0, 1704.0, 1022.0, 659.0, 377.0, 224.0, 141.0, 66.0, 43.0, 32.0, 15.0, 5.0, 4.0, 1.0, 1.0, 1.0], "bins": [-13.5859375, -13.1602783203125, -12.734619140625, -12.3089599609375, -11.88330078125, -11.4576416015625, -11.031982421875, -10.6063232421875, -10.1806640625, -9.7550048828125, -9.329345703125, -8.9036865234375, -8.47802734375, -8.0523681640625, -7.626708984375, -7.2010498046875, -6.775390625, -6.3497314453125, -5.924072265625, -5.4984130859375, -5.07275390625, -4.6470947265625, -4.221435546875, -3.7957763671875, -3.3701171875, -2.9444580078125, -2.518798828125, -2.0931396484375, -1.66748046875, -1.2418212890625, -0.816162109375, -0.3905029296875, 0.03515625, 0.4608154296875, 0.886474609375, 1.3121337890625, 1.73779296875, 2.1634521484375, 2.589111328125, 3.0147705078125, 3.4404296875, 3.8660888671875, 4.291748046875, 4.7174072265625, 5.14306640625, 5.5687255859375, 5.994384765625, 6.4200439453125, 6.845703125, 7.2713623046875, 7.697021484375, 8.1226806640625, 8.54833984375, 8.9739990234375, 9.399658203125, 9.8253173828125, 10.2509765625, 10.6766357421875, 11.102294921875, 11.5279541015625, 11.95361328125, 12.3792724609375, 12.804931640625, 13.2305908203125, 13.65625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 8.0, 11.0, 13.0, 12.0, 17.0, 18.0, 26.0, 29.0, 36.0, 40.0, 60.0, 57.0, 89.0, 94.0, 95.0, 125.0, 126.0, 139.0, 140.0, 174.0, 169.0, 172.0, 168.0, 170.0, 188.0, 185.0, 181.0, 187.0, 159.0, 164.0, 126.0, 112.0, 116.0, 113.0, 69.0, 89.0, 88.0, 61.0, 53.0, 40.0, 39.0, 23.0, 26.0, 10.0, 18.0, 10.0, 10.0, 7.0, 4.0, 5.0, 6.0, 1.0, 0.0, 1.0], "bins": [-12.53125, -12.1793212890625, -11.827392578125, -11.4754638671875, -11.12353515625, -10.7716064453125, -10.419677734375, -10.0677490234375, -9.7158203125, -9.3638916015625, -9.011962890625, -8.6600341796875, -8.30810546875, -7.9561767578125, -7.604248046875, -7.2523193359375, -6.900390625, -6.5484619140625, -6.196533203125, -5.8446044921875, -5.49267578125, -5.1407470703125, -4.788818359375, -4.4368896484375, -4.0849609375, -3.7330322265625, -3.381103515625, -3.0291748046875, -2.67724609375, -2.3253173828125, -1.973388671875, -1.6214599609375, -1.26953125, -0.9176025390625, -0.565673828125, -0.2137451171875, 0.13818359375, 0.4901123046875, 0.842041015625, 1.1939697265625, 1.5458984375, 1.8978271484375, 2.249755859375, 2.6016845703125, 2.95361328125, 3.3055419921875, 3.657470703125, 4.0093994140625, 4.361328125, 4.7132568359375, 5.065185546875, 5.4171142578125, 5.76904296875, 6.1209716796875, 6.472900390625, 6.8248291015625, 7.1767578125, 7.5286865234375, 7.880615234375, 8.2325439453125, 8.58447265625, 8.9364013671875, 9.288330078125, 9.6402587890625, 9.9921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 9.0, 4.0, 10.0, 17.0, 16.0, 17.0, 18.0, 28.0, 30.0, 33.0, 32.0, 35.0, 45.0, 41.0, 56.0, 39.0, 42.0, 50.0, 48.0, 45.0, 48.0, 43.0, 38.0, 33.0, 35.0, 24.0, 32.0, 19.0, 16.0, 12.0, 15.0, 19.0, 11.0, 7.0, 5.0, 6.0, 7.0, 2.0, 6.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-28.121347427368164, -27.357515335083008, -26.593685150146484, -25.829853057861328, -25.066022872924805, -24.30219078063965, -23.538360595703125, -22.77452850341797, -22.010696411132812, -21.246864318847656, -20.483034133911133, -19.719202041625977, -18.955371856689453, -18.191539764404297, -17.42770767211914, -16.663877487182617, -15.900046348571777, -15.136215209960938, -14.372384071350098, -13.608552932739258, -12.844720840454102, -12.080889701843262, -11.317058563232422, -10.553226470947266, -9.789396286010742, -9.025565147399902, -8.261734008789062, -7.4979023933410645, -6.734070777893066, -5.970239639282227, -5.206408500671387, -4.442576885223389, -3.6787452697753906, -2.9149138927459717, -2.1510825157165527, -1.387251377105713, -0.623420000076294, 0.140411376953125, 0.9042425155639648, 1.668074131011963, 2.4319052696228027, 3.1957366466522217, 3.9595680236816406, 4.7233991622924805, 5.48723030090332, 6.251061916351318, 7.014893054962158, 7.778724670410156, 8.542555809020996, 9.306386947631836, 10.070218086242676, 10.834049224853516, 11.597881317138672, 12.361712455749512, 13.125543594360352, 13.889375686645508, 14.653205871582031, 15.417037010192871, 16.18086814880371, 16.944700241088867, 17.70853042602539, 18.472362518310547, 19.236194610595703, 20.000024795532227, 20.763856887817383]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 6.0, 5.0, 10.0, 16.0, 10.0, 16.0, 26.0, 24.0, 33.0, 49.0, 45.0, 46.0, 38.0, 49.0, 34.0, 41.0, 48.0, 59.0, 46.0, 52.0, 50.0, 45.0, 35.0, 29.0, 40.0, 26.0, 25.0, 13.0, 16.0, 16.0, 13.0, 9.0, 9.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.807777404785156, -51.286956787109375, -49.76613235473633, -48.24531173706055, -46.724491119384766, -45.20366668701172, -43.68284606933594, -42.162025451660156, -40.641204833984375, -39.120384216308594, -37.59955978393555, -36.078739166259766, -34.557918548583984, -33.03709411621094, -31.516273498535156, -29.995452880859375, -28.474628448486328, -26.953805923461914, -25.432985305786133, -23.91216278076172, -22.391342163085938, -20.870519638061523, -19.34969711303711, -17.828876495361328, -16.308053970336914, -14.787232398986816, -13.266410827636719, -11.745588302612305, -10.224766731262207, -8.70394515991211, -7.183122634887695, -5.662301063537598, -4.141475677490234, -2.6206538677215576, -1.0998320579528809, 0.420989990234375, 1.9418115615844727, 3.4626331329345703, 4.983455657958984, 6.504277229309082, 8.02509880065918, 9.545920372009277, 11.066741943359375, 12.587564468383789, 14.108386039733887, 15.629207611083984, 17.1500301361084, 18.670852661132812, 20.191673278808594, 21.712495803833008, 23.23331642150879, 24.754138946533203, 26.274959564208984, 27.7957820892334, 29.316604614257812, 30.837425231933594, 32.358245849609375, 33.879066467285156, 35.3998908996582, 36.920711517333984, 38.441532135009766, 39.96235656738281, 41.483177185058594, 43.003997802734375, 44.52482223510742]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 12.0, 19.0, 17.0, 49.0, 77.0, 124.0, 221.0, 322.0, 545.0, 1007.0, 1768.0, 2926.0, 5220.0, 8896.0, 14996.0, 25154.0, 41647.0, 65664.0, 96213.0, 127838.0, 147850.0, 145184.0, 121445.0, 89424.0, 59840.0, 37200.0, 22645.0, 13397.0, 7867.0, 4568.0, 2681.0, 1526.0, 883.0, 524.0, 287.0, 206.0, 120.0, 76.0, 51.0, 23.0, 19.0, 9.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.7890625, -4.634033203125, -4.47900390625, -4.323974609375, -4.1689453125, -4.013916015625, -3.85888671875, -3.703857421875, -3.548828125, -3.393798828125, -3.23876953125, -3.083740234375, -2.9287109375, -2.773681640625, -2.61865234375, -2.463623046875, -2.30859375, -2.153564453125, -1.99853515625, -1.843505859375, -1.6884765625, -1.533447265625, -1.37841796875, -1.223388671875, -1.068359375, -0.913330078125, -0.75830078125, -0.603271484375, -0.4482421875, -0.293212890625, -0.13818359375, 0.016845703125, 0.171875, 0.326904296875, 0.48193359375, 0.636962890625, 0.7919921875, 0.947021484375, 1.10205078125, 1.257080078125, 1.412109375, 1.567138671875, 1.72216796875, 1.877197265625, 2.0322265625, 2.187255859375, 2.34228515625, 2.497314453125, 2.65234375, 2.807373046875, 2.96240234375, 3.117431640625, 3.2724609375, 3.427490234375, 3.58251953125, 3.737548828125, 3.892578125, 4.047607421875, 4.20263671875, 4.357666015625, 4.5126953125, 4.667724609375, 4.82275390625, 4.977783203125, 5.1328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 6.0, 5.0, 10.0, 16.0, 11.0, 14.0, 26.0, 23.0, 32.0, 51.0, 45.0, 44.0, 42.0, 47.0, 33.0, 42.0, 47.0, 60.0, 46.0, 52.0, 51.0, 42.0, 38.0, 29.0, 38.0, 28.0, 23.0, 14.0, 17.0, 16.0, 13.0, 8.0, 10.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.75, -51.22607421875, -49.7021484375, -48.17822265625, -46.654296875, -45.13037109375, -43.6064453125, -42.08251953125, -40.55859375, -39.03466796875, -37.5107421875, -35.98681640625, -34.462890625, -32.93896484375, -31.4150390625, -29.89111328125, -28.3671875, -26.84326171875, -25.3193359375, -23.79541015625, -22.271484375, -20.74755859375, -19.2236328125, -17.69970703125, -16.17578125, -14.65185546875, -13.1279296875, -11.60400390625, -10.080078125, -8.55615234375, -7.0322265625, -5.50830078125, -3.984375, -2.46044921875, -0.9365234375, 0.58740234375, 2.111328125, 3.63525390625, 5.1591796875, 6.68310546875, 8.20703125, 9.73095703125, 11.2548828125, 12.77880859375, 14.302734375, 15.82666015625, 17.3505859375, 18.87451171875, 20.3984375, 21.92236328125, 23.4462890625, 24.97021484375, 26.494140625, 28.01806640625, 29.5419921875, 31.06591796875, 32.58984375, 34.11376953125, 35.6376953125, 37.16162109375, 38.685546875, 40.20947265625, 41.7333984375, 43.25732421875, 44.78125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 12.0, 11.0, 12.0, 24.0, 37.0, 50.0, 85.0, 110.0, 153.0, 220.0, 314.0, 450.0, 662.0, 940.0, 1311.0, 1783.0, 2485.0, 3804.0, 5133.0, 7570.0, 10970.0, 17077.0, 30265.0, 210952.0, 643947.0, 47368.0, 20931.0, 13092.0, 8558.0, 6023.0, 4226.0, 2925.0, 2071.0, 1457.0, 1006.0, 754.0, 528.0, 340.0, 287.0, 191.0, 119.0, 94.0, 72.0, 51.0, 27.0, 20.0, 14.0, 9.0, 3.0, 2.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.356201171875, -8.07958984375, -7.802978515625, -7.5263671875, -7.249755859375, -6.97314453125, -6.696533203125, -6.419921875, -6.143310546875, -5.86669921875, -5.590087890625, -5.3134765625, -5.036865234375, -4.76025390625, -4.483642578125, -4.20703125, -3.930419921875, -3.65380859375, -3.377197265625, -3.1005859375, -2.823974609375, -2.54736328125, -2.270751953125, -1.994140625, -1.717529296875, -1.44091796875, -1.164306640625, -0.8876953125, -0.611083984375, -0.33447265625, -0.057861328125, 0.21875, 0.495361328125, 0.77197265625, 1.048583984375, 1.3251953125, 1.601806640625, 1.87841796875, 2.155029296875, 2.431640625, 2.708251953125, 2.98486328125, 3.261474609375, 3.5380859375, 3.814697265625, 4.09130859375, 4.367919921875, 4.64453125, 4.921142578125, 5.19775390625, 5.474365234375, 5.7509765625, 6.027587890625, 6.30419921875, 6.580810546875, 6.857421875, 7.134033203125, 7.41064453125, 7.687255859375, 7.9638671875, 8.240478515625, 8.51708984375, 8.793701171875, 9.0703125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 3.0, 11.0, 9.0, 4.0, 6.0, 19.0, 15.0, 21.0, 22.0, 28.0, 17.0, 42.0, 38.0, 32.0, 36.0, 27.0, 37.0, 49.0, 47.0, 50.0, 50.0, 52.0, 44.0, 36.0, 47.0, 28.0, 34.0, 28.0, 21.0, 26.0, 16.0, 14.0, 17.0, 16.0, 10.0, 11.0, 4.0, 5.0, 7.0, 6.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.0, -32.92138671875, -31.8427734375, -30.76416015625, -29.685546875, -28.60693359375, -27.5283203125, -26.44970703125, -25.37109375, -24.29248046875, -23.2138671875, -22.13525390625, -21.056640625, -19.97802734375, -18.8994140625, -17.82080078125, -16.7421875, -15.66357421875, -14.5849609375, -13.50634765625, -12.427734375, -11.34912109375, -10.2705078125, -9.19189453125, -8.11328125, -7.03466796875, -5.9560546875, -4.87744140625, -3.798828125, -2.72021484375, -1.6416015625, -0.56298828125, 0.515625, 1.59423828125, 2.6728515625, 3.75146484375, 4.830078125, 5.90869140625, 6.9873046875, 8.06591796875, 9.14453125, 10.22314453125, 11.3017578125, 12.38037109375, 13.458984375, 14.53759765625, 15.6162109375, 16.69482421875, 17.7734375, 18.85205078125, 19.9306640625, 21.00927734375, 22.087890625, 23.16650390625, 24.2451171875, 25.32373046875, 26.40234375, 27.48095703125, 28.5595703125, 29.63818359375, 30.716796875, 31.79541015625, 32.8740234375, 33.95263671875, 35.03125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 8.0, 10.0, 8.0, 16.0, 11.0, 23.0, 38.0, 52.0, 67.0, 93.0, 162.0, 222.0, 394.0, 597.0, 1014.0, 1632.0, 2817.0, 4786.0, 8663.0, 16152.0, 32562.0, 719503.0, 199812.0, 27750.0, 13952.0, 7623.0, 4243.0, 2467.0, 1517.0, 843.0, 529.0, 329.0, 202.0, 159.0, 91.0, 59.0, 37.0, 35.0, 21.0, 22.0, 12.0, 9.0, 3.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.1875, -2.1248016357421875, -2.062103271484375, -1.9994049072265625, -1.93670654296875, -1.8740081787109375, -1.811309814453125, -1.7486114501953125, -1.6859130859375, -1.6232147216796875, -1.560516357421875, -1.4978179931640625, -1.43511962890625, -1.3724212646484375, -1.309722900390625, -1.2470245361328125, -1.184326171875, -1.1216278076171875, -1.058929443359375, -0.9962310791015625, -0.93353271484375, -0.8708343505859375, -0.808135986328125, -0.7454376220703125, -0.6827392578125, -0.6200408935546875, -0.557342529296875, -0.4946441650390625, -0.43194580078125, -0.3692474365234375, -0.306549072265625, -0.2438507080078125, -0.18115234375, -0.1184539794921875, -0.055755615234375, 0.0069427490234375, 0.06964111328125, 0.1323394775390625, 0.195037841796875, 0.2577362060546875, 0.3204345703125, 0.3831329345703125, 0.445831298828125, 0.5085296630859375, 0.57122802734375, 0.6339263916015625, 0.696624755859375, 0.7593231201171875, 0.822021484375, 0.8847198486328125, 0.947418212890625, 1.0101165771484375, 1.07281494140625, 1.1355133056640625, 1.198211669921875, 1.2609100341796875, 1.3236083984375, 1.3863067626953125, 1.449005126953125, 1.5117034912109375, 1.57440185546875, 1.6371002197265625, 1.699798583984375, 1.7624969482421875, 1.8251953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 6.0, 10.0, 10.0, 10.0, 12.0, 22.0, 26.0, 24.0, 29.0, 33.0, 36.0, 42.0, 40.0, 37.0, 57.0, 49.0, 55.0, 48.0, 48.0, 41.0, 42.0, 31.0, 22.0, 45.0, 31.0, 29.0, 21.0, 29.0, 16.0, 17.0, 20.0, 12.0, 13.0, 6.0, 4.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7835369110107422e-05, -2.692919224500656e-05, -2.60230153799057e-05, -2.511683851480484e-05, -2.421066164970398e-05, -2.330448478460312e-05, -2.2398307919502258e-05, -2.1492131054401398e-05, -2.0585954189300537e-05, -1.9679777324199677e-05, -1.8773600459098816e-05, -1.7867423593997955e-05, -1.6961246728897095e-05, -1.6055069863796234e-05, -1.5148892998695374e-05, -1.4242716133594513e-05, -1.3336539268493652e-05, -1.2430362403392792e-05, -1.1524185538291931e-05, -1.061800867319107e-05, -9.71183180809021e-06, -8.80565494298935e-06, -7.899478077888489e-06, -6.993301212787628e-06, -6.087124347686768e-06, -5.180947482585907e-06, -4.274770617485046e-06, -3.368593752384186e-06, -2.462416887283325e-06, -1.5562400221824646e-06, -6.50063157081604e-07, 2.561137080192566e-07, 1.1622905731201172e-06, 2.0684674382209778e-06, 2.9746443033218384e-06, 3.880821168422699e-06, 4.7869980335235596e-06, 5.69317489862442e-06, 6.599351763725281e-06, 7.505528628826141e-06, 8.411705493927002e-06, 9.317882359027863e-06, 1.0224059224128723e-05, 1.1130236089229584e-05, 1.2036412954330444e-05, 1.2942589819431305e-05, 1.3848766684532166e-05, 1.4754943549633026e-05, 1.5661120414733887e-05, 1.6567297279834747e-05, 1.7473474144935608e-05, 1.837965101003647e-05, 1.928582787513733e-05, 2.019200474023819e-05, 2.109818160533905e-05, 2.200435847043991e-05, 2.291053533554077e-05, 2.3816712200641632e-05, 2.4722889065742493e-05, 2.5629065930843353e-05, 2.6535242795944214e-05, 2.7441419661045074e-05, 2.8347596526145935e-05, 2.9253773391246796e-05, 3.0159950256347656e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 8.0, 15.0, 11.0, 19.0, 19.0, 31.0, 64.0, 100.0, 130.0, 198.0, 320.0, 517.0, 865.0, 1523.0, 2528.0, 4344.0, 7501.0, 13341.0, 23065.0, 40322.0, 69715.0, 119126.0, 185655.0, 209839.0, 152243.0, 91747.0, 53279.0, 30921.0, 17369.0, 9986.0, 5706.0, 3218.0, 1893.0, 1178.0, 650.0, 377.0, 262.0, 141.0, 121.0, 57.0, 43.0, 32.0, 32.0, 17.0, 9.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.5703125, -1.5216217041015625, -1.472930908203125, -1.4242401123046875, -1.37554931640625, -1.3268585205078125, -1.278167724609375, -1.2294769287109375, -1.1807861328125, -1.1320953369140625, -1.083404541015625, -1.0347137451171875, -0.98602294921875, -0.9373321533203125, -0.888641357421875, -0.8399505615234375, -0.791259765625, -0.7425689697265625, -0.693878173828125, -0.6451873779296875, -0.59649658203125, -0.5478057861328125, -0.499114990234375, -0.4504241943359375, -0.4017333984375, -0.3530426025390625, -0.304351806640625, -0.2556610107421875, -0.20697021484375, -0.1582794189453125, -0.109588623046875, -0.0608978271484375, -0.01220703125, 0.0364837646484375, 0.085174560546875, 0.1338653564453125, 0.18255615234375, 0.2312469482421875, 0.279937744140625, 0.3286285400390625, 0.3773193359375, 0.4260101318359375, 0.474700927734375, 0.5233917236328125, 0.57208251953125, 0.6207733154296875, 0.669464111328125, 0.7181549072265625, 0.766845703125, 0.8155364990234375, 0.864227294921875, 0.9129180908203125, 0.96160888671875, 1.0102996826171875, 1.058990478515625, 1.1076812744140625, 1.1563720703125, 1.2050628662109375, 1.253753662109375, 1.3024444580078125, 1.35113525390625, 1.3998260498046875, 1.448516845703125, 1.4972076416015625, 1.5458984375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 3.0, 6.0, 6.0, 5.0, 10.0, 20.0, 18.0, 24.0, 28.0, 33.0, 27.0, 31.0, 47.0, 54.0, 43.0, 67.0, 50.0, 44.0, 56.0, 52.0, 48.0, 56.0, 54.0, 34.0, 32.0, 26.0, 21.0, 29.0, 21.0, 19.0, 8.0, 6.0, 7.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7080078125, -1.657012939453125, -1.60601806640625, -1.555023193359375, -1.5040283203125, -1.453033447265625, -1.40203857421875, -1.351043701171875, -1.300048828125, -1.249053955078125, -1.19805908203125, -1.147064208984375, -1.0960693359375, -1.045074462890625, -0.99407958984375, -0.943084716796875, -0.89208984375, -0.841094970703125, -0.79010009765625, -0.739105224609375, -0.6881103515625, -0.637115478515625, -0.58612060546875, -0.535125732421875, -0.484130859375, -0.433135986328125, -0.38214111328125, -0.331146240234375, -0.2801513671875, -0.229156494140625, -0.17816162109375, -0.127166748046875, -0.076171875, -0.025177001953125, 0.02581787109375, 0.076812744140625, 0.1278076171875, 0.178802490234375, 0.22979736328125, 0.280792236328125, 0.331787109375, 0.382781982421875, 0.43377685546875, 0.484771728515625, 0.5357666015625, 0.586761474609375, 0.63775634765625, 0.688751220703125, 0.73974609375, 0.790740966796875, 0.84173583984375, 0.892730712890625, 0.9437255859375, 0.994720458984375, 1.04571533203125, 1.096710205078125, 1.147705078125, 1.198699951171875, 1.24969482421875, 1.300689697265625, 1.3516845703125, 1.402679443359375, 1.45367431640625, 1.504669189453125, 1.5556640625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 5.0, 5.0, 7.0, 12.0, 7.0, 14.0, 14.0, 16.0, 19.0, 23.0, 28.0, 35.0, 31.0, 37.0, 31.0, 41.0, 46.0, 52.0, 42.0, 44.0, 63.0, 32.0, 46.0, 44.0, 43.0, 31.0, 43.0, 24.0, 35.0, 19.0, 22.0, 11.0, 12.0, 20.0, 14.0, 6.0, 10.0, 8.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-27.45720100402832, -26.69425392150879, -25.931306838989258, -25.16836166381836, -24.405414581298828, -23.642467498779297, -22.879520416259766, -22.116573333740234, -21.353628158569336, -20.590681076049805, -19.827733993530273, -19.064788818359375, -18.301841735839844, -17.538894653320312, -16.77594757080078, -16.01300048828125, -15.250054359436035, -14.487107276916504, -13.724161148071289, -12.961214065551758, -12.198267936706543, -11.435320854187012, -10.672374725341797, -9.909427642822266, -9.146480560302734, -8.383533477783203, -7.620587348937988, -6.857640266418457, -6.094694137573242, -5.331747055053711, -4.568800449371338, -3.805853843688965, -3.04290771484375, -2.279961109161377, -1.5170143842697144, -0.7540676593780518, 0.008878946304321289, 0.7718255519866943, 1.5347723960876465, 2.2977190017700195, 3.0606656074523926, 3.8236122131347656, 4.586558818817139, 5.349505424499512, 6.112452507019043, 6.875398635864258, 7.638345718383789, 8.40129280090332, 9.164238929748535, 9.927186012268066, 10.690132141113281, 11.453079223632812, 12.216025352478027, 12.978972434997559, 13.741918563842773, 14.504865646362305, 15.267812728881836, 16.030759811401367, 16.7937068939209, 17.556652069091797, 18.319599151611328, 19.08254623413086, 19.84549331665039, 20.608440399169922, 21.37138557434082]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 6.0, 10.0, 15.0, 8.0, 18.0, 21.0, 25.0, 33.0, 47.0, 45.0, 36.0, 48.0, 45.0, 35.0, 33.0, 53.0, 51.0, 55.0, 50.0, 44.0, 49.0, 42.0, 22.0, 37.0, 32.0, 24.0, 19.0, 16.0, 17.0, 8.0, 17.0, 5.0, 11.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.153324127197266, -50.65609359741211, -49.15886306762695, -47.6616325378418, -46.164405822753906, -44.66717529296875, -43.169944763183594, -41.67271423339844, -40.17548370361328, -38.678253173828125, -37.18102264404297, -35.68379211425781, -34.186561584472656, -32.689334869384766, -31.19210433959961, -29.694873809814453, -28.197643280029297, -26.70041275024414, -25.203182220458984, -23.70595359802246, -22.208723068237305, -20.71149253845215, -19.214263916015625, -17.71703338623047, -16.219802856445312, -14.722572326660156, -13.225342750549316, -11.728113174438477, -10.23088264465332, -8.733652114868164, -7.236422538757324, -5.739192962646484, -4.241962432861328, -2.74473237991333, -1.247502326965332, 0.24972772598266602, 1.746957778930664, 3.244187831878662, 4.74141788482666, 6.2386474609375, 7.735877990722656, 9.233108520507812, 10.730338096618652, 12.227567672729492, 13.724798202514648, 15.222028732299805, 16.719257354736328, 18.216487884521484, 19.71371841430664, 21.210948944091797, 22.708179473876953, 24.205408096313477, 25.702638626098633, 27.19986915588379, 28.697097778320312, 30.19432830810547, 31.691558837890625, 33.18878936767578, 34.68601989746094, 36.183250427246094, 37.68048095703125, 39.17770767211914, 40.6749382019043, 42.17216873168945, 43.66939926147461]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 3.0, 9.0, 14.0, 9.0, 30.0, 61.0, 81.0, 161.0, 249.0, 387.0, 596.0, 1012.0, 1598.0, 2653.0, 4027.0, 6169.0, 9468.0, 14263.0, 20972.0, 29735.0, 41111.0, 53637.0, 68173.0, 81063.0, 92356.0, 97925.0, 98374.0, 92031.0, 80435.0, 67483.0, 53876.0, 40528.0, 29549.0, 20557.0, 14076.0, 9292.0, 6051.0, 3938.0, 2520.0, 1537.0, 1034.0, 596.0, 342.0, 221.0, 138.0, 77.0, 48.0, 40.0, 23.0, 12.0, 8.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.875, -12.445556640625, -12.01611328125, -11.586669921875, -11.1572265625, -10.727783203125, -10.29833984375, -9.868896484375, -9.439453125, -9.010009765625, -8.58056640625, -8.151123046875, -7.7216796875, -7.292236328125, -6.86279296875, -6.433349609375, -6.00390625, -5.574462890625, -5.14501953125, -4.715576171875, -4.2861328125, -3.856689453125, -3.42724609375, -2.997802734375, -2.568359375, -2.138916015625, -1.70947265625, -1.280029296875, -0.8505859375, -0.421142578125, 0.00830078125, 0.437744140625, 0.8671875, 1.296630859375, 1.72607421875, 2.155517578125, 2.5849609375, 3.014404296875, 3.44384765625, 3.873291015625, 4.302734375, 4.732177734375, 5.16162109375, 5.591064453125, 6.0205078125, 6.449951171875, 6.87939453125, 7.308837890625, 7.73828125, 8.167724609375, 8.59716796875, 9.026611328125, 9.4560546875, 9.885498046875, 10.31494140625, 10.744384765625, 11.173828125, 11.603271484375, 12.03271484375, 12.462158203125, 12.8916015625, 13.321044921875, 13.75048828125, 14.179931640625, 14.609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 6.0, 10.0, 14.0, 8.0, 19.0, 21.0, 24.0, 27.0, 51.0, 44.0, 37.0, 47.0, 46.0, 37.0, 33.0, 54.0, 49.0, 56.0, 51.0, 43.0, 48.0, 42.0, 24.0, 34.0, 34.0, 25.0, 19.0, 16.0, 15.0, 11.0, 15.0, 7.0, 10.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.90625, -50.41796875, -48.9296875, -47.44140625, -45.953125, -44.46484375, -42.9765625, -41.48828125, -40.0, -38.51171875, -37.0234375, -35.53515625, -34.046875, -32.55859375, -31.0703125, -29.58203125, -28.09375, -26.60546875, -25.1171875, -23.62890625, -22.140625, -20.65234375, -19.1640625, -17.67578125, -16.1875, -14.69921875, -13.2109375, -11.72265625, -10.234375, -8.74609375, -7.2578125, -5.76953125, -4.28125, -2.79296875, -1.3046875, 0.18359375, 1.671875, 3.16015625, 4.6484375, 6.13671875, 7.625, 9.11328125, 10.6015625, 12.08984375, 13.578125, 15.06640625, 16.5546875, 18.04296875, 19.53125, 21.01953125, 22.5078125, 23.99609375, 25.484375, 26.97265625, 28.4609375, 29.94921875, 31.4375, 32.92578125, 34.4140625, 35.90234375, 37.390625, 38.87890625, 40.3671875, 41.85546875, 43.34375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 8.0, 16.0, 33.0, 53.0, 55.0, 90.0, 163.0, 251.0, 491.0, 876.0, 1684.0, 3488.0, 6817.0, 13437.0, 26353.0, 49632.0, 87819.0, 135897.0, 174512.0, 179511.0, 147334.0, 99309.0, 57332.0, 30928.0, 15994.0, 7971.0, 4023.0, 2085.0, 1042.0, 573.0, 288.0, 195.0, 107.0, 62.0, 44.0, 25.0, 26.0, 11.0, 7.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.1875, -34.21337890625, -33.2392578125, -32.26513671875, -31.291015625, -30.31689453125, -29.3427734375, -28.36865234375, -27.39453125, -26.42041015625, -25.4462890625, -24.47216796875, -23.498046875, -22.52392578125, -21.5498046875, -20.57568359375, -19.6015625, -18.62744140625, -17.6533203125, -16.67919921875, -15.705078125, -14.73095703125, -13.7568359375, -12.78271484375, -11.80859375, -10.83447265625, -9.8603515625, -8.88623046875, -7.912109375, -6.93798828125, -5.9638671875, -4.98974609375, -4.015625, -3.04150390625, -2.0673828125, -1.09326171875, -0.119140625, 0.85498046875, 1.8291015625, 2.80322265625, 3.77734375, 4.75146484375, 5.7255859375, 6.69970703125, 7.673828125, 8.64794921875, 9.6220703125, 10.59619140625, 11.5703125, 12.54443359375, 13.5185546875, 14.49267578125, 15.466796875, 16.44091796875, 17.4150390625, 18.38916015625, 19.36328125, 20.33740234375, 21.3115234375, 22.28564453125, 23.259765625, 24.23388671875, 25.2080078125, 26.18212890625, 27.15625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 6.0, 3.0, 7.0, 7.0, 9.0, 19.0, 14.0, 18.0, 19.0, 31.0, 27.0, 37.0, 44.0, 50.0, 60.0, 75.0, 68.0, 54.0, 52.0, 57.0, 47.0, 41.0, 39.0, 35.0, 39.0, 32.0, 27.0, 15.0, 22.0, 10.0, 12.0, 8.0, 7.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.28125, -40.0400390625, -38.798828125, -37.5576171875, -36.31640625, -35.0751953125, -33.833984375, -32.5927734375, -31.3515625, -30.1103515625, -28.869140625, -27.6279296875, -26.38671875, -25.1455078125, -23.904296875, -22.6630859375, -21.421875, -20.1806640625, -18.939453125, -17.6982421875, -16.45703125, -15.2158203125, -13.974609375, -12.7333984375, -11.4921875, -10.2509765625, -9.009765625, -7.7685546875, -6.52734375, -5.2861328125, -4.044921875, -2.8037109375, -1.5625, -0.3212890625, 0.919921875, 2.1611328125, 3.40234375, 4.6435546875, 5.884765625, 7.1259765625, 8.3671875, 9.6083984375, 10.849609375, 12.0908203125, 13.33203125, 14.5732421875, 15.814453125, 17.0556640625, 18.296875, 19.5380859375, 20.779296875, 22.0205078125, 23.26171875, 24.5029296875, 25.744140625, 26.9853515625, 28.2265625, 29.4677734375, 30.708984375, 31.9501953125, 33.19140625, 34.4326171875, 35.673828125, 36.9150390625, 38.15625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 8.0, 16.0, 26.0, 38.0, 46.0, 80.0, 124.0, 202.0, 315.0, 443.0, 751.0, 1215.0, 1944.0, 3029.0, 4579.0, 7220.0, 10944.0, 16245.0, 23602.0, 33267.0, 45420.0, 58418.0, 72876.0, 85837.0, 93979.0, 97800.0, 96177.0, 88645.0, 77068.0, 62786.0, 49145.0, 36786.0, 26417.0, 18318.0, 12293.0, 8157.0, 5150.0, 3390.0, 2124.0, 1375.0, 819.0, 559.0, 342.0, 217.0, 123.0, 85.0, 56.0, 41.0, 28.0, 14.0, 7.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.78125, -5.59857177734375, -5.4158935546875, -5.23321533203125, -5.050537109375, -4.86785888671875, -4.6851806640625, -4.50250244140625, -4.31982421875, -4.13714599609375, -3.9544677734375, -3.77178955078125, -3.589111328125, -3.40643310546875, -3.2237548828125, -3.04107666015625, -2.8583984375, -2.67572021484375, -2.4930419921875, -2.31036376953125, -2.127685546875, -1.94500732421875, -1.7623291015625, -1.57965087890625, -1.39697265625, -1.21429443359375, -1.0316162109375, -0.84893798828125, -0.666259765625, -0.48358154296875, -0.3009033203125, -0.11822509765625, 0.064453125, 0.24713134765625, 0.4298095703125, 0.61248779296875, 0.795166015625, 0.97784423828125, 1.1605224609375, 1.34320068359375, 1.52587890625, 1.70855712890625, 1.8912353515625, 2.07391357421875, 2.256591796875, 2.43927001953125, 2.6219482421875, 2.80462646484375, 2.9873046875, 3.16998291015625, 3.3526611328125, 3.53533935546875, 3.718017578125, 3.90069580078125, 4.0833740234375, 4.26605224609375, 4.44873046875, 4.63140869140625, 4.8140869140625, 4.99676513671875, 5.179443359375, 5.36212158203125, 5.5447998046875, 5.72747802734375, 5.91015625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 6.0, 11.0, 13.0, 12.0, 16.0, 14.0, 18.0, 21.0, 18.0, 28.0, 28.0, 46.0, 43.0, 43.0, 42.0, 53.0, 67.0, 46.0, 44.0, 48.0, 47.0, 51.0, 30.0, 38.0, 19.0, 34.0, 31.0, 21.0, 16.0, 10.0, 14.0, 14.0, 5.0, 10.0, 8.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.0008497238159179688, -0.0008236095309257507, -0.0007974952459335327, -0.0007713809609413147, -0.0007452666759490967, -0.0007191523909568787, -0.0006930381059646606, -0.0006669238209724426, -0.0006408095359802246, -0.0006146952509880066, -0.0005885809659957886, -0.0005624666810035706, -0.0005363523960113525, -0.0005102381110191345, -0.0004841238260269165, -0.0004580095410346985, -0.00043189525604248047, -0.00040578097105026245, -0.00037966668605804443, -0.0003535524010658264, -0.0003274381160736084, -0.0003013238310813904, -0.00027520954608917236, -0.00024909526109695435, -0.00022298097610473633, -0.0001968666911125183, -0.0001707524061203003, -0.00014463812112808228, -0.00011852383613586426, -9.240955114364624e-05, -6.629526615142822e-05, -4.0180981159210205e-05, -1.4066696166992188e-05, 1.204758882522583e-05, 3.816187381744385e-05, 6.427615880966187e-05, 9.039044380187988e-05, 0.0001165047287940979, 0.00014261901378631592, 0.00016873329877853394, 0.00019484758377075195, 0.00022096186876296997, 0.000247076153755188, 0.000273190438747406, 0.000299304723739624, 0.00032541900873184204, 0.00035153329372406006, 0.0003776475787162781, 0.0004037618637084961, 0.0004298761487007141, 0.00045599043369293213, 0.00048210471868515015, 0.0005082190036773682, 0.0005343332886695862, 0.0005604475736618042, 0.0005865618586540222, 0.0006126761436462402, 0.0006387904286384583, 0.0006649047136306763, 0.0006910189986228943, 0.0007171332836151123, 0.0007432475686073303, 0.0007693618535995483, 0.0007954761385917664, 0.0008215904235839844]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 12.0, 9.0, 27.0, 36.0, 68.0, 86.0, 151.0, 214.0, 311.0, 554.0, 878.0, 1377.0, 2201.0, 3268.0, 5197.0, 7659.0, 11356.0, 16376.0, 23218.0, 31585.0, 41552.0, 52597.0, 64345.0, 75144.0, 82974.0, 88135.0, 88596.0, 86231.0, 77025.0, 68437.0, 56608.0, 45380.0, 34530.0, 25683.0, 18261.0, 13008.0, 8781.0, 5971.0, 3840.0, 2535.0, 1645.0, 983.0, 650.0, 372.0, 266.0, 147.0, 105.0, 76.0, 40.0, 31.0, 14.0, 10.0, 1.0, 3.0, 5.0], "bins": [-6.18359375, -6.00775146484375, -5.8319091796875, -5.65606689453125, -5.480224609375, -5.30438232421875, -5.1285400390625, -4.95269775390625, -4.77685546875, -4.60101318359375, -4.4251708984375, -4.24932861328125, -4.073486328125, -3.89764404296875, -3.7218017578125, -3.54595947265625, -3.3701171875, -3.19427490234375, -3.0184326171875, -2.84259033203125, -2.666748046875, -2.49090576171875, -2.3150634765625, -2.13922119140625, -1.96337890625, -1.78753662109375, -1.6116943359375, -1.43585205078125, -1.260009765625, -1.08416748046875, -0.9083251953125, -0.73248291015625, -0.556640625, -0.38079833984375, -0.2049560546875, -0.02911376953125, 0.146728515625, 0.32257080078125, 0.4984130859375, 0.67425537109375, 0.85009765625, 1.02593994140625, 1.2017822265625, 1.37762451171875, 1.553466796875, 1.72930908203125, 1.9051513671875, 2.08099365234375, 2.2568359375, 2.43267822265625, 2.6085205078125, 2.78436279296875, 2.960205078125, 3.13604736328125, 3.3118896484375, 3.48773193359375, 3.66357421875, 3.83941650390625, 4.0152587890625, 4.19110107421875, 4.366943359375, 4.54278564453125, 4.7186279296875, 4.89447021484375, 5.0703125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 4.0, 4.0, 7.0, 8.0, 15.0, 11.0, 19.0, 16.0, 23.0, 27.0, 29.0, 25.0, 32.0, 41.0, 50.0, 50.0, 42.0, 54.0, 59.0, 55.0, 45.0, 55.0, 41.0, 49.0, 40.0, 32.0, 22.0, 33.0, 23.0, 21.0, 14.0, 12.0, 12.0, 9.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.59765625, -4.46563720703125, -4.3336181640625, -4.20159912109375, -4.069580078125, -3.93756103515625, -3.8055419921875, -3.67352294921875, -3.54150390625, -3.40948486328125, -3.2774658203125, -3.14544677734375, -3.013427734375, -2.88140869140625, -2.7493896484375, -2.61737060546875, -2.4853515625, -2.35333251953125, -2.2213134765625, -2.08929443359375, -1.957275390625, -1.82525634765625, -1.6932373046875, -1.56121826171875, -1.42919921875, -1.29718017578125, -1.1651611328125, -1.03314208984375, -0.901123046875, -0.76910400390625, -0.6370849609375, -0.50506591796875, -0.373046875, -0.24102783203125, -0.1090087890625, 0.02301025390625, 0.155029296875, 0.28704833984375, 0.4190673828125, 0.55108642578125, 0.68310546875, 0.81512451171875, 0.9471435546875, 1.07916259765625, 1.211181640625, 1.34320068359375, 1.4752197265625, 1.60723876953125, 1.7392578125, 1.87127685546875, 2.0032958984375, 2.13531494140625, 2.267333984375, 2.39935302734375, 2.5313720703125, 2.66339111328125, 2.79541015625, 2.92742919921875, 3.0594482421875, 3.19146728515625, 3.323486328125, 3.45550537109375, 3.5875244140625, 3.71954345703125, 3.8515625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 9.0, 5.0, 16.0, 7.0, 18.0, 15.0, 14.0, 27.0, 28.0, 30.0, 32.0, 43.0, 34.0, 53.0, 35.0, 41.0, 39.0, 48.0, 40.0, 49.0, 36.0, 37.0, 43.0, 31.0, 39.0, 33.0, 23.0, 23.0, 31.0, 18.0, 14.0, 20.0, 10.0, 8.0, 6.0, 7.0, 13.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-27.508285522460938, -26.743144989013672, -25.97800636291504, -25.212865829467773, -24.447725296020508, -23.682586669921875, -22.91744613647461, -22.152305603027344, -21.387165069580078, -20.622024536132812, -19.85688591003418, -19.091745376586914, -18.32660484313965, -17.561466217041016, -16.79632568359375, -16.031185150146484, -15.266046524047852, -14.500906944274902, -13.735766410827637, -12.970626831054688, -12.205486297607422, -11.440346717834473, -10.675207138061523, -9.910066604614258, -9.144927024841309, -8.37978744506836, -7.614646911621094, -6.8495073318481445, -6.084367275238037, -5.31922721862793, -4.5540876388549805, -3.788947582244873, -3.0238094329833984, -2.258669376373291, -1.4935295581817627, -0.7283897399902344, 0.03675031661987305, 0.8018903732299805, 1.5670299530029297, 2.332170009613037, 3.0973100662231445, 3.862450122833252, 4.627590179443359, 5.392729759216309, 6.157869815826416, 6.923009872436523, 7.688149452209473, 8.453289031982422, 9.218429565429688, 9.983569145202637, 10.748709678649902, 11.513849258422852, 12.278989791870117, 13.044129371643066, 13.809268951416016, 14.574409484863281, 15.33954906463623, 16.10468864440918, 16.869829177856445, 17.634967803955078, 18.400108337402344, 19.16524887084961, 19.930389404296875, 20.695528030395508, 21.460668563842773]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 8.0, 15.0, 17.0, 16.0, 27.0, 17.0, 29.0, 27.0, 41.0, 43.0, 38.0, 44.0, 44.0, 46.0, 44.0, 40.0, 49.0, 36.0, 48.0, 62.0, 48.0, 35.0, 34.0, 35.0, 27.0, 30.0, 19.0, 20.0, 15.0, 11.0, 10.0, 5.0, 3.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.12012481689453, -66.9241714477539, -64.72821807861328, -62.53226089477539, -60.3363037109375, -58.140350341796875, -55.94439697265625, -53.74843978881836, -51.55248260498047, -49.356529235839844, -47.16057205200195, -44.96461868286133, -42.76866149902344, -40.57270812988281, -38.37675476074219, -36.1807975769043, -33.98484420776367, -31.788888931274414, -29.592933654785156, -27.39698028564453, -25.20102310180664, -23.005069732666016, -20.809114456176758, -18.6131591796875, -16.417203903198242, -14.221248626708984, -12.025293350219727, -9.829339027404785, -7.633383750915527, -5.4374284744262695, -3.241474151611328, -1.0455188751220703, 1.1504364013671875, 3.346391439437866, 5.542346477508545, 7.7383012771606445, 9.934256553649902, 12.13021183013916, 14.326166152954102, 16.52212142944336, 18.718076705932617, 20.914031982421875, 23.109987258911133, 25.30594253540039, 27.501895904541016, 29.697853088378906, 31.89380645751953, 34.089759826660156, 36.28571701049805, 38.48167037963867, 40.67762756347656, 42.87358093261719, 45.06953811645508, 47.2654914855957, 49.461448669433594, 51.65740203857422, 53.853355407714844, 56.04930877685547, 58.24526596069336, 60.441219329833984, 62.637176513671875, 64.8331298828125, 67.02908325195312, 69.22503662109375, 71.4209976196289]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 6.0, 3.0, 11.0, 7.0, 18.0, 35.0, 39.0, 53.0, 69.0, 108.0, 146.0, 194.0, 289.0, 408.0, 574.0, 822.0, 1076.0, 1566.0, 2082.0, 2685.0, 3317.0, 4244.0, 4979.0, 1003761.0, 5037.0, 4480.0, 3601.0, 2885.0, 2288.0, 1642.0, 1205.0, 853.0, 613.0, 446.0, 309.0, 198.0, 142.0, 102.0, 84.0, 59.0, 46.0, 34.0, 25.0, 17.0, 11.0, 8.0, 12.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-207.1431121826172, -200.37997436523438, -193.6168212890625, -186.8536834716797, -180.09054565429688, -173.327392578125, -166.5642547607422, -159.80111694335938, -153.0379638671875, -146.2748260498047, -139.5116729736328, -132.74853515625, -125.98538970947266, -119.22224426269531, -112.4591064453125, -105.69596099853516, -98.93281555175781, -92.16967010498047, -85.40652465820312, -78.64338684082031, -71.88024139404297, -65.11709594726562, -58.35395431518555, -51.59081268310547, -44.827667236328125, -38.06452178955078, -31.301380157470703, -24.538236618041992, -17.77509307861328, -11.011947631835938, -4.248805999755859, 2.5143356323242188, 9.277481079101562, 16.040624618530273, 22.803768157958984, 29.566911697387695, 36.330055236816406, 43.09320068359375, 49.85634231567383, 56.619483947753906, 63.38262939453125, 70.1457748413086, 76.90892028808594, 83.67205810546875, 90.4352035522461, 97.19834899902344, 103.96148681640625, 110.7246322631836, 117.48777770996094, 124.25092315673828, 131.01406860351562, 137.77720642089844, 144.54034423828125, 151.30349731445312, 158.06663513183594, 164.82977294921875, 171.59292602539062, 178.35606384277344, 185.1192169189453, 191.88235473632812, 198.6455078125, 205.4086456298828, 212.17178344726562, 218.9349365234375, 225.6980743408203]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 6.0, 3.0, 11.0, 5.0, 14.0, 21.0, 30.0, 39.0, 42.0, 65.0, 93.0, 130.0, 226.0, 282.0, 413.0, 539.0, 772.0, 1073.0, 1574.0, 2199.0, 3050.0, 4428.0, 5970.0, 8916.0, 13447.0, 21888.0, 44510.0, 51263652.0, 37221.0, 20250.0, 12390.0, 8336.0, 5739.0, 3981.0, 2931.0, 2067.0, 1470.0, 1060.0, 734.0, 553.0, 344.0, 256.0, 181.0, 131.0, 85.0, 64.0, 45.0, 24.0, 28.0, 13.0, 15.0, 10.0, 4.0, 4.0, 9.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-154.3770294189453, -149.4623565673828, -144.54766845703125, -139.63299560546875, -134.7183074951172, -129.8036346435547, -124.88894653320312, -119.97427368164062, -115.05958557128906, -110.14490509033203, -105.230224609375, -100.31554412841797, -95.40086364746094, -90.4861831665039, -85.57150268554688, -80.65682983398438, -75.74214935302734, -70.82746887207031, -65.91278839111328, -60.99810791015625, -56.08342742919922, -51.16874694824219, -46.25407028198242, -41.33938980102539, -36.42470932006836, -31.510028839111328, -26.595348358154297, -21.6806697845459, -16.765989303588867, -11.851308822631836, -6.9366302490234375, -2.0219497680664062, 2.892730712890625, 7.807410717010498, 12.722090721130371, 17.636770248413086, 22.551450729370117, 27.46613121032715, 32.38080978393555, 37.29549026489258, 42.21017074584961, 47.12485122680664, 52.03953170776367, 56.95420837402344, 61.86888885498047, 66.7835693359375, 71.69824981689453, 76.61293029785156, 81.5276107788086, 86.44229125976562, 91.35697174072266, 96.27165222167969, 101.18633270263672, 106.10101318359375, 111.01568603515625, 115.93037414550781, 120.84504699707031, 125.75972747802734, 130.67440795898438, 135.58908081054688, 140.50376892089844, 145.41844177246094, 150.3331298828125, 155.247802734375, 160.16249084472656]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 6.0, 17.0, 18.0, 17.0, 40.0, 58.0, 87.0, 125.0, 171.0, 153.0, 111.0, 71.0, 56.0, 22.0, 22.0, 15.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-866.084716796875, -841.707275390625, -817.329833984375, -792.952392578125, -768.5748901367188, -744.1974487304688, -719.8200073242188, -695.4425659179688, -671.0650634765625, -646.6876220703125, -622.3101806640625, -597.9327392578125, -573.5552368164062, -549.1777954101562, -524.8003540039062, -500.42291259765625, -476.04547119140625, -451.66802978515625, -427.2905578613281, -402.9131164550781, -378.53564453125, -354.158203125, -329.78076171875, -305.4033203125, -281.0258483886719, -256.6484069824219, -232.27093505859375, -207.89349365234375, -183.5160369873047, -159.13858032226562, -134.76113891601562, -110.38368225097656, -86.00616455078125, -61.62871170043945, -37.251258850097656, -12.873809814453125, 11.503646850585938, 35.881103515625, 60.258544921875, 84.63600158691406, 109.01345825195312, 133.3909149169922, 157.76837158203125, 182.14581298828125, 206.5232696533203, 230.90072631835938, 255.27816772460938, 279.6556396484375, 304.0330810546875, 328.4105224609375, 352.7879943847656, 377.1654357910156, 401.54290771484375, 425.92034912109375, 450.29779052734375, 474.67523193359375, 499.0527038574219, 523.43017578125, 547.8076171875, 572.18505859375, 596.5625, 620.93994140625, 645.3173828125, 669.6948852539062, 694.0723266601562]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 6.0, 9.0, 8.0, 11.0, 13.0, 18.0, 17.0, 23.0, 25.0, 28.0, 38.0, 50.0, 49.0, 72.0, 81.0, 90.0, 87.0, 59.0, 44.0, 42.0, 40.0, 30.0, 35.0, 18.0, 24.0, 17.0, 11.0, 8.0, 9.0, 9.0, 9.0, 5.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-619.3272094726562, -597.7445068359375, -576.1618041992188, -554.5791015625, -532.996337890625, -511.41363525390625, -489.8309326171875, -468.24822998046875, -446.6654968261719, -425.0827941894531, -403.50006103515625, -381.9173583984375, -360.33465576171875, -338.7519226074219, -317.1692199707031, -295.58648681640625, -274.0037841796875, -252.4210662841797, -230.83834838867188, -209.25564575195312, -187.6729278564453, -166.0902099609375, -144.50750732421875, -122.92478942871094, -101.34207153320312, -79.75935363769531, -58.17664337158203, -36.59393310546875, -15.011215209960938, 6.571502685546875, 28.154205322265625, 49.73692321777344, 71.319580078125, 92.90229797363281, 114.4850082397461, 136.06771850585938, 157.6504364013672, 179.233154296875, 200.81585693359375, 222.39857482910156, 243.98129272460938, 265.5639953613281, 287.146728515625, 308.72943115234375, 330.3121337890625, 351.8948669433594, 373.4775695800781, 395.060302734375, 416.64300537109375, 438.2257080078125, 459.8084411621094, 481.3911437988281, 502.973876953125, 524.5565795898438, 546.1392822265625, 567.7219848632812, 589.3046875, 610.8873901367188, 632.4700927734375, 654.0528564453125, 675.6355590820312, 697.21826171875, 718.8009643554688, 740.3836669921875, 761.9664306640625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 2.0, 2.0, 2.0, 6.0, 6.0, 6.0, 17.0, 15.0, 10.0, 37.0, 21.0, 36.0, 55.0, 71.0, 90.0, 114.0, 168.0, 290.0, 336.0, 503.0, 770.0, 1173.0, 1808.0, 2930.0, 4785.0, 8644.0, 17421.0, 41492.0, 119058.0, 493207.0, 3040321.0, 307157.0, 87234.0, 32884.0, 15013.0, 7660.0, 4302.0, 2537.0, 1438.0, 919.0, 617.0, 401.0, 233.0, 166.0, 97.0, 85.0, 47.0, 34.0, 24.0, 12.0, 14.0, 2.0, 6.0, 3.0, 2.0, 2.0, 3.0], "bins": [-20.890625, -20.3314208984375, -19.772216796875, -19.2130126953125, -18.65380859375, -18.0946044921875, -17.535400390625, -16.9761962890625, -16.4169921875, -15.8577880859375, -15.298583984375, -14.7393798828125, -14.18017578125, -13.6209716796875, -13.061767578125, -12.5025634765625, -11.943359375, -11.3841552734375, -10.824951171875, -10.2657470703125, -9.70654296875, -9.1473388671875, -8.588134765625, -8.0289306640625, -7.4697265625, -6.9105224609375, -6.351318359375, -5.7921142578125, -5.23291015625, -4.6737060546875, -4.114501953125, -3.5552978515625, -2.99609375, -2.4368896484375, -1.877685546875, -1.3184814453125, -0.75927734375, -0.2000732421875, 0.359130859375, 0.9183349609375, 1.4775390625, 2.0367431640625, 2.595947265625, 3.1551513671875, 3.71435546875, 4.2735595703125, 4.832763671875, 5.3919677734375, 5.951171875, 6.5103759765625, 7.069580078125, 7.6287841796875, 8.18798828125, 8.7471923828125, 9.306396484375, 9.8656005859375, 10.4248046875, 10.9840087890625, 11.543212890625, 12.1024169921875, 12.66162109375, 13.2208251953125, 13.780029296875, 14.3392333984375, 14.8984375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 7.0, 10.0, 22.0, 22.0, 35.0, 58.0, 66.0, 93.0, 104.0, 113.0, 127.0, 96.0, 82.0, 47.0, 31.0, 26.0, 18.0, 8.0, 6.0, 7.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.31396484375, -2.2470703125, -2.18017578125, -2.11328125, -2.04638671875, -1.9794921875, -1.91259765625, -1.845703125, -1.77880859375, -1.7119140625, -1.64501953125, -1.578125, -1.51123046875, -1.4443359375, -1.37744140625, -1.310546875, -1.24365234375, -1.1767578125, -1.10986328125, -1.04296875, -0.97607421875, -0.9091796875, -0.84228515625, -0.775390625, -0.70849609375, -0.6416015625, -0.57470703125, -0.5078125, -0.44091796875, -0.3740234375, -0.30712890625, -0.240234375, -0.17333984375, -0.1064453125, -0.03955078125, 0.02734375, 0.09423828125, 0.1611328125, 0.22802734375, 0.294921875, 0.36181640625, 0.4287109375, 0.49560546875, 0.5625, 0.62939453125, 0.6962890625, 0.76318359375, 0.830078125, 0.89697265625, 0.9638671875, 1.03076171875, 1.09765625, 1.16455078125, 1.2314453125, 1.29833984375, 1.365234375, 1.43212890625, 1.4990234375, 1.56591796875, 1.6328125, 1.69970703125, 1.7666015625, 1.83349609375, 1.900390625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 9.0, 3.0, 10.0, 17.0, 13.0, 21.0, 46.0, 74.0, 99.0, 183.0, 326.0, 569.0, 1276.0, 3056.0, 8397.0, 28137.0, 131057.0, 1177703.0, 2605136.0, 183358.0, 37105.0, 10643.0, 3779.0, 1541.0, 765.0, 354.0, 202.0, 131.0, 87.0, 54.0, 32.0, 35.0, 17.0, 17.0, 7.0, 11.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.0625, -15.44677734375, -14.8310546875, -14.21533203125, -13.599609375, -12.98388671875, -12.3681640625, -11.75244140625, -11.13671875, -10.52099609375, -9.9052734375, -9.28955078125, -8.673828125, -8.05810546875, -7.4423828125, -6.82666015625, -6.2109375, -5.59521484375, -4.9794921875, -4.36376953125, -3.748046875, -3.13232421875, -2.5166015625, -1.90087890625, -1.28515625, -0.66943359375, -0.0537109375, 0.56201171875, 1.177734375, 1.79345703125, 2.4091796875, 3.02490234375, 3.640625, 4.25634765625, 4.8720703125, 5.48779296875, 6.103515625, 6.71923828125, 7.3349609375, 7.95068359375, 8.56640625, 9.18212890625, 9.7978515625, 10.41357421875, 11.029296875, 11.64501953125, 12.2607421875, 12.87646484375, 13.4921875, 14.10791015625, 14.7236328125, 15.33935546875, 15.955078125, 16.57080078125, 17.1865234375, 17.80224609375, 18.41796875, 19.03369140625, 19.6494140625, 20.26513671875, 20.880859375, 21.49658203125, 22.1123046875, 22.72802734375, 23.34375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 5.0, 11.0, 15.0, 6.0, 11.0, 17.0, 30.0, 38.0, 32.0, 62.0, 72.0, 76.0, 112.0, 173.0, 196.0, 260.0, 459.0, 1008.0, 406.0, 244.0, 163.0, 125.0, 103.0, 87.0, 73.0, 50.0, 55.0, 43.0, 35.0, 20.0, 23.0, 14.0, 10.0, 11.0, 7.0, 4.0, 5.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.822265625, -3.70428466796875, -3.5863037109375, -3.46832275390625, -3.350341796875, -3.23236083984375, -3.1143798828125, -2.99639892578125, -2.87841796875, -2.76043701171875, -2.6424560546875, -2.52447509765625, -2.406494140625, -2.28851318359375, -2.1705322265625, -2.05255126953125, -1.9345703125, -1.81658935546875, -1.6986083984375, -1.58062744140625, -1.462646484375, -1.34466552734375, -1.2266845703125, -1.10870361328125, -0.99072265625, -0.87274169921875, -0.7547607421875, -0.63677978515625, -0.518798828125, -0.40081787109375, -0.2828369140625, -0.16485595703125, -0.046875, 0.07110595703125, 0.1890869140625, 0.30706787109375, 0.425048828125, 0.54302978515625, 0.6610107421875, 0.77899169921875, 0.89697265625, 1.01495361328125, 1.1329345703125, 1.25091552734375, 1.368896484375, 1.48687744140625, 1.6048583984375, 1.72283935546875, 1.8408203125, 1.95880126953125, 2.0767822265625, 2.19476318359375, 2.312744140625, 2.43072509765625, 2.5487060546875, 2.66668701171875, 2.78466796875, 2.90264892578125, 3.0206298828125, 3.13861083984375, 3.256591796875, 3.37457275390625, 3.4925537109375, 3.61053466796875, 3.728515625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 52.0, 164.0, 309.0, 288.0, 110.0, 50.0, 11.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.61771583557129, -23.596031188964844, -20.57434844970703, -17.552663803100586, -14.530980110168457, -11.509296417236328, -8.487611770629883, -5.46592903137207, -2.444244384765625, 0.577439546585083, 3.599123477935791, 6.620807647705078, 9.642491340637207, 12.664175033569336, 15.685859680175781, 18.707542419433594, 21.72922706604004, 24.750911712646484, 27.772594451904297, 30.794279098510742, 33.81596374511719, 36.837646484375, 39.85932922363281, 42.881011962890625, 45.9026985168457, 48.924381256103516, 51.946067810058594, 54.967750549316406, 57.98943328857422, 61.01111602783203, 64.03280639648438, 67.05448913574219, 70.07616424560547, 73.09784698486328, 76.1195297241211, 79.14122009277344, 82.16290283203125, 85.18458557128906, 88.20626831054688, 91.22795104980469, 94.2496337890625, 97.27131652832031, 100.29299926757812, 103.31468200683594, 106.33637237548828, 109.3580551147461, 112.3797378540039, 115.40142059326172, 118.42311096191406, 121.44479370117188, 124.46647644042969, 127.4881591796875, 130.5098419189453, 133.53152465820312, 136.55322265625, 139.57489013671875, 142.59657287597656, 145.61825561523438, 148.6399383544922, 151.66162109375, 154.6833038330078, 157.70498657226562, 160.7266845703125, 163.74835205078125, 166.77005004882812]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 11.0, 24.0, 26.0, 31.0, 28.0, 25.0, 49.0, 55.0, 69.0, 64.0, 75.0, 77.0, 58.0, 71.0, 73.0, 60.0, 40.0, 40.0, 26.0, 22.0, 16.0, 15.0, 8.0, 9.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.414440155029297, -23.446041107177734, -22.47764015197754, -21.509241104125977, -20.54084014892578, -19.57244110107422, -18.604042053222656, -17.635643005371094, -16.6672420501709, -15.69884204864502, -14.73044204711914, -13.762042999267578, -12.7936429977417, -11.82524299621582, -10.856843948364258, -9.888443946838379, -8.9200439453125, -7.951643943786621, -6.9832444190979, -6.01484489440918, -5.046444892883301, -4.078044891357422, -3.109645366668701, -2.1412458419799805, -1.1728458404541016, -0.20444607734680176, 0.763953685760498, 1.7323534488677979, 2.7007532119750977, 3.6691532135009766, 4.637552738189697, 5.605952262878418, 6.574352264404297, 7.542752265930176, 8.511152267456055, 9.479551315307617, 10.447951316833496, 11.416351318359375, 12.384750366210938, 13.353150367736816, 14.321550369262695, 15.289950370788574, 16.258350372314453, 17.226749420166016, 18.195148468017578, 19.163549423217773, 20.131948471069336, 21.10034942626953, 22.068748474121094, 23.037147521972656, 24.00554847717285, 24.973947525024414, 25.94234848022461, 26.910747528076172, 27.879146575927734, 28.847545623779297, 29.815946578979492, 30.784345626831055, 31.75274658203125, 32.72114562988281, 33.689544677734375, 34.65794372558594, 35.626346588134766, 36.59474563598633, 37.56314468383789]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 12.0, 8.0, 21.0, 24.0, 37.0, 53.0, 68.0, 131.0, 160.0, 225.0, 378.0, 518.0, 840.0, 1354.0, 2224.0, 3530.0, 6036.0, 11561.0, 25127.0, 62139.0, 173899.0, 376898.0, 235857.0, 82906.0, 32229.0, 14251.0, 7107.0, 4051.0, 2485.0, 1533.0, 1009.0, 619.0, 409.0, 268.0, 193.0, 121.0, 90.0, 66.0, 33.0, 30.0, 20.0, 9.0, 9.0, 7.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.625, -13.2076416015625, -12.790283203125, -12.3729248046875, -11.95556640625, -11.5382080078125, -11.120849609375, -10.7034912109375, -10.2861328125, -9.8687744140625, -9.451416015625, -9.0340576171875, -8.61669921875, -8.1993408203125, -7.781982421875, -7.3646240234375, -6.947265625, -6.5299072265625, -6.112548828125, -5.6951904296875, -5.27783203125, -4.8604736328125, -4.443115234375, -4.0257568359375, -3.6083984375, -3.1910400390625, -2.773681640625, -2.3563232421875, -1.93896484375, -1.5216064453125, -1.104248046875, -0.6868896484375, -0.26953125, 0.1478271484375, 0.565185546875, 0.9825439453125, 1.39990234375, 1.8172607421875, 2.234619140625, 2.6519775390625, 3.0693359375, 3.4866943359375, 3.904052734375, 4.3214111328125, 4.73876953125, 5.1561279296875, 5.573486328125, 5.9908447265625, 6.408203125, 6.8255615234375, 7.242919921875, 7.6602783203125, 8.07763671875, 8.4949951171875, 8.912353515625, 9.3297119140625, 9.7470703125, 10.1644287109375, 10.581787109375, 10.9991455078125, 11.41650390625, 11.8338623046875, 12.251220703125, 12.6685791015625, 13.0859375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 1.0, 5.0, 2.0, 15.0, 11.0, 15.0, 19.0, 38.0, 42.0, 65.0, 67.0, 85.0, 93.0, 113.0, 87.0, 73.0, 71.0, 56.0, 33.0, 22.0, 27.0, 18.0, 5.0, 5.0, 8.0, 7.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.099609375, -2.03662109375, -1.9736328125, -1.91064453125, -1.84765625, -1.78466796875, -1.7216796875, -1.65869140625, -1.595703125, -1.53271484375, -1.4697265625, -1.40673828125, -1.34375, -1.28076171875, -1.2177734375, -1.15478515625, -1.091796875, -1.02880859375, -0.9658203125, -0.90283203125, -0.83984375, -0.77685546875, -0.7138671875, -0.65087890625, -0.587890625, -0.52490234375, -0.4619140625, -0.39892578125, -0.3359375, -0.27294921875, -0.2099609375, -0.14697265625, -0.083984375, -0.02099609375, 0.0419921875, 0.10498046875, 0.16796875, 0.23095703125, 0.2939453125, 0.35693359375, 0.419921875, 0.48291015625, 0.5458984375, 0.60888671875, 0.671875, 0.73486328125, 0.7978515625, 0.86083984375, 0.923828125, 0.98681640625, 1.0498046875, 1.11279296875, 1.17578125, 1.23876953125, 1.3017578125, 1.36474609375, 1.427734375, 1.49072265625, 1.5537109375, 1.61669921875, 1.6796875, 1.74267578125, 1.8056640625, 1.86865234375, 1.931640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 7.0, 2.0, 3.0, 2.0, 6.0, 7.0, 12.0, 12.0, 16.0, 43.0, 47.0, 80.0, 142.0, 263.0, 477.0, 991.0, 1818.0, 3931.0, 8857.0, 23188.0, 97476.0, 572863.0, 267506.0, 44996.0, 14363.0, 5932.0, 2697.0, 1286.0, 707.0, 360.0, 198.0, 104.0, 67.0, 30.0, 24.0, 12.0, 5.0, 12.0, 5.0, 3.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.453125, -17.8720703125, -17.291015625, -16.7099609375, -16.12890625, -15.5478515625, -14.966796875, -14.3857421875, -13.8046875, -13.2236328125, -12.642578125, -12.0615234375, -11.48046875, -10.8994140625, -10.318359375, -9.7373046875, -9.15625, -8.5751953125, -7.994140625, -7.4130859375, -6.83203125, -6.2509765625, -5.669921875, -5.0888671875, -4.5078125, -3.9267578125, -3.345703125, -2.7646484375, -2.18359375, -1.6025390625, -1.021484375, -0.4404296875, 0.140625, 0.7216796875, 1.302734375, 1.8837890625, 2.46484375, 3.0458984375, 3.626953125, 4.2080078125, 4.7890625, 5.3701171875, 5.951171875, 6.5322265625, 7.11328125, 7.6943359375, 8.275390625, 8.8564453125, 9.4375, 10.0185546875, 10.599609375, 11.1806640625, 11.76171875, 12.3427734375, 12.923828125, 13.5048828125, 14.0859375, 14.6669921875, 15.248046875, 15.8291015625, 16.41015625, 16.9912109375, 17.572265625, 18.1533203125, 18.734375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 9.0, 10.0, 9.0, 16.0, 11.0, 24.0, 26.0, 28.0, 33.0, 28.0, 23.0, 42.0, 46.0, 30.0, 37.0, 42.0, 49.0, 53.0, 52.0, 50.0, 50.0, 36.0, 43.0, 41.0, 42.0, 19.0, 35.0, 18.0, 16.0, 19.0, 10.0, 13.0, 7.0, 5.0, 4.0, 10.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.703125, -9.37841796875, -9.0537109375, -8.72900390625, -8.404296875, -8.07958984375, -7.7548828125, -7.43017578125, -7.10546875, -6.78076171875, -6.4560546875, -6.13134765625, -5.806640625, -5.48193359375, -5.1572265625, -4.83251953125, -4.5078125, -4.18310546875, -3.8583984375, -3.53369140625, -3.208984375, -2.88427734375, -2.5595703125, -2.23486328125, -1.91015625, -1.58544921875, -1.2607421875, -0.93603515625, -0.611328125, -0.28662109375, 0.0380859375, 0.36279296875, 0.6875, 1.01220703125, 1.3369140625, 1.66162109375, 1.986328125, 2.31103515625, 2.6357421875, 2.96044921875, 3.28515625, 3.60986328125, 3.9345703125, 4.25927734375, 4.583984375, 4.90869140625, 5.2333984375, 5.55810546875, 5.8828125, 6.20751953125, 6.5322265625, 6.85693359375, 7.181640625, 7.50634765625, 7.8310546875, 8.15576171875, 8.48046875, 8.80517578125, 9.1298828125, 9.45458984375, 9.779296875, 10.10400390625, 10.4287109375, 10.75341796875, 11.078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 8.0, 7.0, 12.0, 12.0, 25.0, 24.0, 46.0, 64.0, 110.0, 152.0, 261.0, 403.0, 818.0, 1542.0, 3454.0, 8842.0, 30836.0, 257292.0, 659612.0, 61933.0, 13652.0, 4808.0, 2123.0, 1033.0, 582.0, 317.0, 187.0, 125.0, 69.0, 57.0, 38.0, 28.0, 17.0, 18.0, 10.0, 9.0, 4.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.46875, -33.4306640625, -32.392578125, -31.3544921875, -30.31640625, -29.2783203125, -28.240234375, -27.2021484375, -26.1640625, -25.1259765625, -24.087890625, -23.0498046875, -22.01171875, -20.9736328125, -19.935546875, -18.8974609375, -17.859375, -16.8212890625, -15.783203125, -14.7451171875, -13.70703125, -12.6689453125, -11.630859375, -10.5927734375, -9.5546875, -8.5166015625, -7.478515625, -6.4404296875, -5.40234375, -4.3642578125, -3.326171875, -2.2880859375, -1.25, -0.2119140625, 0.826171875, 1.8642578125, 2.90234375, 3.9404296875, 4.978515625, 6.0166015625, 7.0546875, 8.0927734375, 9.130859375, 10.1689453125, 11.20703125, 12.2451171875, 13.283203125, 14.3212890625, 15.359375, 16.3974609375, 17.435546875, 18.4736328125, 19.51171875, 20.5498046875, 21.587890625, 22.6259765625, 23.6640625, 24.7021484375, 25.740234375, 26.7783203125, 27.81640625, 28.8544921875, 29.892578125, 30.9306640625, 31.96875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 7.0, 12.0, 8.0, 16.0, 19.0, 25.0, 40.0, 46.0, 65.0, 114.0, 125.0, 127.0, 110.0, 81.0, 69.0, 32.0, 28.0, 21.0, 11.0, 9.0, 13.0, 7.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001255035400390625, -0.0011924505233764648, -0.0011298656463623047, -0.0010672807693481445, -0.0010046958923339844, -0.0009421110153198242, -0.0008795261383056641, -0.0008169412612915039, -0.0007543563842773438, -0.0006917715072631836, -0.0006291866302490234, -0.0005666017532348633, -0.0005040168762207031, -0.00044143199920654297, -0.0003788471221923828, -0.00031626224517822266, -0.0002536773681640625, -0.00019109249114990234, -0.0001285076141357422, -6.592273712158203e-05, -3.337860107421875e-06, 5.924701690673828e-05, 0.00012183189392089844, 0.0001844167709350586, 0.00024700164794921875, 0.0003095865249633789, 0.00037217140197753906, 0.0004347562789916992, 0.0004973411560058594, 0.0005599260330200195, 0.0006225109100341797, 0.0006850957870483398, 0.0007476806640625, 0.0008102655410766602, 0.0008728504180908203, 0.0009354352951049805, 0.0009980201721191406, 0.0010606050491333008, 0.001123189926147461, 0.001185774803161621, 0.0012483596801757812, 0.0013109445571899414, 0.0013735294342041016, 0.0014361143112182617, 0.0014986991882324219, 0.001561284065246582, 0.0016238689422607422, 0.0016864538192749023, 0.0017490386962890625, 0.0018116235733032227, 0.0018742084503173828, 0.001936793327331543, 0.001999378204345703, 0.0020619630813598633, 0.0021245479583740234, 0.0021871328353881836, 0.0022497177124023438, 0.002312302589416504, 0.002374887466430664, 0.0024374723434448242, 0.0025000572204589844, 0.0025626420974731445, 0.0026252269744873047, 0.002687811851501465, 0.002750396728515625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 5.0, 16.0, 15.0, 32.0, 43.0, 41.0, 48.0, 89.0, 152.0, 194.0, 376.0, 611.0, 1079.0, 2217.0, 5675.0, 20123.0, 162161.0, 779778.0, 56915.0, 11299.0, 3859.0, 1679.0, 843.0, 435.0, 284.0, 187.0, 98.0, 96.0, 64.0, 30.0, 26.0, 17.0, 14.0, 8.0, 9.0, 8.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.25, -36.13134765625, -35.0126953125, -33.89404296875, -32.775390625, -31.65673828125, -30.5380859375, -29.41943359375, -28.30078125, -27.18212890625, -26.0634765625, -24.94482421875, -23.826171875, -22.70751953125, -21.5888671875, -20.47021484375, -19.3515625, -18.23291015625, -17.1142578125, -15.99560546875, -14.876953125, -13.75830078125, -12.6396484375, -11.52099609375, -10.40234375, -9.28369140625, -8.1650390625, -7.04638671875, -5.927734375, -4.80908203125, -3.6904296875, -2.57177734375, -1.453125, -0.33447265625, 0.7841796875, 1.90283203125, 3.021484375, 4.14013671875, 5.2587890625, 6.37744140625, 7.49609375, 8.61474609375, 9.7333984375, 10.85205078125, 11.970703125, 13.08935546875, 14.2080078125, 15.32666015625, 16.4453125, 17.56396484375, 18.6826171875, 19.80126953125, 20.919921875, 22.03857421875, 23.1572265625, 24.27587890625, 25.39453125, 26.51318359375, 27.6318359375, 28.75048828125, 29.869140625, 30.98779296875, 32.1064453125, 33.22509765625, 34.34375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 9.0, 7.0, 9.0, 4.0, 8.0, 15.0, 20.0, 24.0, 33.0, 53.0, 49.0, 75.0, 70.0, 100.0, 93.0, 84.0, 67.0, 59.0, 56.0, 32.0, 33.0, 29.0, 17.0, 11.0, 10.0, 9.0, 9.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4375, -9.050537109375, -8.66357421875, -8.276611328125, -7.8896484375, -7.502685546875, -7.11572265625, -6.728759765625, -6.341796875, -5.954833984375, -5.56787109375, -5.180908203125, -4.7939453125, -4.406982421875, -4.02001953125, -3.633056640625, -3.24609375, -2.859130859375, -2.47216796875, -2.085205078125, -1.6982421875, -1.311279296875, -0.92431640625, -0.537353515625, -0.150390625, 0.236572265625, 0.62353515625, 1.010498046875, 1.3974609375, 1.784423828125, 2.17138671875, 2.558349609375, 2.9453125, 3.332275390625, 3.71923828125, 4.106201171875, 4.4931640625, 4.880126953125, 5.26708984375, 5.654052734375, 6.041015625, 6.427978515625, 6.81494140625, 7.201904296875, 7.5888671875, 7.975830078125, 8.36279296875, 8.749755859375, 9.13671875, 9.523681640625, 9.91064453125, 10.297607421875, 10.6845703125, 11.071533203125, 11.45849609375, 11.845458984375, 12.232421875, 12.619384765625, 13.00634765625, 13.393310546875, 13.7802734375, 14.167236328125, 14.55419921875, 14.941162109375, 15.328125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 3.0, 7.0, 5.0, 15.0, 17.0, 31.0, 118.0, 359.0, 283.0, 95.0, 30.0, 20.0, 14.0, 1.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.93592834472656, -114.14376831054688, -102.35161590576172, -90.55945587158203, -78.76730346679688, -66.97514343261719, -55.1829833984375, -43.390830993652344, -31.598670959472656, -19.806514739990234, -8.01435661315918, 3.777801513671875, 15.569957733154297, 27.36211395263672, 39.154273986816406, 50.94642639160156, 62.73858642578125, 74.53074645996094, 86.3228988647461, 98.11505889892578, 109.90721130371094, 121.69937133789062, 133.4915313720703, 145.28369140625, 157.07583618164062, 168.8679962158203, 180.66015625, 192.45230102539062, 204.2444610595703, 216.03662109375, 227.8287811279297, 239.62094116210938, 251.41311645507812, 263.20526123046875, 274.9974365234375, 286.7895812988281, 298.5817565917969, 310.3739013671875, 322.16607666015625, 333.9582214355469, 345.7503662109375, 357.5425109863281, 369.3346862792969, 381.1268310546875, 392.91900634765625, 404.7111511230469, 416.5032958984375, 428.29547119140625, 440.087646484375, 451.8797912597656, 463.6719665527344, 475.464111328125, 487.25628662109375, 499.0484313964844, 510.840576171875, 522.6327514648438, 534.4248657226562, 546.217041015625, 558.0091552734375, 569.8013305664062, 581.593505859375, 593.3856201171875, 605.1777954101562, 616.969970703125, 628.7621459960938]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 6.0, 3.0, 13.0, 10.0, 19.0, 21.0, 67.0, 72.0, 122.0, 134.0, 105.0, 138.0, 95.0, 56.0, 35.0, 27.0, 14.0, 6.0, 14.0, 7.0, 7.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-218.5006103515625, -212.1026611328125, -205.70469665527344, -199.30674743652344, -192.90878295898438, -186.51083374023438, -180.11288452148438, -173.71493530273438, -167.3169708251953, -160.9190216064453, -154.52105712890625, -148.12310791015625, -141.72515869140625, -135.3271942138672, -128.9292449951172, -122.53128814697266, -116.13333129882812, -109.7353744506836, -103.33741760253906, -96.93946838378906, -90.54151153564453, -84.1435546875, -77.74560546875, -71.34764862060547, -64.94969177246094, -58.551734924316406, -52.15378189086914, -45.755828857421875, -39.357872009277344, -32.95991516113281, -26.561962127685547, -20.16400909423828, -13.76605224609375, -7.368097305297852, -0.9701423645019531, 5.427812576293945, 11.825767517089844, 18.223722457885742, 24.62167739868164, 31.019630432128906, 37.41758728027344, 43.81554412841797, 50.213497161865234, 56.6114501953125, 63.00940704345703, 69.40736389160156, 75.80531311035156, 82.2032699584961, 88.60122680664062, 94.99918365478516, 101.39714050292969, 107.79508972167969, 114.19304656982422, 120.59100341796875, 126.98895263671875, 133.38690185546875, 139.7848663330078, 146.1828155517578, 152.58078002929688, 158.97872924804688, 165.37667846679688, 171.77464294433594, 178.17259216308594, 184.570556640625, 190.968505859375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 6.0, 4.0, 4.0, 6.0, 8.0, 3.0, 17.0, 29.0, 31.0, 47.0, 78.0, 120.0, 195.0, 302.0, 537.0, 956.0, 1896.0, 4145.0, 10607.0, 33826.0, 189882.0, 3704871.0, 193336.0, 34880.0, 10647.0, 4048.0, 1774.0, 879.0, 489.0, 258.0, 178.0, 77.0, 52.0, 34.0, 18.0, 14.0, 5.0, 12.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-57.28125, -55.75390625, -54.2265625, -52.69921875, -51.171875, -49.64453125, -48.1171875, -46.58984375, -45.0625, -43.53515625, -42.0078125, -40.48046875, -38.953125, -37.42578125, -35.8984375, -34.37109375, -32.84375, -31.31640625, -29.7890625, -28.26171875, -26.734375, -25.20703125, -23.6796875, -22.15234375, -20.625, -19.09765625, -17.5703125, -16.04296875, -14.515625, -12.98828125, -11.4609375, -9.93359375, -8.40625, -6.87890625, -5.3515625, -3.82421875, -2.296875, -0.76953125, 0.7578125, 2.28515625, 3.8125, 5.33984375, 6.8671875, 8.39453125, 9.921875, 11.44921875, 12.9765625, 14.50390625, 16.03125, 17.55859375, 19.0859375, 20.61328125, 22.140625, 23.66796875, 25.1953125, 26.72265625, 28.25, 29.77734375, 31.3046875, 32.83203125, 34.359375, 35.88671875, 37.4140625, 38.94140625, 40.46875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 3.0, 4.0, 6.0, 15.0, 16.0, 17.0, 20.0, 34.0, 36.0, 47.0, 54.0, 60.0, 73.0, 84.0, 71.0, 79.0, 78.0, 58.0, 48.0, 38.0, 36.0, 23.0, 23.0, 20.0, 14.0, 11.0, 5.0, 7.0, 2.0, 6.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-2.169921875, -2.114776611328125, -2.05963134765625, -2.004486083984375, -1.9493408203125, -1.894195556640625, -1.83905029296875, -1.783905029296875, -1.728759765625, -1.673614501953125, -1.61846923828125, -1.563323974609375, -1.5081787109375, -1.453033447265625, -1.39788818359375, -1.342742919921875, -1.28759765625, -1.232452392578125, -1.17730712890625, -1.122161865234375, -1.0670166015625, -1.011871337890625, -0.95672607421875, -0.901580810546875, -0.846435546875, -0.791290283203125, -0.73614501953125, -0.680999755859375, -0.6258544921875, -0.570709228515625, -0.51556396484375, -0.460418701171875, -0.4052734375, -0.350128173828125, -0.29498291015625, -0.239837646484375, -0.1846923828125, -0.129547119140625, -0.07440185546875, -0.019256591796875, 0.035888671875, 0.091033935546875, 0.14617919921875, 0.201324462890625, 0.2564697265625, 0.311614990234375, 0.36676025390625, 0.421905517578125, 0.47705078125, 0.532196044921875, 0.58734130859375, 0.642486572265625, 0.6976318359375, 0.752777099609375, 0.80792236328125, 0.863067626953125, 0.918212890625, 0.973358154296875, 1.02850341796875, 1.083648681640625, 1.1387939453125, 1.193939208984375, 1.24908447265625, 1.304229736328125, 1.359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 6.0, 12.0, 14.0, 16.0, 31.0, 35.0, 71.0, 79.0, 136.0, 265.0, 418.0, 777.0, 1414.0, 3007.0, 6864.0, 17909.0, 54965.0, 230775.0, 2733718.0, 948455.0, 135505.0, 36714.0, 12816.0, 5186.0, 2282.0, 1182.0, 618.0, 376.0, 231.0, 142.0, 78.0, 50.0, 42.0, 15.0, 23.0, 13.0, 9.0, 3.0, 9.0, 9.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-26.546875, -25.76220703125, -24.9775390625, -24.19287109375, -23.408203125, -22.62353515625, -21.8388671875, -21.05419921875, -20.26953125, -19.48486328125, -18.7001953125, -17.91552734375, -17.130859375, -16.34619140625, -15.5615234375, -14.77685546875, -13.9921875, -13.20751953125, -12.4228515625, -11.63818359375, -10.853515625, -10.06884765625, -9.2841796875, -8.49951171875, -7.71484375, -6.93017578125, -6.1455078125, -5.36083984375, -4.576171875, -3.79150390625, -3.0068359375, -2.22216796875, -1.4375, -0.65283203125, 0.1318359375, 0.91650390625, 1.701171875, 2.48583984375, 3.2705078125, 4.05517578125, 4.83984375, 5.62451171875, 6.4091796875, 7.19384765625, 7.978515625, 8.76318359375, 9.5478515625, 10.33251953125, 11.1171875, 11.90185546875, 12.6865234375, 13.47119140625, 14.255859375, 15.04052734375, 15.8251953125, 16.60986328125, 17.39453125, 18.17919921875, 18.9638671875, 19.74853515625, 20.533203125, 21.31787109375, 22.1025390625, 22.88720703125, 23.671875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 7.0, 12.0, 11.0, 9.0, 24.0, 18.0, 38.0, 48.0, 51.0, 107.0, 124.0, 187.0, 299.0, 485.0, 1186.0, 541.0, 272.0, 208.0, 113.0, 82.0, 67.0, 40.0, 38.0, 23.0, 16.0, 21.0, 6.0, 6.0, 8.0, 4.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.435546875, -3.314727783203125, -3.19390869140625, -3.073089599609375, -2.9522705078125, -2.831451416015625, -2.71063232421875, -2.589813232421875, -2.468994140625, -2.348175048828125, -2.22735595703125, -2.106536865234375, -1.9857177734375, -1.864898681640625, -1.74407958984375, -1.623260498046875, -1.50244140625, -1.381622314453125, -1.26080322265625, -1.139984130859375, -1.0191650390625, -0.898345947265625, -0.77752685546875, -0.656707763671875, -0.535888671875, -0.415069580078125, -0.29425048828125, -0.173431396484375, -0.0526123046875, 0.068206787109375, 0.18902587890625, 0.309844970703125, 0.4306640625, 0.551483154296875, 0.67230224609375, 0.793121337890625, 0.9139404296875, 1.034759521484375, 1.15557861328125, 1.276397705078125, 1.397216796875, 1.518035888671875, 1.63885498046875, 1.759674072265625, 1.8804931640625, 2.001312255859375, 2.12213134765625, 2.242950439453125, 2.36376953125, 2.484588623046875, 2.60540771484375, 2.726226806640625, 2.8470458984375, 2.967864990234375, 3.08868408203125, 3.209503173828125, 3.330322265625, 3.451141357421875, 3.57196044921875, 3.692779541015625, 3.8135986328125, 3.934417724609375, 4.05523681640625, 4.176055908203125, 4.296875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 9.0, 15.0, 74.0, 243.0, 311.0, 190.0, 84.0, 39.0, 12.0, 7.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-69.55113220214844, -67.5250244140625, -65.4989242553711, -63.472816467285156, -61.44670867919922, -59.42060470581055, -57.394500732421875, -55.36839294433594, -53.34228515625, -51.31618118286133, -49.29007339477539, -47.26396942138672, -45.23786163330078, -43.21175765991211, -41.18565368652344, -39.1595458984375, -37.13344192504883, -35.107337951660156, -33.08123016357422, -31.055126190185547, -29.02901840209961, -27.002914428710938, -24.976808547973633, -22.950702667236328, -20.924596786499023, -18.89849090576172, -16.872385025024414, -14.846280097961426, -12.820174217224121, -10.794068336486816, -8.767963409423828, -6.741857528686523, -4.715755462646484, -2.689649820327759, -0.6635441780090332, 1.3625612258911133, 3.388667106628418, 5.414772987365723, 7.440877914428711, 9.466983795166016, 11.49308967590332, 13.519195556640625, 15.54530143737793, 17.571407318115234, 19.597511291503906, 21.623619079589844, 23.649723052978516, 25.67582893371582, 27.701934814453125, 29.72804069519043, 31.754146575927734, 33.780250549316406, 35.806358337402344, 37.832462310791016, 39.85856628417969, 41.884674072265625, 43.91078186035156, 45.936885833740234, 47.96299362182617, 49.989097595214844, 52.01520538330078, 54.04130935668945, 56.067413330078125, 58.09352111816406, 60.119625091552734]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 14.0, 14.0, 23.0, 22.0, 26.0, 55.0, 50.0, 53.0, 87.0, 64.0, 79.0, 71.0, 78.0, 61.0, 58.0, 47.0, 56.0, 23.0, 26.0, 23.0, 12.0, 11.0, 14.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.699909210205078, -25.919652938842773, -25.1393985748291, -24.359142303466797, -23.578887939453125, -22.79863166809082, -22.018375396728516, -21.238121032714844, -20.45786476135254, -19.677608489990234, -18.897354125976562, -18.117097854614258, -17.336841583251953, -16.55658721923828, -15.776330947875977, -14.996075630187988, -14.2158203125, -13.435564994812012, -12.655309677124023, -11.875053405761719, -11.09479808807373, -10.314542770385742, -9.534286499023438, -8.75403118133545, -7.973775863647461, -7.193520545959473, -6.413264751434326, -5.63300895690918, -4.852753639221191, -4.072498321533203, -3.2922425270080566, -2.51198673248291, -1.7317333221435547, -0.9514777660369873, -0.17122220993041992, 0.6090333461761475, 1.3892889022827148, 2.1695444583892822, 2.9498000144958496, 3.730055809020996, 4.510311126708984, 5.290566444396973, 6.070822238922119, 6.851078033447266, 7.631333351135254, 8.411588668823242, 9.191844940185547, 9.972100257873535, 10.752355575561523, 11.532610893249512, 12.3128662109375, 13.093122482299805, 13.873377799987793, 14.653633117675781, 15.433889389038086, 16.21414566040039, 16.994400024414062, 17.774656295776367, 18.55491065979004, 19.335166931152344, 20.115421295166016, 20.89567756652832, 21.675933837890625, 22.456188201904297, 23.2364444732666]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 5.0, 6.0, 9.0, 13.0, 28.0, 34.0, 49.0, 103.0, 172.0, 293.0, 579.0, 1353.0, 2865.0, 7395.0, 20937.0, 70101.0, 264721.0, 458920.0, 155874.0, 42455.0, 13534.0, 4984.0, 2125.0, 938.0, 458.0, 251.0, 127.0, 71.0, 57.0, 26.0, 18.0, 9.0, 8.0, 6.0, 2.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.625, -17.079345703125, -16.53369140625, -15.988037109375, -15.4423828125, -14.896728515625, -14.35107421875, -13.805419921875, -13.259765625, -12.714111328125, -12.16845703125, -11.622802734375, -11.0771484375, -10.531494140625, -9.98583984375, -9.440185546875, -8.89453125, -8.348876953125, -7.80322265625, -7.257568359375, -6.7119140625, -6.166259765625, -5.62060546875, -5.074951171875, -4.529296875, -3.983642578125, -3.43798828125, -2.892333984375, -2.3466796875, -1.801025390625, -1.25537109375, -0.709716796875, -0.1640625, 0.381591796875, 0.92724609375, 1.472900390625, 2.0185546875, 2.564208984375, 3.10986328125, 3.655517578125, 4.201171875, 4.746826171875, 5.29248046875, 5.838134765625, 6.3837890625, 6.929443359375, 7.47509765625, 8.020751953125, 8.56640625, 9.112060546875, 9.65771484375, 10.203369140625, 10.7490234375, 11.294677734375, 11.84033203125, 12.385986328125, 12.931640625, 13.477294921875, 14.02294921875, 14.568603515625, 15.1142578125, 15.659912109375, 16.20556640625, 16.751220703125, 17.296875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 8.0, 2.0, 13.0, 12.0, 19.0, 27.0, 18.0, 31.0, 36.0, 48.0, 42.0, 38.0, 65.0, 56.0, 65.0, 56.0, 45.0, 55.0, 56.0, 47.0, 28.0, 38.0, 33.0, 30.0, 27.0, 14.0, 25.0, 13.0, 7.0, 14.0, 8.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.45703125, -1.4146728515625, -1.372314453125, -1.3299560546875, -1.28759765625, -1.2452392578125, -1.202880859375, -1.1605224609375, -1.1181640625, -1.0758056640625, -1.033447265625, -0.9910888671875, -0.94873046875, -0.9063720703125, -0.864013671875, -0.8216552734375, -0.779296875, -0.7369384765625, -0.694580078125, -0.6522216796875, -0.60986328125, -0.5675048828125, -0.525146484375, -0.4827880859375, -0.4404296875, -0.3980712890625, -0.355712890625, -0.3133544921875, -0.27099609375, -0.2286376953125, -0.186279296875, -0.1439208984375, -0.1015625, -0.0592041015625, -0.016845703125, 0.0255126953125, 0.06787109375, 0.1102294921875, 0.152587890625, 0.1949462890625, 0.2373046875, 0.2796630859375, 0.322021484375, 0.3643798828125, 0.40673828125, 0.4490966796875, 0.491455078125, 0.5338134765625, 0.576171875, 0.6185302734375, 0.660888671875, 0.7032470703125, 0.74560546875, 0.7879638671875, 0.830322265625, 0.8726806640625, 0.9150390625, 0.9573974609375, 0.999755859375, 1.0421142578125, 1.08447265625, 1.1268310546875, 1.169189453125, 1.2115478515625, 1.25390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 11.0, 22.0, 55.0, 75.0, 223.0, 554.0, 1724.0, 6776.0, 35182.0, 250275.0, 619505.0, 110503.0, 17957.0, 3833.0, 1147.0, 379.0, 157.0, 63.0, 44.0, 25.0, 12.0, 8.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.5625, -16.94189453125, -16.3212890625, -15.70068359375, -15.080078125, -14.45947265625, -13.8388671875, -13.21826171875, -12.59765625, -11.97705078125, -11.3564453125, -10.73583984375, -10.115234375, -9.49462890625, -8.8740234375, -8.25341796875, -7.6328125, -7.01220703125, -6.3916015625, -5.77099609375, -5.150390625, -4.52978515625, -3.9091796875, -3.28857421875, -2.66796875, -2.04736328125, -1.4267578125, -0.80615234375, -0.185546875, 0.43505859375, 1.0556640625, 1.67626953125, 2.296875, 2.91748046875, 3.5380859375, 4.15869140625, 4.779296875, 5.39990234375, 6.0205078125, 6.64111328125, 7.26171875, 7.88232421875, 8.5029296875, 9.12353515625, 9.744140625, 10.36474609375, 10.9853515625, 11.60595703125, 12.2265625, 12.84716796875, 13.4677734375, 14.08837890625, 14.708984375, 15.32958984375, 15.9501953125, 16.57080078125, 17.19140625, 17.81201171875, 18.4326171875, 19.05322265625, 19.673828125, 20.29443359375, 20.9150390625, 21.53564453125, 22.15625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 6.0, 7.0, 1.0, 6.0, 10.0, 5.0, 12.0, 13.0, 13.0, 21.0, 20.0, 20.0, 23.0, 26.0, 29.0, 27.0, 33.0, 34.0, 37.0, 31.0, 39.0, 44.0, 47.0, 40.0, 61.0, 36.0, 31.0, 41.0, 31.0, 30.0, 34.0, 32.0, 26.0, 14.0, 19.0, 10.0, 10.0, 10.0, 12.0, 13.0, 12.0, 6.0, 8.0, 6.0, 9.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.00390625, -5.806640625, -5.609375, -5.412109375, -5.21484375, -5.017578125, -4.8203125, -4.623046875, -4.42578125, -4.228515625, -4.03125, -3.833984375, -3.63671875, -3.439453125, -3.2421875, -3.044921875, -2.84765625, -2.650390625, -2.453125, -2.255859375, -2.05859375, -1.861328125, -1.6640625, -1.466796875, -1.26953125, -1.072265625, -0.875, -0.677734375, -0.48046875, -0.283203125, -0.0859375, 0.111328125, 0.30859375, 0.505859375, 0.703125, 0.900390625, 1.09765625, 1.294921875, 1.4921875, 1.689453125, 1.88671875, 2.083984375, 2.28125, 2.478515625, 2.67578125, 2.873046875, 3.0703125, 3.267578125, 3.46484375, 3.662109375, 3.859375, 4.056640625, 4.25390625, 4.451171875, 4.6484375, 4.845703125, 5.04296875, 5.240234375, 5.4375, 5.634765625, 5.83203125, 6.029296875, 6.2265625, 6.423828125, 6.62109375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 0.0, 2.0, 6.0, 5.0, 10.0, 21.0, 43.0, 64.0, 131.0, 308.0, 751.0, 2337.0, 9951.0, 81196.0, 806443.0, 129615.0, 13215.0, 2873.0, 907.0, 332.0, 143.0, 68.0, 58.0, 20.0, 16.0, 10.0, 9.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.46875, -44.320068359375, -43.17138671875, -42.022705078125, -40.8740234375, -39.725341796875, -38.57666015625, -37.427978515625, -36.279296875, -35.130615234375, -33.98193359375, -32.833251953125, -31.6845703125, -30.535888671875, -29.38720703125, -28.238525390625, -27.08984375, -25.941162109375, -24.79248046875, -23.643798828125, -22.4951171875, -21.346435546875, -20.19775390625, -19.049072265625, -17.900390625, -16.751708984375, -15.60302734375, -14.454345703125, -13.3056640625, -12.156982421875, -11.00830078125, -9.859619140625, -8.7109375, -7.562255859375, -6.41357421875, -5.264892578125, -4.1162109375, -2.967529296875, -1.81884765625, -0.670166015625, 0.478515625, 1.627197265625, 2.77587890625, 3.924560546875, 5.0732421875, 6.221923828125, 7.37060546875, 8.519287109375, 9.66796875, 10.816650390625, 11.96533203125, 13.114013671875, 14.2626953125, 15.411376953125, 16.56005859375, 17.708740234375, 18.857421875, 20.006103515625, 21.15478515625, 22.303466796875, 23.4521484375, 24.600830078125, 25.74951171875, 26.898193359375, 28.046875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 7.0, 13.0, 13.0, 14.0, 30.0, 44.0, 43.0, 67.0, 85.0, 111.0, 123.0, 124.0, 85.0, 55.0, 53.0, 33.0, 25.0, 16.0, 14.0, 7.0, 7.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011472702026367188, -0.001117415726184845, -0.0010875612497329712, -0.0010577067732810974, -0.0010278522968292236, -0.0009979978203773499, -0.0009681433439254761, -0.0009382888674736023, -0.0009084343910217285, -0.0008785799145698547, -0.000848725438117981, -0.0008188709616661072, -0.0007890164852142334, -0.0007591620087623596, -0.0007293075323104858, -0.0006994530558586121, -0.0006695985794067383, -0.0006397441029548645, -0.0006098896265029907, -0.0005800351500511169, -0.0005501806735992432, -0.0005203261971473694, -0.0004904717206954956, -0.0004606172442436218, -0.00043076276779174805, -0.00040090829133987427, -0.0003710538148880005, -0.0003411993384361267, -0.00031134486198425293, -0.00028149038553237915, -0.00025163590908050537, -0.0002217814326286316, -0.0001919269561767578, -0.00016207247972488403, -0.00013221800327301025, -0.00010236352682113647, -7.25090503692627e-05, -4.2654573917388916e-05, -1.2800097465515137e-05, 1.7054378986358643e-05, 4.690885543823242e-05, 7.67633318901062e-05, 0.00010661780834197998, 0.00013647228479385376, 0.00016632676124572754, 0.00019618123769760132, 0.0002260357141494751, 0.0002558901906013489, 0.00028574466705322266, 0.00031559914350509644, 0.0003454536199569702, 0.000375308096408844, 0.0004051625728607178, 0.00043501704931259155, 0.00046487152576446533, 0.0004947260022163391, 0.0005245804786682129, 0.0005544349551200867, 0.0005842894315719604, 0.0006141439080238342, 0.000643998384475708, 0.0006738528609275818, 0.0007037073373794556, 0.0007335618138313293, 0.0007634162902832031]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 13.0, 9.0, 19.0, 16.0, 31.0, 56.0, 62.0, 106.0, 187.0, 301.0, 607.0, 1127.0, 2506.0, 6935.0, 23559.0, 105098.0, 552170.0, 283207.0, 50609.0, 13228.0, 4525.0, 1928.0, 934.0, 526.0, 273.0, 170.0, 115.0, 78.0, 45.0, 28.0, 28.0, 16.0, 5.0, 11.0, 10.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-24.59375, -23.90625, -23.21875, -22.53125, -21.84375, -21.15625, -20.46875, -19.78125, -19.09375, -18.40625, -17.71875, -17.03125, -16.34375, -15.65625, -14.96875, -14.28125, -13.59375, -12.90625, -12.21875, -11.53125, -10.84375, -10.15625, -9.46875, -8.78125, -8.09375, -7.40625, -6.71875, -6.03125, -5.34375, -4.65625, -3.96875, -3.28125, -2.59375, -1.90625, -1.21875, -0.53125, 0.15625, 0.84375, 1.53125, 2.21875, 2.90625, 3.59375, 4.28125, 4.96875, 5.65625, 6.34375, 7.03125, 7.71875, 8.40625, 9.09375, 9.78125, 10.46875, 11.15625, 11.84375, 12.53125, 13.21875, 13.90625, 14.59375, 15.28125, 15.96875, 16.65625, 17.34375, 18.03125, 18.71875, 19.40625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 9.0, 8.0, 15.0, 18.0, 19.0, 35.0, 34.0, 58.0, 67.0, 78.0, 103.0, 104.0, 90.0, 82.0, 67.0, 49.0, 40.0, 29.0, 31.0, 13.0, 13.0, 8.0, 9.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.71875, -7.377685546875, -7.03662109375, -6.695556640625, -6.3544921875, -6.013427734375, -5.67236328125, -5.331298828125, -4.990234375, -4.649169921875, -4.30810546875, -3.967041015625, -3.6259765625, -3.284912109375, -2.94384765625, -2.602783203125, -2.26171875, -1.920654296875, -1.57958984375, -1.238525390625, -0.8974609375, -0.556396484375, -0.21533203125, 0.125732421875, 0.466796875, 0.807861328125, 1.14892578125, 1.489990234375, 1.8310546875, 2.172119140625, 2.51318359375, 2.854248046875, 3.1953125, 3.536376953125, 3.87744140625, 4.218505859375, 4.5595703125, 4.900634765625, 5.24169921875, 5.582763671875, 5.923828125, 6.264892578125, 6.60595703125, 6.947021484375, 7.2880859375, 7.629150390625, 7.97021484375, 8.311279296875, 8.65234375, 8.993408203125, 9.33447265625, 9.675537109375, 10.0166015625, 10.357666015625, 10.69873046875, 11.039794921875, 11.380859375, 11.721923828125, 12.06298828125, 12.404052734375, 12.7451171875, 13.086181640625, 13.42724609375, 13.768310546875, 14.109375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 15.0, 36.0, 154.0, 407.0, 297.0, 69.0, 13.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-252.6759490966797, -244.7059326171875, -236.7359161376953, -228.76589965820312, -220.7958984375, -212.82586669921875, -204.85586547851562, -196.88584899902344, -188.91583251953125, -180.94581604003906, -172.97579956054688, -165.0057830810547, -157.0357666015625, -149.06576538085938, -141.0957489013672, -133.125732421875, -125.15571594238281, -117.18569946289062, -109.21568298339844, -101.24567413330078, -93.2756576538086, -85.3056411743164, -77.33563232421875, -69.36561584472656, -61.395599365234375, -53.42558288574219, -45.455570220947266, -37.485557556152344, -29.515541076660156, -21.54552459716797, -13.575511932373047, -5.605499267578125, 2.364501953125, 10.334516525268555, 18.30453109741211, 26.274545669555664, 34.24456024169922, 42.214576721191406, 50.18458938598633, 58.15460205078125, 66.12461853027344, 74.09463500976562, 82.06465148925781, 90.03466033935547, 98.00467681884766, 105.97469329833984, 113.9447021484375, 121.91471862792969, 129.88473510742188, 137.85475158691406, 145.82476806640625, 153.79478454589844, 161.76480102539062, 169.73480224609375, 177.70481872558594, 185.67483520507812, 193.6448516845703, 201.6148681640625, 209.5848846435547, 217.55490112304688, 225.52490234375, 233.49493408203125, 241.46493530273438, 249.43495178222656, 257.40496826171875]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 3.0, 8.0, 4.0, 6.0, 17.0, 25.0, 32.0, 41.0, 68.0, 85.0, 78.0, 85.0, 111.0, 111.0, 86.0, 63.0, 47.0, 27.0, 26.0, 19.0, 13.0, 7.0, 10.0, 6.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.87586212158203, -78.69412231445312, -75.51238250732422, -72.33064270019531, -69.14891052246094, -65.96717071533203, -62.785430908203125, -59.60369110107422, -56.42195129394531, -53.240211486816406, -50.0584716796875, -46.87673568725586, -43.69499588012695, -40.51325607299805, -37.331520080566406, -34.1497802734375, -30.968040466308594, -27.786300659179688, -24.604562759399414, -21.42282485961914, -18.241085052490234, -15.059346199035645, -11.877607345581055, -8.695869445800781, -5.514129638671875, -2.332390785217285, 0.8493480682373047, 4.0310869216918945, 7.212825775146484, 10.394564628601074, 13.576303482055664, 16.758041381835938, 19.939781188964844, 23.12152099609375, 26.303258895874023, 29.484996795654297, 32.6667366027832, 35.84847640991211, 39.03021240234375, 42.211952209472656, 45.39369201660156, 48.57543182373047, 51.757171630859375, 54.938907623291016, 58.12064743041992, 61.30238723754883, 64.48412322998047, 67.66586303710938, 70.84760284423828, 74.02934265136719, 77.2110824584961, 80.392822265625, 83.57455444335938, 86.75629425048828, 89.93803405761719, 93.1197738647461, 96.301513671875, 99.4832534790039, 102.66499328613281, 105.84673309326172, 109.02847290039062, 112.210205078125, 115.3919448852539, 118.57368469238281, 121.75542449951172]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 9.0, 6.0, 11.0, 10.0, 12.0, 19.0, 23.0, 37.0, 42.0, 71.0, 106.0, 135.0, 243.0, 430.0, 697.0, 1365.0, 3037.0, 6671.0, 16785.0, 56467.0, 841152.0, 3163915.0, 68548.0, 19601.0, 7678.0, 3492.0, 1721.0, 872.0, 473.0, 256.0, 164.0, 71.0, 67.0, 29.0, 24.0, 12.0, 13.0, 7.0, 6.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-52.96875, -51.678955078125, -50.38916015625, -49.099365234375, -47.8095703125, -46.519775390625, -45.22998046875, -43.940185546875, -42.650390625, -41.360595703125, -40.07080078125, -38.781005859375, -37.4912109375, -36.201416015625, -34.91162109375, -33.621826171875, -32.33203125, -31.042236328125, -29.75244140625, -28.462646484375, -27.1728515625, -25.883056640625, -24.59326171875, -23.303466796875, -22.013671875, -20.723876953125, -19.43408203125, -18.144287109375, -16.8544921875, -15.564697265625, -14.27490234375, -12.985107421875, -11.6953125, -10.405517578125, -9.11572265625, -7.825927734375, -6.5361328125, -5.246337890625, -3.95654296875, -2.666748046875, -1.376953125, -0.087158203125, 1.20263671875, 2.492431640625, 3.7822265625, 5.072021484375, 6.36181640625, 7.651611328125, 8.94140625, 10.231201171875, 11.52099609375, 12.810791015625, 14.1005859375, 15.390380859375, 16.68017578125, 17.969970703125, 19.259765625, 20.549560546875, 21.83935546875, 23.129150390625, 24.4189453125, 25.708740234375, 26.99853515625, 28.288330078125, 29.578125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 2.0, 8.0, 17.0, 19.0, 22.0, 35.0, 55.0, 58.0, 57.0, 72.0, 71.0, 75.0, 80.0, 70.0, 68.0, 36.0, 61.0, 52.0, 27.0, 23.0, 18.0, 21.0, 15.0, 15.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.23828125, -2.1810760498046875, -2.123870849609375, -2.0666656494140625, -2.00946044921875, -1.9522552490234375, -1.895050048828125, -1.8378448486328125, -1.7806396484375, -1.7234344482421875, -1.666229248046875, -1.6090240478515625, -1.55181884765625, -1.4946136474609375, -1.437408447265625, -1.3802032470703125, -1.322998046875, -1.2657928466796875, -1.208587646484375, -1.1513824462890625, -1.09417724609375, -1.0369720458984375, -0.979766845703125, -0.9225616455078125, -0.8653564453125, -0.8081512451171875, -0.750946044921875, -0.6937408447265625, -0.63653564453125, -0.5793304443359375, -0.522125244140625, -0.4649200439453125, -0.40771484375, -0.3505096435546875, -0.293304443359375, -0.2360992431640625, -0.17889404296875, -0.1216888427734375, -0.064483642578125, -0.0072784423828125, 0.0499267578125, 0.1071319580078125, 0.164337158203125, 0.2215423583984375, 0.27874755859375, 0.3359527587890625, 0.393157958984375, 0.4503631591796875, 0.507568359375, 0.5647735595703125, 0.621978759765625, 0.6791839599609375, 0.73638916015625, 0.7935943603515625, 0.850799560546875, 0.9080047607421875, 0.9652099609375, 1.0224151611328125, 1.079620361328125, 1.1368255615234375, 1.19403076171875, 1.2512359619140625, 1.308441162109375, 1.3656463623046875, 1.4228515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 4.0, 4.0, 7.0, 8.0, 14.0, 22.0, 22.0, 44.0, 69.0, 116.0, 248.0, 512.0, 1249.0, 3162.0, 9698.0, 37125.0, 256687.0, 3615906.0, 220317.0, 34543.0, 9225.0, 3170.0, 1108.0, 497.0, 232.0, 123.0, 57.0, 26.0, 16.0, 16.0, 11.0, 9.0, 10.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-35.3125, -34.1904296875, -33.068359375, -31.9462890625, -30.82421875, -29.7021484375, -28.580078125, -27.4580078125, -26.3359375, -25.2138671875, -24.091796875, -22.9697265625, -21.84765625, -20.7255859375, -19.603515625, -18.4814453125, -17.359375, -16.2373046875, -15.115234375, -13.9931640625, -12.87109375, -11.7490234375, -10.626953125, -9.5048828125, -8.3828125, -7.2607421875, -6.138671875, -5.0166015625, -3.89453125, -2.7724609375, -1.650390625, -0.5283203125, 0.59375, 1.7158203125, 2.837890625, 3.9599609375, 5.08203125, 6.2041015625, 7.326171875, 8.4482421875, 9.5703125, 10.6923828125, 11.814453125, 12.9365234375, 14.05859375, 15.1806640625, 16.302734375, 17.4248046875, 18.546875, 19.6689453125, 20.791015625, 21.9130859375, 23.03515625, 24.1572265625, 25.279296875, 26.4013671875, 27.5234375, 28.6455078125, 29.767578125, 30.8896484375, 32.01171875, 33.1337890625, 34.255859375, 35.3779296875, 36.5]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 5.0, 6.0, 11.0, 10.0, 12.0, 18.0, 28.0, 39.0, 49.0, 68.0, 118.0, 164.0, 299.0, 700.0, 1430.0, 447.0, 204.0, 124.0, 74.0, 76.0, 40.0, 29.0, 22.0, 18.0, 14.0, 11.0, 13.0, 11.0, 2.0, 3.0, 5.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.59375, -3.47503662109375, -3.3563232421875, -3.23760986328125, -3.118896484375, -3.00018310546875, -2.8814697265625, -2.76275634765625, -2.64404296875, -2.52532958984375, -2.4066162109375, -2.28790283203125, -2.169189453125, -2.05047607421875, -1.9317626953125, -1.81304931640625, -1.6943359375, -1.57562255859375, -1.4569091796875, -1.33819580078125, -1.219482421875, -1.10076904296875, -0.9820556640625, -0.86334228515625, -0.74462890625, -0.62591552734375, -0.5072021484375, -0.38848876953125, -0.269775390625, -0.15106201171875, -0.0323486328125, 0.08636474609375, 0.205078125, 0.32379150390625, 0.4425048828125, 0.56121826171875, 0.679931640625, 0.79864501953125, 0.9173583984375, 1.03607177734375, 1.15478515625, 1.27349853515625, 1.3922119140625, 1.51092529296875, 1.629638671875, 1.74835205078125, 1.8670654296875, 1.98577880859375, 2.1044921875, 2.22320556640625, 2.3419189453125, 2.46063232421875, 2.579345703125, 2.69805908203125, 2.8167724609375, 2.93548583984375, 3.05419921875, 3.17291259765625, 3.2916259765625, 3.41033935546875, 3.529052734375, 3.64776611328125, 3.7664794921875, 3.88519287109375, 4.00390625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 11.0, 26.0, 64.0, 165.0, 270.0, 241.0, 129.0, 72.0, 11.0, 12.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.9666519165039, -65.14627838134766, -63.325904846191406, -61.505531311035156, -59.68516159057617, -57.86478805541992, -56.04441452026367, -54.22404098510742, -52.40367126464844, -50.58329772949219, -48.76292419433594, -46.94255065917969, -45.1221809387207, -43.30180740356445, -41.4814338684082, -39.66106033325195, -37.8406867980957, -36.02031326293945, -34.1999397277832, -32.37957000732422, -30.55919647216797, -28.73882293701172, -26.91844940185547, -25.09807586669922, -23.2777042388916, -21.45733070373535, -19.636959075927734, -17.816585540771484, -15.99621295928955, -14.175840377807617, -12.355466842651367, -10.535094261169434, -8.7147216796875, -6.894349098205566, -5.073976039886475, -3.253602981567383, -1.4332304000854492, 0.3871421813964844, 2.2075157165527344, 4.027888298034668, 5.848260879516602, 7.668633460998535, 9.489006042480469, 11.309379577636719, 13.129752159118652, 14.950124740600586, 16.770498275756836, 18.590869903564453, 20.411243438720703, 22.231616973876953, 24.05198860168457, 25.87236213684082, 27.692733764648438, 29.513107299804688, 31.333480834960938, 33.15385437011719, 34.97422790527344, 36.79460144042969, 38.61497497558594, 40.43534851074219, 42.25571823120117, 44.07609176635742, 45.89646530151367, 47.71683883666992, 49.537208557128906]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 9.0, 10.0, 14.0, 17.0, 16.0, 26.0, 22.0, 28.0, 54.0, 46.0, 65.0, 57.0, 63.0, 57.0, 65.0, 70.0, 60.0, 49.0, 55.0, 45.0, 44.0, 25.0, 20.0, 19.0, 16.0, 9.0, 10.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.043865203857422, -16.433671951293945, -15.823478698730469, -15.213284492492676, -14.6030912399292, -13.992897987365723, -13.38270378112793, -12.772510528564453, -12.162317276000977, -11.5521240234375, -10.941930770874023, -10.33173656463623, -9.721543312072754, -9.111350059509277, -8.501155853271484, -7.890962600708008, -7.280769348144531, -6.670576095581055, -6.06038236618042, -5.450188636779785, -4.839995384216309, -4.229802131652832, -3.6196084022521973, -3.0094146728515625, -2.399221420288086, -1.7890279293060303, -1.1788344383239746, -0.568640947341919, 0.04155254364013672, 0.6517460346221924, 1.261939525604248, 1.8721332550048828, 2.4823246002197266, 3.0925180912017822, 3.702711582183838, 4.312905311584473, 4.923098564147949, 5.533291816711426, 6.1434855461120605, 6.753679275512695, 7.363872528076172, 7.974065780639648, 8.584259033203125, 9.194453239440918, 9.804646492004395, 10.414839744567871, 11.025033950805664, 11.63522720336914, 12.245420455932617, 12.855613708496094, 13.46580696105957, 14.076001167297363, 14.68619441986084, 15.296387672424316, 15.90658187866211, 16.516775131225586, 17.126968383789062, 17.73716163635254, 18.347354888916016, 18.957548141479492, 19.56774139404297, 20.177936553955078, 20.788129806518555, 21.39832305908203, 22.008516311645508]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 5.0, 10.0, 7.0, 11.0, 22.0, 21.0, 34.0, 49.0, 77.0, 137.0, 212.0, 442.0, 954.0, 2307.0, 6277.0, 21107.0, 84700.0, 333588.0, 428833.0, 125197.0, 30551.0, 8711.0, 2901.0, 1144.0, 565.0, 265.0, 151.0, 86.0, 59.0, 35.0, 31.0, 21.0, 9.0, 9.0, 11.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.0625, -21.4345703125, -20.806640625, -20.1787109375, -19.55078125, -18.9228515625, -18.294921875, -17.6669921875, -17.0390625, -16.4111328125, -15.783203125, -15.1552734375, -14.52734375, -13.8994140625, -13.271484375, -12.6435546875, -12.015625, -11.3876953125, -10.759765625, -10.1318359375, -9.50390625, -8.8759765625, -8.248046875, -7.6201171875, -6.9921875, -6.3642578125, -5.736328125, -5.1083984375, -4.48046875, -3.8525390625, -3.224609375, -2.5966796875, -1.96875, -1.3408203125, -0.712890625, -0.0849609375, 0.54296875, 1.1708984375, 1.798828125, 2.4267578125, 3.0546875, 3.6826171875, 4.310546875, 4.9384765625, 5.56640625, 6.1943359375, 6.822265625, 7.4501953125, 8.078125, 8.7060546875, 9.333984375, 9.9619140625, 10.58984375, 11.2177734375, 11.845703125, 12.4736328125, 13.1015625, 13.7294921875, 14.357421875, 14.9853515625, 15.61328125, 16.2412109375, 16.869140625, 17.4970703125, 18.125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 5.0, 3.0, 4.0, 9.0, 5.0, 16.0, 21.0, 33.0, 43.0, 41.0, 56.0, 63.0, 57.0, 59.0, 62.0, 55.0, 76.0, 69.0, 63.0, 50.0, 32.0, 30.0, 41.0, 26.0, 24.0, 19.0, 9.0, 11.0, 6.0, 4.0, 5.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.439453125, -1.388763427734375, -1.33807373046875, -1.287384033203125, -1.2366943359375, -1.186004638671875, -1.13531494140625, -1.084625244140625, -1.033935546875, -0.983245849609375, -0.93255615234375, -0.881866455078125, -0.8311767578125, -0.780487060546875, -0.72979736328125, -0.679107666015625, -0.62841796875, -0.577728271484375, -0.52703857421875, -0.476348876953125, -0.4256591796875, -0.374969482421875, -0.32427978515625, -0.273590087890625, -0.222900390625, -0.172210693359375, -0.12152099609375, -0.070831298828125, -0.0201416015625, 0.030548095703125, 0.08123779296875, 0.131927490234375, 0.1826171875, 0.233306884765625, 0.28399658203125, 0.334686279296875, 0.3853759765625, 0.436065673828125, 0.48675537109375, 0.537445068359375, 0.588134765625, 0.638824462890625, 0.68951416015625, 0.740203857421875, 0.7908935546875, 0.841583251953125, 0.89227294921875, 0.942962646484375, 0.99365234375, 1.044342041015625, 1.09503173828125, 1.145721435546875, 1.1964111328125, 1.247100830078125, 1.29779052734375, 1.348480224609375, 1.399169921875, 1.449859619140625, 1.50054931640625, 1.551239013671875, 1.6019287109375, 1.652618408203125, 1.70330810546875, 1.753997802734375, 1.8046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 5.0, 2.0, 8.0, 1.0, 8.0, 5.0, 11.0, 19.0, 30.0, 29.0, 37.0, 40.0, 62.0, 62.0, 98.0, 139.0, 194.0, 259.0, 369.0, 560.0, 1005.0, 1835.0, 3880.0, 8945.0, 24122.0, 69884.0, 200267.0, 375090.0, 230708.0, 82349.0, 28276.0, 10682.0, 4346.0, 1971.0, 1126.0, 655.0, 404.0, 269.0, 209.0, 162.0, 105.0, 98.0, 61.0, 49.0, 38.0, 15.0, 24.0, 17.0, 12.0, 8.0, 7.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.7109375, -13.2767333984375, -12.842529296875, -12.4083251953125, -11.97412109375, -11.5399169921875, -11.105712890625, -10.6715087890625, -10.2373046875, -9.8031005859375, -9.368896484375, -8.9346923828125, -8.50048828125, -8.0662841796875, -7.632080078125, -7.1978759765625, -6.763671875, -6.3294677734375, -5.895263671875, -5.4610595703125, -5.02685546875, -4.5926513671875, -4.158447265625, -3.7242431640625, -3.2900390625, -2.8558349609375, -2.421630859375, -1.9874267578125, -1.55322265625, -1.1190185546875, -0.684814453125, -0.2506103515625, 0.18359375, 0.6177978515625, 1.052001953125, 1.4862060546875, 1.92041015625, 2.3546142578125, 2.788818359375, 3.2230224609375, 3.6572265625, 4.0914306640625, 4.525634765625, 4.9598388671875, 5.39404296875, 5.8282470703125, 6.262451171875, 6.6966552734375, 7.130859375, 7.5650634765625, 7.999267578125, 8.4334716796875, 8.86767578125, 9.3018798828125, 9.736083984375, 10.1702880859375, 10.6044921875, 11.0386962890625, 11.472900390625, 11.9071044921875, 12.34130859375, 12.7755126953125, 13.209716796875, 13.6439208984375, 14.078125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 0.0, 4.0, 1.0, 4.0, 4.0, 6.0, 10.0, 11.0, 11.0, 14.0, 18.0, 21.0, 20.0, 28.0, 33.0, 31.0, 33.0, 33.0, 42.0, 40.0, 30.0, 39.0, 53.0, 44.0, 45.0, 38.0, 30.0, 40.0, 25.0, 37.0, 27.0, 28.0, 34.0, 24.0, 15.0, 31.0, 16.0, 18.0, 17.0, 9.0, 9.0, 9.0, 9.0, 4.0, 5.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.8671875, -6.64385986328125, -6.4205322265625, -6.19720458984375, -5.973876953125, -5.75054931640625, -5.5272216796875, -5.30389404296875, -5.08056640625, -4.85723876953125, -4.6339111328125, -4.41058349609375, -4.187255859375, -3.96392822265625, -3.7406005859375, -3.51727294921875, -3.2939453125, -3.07061767578125, -2.8472900390625, -2.62396240234375, -2.400634765625, -2.17730712890625, -1.9539794921875, -1.73065185546875, -1.50732421875, -1.28399658203125, -1.0606689453125, -0.83734130859375, -0.614013671875, -0.39068603515625, -0.1673583984375, 0.05596923828125, 0.279296875, 0.50262451171875, 0.7259521484375, 0.94927978515625, 1.172607421875, 1.39593505859375, 1.6192626953125, 1.84259033203125, 2.06591796875, 2.28924560546875, 2.5125732421875, 2.73590087890625, 2.959228515625, 3.18255615234375, 3.4058837890625, 3.62921142578125, 3.8525390625, 4.07586669921875, 4.2991943359375, 4.52252197265625, 4.745849609375, 4.96917724609375, 5.1925048828125, 5.41583251953125, 5.63916015625, 5.86248779296875, 6.0858154296875, 6.30914306640625, 6.532470703125, 6.75579833984375, 6.9791259765625, 7.20245361328125, 7.42578125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 7.0, 9.0, 26.0, 28.0, 41.0, 84.0, 108.0, 226.0, 421.0, 833.0, 2070.0, 6444.0, 26670.0, 156522.0, 581484.0, 224385.0, 36195.0, 8282.0, 2624.0, 1006.0, 488.0, 242.0, 135.0, 72.0, 59.0, 38.0, 17.0, 18.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.515625, -23.785888671875, -23.05615234375, -22.326416015625, -21.5966796875, -20.866943359375, -20.13720703125, -19.407470703125, -18.677734375, -17.947998046875, -17.21826171875, -16.488525390625, -15.7587890625, -15.029052734375, -14.29931640625, -13.569580078125, -12.83984375, -12.110107421875, -11.38037109375, -10.650634765625, -9.9208984375, -9.191162109375, -8.46142578125, -7.731689453125, -7.001953125, -6.272216796875, -5.54248046875, -4.812744140625, -4.0830078125, -3.353271484375, -2.62353515625, -1.893798828125, -1.1640625, -0.434326171875, 0.29541015625, 1.025146484375, 1.7548828125, 2.484619140625, 3.21435546875, 3.944091796875, 4.673828125, 5.403564453125, 6.13330078125, 6.863037109375, 7.5927734375, 8.322509765625, 9.05224609375, 9.781982421875, 10.51171875, 11.241455078125, 11.97119140625, 12.700927734375, 13.4306640625, 14.160400390625, 14.89013671875, 15.619873046875, 16.349609375, 17.079345703125, 17.80908203125, 18.538818359375, 19.2685546875, 19.998291015625, 20.72802734375, 21.457763671875, 22.1875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 0.0, 14.0, 8.0, 27.0, 13.0, 12.0, 27.0, 27.0, 30.0, 30.0, 40.0, 51.0, 52.0, 72.0, 68.0, 85.0, 83.0, 62.0, 48.0, 31.0, 39.0, 35.0, 23.0, 20.0, 19.0, 13.0, 13.0, 9.0, 9.0, 9.0, 5.0, 3.0, 9.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009889602661132812, -0.0009561926126480103, -0.0009234249591827393, -0.0008906573057174683, -0.0008578896522521973, -0.0008251219987869263, -0.0007923543453216553, -0.0007595866918563843, -0.0007268190383911133, -0.0006940513849258423, -0.0006612837314605713, -0.0006285160779953003, -0.0005957484245300293, -0.0005629807710647583, -0.0005302131175994873, -0.0004974454641342163, -0.0004646778106689453, -0.0004319101572036743, -0.0003991425037384033, -0.0003663748502731323, -0.00033360719680786133, -0.00030083954334259033, -0.00026807188987731934, -0.00023530423641204834, -0.00020253658294677734, -0.00016976892948150635, -0.00013700127601623535, -0.00010423362255096436, -7.146596908569336e-05, -3.869831562042236e-05, -5.930662155151367e-06, 2.683699131011963e-05, 5.9604644775390625e-05, 9.237229824066162e-05, 0.00012513995170593262, 0.0001579076051712036, 0.0001906752586364746, 0.0002234429121017456, 0.0002562105655670166, 0.0002889782190322876, 0.0003217458724975586, 0.0003545135259628296, 0.0003872811794281006, 0.0004200488328933716, 0.0004528164863586426, 0.0004855841398239136, 0.0005183517932891846, 0.0005511194467544556, 0.0005838871002197266, 0.0006166547536849976, 0.0006494224071502686, 0.0006821900606155396, 0.0007149577140808105, 0.0007477253675460815, 0.0007804930210113525, 0.0008132606744766235, 0.0008460283279418945, 0.0008787959814071655, 0.0009115636348724365, 0.0009443312883377075, 0.0009770989418029785, 0.0010098665952682495, 0.0010426342487335205, 0.0010754019021987915, 0.0011081695556640625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 0.0, 1.0, 3.0, 4.0, 7.0, 12.0, 23.0, 31.0, 55.0, 77.0, 130.0, 190.0, 333.0, 563.0, 1189.0, 2951.0, 8626.0, 32440.0, 176346.0, 597892.0, 180053.0, 33265.0, 8761.0, 3017.0, 1187.0, 620.0, 311.0, 166.0, 105.0, 65.0, 48.0, 25.0, 22.0, 9.0, 6.0, 10.0, 2.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.453125, -29.618896484375, -28.78466796875, -27.950439453125, -27.1162109375, -26.281982421875, -25.44775390625, -24.613525390625, -23.779296875, -22.945068359375, -22.11083984375, -21.276611328125, -20.4423828125, -19.608154296875, -18.77392578125, -17.939697265625, -17.10546875, -16.271240234375, -15.43701171875, -14.602783203125, -13.7685546875, -12.934326171875, -12.10009765625, -11.265869140625, -10.431640625, -9.597412109375, -8.76318359375, -7.928955078125, -7.0947265625, -6.260498046875, -5.42626953125, -4.592041015625, -3.7578125, -2.923583984375, -2.08935546875, -1.255126953125, -0.4208984375, 0.413330078125, 1.24755859375, 2.081787109375, 2.916015625, 3.750244140625, 4.58447265625, 5.418701171875, 6.2529296875, 7.087158203125, 7.92138671875, 8.755615234375, 9.58984375, 10.424072265625, 11.25830078125, 12.092529296875, 12.9267578125, 13.760986328125, 14.59521484375, 15.429443359375, 16.263671875, 17.097900390625, 17.93212890625, 18.766357421875, 19.6005859375, 20.434814453125, 21.26904296875, 22.103271484375, 22.9375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 13.0, 3.0, 9.0, 11.0, 14.0, 15.0, 29.0, 24.0, 46.0, 51.0, 70.0, 97.0, 96.0, 80.0, 96.0, 78.0, 61.0, 51.0, 37.0, 38.0, 20.0, 17.0, 9.0, 7.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0], "bins": [-15.8203125, -15.4365234375, -15.052734375, -14.6689453125, -14.28515625, -13.9013671875, -13.517578125, -13.1337890625, -12.75, -12.3662109375, -11.982421875, -11.5986328125, -11.21484375, -10.8310546875, -10.447265625, -10.0634765625, -9.6796875, -9.2958984375, -8.912109375, -8.5283203125, -8.14453125, -7.7607421875, -7.376953125, -6.9931640625, -6.609375, -6.2255859375, -5.841796875, -5.4580078125, -5.07421875, -4.6904296875, -4.306640625, -3.9228515625, -3.5390625, -3.1552734375, -2.771484375, -2.3876953125, -2.00390625, -1.6201171875, -1.236328125, -0.8525390625, -0.46875, -0.0849609375, 0.298828125, 0.6826171875, 1.06640625, 1.4501953125, 1.833984375, 2.2177734375, 2.6015625, 2.9853515625, 3.369140625, 3.7529296875, 4.13671875, 4.5205078125, 4.904296875, 5.2880859375, 5.671875, 6.0556640625, 6.439453125, 6.8232421875, 7.20703125, 7.5908203125, 7.974609375, 8.3583984375, 8.7421875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 16.0, 18.0, 102.0, 379.0, 354.0, 91.0, 31.0, 8.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-324.14141845703125, -313.6930847167969, -303.2447509765625, -292.7964172363281, -282.34808349609375, -271.8997497558594, -261.451416015625, -251.00308227539062, -240.55474853515625, -230.10641479492188, -219.6580810546875, -209.20974731445312, -198.76141357421875, -188.31307983398438, -177.86474609375, -167.41641235351562, -156.96807861328125, -146.51974487304688, -136.0714111328125, -125.62307739257812, -115.17474365234375, -104.72640991210938, -94.278076171875, -83.82974243164062, -73.38140869140625, -62.933074951171875, -52.4847412109375, -42.036407470703125, -31.58807373046875, -21.139739990234375, -10.69140625, -0.243072509765625, 10.205291748046875, 20.65362548828125, 31.101959228515625, 41.55029296875, 51.998626708984375, 62.44696044921875, 72.89529418945312, 83.3436279296875, 93.79196166992188, 104.24029541015625, 114.68862915039062, 125.136962890625, 135.58529663085938, 146.03363037109375, 156.48196411132812, 166.9302978515625, 177.37863159179688, 187.82696533203125, 198.27529907226562, 208.7236328125, 219.17196655273438, 229.62030029296875, 240.06863403320312, 250.5169677734375, 260.9653015136719, 271.41363525390625, 281.8619689941406, 292.310302734375, 302.7586364746094, 313.20697021484375, 323.6553039550781, 334.1036376953125, 344.5519714355469]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 9.0, 8.0, 10.0, 8.0, 10.0, 13.0, 15.0, 28.0, 38.0, 33.0, 33.0, 48.0, 61.0, 60.0, 44.0, 59.0, 46.0, 55.0, 53.0, 43.0, 47.0, 45.0, 36.0, 36.0, 29.0, 32.0, 25.0, 18.0, 15.0, 6.0, 13.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-68.93733215332031, -66.72986602783203, -64.52239990234375, -62.31493377685547, -60.10746383666992, -57.89999771118164, -55.69253158569336, -53.48506546020508, -51.27759552001953, -49.07012939453125, -46.86266326904297, -44.65519714355469, -42.44772720336914, -40.24026107788086, -38.03279495239258, -35.8253288269043, -33.617862701416016, -31.410396575927734, -29.20292854309082, -26.99546241760254, -24.787994384765625, -22.580528259277344, -20.373062133789062, -18.16559600830078, -15.958127975463867, -13.75066089630127, -11.543193817138672, -9.33572769165039, -7.128260612487793, -4.920793533325195, -2.713327407836914, -0.5058603286743164, 1.7016067504882812, 3.9090735912323, 6.116540431976318, 8.324007034301758, 10.531474113464355, 12.738941192626953, 14.946407318115234, 17.153873443603516, 19.36134147644043, 21.56880760192871, 23.776275634765625, 25.983741760253906, 28.191207885742188, 30.3986759185791, 32.60614013671875, 34.8136100769043, 37.02107620239258, 39.22854232788086, 41.43600845336914, 43.64347839355469, 45.85094451904297, 48.05841064453125, 50.26587677001953, 52.47334289550781, 54.680809020996094, 56.888275146484375, 59.095741271972656, 61.30320739746094, 63.510677337646484, 65.7181396484375, 67.92561340332031, 70.1330795288086, 72.34054565429688]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 16.0, 12.0, 26.0, 40.0, 88.0, 111.0, 223.0, 696.0, 3553.0, 55195.0, 4069766.0, 59576.0, 3751.0, 715.0, 223.0, 98.0, 65.0, 29.0, 21.0, 22.0, 13.0, 9.0, 7.0, 1.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.3125, -64.44921875, -61.5859375, -58.72265625, -55.859375, -52.99609375, -50.1328125, -47.26953125, -44.40625, -41.54296875, -38.6796875, -35.81640625, -32.953125, -30.08984375, -27.2265625, -24.36328125, -21.5, -18.63671875, -15.7734375, -12.91015625, -10.046875, -7.18359375, -4.3203125, -1.45703125, 1.40625, 4.26953125, 7.1328125, 9.99609375, 12.859375, 15.72265625, 18.5859375, 21.44921875, 24.3125, 27.17578125, 30.0390625, 32.90234375, 35.765625, 38.62890625, 41.4921875, 44.35546875, 47.21875, 50.08203125, 52.9453125, 55.80859375, 58.671875, 61.53515625, 64.3984375, 67.26171875, 70.125, 72.98828125, 75.8515625, 78.71484375, 81.578125, 84.44140625, 87.3046875, 90.16796875, 93.03125, 95.89453125, 98.7578125, 101.62109375, 104.484375, 107.34765625, 110.2109375, 113.07421875, 115.9375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 10.0, 15.0, 19.0, 36.0, 59.0, 48.0, 52.0, 73.0, 87.0, 91.0, 66.0, 82.0, 71.0, 66.0, 59.0, 44.0, 25.0, 19.0, 19.0, 18.0, 8.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.083984375, -2.004180908203125, -1.92437744140625, -1.844573974609375, -1.7647705078125, -1.684967041015625, -1.60516357421875, -1.525360107421875, -1.445556640625, -1.365753173828125, -1.28594970703125, -1.206146240234375, -1.1263427734375, -1.046539306640625, -0.96673583984375, -0.886932373046875, -0.80712890625, -0.727325439453125, -0.64752197265625, -0.567718505859375, -0.4879150390625, -0.408111572265625, -0.32830810546875, -0.248504638671875, -0.168701171875, -0.088897705078125, -0.00909423828125, 0.070709228515625, 0.1505126953125, 0.230316162109375, 0.31011962890625, 0.389923095703125, 0.4697265625, 0.549530029296875, 0.62933349609375, 0.709136962890625, 0.7889404296875, 0.868743896484375, 0.94854736328125, 1.028350830078125, 1.108154296875, 1.187957763671875, 1.26776123046875, 1.347564697265625, 1.4273681640625, 1.507171630859375, 1.58697509765625, 1.666778564453125, 1.74658203125, 1.826385498046875, 1.90618896484375, 1.985992431640625, 2.0657958984375, 2.145599365234375, 2.22540283203125, 2.305206298828125, 2.385009765625, 2.464813232421875, 2.54461669921875, 2.624420166015625, 2.7042236328125, 2.784027099609375, 2.86383056640625, 2.943634033203125, 3.0234375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 5.0, 9.0, 9.0, 13.0, 17.0, 17.0, 25.0, 45.0, 84.0, 163.0, 347.0, 676.0, 1834.0, 5560.0, 19365.0, 90993.0, 988979.0, 2906613.0, 139163.0, 28002.0, 7822.0, 2529.0, 958.0, 430.0, 221.0, 120.0, 72.0, 40.0, 41.0, 25.0, 16.0, 21.0, 20.0, 4.0, 9.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.40625, -25.466796875, -24.52734375, -23.587890625, -22.6484375, -21.708984375, -20.76953125, -19.830078125, -18.890625, -17.951171875, -17.01171875, -16.072265625, -15.1328125, -14.193359375, -13.25390625, -12.314453125, -11.375, -10.435546875, -9.49609375, -8.556640625, -7.6171875, -6.677734375, -5.73828125, -4.798828125, -3.859375, -2.919921875, -1.98046875, -1.041015625, -0.1015625, 0.837890625, 1.77734375, 2.716796875, 3.65625, 4.595703125, 5.53515625, 6.474609375, 7.4140625, 8.353515625, 9.29296875, 10.232421875, 11.171875, 12.111328125, 13.05078125, 13.990234375, 14.9296875, 15.869140625, 16.80859375, 17.748046875, 18.6875, 19.626953125, 20.56640625, 21.505859375, 22.4453125, 23.384765625, 24.32421875, 25.263671875, 26.203125, 27.142578125, 28.08203125, 29.021484375, 29.9609375, 30.900390625, 31.83984375, 32.779296875, 33.71875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 4.0, 9.0, 12.0, 14.0, 15.0, 30.0, 56.0, 106.0, 156.0, 413.0, 1697.0, 835.0, 323.0, 124.0, 103.0, 67.0, 38.0, 29.0, 20.0, 9.0, 8.0, 7.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01171875, -2.79425048828125, -2.5767822265625, -2.35931396484375, -2.141845703125, -1.92437744140625, -1.7069091796875, -1.48944091796875, -1.27197265625, -1.05450439453125, -0.8370361328125, -0.61956787109375, -0.402099609375, -0.18463134765625, 0.0328369140625, 0.25030517578125, 0.4677734375, 0.68524169921875, 0.9027099609375, 1.12017822265625, 1.337646484375, 1.55511474609375, 1.7725830078125, 1.99005126953125, 2.20751953125, 2.42498779296875, 2.6424560546875, 2.85992431640625, 3.077392578125, 3.29486083984375, 3.5123291015625, 3.72979736328125, 3.947265625, 4.16473388671875, 4.3822021484375, 4.59967041015625, 4.817138671875, 5.03460693359375, 5.2520751953125, 5.46954345703125, 5.68701171875, 5.90447998046875, 6.1219482421875, 6.33941650390625, 6.556884765625, 6.77435302734375, 6.9918212890625, 7.20928955078125, 7.4267578125, 7.64422607421875, 7.8616943359375, 8.07916259765625, 8.296630859375, 8.51409912109375, 8.7315673828125, 8.94903564453125, 9.16650390625, 9.38397216796875, 9.6014404296875, 9.81890869140625, 10.036376953125, 10.25384521484375, 10.4713134765625, 10.68878173828125, 10.90625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 8.0, 7.0, 18.0, 42.0, 60.0, 83.0, 169.0, 171.0, 158.0, 124.0, 73.0, 38.0, 20.0, 19.0, 9.0, 3.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.883766174316406, -50.42533874511719, -48.966915130615234, -47.508487701416016, -46.0500602722168, -44.591636657714844, -43.133209228515625, -41.674781799316406, -40.21635437011719, -38.75792694091797, -37.299503326416016, -35.8410758972168, -34.38264846801758, -32.924224853515625, -31.465797424316406, -30.007369995117188, -28.548946380615234, -27.09052085876465, -25.63209342956543, -24.173667907714844, -22.715240478515625, -21.25681495666504, -19.798389434814453, -18.339962005615234, -16.88153648376465, -15.423110008239746, -13.964683532714844, -12.506258010864258, -11.047831535339355, -9.589405059814453, -8.130979537963867, -6.672553062438965, -5.2141265869140625, -3.7557003498077393, -2.297274112701416, -0.8388481140136719, 0.6195783615112305, 2.078004837036133, 3.5364303588867188, 4.994856834411621, 6.453283309936523, 7.911709785461426, 9.370136260986328, 10.828561782836914, 12.286988258361816, 13.745414733886719, 15.203840255737305, 16.66226577758789, 18.12069320678711, 19.579118728637695, 21.037546157836914, 22.4959716796875, 23.95439910888672, 25.412824630737305, 26.87125015258789, 28.32967758178711, 29.788103103637695, 31.24652862548828, 32.7049560546875, 34.16338348388672, 35.62180709838867, 37.08023452758789, 38.538658142089844, 39.99708557128906, 41.45551300048828]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 6.0, 9.0, 10.0, 13.0, 18.0, 16.0, 20.0, 30.0, 38.0, 40.0, 45.0, 51.0, 58.0, 51.0, 50.0, 59.0, 55.0, 41.0, 43.0, 55.0, 53.0, 44.0, 35.0, 29.0, 25.0, 23.0, 25.0, 17.0, 8.0, 12.0, 6.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.520193099975586, -20.81964874267578, -20.119104385375977, -19.418560028076172, -18.718013763427734, -18.01746940612793, -17.316925048828125, -16.61638069152832, -15.9158353805542, -15.215291023254395, -14.514745712280273, -13.814201354980469, -13.113656997680664, -12.413111686706543, -11.712567329406738, -11.012022018432617, -10.311477661132812, -9.610933303833008, -8.910387992858887, -8.209843635559082, -7.509298801422119, -6.808753967285156, -6.108209609985352, -5.407664775848389, -4.707119941711426, -4.006575107574463, -3.306030511856079, -2.6054859161376953, -1.9049410820007324, -1.2043962478637695, -0.5038518905639648, 0.19669294357299805, 0.8972358703613281, 1.5977805852890015, 2.298325300216675, 2.9988698959350586, 3.6994147300720215, 4.399959564208984, 5.100503921508789, 5.801048755645752, 6.501593589782715, 7.202138423919678, 7.902683258056641, 8.603227615356445, 9.30377197265625, 10.004317283630371, 10.704861640930176, 11.405406951904297, 12.105951309204102, 12.806495666503906, 13.507040977478027, 14.207585334777832, 14.908130645751953, 15.608675003051758, 16.309219360351562, 17.009763717651367, 17.710308074951172, 18.410852432250977, 19.11139678955078, 19.81194305419922, 20.512487411499023, 21.213031768798828, 21.913576126098633, 22.614120483398438, 23.314666748046875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 2.0, 5.0, 13.0, 12.0, 23.0, 37.0, 42.0, 64.0, 88.0, 111.0, 142.0, 217.0, 333.0, 466.0, 680.0, 1202.0, 2016.0, 4011.0, 8722.0, 21599.0, 58766.0, 159175.0, 371943.0, 257817.0, 98171.0, 36096.0, 13898.0, 5833.0, 2857.0, 1509.0, 847.0, 565.0, 394.0, 249.0, 176.0, 119.0, 92.0, 68.0, 51.0, 41.0, 23.0, 21.0, 14.0, 12.0, 6.0, 8.0, 0.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.1171875, -10.7305908203125, -10.343994140625, -9.9573974609375, -9.57080078125, -9.1842041015625, -8.797607421875, -8.4110107421875, -8.0244140625, -7.6378173828125, -7.251220703125, -6.8646240234375, -6.47802734375, -6.0914306640625, -5.704833984375, -5.3182373046875, -4.931640625, -4.5450439453125, -4.158447265625, -3.7718505859375, -3.38525390625, -2.9986572265625, -2.612060546875, -2.2254638671875, -1.8388671875, -1.4522705078125, -1.065673828125, -0.6790771484375, -0.29248046875, 0.0941162109375, 0.480712890625, 0.8673095703125, 1.25390625, 1.6405029296875, 2.027099609375, 2.4136962890625, 2.80029296875, 3.1868896484375, 3.573486328125, 3.9600830078125, 4.3466796875, 4.7332763671875, 5.119873046875, 5.5064697265625, 5.89306640625, 6.2796630859375, 6.666259765625, 7.0528564453125, 7.439453125, 7.8260498046875, 8.212646484375, 8.5992431640625, 8.98583984375, 9.3724365234375, 9.759033203125, 10.1456298828125, 10.5322265625, 10.9188232421875, 11.305419921875, 11.6920166015625, 12.07861328125, 12.4652099609375, 12.851806640625, 13.2384033203125, 13.625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 11.0, 17.0, 21.0, 34.0, 42.0, 46.0, 59.0, 70.0, 67.0, 81.0, 79.0, 79.0, 65.0, 74.0, 58.0, 50.0, 33.0, 36.0, 17.0, 18.0, 10.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.234375, -2.158721923828125, -2.08306884765625, -2.007415771484375, -1.9317626953125, -1.856109619140625, -1.78045654296875, -1.704803466796875, -1.629150390625, -1.553497314453125, -1.47784423828125, -1.402191162109375, -1.3265380859375, -1.250885009765625, -1.17523193359375, -1.099578857421875, -1.02392578125, -0.948272705078125, -0.87261962890625, -0.796966552734375, -0.7213134765625, -0.645660400390625, -0.57000732421875, -0.494354248046875, -0.418701171875, -0.343048095703125, -0.26739501953125, -0.191741943359375, -0.1160888671875, -0.040435791015625, 0.03521728515625, 0.110870361328125, 0.1865234375, 0.262176513671875, 0.33782958984375, 0.413482666015625, 0.4891357421875, 0.564788818359375, 0.64044189453125, 0.716094970703125, 0.791748046875, 0.867401123046875, 0.94305419921875, 1.018707275390625, 1.0943603515625, 1.170013427734375, 1.24566650390625, 1.321319580078125, 1.39697265625, 1.472625732421875, 1.54827880859375, 1.623931884765625, 1.6995849609375, 1.775238037109375, 1.85089111328125, 1.926544189453125, 2.002197265625, 2.077850341796875, 2.15350341796875, 2.229156494140625, 2.3048095703125, 2.380462646484375, 2.45611572265625, 2.531768798828125, 2.607421875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 4.0, 11.0, 14.0, 16.0, 30.0, 27.0, 32.0, 48.0, 96.0, 132.0, 228.0, 397.0, 559.0, 1160.0, 2924.0, 11125.0, 57890.0, 362636.0, 503786.0, 84772.0, 15564.0, 3941.0, 1386.0, 654.0, 343.0, 258.0, 161.0, 104.0, 83.0, 44.0, 30.0, 28.0, 15.0, 18.0, 13.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.234375, -19.562255859375, -18.89013671875, -18.218017578125, -17.5458984375, -16.873779296875, -16.20166015625, -15.529541015625, -14.857421875, -14.185302734375, -13.51318359375, -12.841064453125, -12.1689453125, -11.496826171875, -10.82470703125, -10.152587890625, -9.48046875, -8.808349609375, -8.13623046875, -7.464111328125, -6.7919921875, -6.119873046875, -5.44775390625, -4.775634765625, -4.103515625, -3.431396484375, -2.75927734375, -2.087158203125, -1.4150390625, -0.742919921875, -0.07080078125, 0.601318359375, 1.2734375, 1.945556640625, 2.61767578125, 3.289794921875, 3.9619140625, 4.634033203125, 5.30615234375, 5.978271484375, 6.650390625, 7.322509765625, 7.99462890625, 8.666748046875, 9.3388671875, 10.010986328125, 10.68310546875, 11.355224609375, 12.02734375, 12.699462890625, 13.37158203125, 14.043701171875, 14.7158203125, 15.387939453125, 16.06005859375, 16.732177734375, 17.404296875, 18.076416015625, 18.74853515625, 19.420654296875, 20.0927734375, 20.764892578125, 21.43701171875, 22.109130859375, 22.78125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 4.0, 3.0, 7.0, 9.0, 15.0, 10.0, 20.0, 13.0, 27.0, 28.0, 26.0, 33.0, 42.0, 34.0, 38.0, 39.0, 44.0, 61.0, 44.0, 44.0, 58.0, 51.0, 38.0, 45.0, 37.0, 46.0, 25.0, 31.0, 20.0, 24.0, 19.0, 14.0, 10.0, 3.0, 10.0, 6.0, 7.0, 5.0, 7.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.26953125, -6.99053955078125, -6.7115478515625, -6.43255615234375, -6.153564453125, -5.87457275390625, -5.5955810546875, -5.31658935546875, -5.03759765625, -4.75860595703125, -4.4796142578125, -4.20062255859375, -3.921630859375, -3.64263916015625, -3.3636474609375, -3.08465576171875, -2.8056640625, -2.52667236328125, -2.2476806640625, -1.96868896484375, -1.689697265625, -1.41070556640625, -1.1317138671875, -0.85272216796875, -0.57373046875, -0.29473876953125, -0.0157470703125, 0.26324462890625, 0.542236328125, 0.82122802734375, 1.1002197265625, 1.37921142578125, 1.658203125, 1.93719482421875, 2.2161865234375, 2.49517822265625, 2.774169921875, 3.05316162109375, 3.3321533203125, 3.61114501953125, 3.89013671875, 4.16912841796875, 4.4481201171875, 4.72711181640625, 5.006103515625, 5.28509521484375, 5.5640869140625, 5.84307861328125, 6.1220703125, 6.40106201171875, 6.6800537109375, 6.95904541015625, 7.238037109375, 7.51702880859375, 7.7960205078125, 8.07501220703125, 8.35400390625, 8.63299560546875, 8.9119873046875, 9.19097900390625, 9.469970703125, 9.74896240234375, 10.0279541015625, 10.30694580078125, 10.5859375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 5.0, 5.0, 7.0, 11.0, 6.0, 16.0, 30.0, 50.0, 67.0, 117.0, 195.0, 345.0, 749.0, 1761.0, 4603.0, 15379.0, 71138.0, 366693.0, 465447.0, 93577.0, 19192.0, 5369.0, 1957.0, 843.0, 424.0, 224.0, 110.0, 62.0, 40.0, 35.0, 26.0, 18.0, 11.0, 11.0, 4.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-12.6015625, -12.2318115234375, -11.862060546875, -11.4923095703125, -11.12255859375, -10.7528076171875, -10.383056640625, -10.0133056640625, -9.6435546875, -9.2738037109375, -8.904052734375, -8.5343017578125, -8.16455078125, -7.7947998046875, -7.425048828125, -7.0552978515625, -6.685546875, -6.3157958984375, -5.946044921875, -5.5762939453125, -5.20654296875, -4.8367919921875, -4.467041015625, -4.0972900390625, -3.7275390625, -3.3577880859375, -2.988037109375, -2.6182861328125, -2.24853515625, -1.8787841796875, -1.509033203125, -1.1392822265625, -0.76953125, -0.3997802734375, -0.030029296875, 0.3397216796875, 0.70947265625, 1.0792236328125, 1.448974609375, 1.8187255859375, 2.1884765625, 2.5582275390625, 2.927978515625, 3.2977294921875, 3.66748046875, 4.0372314453125, 4.406982421875, 4.7767333984375, 5.146484375, 5.5162353515625, 5.885986328125, 6.2557373046875, 6.62548828125, 6.9952392578125, 7.364990234375, 7.7347412109375, 8.1044921875, 8.4742431640625, 8.843994140625, 9.2137451171875, 9.58349609375, 9.9532470703125, 10.322998046875, 10.6927490234375, 11.0625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 9.0, 3.0, 17.0, 11.0, 18.0, 15.0, 19.0, 18.0, 27.0, 28.0, 42.0, 51.0, 64.0, 67.0, 69.0, 82.0, 85.0, 75.0, 52.0, 46.0, 31.0, 30.0, 19.0, 21.0, 24.0, 12.0, 16.0, 8.0, 11.0, 5.0, 7.0, 5.0, 1.0, 4.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007662773132324219, -0.0007448047399520874, -0.0007233321666717529, -0.0007018595933914185, -0.000680387020111084, -0.0006589144468307495, -0.000637441873550415, -0.0006159693002700806, -0.0005944967269897461, -0.0005730241537094116, -0.0005515515804290771, -0.0005300790071487427, -0.0005086064338684082, -0.00048713386058807373, -0.00046566128730773926, -0.0004441887140274048, -0.0004227161407470703, -0.00040124356746673584, -0.00037977099418640137, -0.0003582984209060669, -0.0003368258476257324, -0.00031535327434539795, -0.0002938807010650635, -0.000272408127784729, -0.00025093555450439453, -0.00022946298122406006, -0.00020799040794372559, -0.0001865178346633911, -0.00016504526138305664, -0.00014357268810272217, -0.0001221001148223877, -0.00010062754154205322, -7.915496826171875e-05, -5.768239498138428e-05, -3.6209821701049805e-05, -1.4737248420715332e-05, 6.735324859619141e-06, 2.8207898139953613e-05, 4.9680471420288086e-05, 7.115304470062256e-05, 9.262561798095703e-05, 0.0001140981912612915, 0.00013557076454162598, 0.00015704333782196045, 0.00017851591110229492, 0.0001999884843826294, 0.00022146105766296387, 0.00024293363094329834, 0.0002644062042236328, 0.0002858787775039673, 0.00030735135078430176, 0.00032882392406463623, 0.0003502964973449707, 0.0003717690706253052, 0.00039324164390563965, 0.0004147142171859741, 0.0004361867904663086, 0.00045765936374664307, 0.00047913193702697754, 0.000500604510307312, 0.0005220770835876465, 0.000543549656867981, 0.0005650222301483154, 0.0005864948034286499, 0.0006079673767089844]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 5.0, 8.0, 13.0, 10.0, 22.0, 21.0, 46.0, 53.0, 85.0, 154.0, 248.0, 455.0, 803.0, 1574.0, 3612.0, 9435.0, 35851.0, 206754.0, 594655.0, 152435.0, 27925.0, 8097.0, 3159.0, 1418.0, 696.0, 382.0, 227.0, 149.0, 76.0, 45.0, 54.0, 21.0, 16.0, 6.0, 12.0, 9.0, 9.0, 2.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.5546875, -14.0599365234375, -13.565185546875, -13.0704345703125, -12.57568359375, -12.0809326171875, -11.586181640625, -11.0914306640625, -10.5966796875, -10.1019287109375, -9.607177734375, -9.1124267578125, -8.61767578125, -8.1229248046875, -7.628173828125, -7.1334228515625, -6.638671875, -6.1439208984375, -5.649169921875, -5.1544189453125, -4.65966796875, -4.1649169921875, -3.670166015625, -3.1754150390625, -2.6806640625, -2.1859130859375, -1.691162109375, -1.1964111328125, -0.70166015625, -0.2069091796875, 0.287841796875, 0.7825927734375, 1.27734375, 1.7720947265625, 2.266845703125, 2.7615966796875, 3.25634765625, 3.7510986328125, 4.245849609375, 4.7406005859375, 5.2353515625, 5.7301025390625, 6.224853515625, 6.7196044921875, 7.21435546875, 7.7091064453125, 8.203857421875, 8.6986083984375, 9.193359375, 9.6881103515625, 10.182861328125, 10.6776123046875, 11.17236328125, 11.6671142578125, 12.161865234375, 12.6566162109375, 13.1513671875, 13.6461181640625, 14.140869140625, 14.6356201171875, 15.13037109375, 15.6251220703125, 16.119873046875, 16.6146240234375, 17.109375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 10.0, 7.0, 21.0, 31.0, 46.0, 62.0, 71.0, 123.0, 142.0, 143.0, 95.0, 86.0, 58.0, 28.0, 29.0, 10.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-12.578125, -12.2452392578125, -11.912353515625, -11.5794677734375, -11.24658203125, -10.9136962890625, -10.580810546875, -10.2479248046875, -9.9150390625, -9.5821533203125, -9.249267578125, -8.9163818359375, -8.58349609375, -8.2506103515625, -7.917724609375, -7.5848388671875, -7.251953125, -6.9190673828125, -6.586181640625, -6.2532958984375, -5.92041015625, -5.5875244140625, -5.254638671875, -4.9217529296875, -4.5888671875, -4.2559814453125, -3.923095703125, -3.5902099609375, -3.25732421875, -2.9244384765625, -2.591552734375, -2.2586669921875, -1.92578125, -1.5928955078125, -1.260009765625, -0.9271240234375, -0.59423828125, -0.2613525390625, 0.071533203125, 0.4044189453125, 0.7373046875, 1.0701904296875, 1.403076171875, 1.7359619140625, 2.06884765625, 2.4017333984375, 2.734619140625, 3.0675048828125, 3.400390625, 3.7332763671875, 4.066162109375, 4.3990478515625, 4.73193359375, 5.0648193359375, 5.397705078125, 5.7305908203125, 6.0634765625, 6.3963623046875, 6.729248046875, 7.0621337890625, 7.39501953125, 7.7279052734375, 8.060791015625, 8.3936767578125, 8.7265625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 18.0, 13.0, 55.0, 141.0, 245.0, 259.0, 165.0, 64.0, 23.0, 10.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.38150024414062, -152.00714111328125, -146.63279724121094, -141.25843811035156, -135.8840789794922, -130.5097198486328, -125.1353759765625, -119.76101684570312, -114.38665771484375, -109.0123062133789, -103.63794708251953, -98.26359558105469, -92.88923645019531, -87.51488494873047, -82.14053344726562, -76.76617431640625, -71.3918228149414, -66.01747131347656, -60.64311218261719, -55.268760681152344, -49.89440155029297, -44.520050048828125, -39.145694732666016, -33.771339416503906, -28.396984100341797, -23.022628784179688, -17.648273468017578, -12.273920059204102, -6.899564743041992, -1.5252094268798828, 3.8491439819335938, 9.223499298095703, 14.597854614257812, 19.972209930419922, 25.34656524658203, 30.720918655395508, 36.09527587890625, 41.469627380371094, 46.8439826965332, 52.21833801269531, 57.59269332885742, 62.96704864501953, 68.34140014648438, 73.71575927734375, 79.0901107788086, 84.46446990966797, 89.83882141113281, 95.21318054199219, 100.58753204345703, 105.96188354492188, 111.33624267578125, 116.7105941772461, 122.08495330810547, 127.45930480957031, 132.8336639404297, 138.2080078125, 143.58236694335938, 148.95672607421875, 154.33106994628906, 159.70542907714844, 165.0797882080078, 170.4541473388672, 175.8284912109375, 181.20285034179688, 186.57720947265625]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 6.0, 7.0, 10.0, 10.0, 16.0, 11.0, 19.0, 21.0, 28.0, 30.0, 43.0, 36.0, 39.0, 39.0, 46.0, 45.0, 54.0, 58.0, 48.0, 54.0, 52.0, 49.0, 36.0, 40.0, 42.0, 28.0, 17.0, 18.0, 16.0, 11.0, 14.0, 11.0, 11.0, 4.0, 9.0, 8.0, 5.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-67.77264404296875, -65.85935974121094, -63.94607162475586, -62.03278732299805, -60.119503021240234, -58.206214904785156, -56.292930603027344, -54.37964630126953, -52.46636199951172, -50.553077697753906, -48.63978958129883, -46.726505279541016, -44.8132209777832, -42.899932861328125, -40.98664855957031, -39.0733642578125, -37.16007614135742, -35.24679183959961, -33.33350372314453, -31.42021942138672, -29.506935119628906, -27.59364891052246, -25.680362701416016, -23.767078399658203, -21.853792190551758, -19.940505981445312, -18.0272216796875, -16.113935470581055, -14.200650215148926, -12.287364959716797, -10.374078750610352, -8.460793495178223, -6.547508239746094, -4.634222984313965, -2.7209372520446777, -0.8076515197753906, 1.1056337356567383, 3.018918991088867, 4.9322052001953125, 6.845490455627441, 8.75877571105957, 10.6720609664917, 12.585346221923828, 14.498632431030273, 16.41191864013672, 18.32520294189453, 20.238489151000977, 22.151775360107422, 24.065059661865234, 25.97834587097168, 27.891630172729492, 29.804916381835938, 31.71820068359375, 33.63148498535156, 35.54477310180664, 37.45805740356445, 39.37134552001953, 41.284629821777344, 43.19791793823242, 45.111202239990234, 47.02448654174805, 48.937774658203125, 50.85105895996094, 52.76434326171875, 54.67762756347656]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 8.0, 13.0, 18.0, 26.0, 38.0, 43.0, 74.0, 108.0, 191.0, 364.0, 827.0, 2145.0, 6733.0, 29652.0, 333826.0, 3724411.0, 76079.0, 13479.0, 3828.0, 1264.0, 487.0, 239.0, 131.0, 95.0, 72.0, 33.0, 28.0, 16.0, 16.0, 14.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.71875, -28.58642578125, -27.4541015625, -26.32177734375, -25.189453125, -24.05712890625, -22.9248046875, -21.79248046875, -20.66015625, -19.52783203125, -18.3955078125, -17.26318359375, -16.130859375, -14.99853515625, -13.8662109375, -12.73388671875, -11.6015625, -10.46923828125, -9.3369140625, -8.20458984375, -7.072265625, -5.93994140625, -4.8076171875, -3.67529296875, -2.54296875, -1.41064453125, -0.2783203125, 0.85400390625, 1.986328125, 3.11865234375, 4.2509765625, 5.38330078125, 6.515625, 7.64794921875, 8.7802734375, 9.91259765625, 11.044921875, 12.17724609375, 13.3095703125, 14.44189453125, 15.57421875, 16.70654296875, 17.8388671875, 18.97119140625, 20.103515625, 21.23583984375, 22.3681640625, 23.50048828125, 24.6328125, 25.76513671875, 26.8974609375, 28.02978515625, 29.162109375, 30.29443359375, 31.4267578125, 32.55908203125, 33.69140625, 34.82373046875, 35.9560546875, 37.08837890625, 38.220703125, 39.35302734375, 40.4853515625, 41.61767578125, 42.75]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 5.0, 16.0, 28.0, 30.0, 21.0, 25.0, 39.0, 54.0, 68.0, 59.0, 71.0, 70.0, 70.0, 61.0, 74.0, 54.0, 50.0, 37.0, 38.0, 31.0, 22.0, 13.0, 15.0, 11.0, 9.0, 10.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.53515625, -2.458465576171875, -2.38177490234375, -2.305084228515625, -2.2283935546875, -2.151702880859375, -2.07501220703125, -1.998321533203125, -1.921630859375, -1.844940185546875, -1.76824951171875, -1.691558837890625, -1.6148681640625, -1.538177490234375, -1.46148681640625, -1.384796142578125, -1.30810546875, -1.231414794921875, -1.15472412109375, -1.078033447265625, -1.0013427734375, -0.924652099609375, -0.84796142578125, -0.771270751953125, -0.694580078125, -0.617889404296875, -0.54119873046875, -0.464508056640625, -0.3878173828125, -0.311126708984375, -0.23443603515625, -0.157745361328125, -0.0810546875, -0.004364013671875, 0.07232666015625, 0.149017333984375, 0.2257080078125, 0.302398681640625, 0.37908935546875, 0.455780029296875, 0.532470703125, 0.609161376953125, 0.68585205078125, 0.762542724609375, 0.8392333984375, 0.915924072265625, 0.99261474609375, 1.069305419921875, 1.14599609375, 1.222686767578125, 1.29937744140625, 1.376068115234375, 1.4527587890625, 1.529449462890625, 1.60614013671875, 1.682830810546875, 1.759521484375, 1.836212158203125, 1.91290283203125, 1.989593505859375, 2.0662841796875, 2.142974853515625, 2.21966552734375, 2.296356201171875, 2.373046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 3.0, 8.0, 8.0, 10.0, 6.0, 13.0, 13.0, 17.0, 16.0, 24.0, 20.0, 19.0, 43.0, 58.0, 95.0, 204.0, 404.0, 957.0, 2876.0, 9986.0, 46851.0, 523579.0, 3451449.0, 128880.0, 20852.0, 5175.0, 1508.0, 595.0, 261.0, 109.0, 53.0, 48.0, 20.0, 14.0, 13.0, 22.0, 11.0, 23.0, 11.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.3125, -26.465576171875, -25.61865234375, -24.771728515625, -23.9248046875, -23.077880859375, -22.23095703125, -21.384033203125, -20.537109375, -19.690185546875, -18.84326171875, -17.996337890625, -17.1494140625, -16.302490234375, -15.45556640625, -14.608642578125, -13.76171875, -12.914794921875, -12.06787109375, -11.220947265625, -10.3740234375, -9.527099609375, -8.68017578125, -7.833251953125, -6.986328125, -6.139404296875, -5.29248046875, -4.445556640625, -3.5986328125, -2.751708984375, -1.90478515625, -1.057861328125, -0.2109375, 0.635986328125, 1.48291015625, 2.329833984375, 3.1767578125, 4.023681640625, 4.87060546875, 5.717529296875, 6.564453125, 7.411376953125, 8.25830078125, 9.105224609375, 9.9521484375, 10.799072265625, 11.64599609375, 12.492919921875, 13.33984375, 14.186767578125, 15.03369140625, 15.880615234375, 16.7275390625, 17.574462890625, 18.42138671875, 19.268310546875, 20.115234375, 20.962158203125, 21.80908203125, 22.656005859375, 23.5029296875, 24.349853515625, 25.19677734375, 26.043701171875, 26.890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 7.0, 10.0, 13.0, 21.0, 26.0, 50.0, 81.0, 156.0, 303.0, 1178.0, 1425.0, 370.0, 166.0, 107.0, 58.0, 26.0, 28.0, 14.0, 11.0, 9.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.5078125, -9.301239013671875, -9.09466552734375, -8.888092041015625, -8.6815185546875, -8.474945068359375, -8.26837158203125, -8.061798095703125, -7.855224609375, -7.648651123046875, -7.44207763671875, -7.235504150390625, -7.0289306640625, -6.822357177734375, -6.61578369140625, -6.409210205078125, -6.20263671875, -5.996063232421875, -5.78948974609375, -5.582916259765625, -5.3763427734375, -5.169769287109375, -4.96319580078125, -4.756622314453125, -4.550048828125, -4.343475341796875, -4.13690185546875, -3.930328369140625, -3.7237548828125, -3.517181396484375, -3.31060791015625, -3.104034423828125, -2.8974609375, -2.690887451171875, -2.48431396484375, -2.277740478515625, -2.0711669921875, -1.864593505859375, -1.65802001953125, -1.451446533203125, -1.244873046875, -1.038299560546875, -0.83172607421875, -0.625152587890625, -0.4185791015625, -0.212005615234375, -0.00543212890625, 0.201141357421875, 0.40771484375, 0.614288330078125, 0.82086181640625, 1.027435302734375, 1.2340087890625, 1.440582275390625, 1.64715576171875, 1.853729248046875, 2.060302734375, 2.266876220703125, 2.47344970703125, 2.680023193359375, 2.8865966796875, 3.093170166015625, 3.29974365234375, 3.506317138671875, 3.712890625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 11.0, 18.0, 54.0, 170.0, 372.0, 283.0, 70.0, 23.0, 5.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-149.37835693359375, -146.6397705078125, -143.90118408203125, -141.16259765625, -138.4239959716797, -135.68540954589844, -132.9468231201172, -130.20823669433594, -127.46965026855469, -124.73106384277344, -121.99246978759766, -119.2538833618164, -116.51529693603516, -113.77670288085938, -111.03811645507812, -108.29953002929688, -105.5609359741211, -102.82234954833984, -100.08375549316406, -97.34516906738281, -94.60658264160156, -91.86799621582031, -89.12940216064453, -86.39081573486328, -83.6522216796875, -80.91363525390625, -78.17504119873047, -75.43645477294922, -72.69786834716797, -69.95927429199219, -67.22068786621094, -64.48210144042969, -61.74351501464844, -59.00492477416992, -56.26633834838867, -53.527748107910156, -50.789161682128906, -48.05057144165039, -45.311981201171875, -42.573394775390625, -39.83480453491211, -37.096214294433594, -34.357627868652344, -31.619037628173828, -28.880449295043945, -26.141860961914062, -23.403270721435547, -20.664682388305664, -17.92609405517578, -15.187505722045898, -12.4489164352417, -9.7103271484375, -6.971738815307617, -4.233150482177734, -1.4945602416992188, 1.244028091430664, 3.982616424560547, 6.721205234527588, 9.459794044494629, 12.198383331298828, 14.936971664428711, 17.675559997558594, 20.41415023803711, 23.152738571166992, 25.891326904296875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 7.0, 8.0, 12.0, 16.0, 43.0, 46.0, 64.0, 74.0, 68.0, 75.0, 90.0, 82.0, 101.0, 82.0, 73.0, 41.0, 25.0, 35.0, 17.0, 13.0, 14.0, 4.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-41.807220458984375, -40.90155029296875, -39.99587631225586, -39.090206146240234, -38.184532165527344, -37.27886199951172, -36.37318801879883, -35.4675178527832, -34.56184387207031, -33.65617370605469, -32.7504997253418, -31.84482765197754, -30.93915557861328, -30.033483505249023, -29.127811431884766, -28.22214126586914, -27.316469192504883, -26.410797119140625, -25.505125045776367, -24.59945297241211, -23.69378089904785, -22.788108825683594, -21.88243865966797, -20.976764678955078, -20.071094512939453, -19.165422439575195, -18.259750366210938, -17.35407829284668, -16.448406219482422, -15.542734146118164, -14.637063026428223, -13.731390953063965, -12.82571792602539, -11.920045852661133, -11.014373779296875, -10.108701705932617, -9.20302963256836, -8.297357559204102, -7.39168643951416, -6.486014366149902, -5.5803422927856445, -4.674670219421387, -3.768998384475708, -2.8633265495300293, -1.9576544761657715, -1.0519824028015137, -0.14631080627441406, 0.7593612670898438, 1.6650333404541016, 2.5707054138183594, 3.476377248764038, 4.382049083709717, 5.287721157073975, 6.193393230438232, 7.099064826965332, 8.00473690032959, 8.910408973693848, 9.816081047058105, 10.721753120422363, 11.627424240112305, 12.533096313476562, 13.43876838684082, 14.344440460205078, 15.250112533569336, 16.155784606933594]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 2.0, 5.0, 3.0, 8.0, 14.0, 21.0, 28.0, 39.0, 49.0, 75.0, 99.0, 180.0, 249.0, 413.0, 749.0, 1354.0, 2557.0, 5375.0, 12235.0, 33650.0, 106745.0, 305304.0, 363269.0, 142258.0, 44814.0, 15650.0, 6502.0, 3149.0, 1548.0, 832.0, 493.0, 296.0, 194.0, 105.0, 104.0, 59.0, 40.0, 27.0, 20.0, 13.0, 8.0, 10.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.9609375, -11.588623046875, -11.21630859375, -10.843994140625, -10.4716796875, -10.099365234375, -9.72705078125, -9.354736328125, -8.982421875, -8.610107421875, -8.23779296875, -7.865478515625, -7.4931640625, -7.120849609375, -6.74853515625, -6.376220703125, -6.00390625, -5.631591796875, -5.25927734375, -4.886962890625, -4.5146484375, -4.142333984375, -3.77001953125, -3.397705078125, -3.025390625, -2.653076171875, -2.28076171875, -1.908447265625, -1.5361328125, -1.163818359375, -0.79150390625, -0.419189453125, -0.046875, 0.325439453125, 0.69775390625, 1.070068359375, 1.4423828125, 1.814697265625, 2.18701171875, 2.559326171875, 2.931640625, 3.303955078125, 3.67626953125, 4.048583984375, 4.4208984375, 4.793212890625, 5.16552734375, 5.537841796875, 5.91015625, 6.282470703125, 6.65478515625, 7.027099609375, 7.3994140625, 7.771728515625, 8.14404296875, 8.516357421875, 8.888671875, 9.260986328125, 9.63330078125, 10.005615234375, 10.3779296875, 10.750244140625, 11.12255859375, 11.494873046875, 11.8671875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 12.0, 15.0, 22.0, 27.0, 39.0, 46.0, 72.0, 66.0, 87.0, 72.0, 81.0, 70.0, 75.0, 69.0, 60.0, 49.0, 32.0, 38.0, 16.0, 19.0, 9.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.974609375, -2.88592529296875, -2.7972412109375, -2.70855712890625, -2.619873046875, -2.53118896484375, -2.4425048828125, -2.35382080078125, -2.26513671875, -2.17645263671875, -2.0877685546875, -1.99908447265625, -1.910400390625, -1.82171630859375, -1.7330322265625, -1.64434814453125, -1.5556640625, -1.46697998046875, -1.3782958984375, -1.28961181640625, -1.200927734375, -1.11224365234375, -1.0235595703125, -0.93487548828125, -0.84619140625, -0.75750732421875, -0.6688232421875, -0.58013916015625, -0.491455078125, -0.40277099609375, -0.3140869140625, -0.22540283203125, -0.13671875, -0.04803466796875, 0.0406494140625, 0.12933349609375, 0.218017578125, 0.30670166015625, 0.3953857421875, 0.48406982421875, 0.57275390625, 0.66143798828125, 0.7501220703125, 0.83880615234375, 0.927490234375, 1.01617431640625, 1.1048583984375, 1.19354248046875, 1.2822265625, 1.37091064453125, 1.4595947265625, 1.54827880859375, 1.636962890625, 1.72564697265625, 1.8143310546875, 1.90301513671875, 1.99169921875, 2.08038330078125, 2.1690673828125, 2.25775146484375, 2.346435546875, 2.43511962890625, 2.5238037109375, 2.61248779296875, 2.701171875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 14.0, 13.0, 27.0, 19.0, 42.0, 47.0, 74.0, 93.0, 125.0, 165.0, 294.0, 476.0, 912.0, 1831.0, 5178.0, 16884.0, 66197.0, 270711.0, 467689.0, 162084.0, 38509.0, 10481.0, 3362.0, 1384.0, 704.0, 378.0, 263.0, 183.0, 121.0, 81.0, 56.0, 45.0, 24.0, 23.0, 15.0, 14.0, 7.0, 8.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.046875, -13.637451171875, -13.22802734375, -12.818603515625, -12.4091796875, -11.999755859375, -11.59033203125, -11.180908203125, -10.771484375, -10.362060546875, -9.95263671875, -9.543212890625, -9.1337890625, -8.724365234375, -8.31494140625, -7.905517578125, -7.49609375, -7.086669921875, -6.67724609375, -6.267822265625, -5.8583984375, -5.448974609375, -5.03955078125, -4.630126953125, -4.220703125, -3.811279296875, -3.40185546875, -2.992431640625, -2.5830078125, -2.173583984375, -1.76416015625, -1.354736328125, -0.9453125, -0.535888671875, -0.12646484375, 0.282958984375, 0.6923828125, 1.101806640625, 1.51123046875, 1.920654296875, 2.330078125, 2.739501953125, 3.14892578125, 3.558349609375, 3.9677734375, 4.377197265625, 4.78662109375, 5.196044921875, 5.60546875, 6.014892578125, 6.42431640625, 6.833740234375, 7.2431640625, 7.652587890625, 8.06201171875, 8.471435546875, 8.880859375, 9.290283203125, 9.69970703125, 10.109130859375, 10.5185546875, 10.927978515625, 11.33740234375, 11.746826171875, 12.15625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 0.0, 2.0, 7.0, 4.0, 7.0, 6.0, 10.0, 7.0, 10.0, 15.0, 12.0, 28.0, 21.0, 29.0, 44.0, 42.0, 32.0, 33.0, 29.0, 38.0, 47.0, 43.0, 45.0, 48.0, 44.0, 34.0, 37.0, 46.0, 42.0, 37.0, 18.0, 29.0, 26.0, 15.0, 25.0, 13.0, 12.0, 11.0, 13.0, 9.0, 7.0, 6.0, 3.0, 4.0, 3.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-7.84375, -7.6044921875, -7.365234375, -7.1259765625, -6.88671875, -6.6474609375, -6.408203125, -6.1689453125, -5.9296875, -5.6904296875, -5.451171875, -5.2119140625, -4.97265625, -4.7333984375, -4.494140625, -4.2548828125, -4.015625, -3.7763671875, -3.537109375, -3.2978515625, -3.05859375, -2.8193359375, -2.580078125, -2.3408203125, -2.1015625, -1.8623046875, -1.623046875, -1.3837890625, -1.14453125, -0.9052734375, -0.666015625, -0.4267578125, -0.1875, 0.0517578125, 0.291015625, 0.5302734375, 0.76953125, 1.0087890625, 1.248046875, 1.4873046875, 1.7265625, 1.9658203125, 2.205078125, 2.4443359375, 2.68359375, 2.9228515625, 3.162109375, 3.4013671875, 3.640625, 3.8798828125, 4.119140625, 4.3583984375, 4.59765625, 4.8369140625, 5.076171875, 5.3154296875, 5.5546875, 5.7939453125, 6.033203125, 6.2724609375, 6.51171875, 6.7509765625, 6.990234375, 7.2294921875, 7.46875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 2.0, 7.0, 12.0, 14.0, 18.0, 27.0, 40.0, 98.0, 131.0, 210.0, 383.0, 658.0, 1254.0, 3059.0, 9016.0, 37338.0, 233581.0, 585218.0, 141699.0, 24450.0, 6430.0, 2387.0, 1103.0, 566.0, 305.0, 205.0, 120.0, 75.0, 44.0, 29.0, 23.0, 20.0, 4.0, 4.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3203125, -9.023193359375, -8.72607421875, -8.428955078125, -8.1318359375, -7.834716796875, -7.53759765625, -7.240478515625, -6.943359375, -6.646240234375, -6.34912109375, -6.052001953125, -5.7548828125, -5.457763671875, -5.16064453125, -4.863525390625, -4.56640625, -4.269287109375, -3.97216796875, -3.675048828125, -3.3779296875, -3.080810546875, -2.78369140625, -2.486572265625, -2.189453125, -1.892333984375, -1.59521484375, -1.298095703125, -1.0009765625, -0.703857421875, -0.40673828125, -0.109619140625, 0.1875, 0.484619140625, 0.78173828125, 1.078857421875, 1.3759765625, 1.673095703125, 1.97021484375, 2.267333984375, 2.564453125, 2.861572265625, 3.15869140625, 3.455810546875, 3.7529296875, 4.050048828125, 4.34716796875, 4.644287109375, 4.94140625, 5.238525390625, 5.53564453125, 5.832763671875, 6.1298828125, 6.427001953125, 6.72412109375, 7.021240234375, 7.318359375, 7.615478515625, 7.91259765625, 8.209716796875, 8.5068359375, 8.803955078125, 9.10107421875, 9.398193359375, 9.6953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 5.0, 1.0, 2.0, 4.0, 8.0, 6.0, 11.0, 9.0, 8.0, 18.0, 10.0, 20.0, 26.0, 37.0, 44.0, 52.0, 50.0, 67.0, 84.0, 94.0, 89.0, 73.0, 59.0, 33.0, 30.0, 32.0, 18.0, 31.0, 17.0, 10.0, 10.0, 9.0, 8.0, 12.0, 6.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0005640983581542969, -0.0005454421043395996, -0.0005267858505249023, -0.0005081295967102051, -0.0004894733428955078, -0.00047081708908081055, -0.0004521608352661133, -0.000433504581451416, -0.00041484832763671875, -0.0003961920738220215, -0.0003775358200073242, -0.00035887956619262695, -0.0003402233123779297, -0.0003215670585632324, -0.00030291080474853516, -0.0002842545509338379, -0.0002655982971191406, -0.00024694204330444336, -0.0002282857894897461, -0.00020962953567504883, -0.00019097328186035156, -0.0001723170280456543, -0.00015366077423095703, -0.00013500452041625977, -0.0001163482666015625, -9.769201278686523e-05, -7.903575897216797e-05, -6.03795051574707e-05, -4.172325134277344e-05, -2.3066997528076172e-05, -4.410743713378906e-06, 1.424551010131836e-05, 3.2901763916015625e-05, 5.155801773071289e-05, 7.021427154541016e-05, 8.887052536010742e-05, 0.00010752677917480469, 0.00012618303298950195, 0.00014483928680419922, 0.00016349554061889648, 0.00018215179443359375, 0.00020080804824829102, 0.00021946430206298828, 0.00023812055587768555, 0.0002567768096923828, 0.0002754330635070801, 0.00029408931732177734, 0.0003127455711364746, 0.0003314018249511719, 0.00035005807876586914, 0.0003687143325805664, 0.00038737058639526367, 0.00040602684020996094, 0.0004246830940246582, 0.00044333934783935547, 0.00046199560165405273, 0.00048065185546875, 0.0004993081092834473, 0.0005179643630981445, 0.0005366206169128418, 0.0005552768707275391, 0.0005739331245422363, 0.0005925893783569336, 0.0006112456321716309, 0.0006299018859863281]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 10.0, 9.0, 12.0, 14.0, 18.0, 26.0, 23.0, 58.0, 78.0, 139.0, 228.0, 435.0, 924.0, 1962.0, 5690.0, 21629.0, 134753.0, 670496.0, 175255.0, 25771.0, 6590.0, 2290.0, 959.0, 433.0, 265.0, 165.0, 111.0, 57.0, 38.0, 34.0, 23.0, 15.0, 10.0, 13.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-16.28125, -15.8590087890625, -15.436767578125, -15.0145263671875, -14.59228515625, -14.1700439453125, -13.747802734375, -13.3255615234375, -12.9033203125, -12.4810791015625, -12.058837890625, -11.6365966796875, -11.21435546875, -10.7921142578125, -10.369873046875, -9.9476318359375, -9.525390625, -9.1031494140625, -8.680908203125, -8.2586669921875, -7.83642578125, -7.4141845703125, -6.991943359375, -6.5697021484375, -6.1474609375, -5.7252197265625, -5.302978515625, -4.8807373046875, -4.45849609375, -4.0362548828125, -3.614013671875, -3.1917724609375, -2.76953125, -2.3472900390625, -1.925048828125, -1.5028076171875, -1.08056640625, -0.6583251953125, -0.236083984375, 0.1861572265625, 0.6083984375, 1.0306396484375, 1.452880859375, 1.8751220703125, 2.29736328125, 2.7196044921875, 3.141845703125, 3.5640869140625, 3.986328125, 4.4085693359375, 4.830810546875, 5.2530517578125, 5.67529296875, 6.0975341796875, 6.519775390625, 6.9420166015625, 7.3642578125, 7.7864990234375, 8.208740234375, 8.6309814453125, 9.05322265625, 9.4754638671875, 9.897705078125, 10.3199462890625, 10.7421875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 10.0, 6.0, 5.0, 14.0, 25.0, 27.0, 39.0, 40.0, 61.0, 55.0, 94.0, 115.0, 91.0, 92.0, 85.0, 61.0, 45.0, 35.0, 24.0, 16.0, 17.0, 15.0, 5.0, 8.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5078125, -5.2772216796875, -5.046630859375, -4.8160400390625, -4.58544921875, -4.3548583984375, -4.124267578125, -3.8936767578125, -3.6630859375, -3.4324951171875, -3.201904296875, -2.9713134765625, -2.74072265625, -2.5101318359375, -2.279541015625, -2.0489501953125, -1.818359375, -1.5877685546875, -1.357177734375, -1.1265869140625, -0.89599609375, -0.6654052734375, -0.434814453125, -0.2042236328125, 0.0263671875, 0.2569580078125, 0.487548828125, 0.7181396484375, 0.94873046875, 1.1793212890625, 1.409912109375, 1.6405029296875, 1.87109375, 2.1016845703125, 2.332275390625, 2.5628662109375, 2.79345703125, 3.0240478515625, 3.254638671875, 3.4852294921875, 3.7158203125, 3.9464111328125, 4.177001953125, 4.4075927734375, 4.63818359375, 4.8687744140625, 5.099365234375, 5.3299560546875, 5.560546875, 5.7911376953125, 6.021728515625, 6.2523193359375, 6.48291015625, 6.7135009765625, 6.944091796875, 7.1746826171875, 7.4052734375, 7.6358642578125, 7.866455078125, 8.0970458984375, 8.32763671875, 8.5582275390625, 8.788818359375, 9.0194091796875, 9.25]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 7.0, 8.0, 17.0, 42.0, 116.0, 151.0, 231.0, 163.0, 116.0, 69.0, 22.0, 25.0, 16.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.38772583007812, -120.80936431884766, -117.23101043701172, -113.65264892578125, -110.07429504394531, -106.49593353271484, -102.91757202148438, -99.33921813964844, -95.76085662841797, -92.1824951171875, -88.60414123535156, -85.0257797241211, -81.44741821289062, -77.86906433105469, -74.29070281982422, -70.71234130859375, -67.13398742675781, -63.55562973022461, -59.977272033691406, -56.39891052246094, -52.820552825927734, -49.24219512939453, -45.66383361816406, -42.08547592163086, -38.507118225097656, -34.92876052856445, -31.350400924682617, -27.77204132080078, -24.193683624267578, -20.615325927734375, -17.03696632385254, -13.458606719970703, -9.880256652832031, -6.301898002624512, -2.723539352416992, 0.8548192977905273, 4.433177947998047, 8.01153564453125, 11.589895248413086, 15.168254852294922, 18.746612548828125, 22.324970245361328, 25.903329849243164, 29.481689453125, 33.0600471496582, 36.638404846191406, 40.216766357421875, 43.79512405395508, 47.37348175048828, 50.951839447021484, 54.53019714355469, 58.108558654785156, 61.68691635131836, 65.26527404785156, 68.84363555908203, 72.4219970703125, 76.00035095214844, 79.5787124633789, 83.15706634521484, 86.73542785644531, 90.31378173828125, 93.89214324951172, 97.47050476074219, 101.04885864257812, 104.6272201538086]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 7.0, 12.0, 7.0, 10.0, 8.0, 14.0, 23.0, 26.0, 17.0, 29.0, 28.0, 31.0, 42.0, 32.0, 54.0, 56.0, 52.0, 45.0, 52.0, 41.0, 35.0, 48.0, 48.0, 38.0, 33.0, 27.0, 27.0, 27.0, 24.0, 12.0, 15.0, 11.0, 15.0, 9.0, 8.0, 9.0, 6.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-57.3864631652832, -55.79595947265625, -54.20545196533203, -52.61494827270508, -51.024444580078125, -49.433937072753906, -47.84343338012695, -46.2529296875, -44.66242218017578, -43.07191848754883, -41.48141098022461, -39.890907287597656, -38.3004035949707, -36.709896087646484, -35.11939239501953, -33.52888488769531, -31.938383102416992, -30.347877502441406, -28.757373809814453, -27.166868209838867, -25.57636260986328, -23.985858917236328, -22.395353317260742, -20.804847717285156, -19.214344024658203, -17.623838424682617, -16.033334732055664, -14.442829132080078, -12.852323532104492, -11.261818885803223, -9.671314239501953, -8.080808639526367, -6.490303039550781, -4.8997979164123535, -3.309293031692505, -1.7187881469726562, -0.12828302383422852, 1.4622220993041992, 3.0527267456054688, 4.643232345581055, 6.233736991882324, 7.824242115020752, 9.41474723815918, 11.00525188446045, 12.595756530761719, 14.186262130737305, 15.776766777038574, 17.367271423339844, 18.95777702331543, 20.548282623291016, 22.13878631591797, 23.729291915893555, 25.31979751586914, 26.910301208496094, 28.50080680847168, 30.091312408447266, 31.68181610107422, 33.27231979370117, 34.86282730102539, 36.453330993652344, 38.0438346862793, 39.634342193603516, 41.22484588623047, 42.81535339355469, 44.40585708618164]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 4.0, 7.0, 6.0, 6.0, 6.0, 13.0, 20.0, 23.0, 37.0, 34.0, 72.0, 118.0, 211.0, 329.0, 537.0, 844.0, 1803.0, 3876.0, 9161.0, 27830.0, 140349.0, 3661536.0, 284149.0, 40863.0, 12293.0, 4982.0, 2297.0, 1194.0, 621.0, 365.0, 238.0, 161.0, 77.0, 61.0, 42.0, 37.0, 22.0, 12.0, 9.0, 8.0, 6.0, 11.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.8984375, -14.3782958984375, -13.858154296875, -13.3380126953125, -12.81787109375, -12.2977294921875, -11.777587890625, -11.2574462890625, -10.7373046875, -10.2171630859375, -9.697021484375, -9.1768798828125, -8.65673828125, -8.1365966796875, -7.616455078125, -7.0963134765625, -6.576171875, -6.0560302734375, -5.535888671875, -5.0157470703125, -4.49560546875, -3.9754638671875, -3.455322265625, -2.9351806640625, -2.4150390625, -1.8948974609375, -1.374755859375, -0.8546142578125, -0.33447265625, 0.1856689453125, 0.705810546875, 1.2259521484375, 1.74609375, 2.2662353515625, 2.786376953125, 3.3065185546875, 3.82666015625, 4.3468017578125, 4.866943359375, 5.3870849609375, 5.9072265625, 6.4273681640625, 6.947509765625, 7.4676513671875, 7.98779296875, 8.5079345703125, 9.028076171875, 9.5482177734375, 10.068359375, 10.5885009765625, 11.108642578125, 11.6287841796875, 12.14892578125, 12.6690673828125, 13.189208984375, 13.7093505859375, 14.2294921875, 14.7496337890625, 15.269775390625, 15.7899169921875, 16.31005859375, 16.8302001953125, 17.350341796875, 17.8704833984375, 18.390625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 16.0, 18.0, 22.0, 33.0, 40.0, 64.0, 64.0, 71.0, 92.0, 91.0, 72.0, 85.0, 69.0, 66.0, 57.0, 40.0, 30.0, 23.0, 10.0, 14.0, 9.0, 3.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.310546875, -3.212921142578125, -3.11529541015625, -3.017669677734375, -2.9200439453125, -2.822418212890625, -2.72479248046875, -2.627166748046875, -2.529541015625, -2.431915283203125, -2.33428955078125, -2.236663818359375, -2.1390380859375, -2.041412353515625, -1.94378662109375, -1.846160888671875, -1.74853515625, -1.650909423828125, -1.55328369140625, -1.455657958984375, -1.3580322265625, -1.260406494140625, -1.16278076171875, -1.065155029296875, -0.967529296875, -0.869903564453125, -0.77227783203125, -0.674652099609375, -0.5770263671875, -0.479400634765625, -0.38177490234375, -0.284149169921875, -0.1865234375, -0.088897705078125, 0.00872802734375, 0.106353759765625, 0.2039794921875, 0.301605224609375, 0.39923095703125, 0.496856689453125, 0.594482421875, 0.692108154296875, 0.78973388671875, 0.887359619140625, 0.9849853515625, 1.082611083984375, 1.18023681640625, 1.277862548828125, 1.37548828125, 1.473114013671875, 1.57073974609375, 1.668365478515625, 1.7659912109375, 1.863616943359375, 1.96124267578125, 2.058868408203125, 2.156494140625, 2.254119873046875, 2.35174560546875, 2.449371337890625, 2.5469970703125, 2.644622802734375, 2.74224853515625, 2.839874267578125, 2.9375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 4.0, 5.0, 10.0, 15.0, 12.0, 29.0, 32.0, 45.0, 83.0, 110.0, 128.0, 200.0, 341.0, 581.0, 981.0, 1707.0, 3121.0, 6209.0, 13646.0, 34934.0, 116352.0, 836136.0, 2885560.0, 208411.0, 51281.0, 17801.0, 7933.0, 3803.0, 1908.0, 1134.0, 654.0, 399.0, 242.0, 161.0, 84.0, 78.0, 56.0, 32.0, 30.0, 14.0, 10.0, 4.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0], "bins": [-13.3828125, -13.0323486328125, -12.681884765625, -12.3314208984375, -11.98095703125, -11.6304931640625, -11.280029296875, -10.9295654296875, -10.5791015625, -10.2286376953125, -9.878173828125, -9.5277099609375, -9.17724609375, -8.8267822265625, -8.476318359375, -8.1258544921875, -7.775390625, -7.4249267578125, -7.074462890625, -6.7239990234375, -6.37353515625, -6.0230712890625, -5.672607421875, -5.3221435546875, -4.9716796875, -4.6212158203125, -4.270751953125, -3.9202880859375, -3.56982421875, -3.2193603515625, -2.868896484375, -2.5184326171875, -2.16796875, -1.8175048828125, -1.467041015625, -1.1165771484375, -0.76611328125, -0.4156494140625, -0.065185546875, 0.2852783203125, 0.6357421875, 0.9862060546875, 1.336669921875, 1.6871337890625, 2.03759765625, 2.3880615234375, 2.738525390625, 3.0889892578125, 3.439453125, 3.7899169921875, 4.140380859375, 4.4908447265625, 4.84130859375, 5.1917724609375, 5.542236328125, 5.8927001953125, 6.2431640625, 6.5936279296875, 6.944091796875, 7.2945556640625, 7.64501953125, 7.9954833984375, 8.345947265625, 8.6964111328125, 9.046875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 6.0, 4.0, 5.0, 9.0, 10.0, 5.0, 8.0, 29.0, 38.0, 54.0, 71.0, 126.0, 308.0, 751.0, 1729.0, 461.0, 203.0, 96.0, 49.0, 33.0, 21.0, 17.0, 14.0, 5.0, 10.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.71875, -5.569244384765625, -5.41973876953125, -5.270233154296875, -5.1207275390625, -4.971221923828125, -4.82171630859375, -4.672210693359375, -4.522705078125, -4.373199462890625, -4.22369384765625, -4.074188232421875, -3.9246826171875, -3.775177001953125, -3.62567138671875, -3.476165771484375, -3.32666015625, -3.177154541015625, -3.02764892578125, -2.878143310546875, -2.7286376953125, -2.579132080078125, -2.42962646484375, -2.280120849609375, -2.130615234375, -1.981109619140625, -1.83160400390625, -1.682098388671875, -1.5325927734375, -1.383087158203125, -1.23358154296875, -1.084075927734375, -0.9345703125, -0.785064697265625, -0.63555908203125, -0.486053466796875, -0.3365478515625, -0.187042236328125, -0.03753662109375, 0.111968994140625, 0.261474609375, 0.410980224609375, 0.56048583984375, 0.709991455078125, 0.8594970703125, 1.009002685546875, 1.15850830078125, 1.308013916015625, 1.45751953125, 1.607025146484375, 1.75653076171875, 1.906036376953125, 2.0555419921875, 2.205047607421875, 2.35455322265625, 2.504058837890625, 2.653564453125, 2.803070068359375, 2.95257568359375, 3.102081298828125, 3.2515869140625, 3.401092529296875, 3.55059814453125, 3.700103759765625, 3.849609375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 3.0, 11.0, 41.0, 88.0, 208.0, 296.0, 212.0, 101.0, 32.0, 12.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-90.55015563964844, -88.82869720458984, -87.10724639892578, -85.38578796386719, -83.66433715820312, -81.94287872314453, -80.22142791748047, -78.49996948242188, -76.77851867675781, -75.05706024169922, -73.33560943603516, -71.61415100097656, -69.8927001953125, -68.1712417602539, -66.44979095458984, -64.72833251953125, -63.00687789916992, -61.285423278808594, -59.563968658447266, -57.84251403808594, -56.12105941772461, -54.39960479736328, -52.67814636230469, -50.956695556640625, -49.23523712158203, -47.5137825012207, -45.792327880859375, -44.07087326049805, -42.34941864013672, -40.62796401977539, -38.90650939941406, -37.18505096435547, -35.46359634399414, -33.74214172363281, -32.020687103271484, -30.299232482910156, -28.577777862548828, -26.8563232421875, -25.13486671447754, -23.41341209411621, -21.691957473754883, -19.970502853393555, -18.249048233032227, -16.527591705322266, -14.806138038635254, -13.084683418273926, -11.363227844238281, -9.641773223876953, -7.920318603515625, -6.198863983154297, -4.4774088859558105, -2.755953788757324, -1.034499168395996, 0.686955451965332, 2.4084110260009766, 4.129865646362305, 5.851320266723633, 7.572774887084961, 9.294229507446289, 11.015685081481934, 12.737139701843262, 14.45859432220459, 16.180049896240234, 17.901504516601562, 19.62295913696289]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 8.0, 8.0, 11.0, 9.0, 17.0, 16.0, 24.0, 17.0, 25.0, 38.0, 33.0, 40.0, 43.0, 37.0, 39.0, 53.0, 59.0, 41.0, 55.0, 38.0, 53.0, 44.0, 36.0, 39.0, 37.0, 26.0, 19.0, 18.0, 18.0, 16.0, 17.0, 10.0, 11.0, 9.0, 8.0, 5.0, 4.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.817390441894531, -14.38209056854248, -13.94679069519043, -13.511490821838379, -13.076190948486328, -12.640891075134277, -12.205591201782227, -11.770292282104492, -11.334991455078125, -10.899691581726074, -10.464391708374023, -10.029091835021973, -9.593791961669922, -9.158492088317871, -8.72319221496582, -8.287893295288086, -7.852593421936035, -7.417293548583984, -6.981993675231934, -6.546693801879883, -6.111393928527832, -5.676094055175781, -5.240794658660889, -4.805494785308838, -4.370194911956787, -3.9348950386047363, -3.4995951652526855, -3.064295530319214, -2.628995656967163, -2.1936957836151123, -1.7583961486816406, -1.3230962753295898, -0.8877954483032227, -0.45249563455581665, -0.017195820808410645, 0.4181039333343506, 0.8534038066864014, 1.2887036800384521, 1.7240033149719238, 2.1593031883239746, 2.5946030616760254, 3.029902935028076, 3.465202808380127, 3.9005024433135986, 4.33580207824707, 4.771101951599121, 5.206401824951172, 5.641701698303223, 6.077001571655273, 6.512301445007324, 6.947601318359375, 7.382901191711426, 7.818201065063477, 8.253500938415527, 8.688800811767578, 9.124099731445312, 9.55940055847168, 9.99470043182373, 10.430000305175781, 10.865300178527832, 11.300600051879883, 11.735899925231934, 12.171199798583984, 12.606498718261719, 13.04179859161377]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 9.0, 14.0, 13.0, 12.0, 28.0, 28.0, 74.0, 68.0, 108.0, 158.0, 217.0, 376.0, 635.0, 1079.0, 2070.0, 4127.0, 8954.0, 21911.0, 59319.0, 164309.0, 344826.0, 269049.0, 105345.0, 37721.0, 14694.0, 6299.0, 3134.0, 1662.0, 841.0, 502.0, 324.0, 208.0, 139.0, 92.0, 61.0, 42.0, 26.0, 16.0, 18.0, 11.0, 10.0, 9.0, 6.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0546875, -8.769775390625, -8.48486328125, -8.199951171875, -7.9150390625, -7.630126953125, -7.34521484375, -7.060302734375, -6.775390625, -6.490478515625, -6.20556640625, -5.920654296875, -5.6357421875, -5.350830078125, -5.06591796875, -4.781005859375, -4.49609375, -4.211181640625, -3.92626953125, -3.641357421875, -3.3564453125, -3.071533203125, -2.78662109375, -2.501708984375, -2.216796875, -1.931884765625, -1.64697265625, -1.362060546875, -1.0771484375, -0.792236328125, -0.50732421875, -0.222412109375, 0.0625, 0.347412109375, 0.63232421875, 0.917236328125, 1.2021484375, 1.487060546875, 1.77197265625, 2.056884765625, 2.341796875, 2.626708984375, 2.91162109375, 3.196533203125, 3.4814453125, 3.766357421875, 4.05126953125, 4.336181640625, 4.62109375, 4.906005859375, 5.19091796875, 5.475830078125, 5.7607421875, 6.045654296875, 6.33056640625, 6.615478515625, 6.900390625, 7.185302734375, 7.47021484375, 7.755126953125, 8.0400390625, 8.324951171875, 8.60986328125, 8.894775390625, 9.1796875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 11.0, 17.0, 21.0, 30.0, 33.0, 53.0, 57.0, 63.0, 82.0, 84.0, 96.0, 71.0, 72.0, 68.0, 52.0, 59.0, 33.0, 24.0, 15.0, 19.0, 14.0, 7.0, 7.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.203125, -3.11053466796875, -3.0179443359375, -2.92535400390625, -2.832763671875, -2.74017333984375, -2.6475830078125, -2.55499267578125, -2.46240234375, -2.36981201171875, -2.2772216796875, -2.18463134765625, -2.092041015625, -1.99945068359375, -1.9068603515625, -1.81427001953125, -1.7216796875, -1.62908935546875, -1.5364990234375, -1.44390869140625, -1.351318359375, -1.25872802734375, -1.1661376953125, -1.07354736328125, -0.98095703125, -0.88836669921875, -0.7957763671875, -0.70318603515625, -0.610595703125, -0.51800537109375, -0.4254150390625, -0.33282470703125, -0.240234375, -0.14764404296875, -0.0550537109375, 0.03753662109375, 0.130126953125, 0.22271728515625, 0.3153076171875, 0.40789794921875, 0.50048828125, 0.59307861328125, 0.6856689453125, 0.77825927734375, 0.870849609375, 0.96343994140625, 1.0560302734375, 1.14862060546875, 1.2412109375, 1.33380126953125, 1.4263916015625, 1.51898193359375, 1.611572265625, 1.70416259765625, 1.7967529296875, 1.88934326171875, 1.98193359375, 2.07452392578125, 2.1671142578125, 2.25970458984375, 2.352294921875, 2.44488525390625, 2.5374755859375, 2.63006591796875, 2.72265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 7.0, 8.0, 10.0, 14.0, 24.0, 39.0, 47.0, 78.0, 108.0, 193.0, 294.0, 560.0, 1272.0, 4015.0, 16013.0, 90844.0, 506287.0, 358142.0, 54990.0, 10451.0, 2962.0, 1031.0, 481.0, 228.0, 166.0, 99.0, 52.0, 39.0, 25.0, 19.0, 13.0, 10.0, 8.0, 8.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.25, -16.7552490234375, -16.260498046875, -15.7657470703125, -15.27099609375, -14.7762451171875, -14.281494140625, -13.7867431640625, -13.2919921875, -12.7972412109375, -12.302490234375, -11.8077392578125, -11.31298828125, -10.8182373046875, -10.323486328125, -9.8287353515625, -9.333984375, -8.8392333984375, -8.344482421875, -7.8497314453125, -7.35498046875, -6.8602294921875, -6.365478515625, -5.8707275390625, -5.3759765625, -4.8812255859375, -4.386474609375, -3.8917236328125, -3.39697265625, -2.9022216796875, -2.407470703125, -1.9127197265625, -1.41796875, -0.9232177734375, -0.428466796875, 0.0662841796875, 0.56103515625, 1.0557861328125, 1.550537109375, 2.0452880859375, 2.5400390625, 3.0347900390625, 3.529541015625, 4.0242919921875, 4.51904296875, 5.0137939453125, 5.508544921875, 6.0032958984375, 6.498046875, 6.9927978515625, 7.487548828125, 7.9822998046875, 8.47705078125, 8.9718017578125, 9.466552734375, 9.9613037109375, 10.4560546875, 10.9508056640625, 11.445556640625, 11.9403076171875, 12.43505859375, 12.9298095703125, 13.424560546875, 13.9193115234375, 14.4140625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 7.0, 8.0, 6.0, 8.0, 11.0, 9.0, 15.0, 15.0, 24.0, 18.0, 16.0, 23.0, 30.0, 35.0, 27.0, 40.0, 41.0, 46.0, 35.0, 41.0, 37.0, 45.0, 46.0, 38.0, 39.0, 31.0, 36.0, 30.0, 23.0, 34.0, 25.0, 29.0, 26.0, 18.0, 21.0, 10.0, 7.0, 8.0, 9.0, 10.0, 5.0, 4.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.7578125, -7.51922607421875, -7.2806396484375, -7.04205322265625, -6.803466796875, -6.56488037109375, -6.3262939453125, -6.08770751953125, -5.84912109375, -5.61053466796875, -5.3719482421875, -5.13336181640625, -4.894775390625, -4.65618896484375, -4.4176025390625, -4.17901611328125, -3.9404296875, -3.70184326171875, -3.4632568359375, -3.22467041015625, -2.986083984375, -2.74749755859375, -2.5089111328125, -2.27032470703125, -2.03173828125, -1.79315185546875, -1.5545654296875, -1.31597900390625, -1.077392578125, -0.83880615234375, -0.6002197265625, -0.36163330078125, -0.123046875, 0.11553955078125, 0.3541259765625, 0.59271240234375, 0.831298828125, 1.06988525390625, 1.3084716796875, 1.54705810546875, 1.78564453125, 2.02423095703125, 2.2628173828125, 2.50140380859375, 2.739990234375, 2.97857666015625, 3.2171630859375, 3.45574951171875, 3.6943359375, 3.93292236328125, 4.1715087890625, 4.41009521484375, 4.648681640625, 4.88726806640625, 5.1258544921875, 5.36444091796875, 5.60302734375, 5.84161376953125, 6.0802001953125, 6.31878662109375, 6.557373046875, 6.79595947265625, 7.0345458984375, 7.27313232421875, 7.51171875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 5.0, 2.0, 8.0, 10.0, 8.0, 15.0, 19.0, 22.0, 25.0, 50.0, 67.0, 112.0, 150.0, 256.0, 499.0, 988.0, 2559.0, 8405.0, 37389.0, 229489.0, 585997.0, 147047.0, 25176.0, 6246.0, 2041.0, 839.0, 437.0, 250.0, 159.0, 87.0, 62.0, 38.0, 29.0, 22.0, 13.0, 6.0, 3.0, 7.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0], "bins": [-8.09375, -7.85833740234375, -7.6229248046875, -7.38751220703125, -7.152099609375, -6.91668701171875, -6.6812744140625, -6.44586181640625, -6.21044921875, -5.97503662109375, -5.7396240234375, -5.50421142578125, -5.268798828125, -5.03338623046875, -4.7979736328125, -4.56256103515625, -4.3271484375, -4.09173583984375, -3.8563232421875, -3.62091064453125, -3.385498046875, -3.15008544921875, -2.9146728515625, -2.67926025390625, -2.44384765625, -2.20843505859375, -1.9730224609375, -1.73760986328125, -1.502197265625, -1.26678466796875, -1.0313720703125, -0.79595947265625, -0.560546875, -0.32513427734375, -0.0897216796875, 0.14569091796875, 0.381103515625, 0.61651611328125, 0.8519287109375, 1.08734130859375, 1.32275390625, 1.55816650390625, 1.7935791015625, 2.02899169921875, 2.264404296875, 2.49981689453125, 2.7352294921875, 2.97064208984375, 3.2060546875, 3.44146728515625, 3.6768798828125, 3.91229248046875, 4.147705078125, 4.38311767578125, 4.6185302734375, 4.85394287109375, 5.08935546875, 5.32476806640625, 5.5601806640625, 5.79559326171875, 6.031005859375, 6.26641845703125, 6.5018310546875, 6.73724365234375, 6.97265625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 5.0, 4.0, 6.0, 8.0, 14.0, 19.0, 21.0, 39.0, 53.0, 62.0, 71.0, 102.0, 122.0, 106.0, 94.0, 77.0, 61.0, 38.0, 22.0, 12.0, 19.0, 13.0, 4.0, 8.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006051063537597656, -0.0005825385451316833, -0.0005599707365036011, -0.0005374029278755188, -0.0005148351192474365, -0.0004922673106193542, -0.00046969950199127197, -0.0004471316933631897, -0.0004245638847351074, -0.00040199607610702515, -0.00037942826747894287, -0.0003568604588508606, -0.0003342926502227783, -0.00031172484159469604, -0.00028915703296661377, -0.0002665892243385315, -0.00024402141571044922, -0.00022145360708236694, -0.00019888579845428467, -0.0001763179898262024, -0.00015375018119812012, -0.00013118237257003784, -0.00010861456394195557, -8.604675531387329e-05, -6.347894668579102e-05, -4.091113805770874e-05, -1.8343329429626465e-05, 4.2244791984558105e-06, 2.6792287826538086e-05, 4.936009645462036e-05, 7.192790508270264e-05, 9.449571371078491e-05, 0.00011706352233886719, 0.00013963133096694946, 0.00016219913959503174, 0.00018476694822311401, 0.0002073347568511963, 0.00022990256547927856, 0.00025247037410736084, 0.0002750381827354431, 0.0002976059913635254, 0.00032017379999160767, 0.00034274160861968994, 0.0003653094172477722, 0.0003878772258758545, 0.00041044503450393677, 0.00043301284313201904, 0.0004555806517601013, 0.0004781484603881836, 0.0005007162690162659, 0.0005232840776443481, 0.0005458518862724304, 0.0005684196949005127, 0.000590987503528595, 0.0006135553121566772, 0.0006361231207847595, 0.0006586909294128418, 0.0006812587380409241, 0.0007038265466690063, 0.0007263943552970886, 0.0007489621639251709, 0.0007715299725532532, 0.0007940977811813354, 0.0008166655898094177, 0.0008392333984375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 13.0, 8.0, 15.0, 11.0, 38.0, 66.0, 140.0, 467.0, 1966.0, 13041.0, 487665.0, 528404.0, 13901.0, 1991.0, 487.0, 159.0, 71.0, 37.0, 25.0, 19.0, 7.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-29.28125, -28.6004638671875, -27.919677734375, -27.2388916015625, -26.55810546875, -25.8773193359375, -25.196533203125, -24.5157470703125, -23.8349609375, -23.1541748046875, -22.473388671875, -21.7926025390625, -21.11181640625, -20.4310302734375, -19.750244140625, -19.0694580078125, -18.388671875, -17.7078857421875, -17.027099609375, -16.3463134765625, -15.66552734375, -14.9847412109375, -14.303955078125, -13.6231689453125, -12.9423828125, -12.2615966796875, -11.580810546875, -10.9000244140625, -10.21923828125, -9.5384521484375, -8.857666015625, -8.1768798828125, -7.49609375, -6.8153076171875, -6.134521484375, -5.4537353515625, -4.77294921875, -4.0921630859375, -3.411376953125, -2.7305908203125, -2.0498046875, -1.3690185546875, -0.688232421875, -0.0074462890625, 0.67333984375, 1.3541259765625, 2.034912109375, 2.7156982421875, 3.396484375, 4.0772705078125, 4.758056640625, 5.4388427734375, 6.11962890625, 6.8004150390625, 7.481201171875, 8.1619873046875, 8.8427734375, 9.5235595703125, 10.204345703125, 10.8851318359375, 11.56591796875, 12.2467041015625, 12.927490234375, 13.6082763671875, 14.2890625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 2.0, 5.0, 2.0, 13.0, 7.0, 7.0, 19.0, 18.0, 30.0, 56.0, 50.0, 65.0, 92.0, 92.0, 88.0, 95.0, 69.0, 73.0, 47.0, 48.0, 34.0, 19.0, 16.0, 14.0, 4.0, 7.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.30859375, -5.12701416015625, -4.9454345703125, -4.76385498046875, -4.582275390625, -4.40069580078125, -4.2191162109375, -4.03753662109375, -3.85595703125, -3.67437744140625, -3.4927978515625, -3.31121826171875, -3.129638671875, -2.94805908203125, -2.7664794921875, -2.58489990234375, -2.4033203125, -2.22174072265625, -2.0401611328125, -1.85858154296875, -1.677001953125, -1.49542236328125, -1.3138427734375, -1.13226318359375, -0.95068359375, -0.76910400390625, -0.5875244140625, -0.40594482421875, -0.224365234375, -0.04278564453125, 0.1387939453125, 0.32037353515625, 0.501953125, 0.68353271484375, 0.8651123046875, 1.04669189453125, 1.228271484375, 1.40985107421875, 1.5914306640625, 1.77301025390625, 1.95458984375, 2.13616943359375, 2.3177490234375, 2.49932861328125, 2.680908203125, 2.86248779296875, 3.0440673828125, 3.22564697265625, 3.4072265625, 3.58880615234375, 3.7703857421875, 3.95196533203125, 4.133544921875, 4.31512451171875, 4.4967041015625, 4.67828369140625, 4.85986328125, 5.04144287109375, 5.2230224609375, 5.40460205078125, 5.586181640625, 5.76776123046875, 5.9493408203125, 6.13092041015625, 6.3125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 21.0, 45.0, 148.0, 303.0, 304.0, 117.0, 39.0, 16.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.99029541015625, -126.26513671875, -120.53997802734375, -114.8148193359375, -109.08966064453125, -103.364501953125, -97.63935089111328, -91.91419219970703, -86.18903350830078, -80.46387481689453, -74.73871612548828, -69.01356506347656, -63.28840255737305, -57.5632438659668, -51.83808898925781, -46.11293029785156, -40.38777160644531, -34.66261291503906, -28.937456130981445, -23.212299346923828, -17.487140655517578, -11.761981964111328, -6.036827087402344, -0.31166839599609375, 5.413490295410156, 11.13864803314209, 16.863805770874023, 22.58896255493164, 28.31412124633789, 34.03927993774414, 39.764434814453125, 45.489593505859375, 51.214752197265625, 56.939910888671875, 62.665069580078125, 68.39022827148438, 74.11538696289062, 79.84054565429688, 85.5656967163086, 91.29085540771484, 97.0160140991211, 102.74117279052734, 108.4663314819336, 114.19148254394531, 119.91664123535156, 125.64179992675781, 131.36695861816406, 137.0921173095703, 142.81727600097656, 148.5424346923828, 154.26759338378906, 159.9927520751953, 165.71791076660156, 171.4430694580078, 177.168212890625, 182.89337158203125, 188.6185302734375, 194.34368896484375, 200.06884765625, 205.79400634765625, 211.5191650390625, 217.24432373046875, 222.969482421875, 228.69464111328125, 234.4197998046875]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 7.0, 10.0, 5.0, 9.0, 13.0, 20.0, 24.0, 27.0, 22.0, 38.0, 42.0, 38.0, 68.0, 50.0, 57.0, 56.0, 54.0, 43.0, 56.0, 55.0, 47.0, 39.0, 41.0, 31.0, 34.0, 20.0, 21.0, 18.0, 16.0, 7.0, 6.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.749053955078125, -39.8594856262207, -37.96991729736328, -36.080352783203125, -34.1907844543457, -32.30121612548828, -30.41164779663086, -28.522079467773438, -26.63251304626465, -24.742944717407227, -22.853378295898438, -20.963809967041016, -19.074241638183594, -17.184675216674805, -15.295106887817383, -13.405539512634277, -11.515972137451172, -9.626404762268066, -7.736836910247803, -5.847269058227539, -3.9577016830444336, -2.068134307861328, -0.17856597900390625, 1.7110013961791992, 3.6005687713623047, 5.49013614654541, 7.379703998565674, 9.269271850585938, 11.158839225769043, 13.048406600952148, 14.93797492980957, 16.82754135131836, 18.71710968017578, 20.606678009033203, 22.496244430541992, 24.385812759399414, 26.275379180908203, 28.164947509765625, 30.054515838623047, 31.94408416748047, 33.833648681640625, 35.72321701049805, 37.61278533935547, 39.502349853515625, 41.39191818237305, 43.28148651123047, 45.17105484008789, 47.06062316894531, 48.950191497802734, 50.839759826660156, 52.72932815551758, 54.618896484375, 56.508460998535156, 58.39802932739258, 60.28759765625, 62.17716598510742, 64.06673431396484, 65.956298828125, 67.84587097167969, 69.73543548583984, 71.62500762939453, 73.51457214355469, 75.40414428710938, 77.29370880126953, 79.18327331542969]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 0.0, 5.0, 12.0, 13.0, 18.0, 21.0, 35.0, 49.0, 90.0, 113.0, 229.0, 345.0, 529.0, 999.0, 2186.0, 4918.0, 13395.0, 46892.0, 316795.0, 3548753.0, 202627.0, 36221.0, 11095.0, 4449.0, 2024.0, 1013.0, 541.0, 319.0, 177.0, 123.0, 94.0, 42.0, 44.0, 27.0, 15.0, 19.0, 10.0, 11.0, 8.0, 4.0, 4.0, 5.0, 4.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.8828125, -14.3934326171875, -13.904052734375, -13.4146728515625, -12.92529296875, -12.4359130859375, -11.946533203125, -11.4571533203125, -10.9677734375, -10.4783935546875, -9.989013671875, -9.4996337890625, -9.01025390625, -8.5208740234375, -8.031494140625, -7.5421142578125, -7.052734375, -6.5633544921875, -6.073974609375, -5.5845947265625, -5.09521484375, -4.6058349609375, -4.116455078125, -3.6270751953125, -3.1376953125, -2.6483154296875, -2.158935546875, -1.6695556640625, -1.18017578125, -0.6907958984375, -0.201416015625, 0.2879638671875, 0.77734375, 1.2667236328125, 1.756103515625, 2.2454833984375, 2.73486328125, 3.2242431640625, 3.713623046875, 4.2030029296875, 4.6923828125, 5.1817626953125, 5.671142578125, 6.1605224609375, 6.64990234375, 7.1392822265625, 7.628662109375, 8.1180419921875, 8.607421875, 9.0968017578125, 9.586181640625, 10.0755615234375, 10.56494140625, 11.0543212890625, 11.543701171875, 12.0330810546875, 12.5224609375, 13.0118408203125, 13.501220703125, 13.9906005859375, 14.47998046875, 14.9693603515625, 15.458740234375, 15.9481201171875, 16.4375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 12.0, 15.0, 33.0, 36.0, 38.0, 45.0, 61.0, 87.0, 76.0, 97.0, 99.0, 68.0, 67.0, 64.0, 56.0, 42.0, 29.0, 27.0, 11.0, 14.0, 6.0, 4.0, 2.0, 2.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.41015625, -3.30999755859375, -3.2098388671875, -3.10968017578125, -3.009521484375, -2.90936279296875, -2.8092041015625, -2.70904541015625, -2.60888671875, -2.50872802734375, -2.4085693359375, -2.30841064453125, -2.208251953125, -2.10809326171875, -2.0079345703125, -1.90777587890625, -1.8076171875, -1.70745849609375, -1.6072998046875, -1.50714111328125, -1.406982421875, -1.30682373046875, -1.2066650390625, -1.10650634765625, -1.00634765625, -0.90618896484375, -0.8060302734375, -0.70587158203125, -0.605712890625, -0.50555419921875, -0.4053955078125, -0.30523681640625, -0.205078125, -0.10491943359375, -0.0047607421875, 0.09539794921875, 0.195556640625, 0.29571533203125, 0.3958740234375, 0.49603271484375, 0.59619140625, 0.69635009765625, 0.7965087890625, 0.89666748046875, 0.996826171875, 1.09698486328125, 1.1971435546875, 1.29730224609375, 1.3974609375, 1.49761962890625, 1.5977783203125, 1.69793701171875, 1.798095703125, 1.89825439453125, 1.9984130859375, 2.09857177734375, 2.19873046875, 2.29888916015625, 2.3990478515625, 2.49920654296875, 2.599365234375, 2.69952392578125, 2.7996826171875, 2.89984130859375, 3.0]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 12.0, 18.0, 22.0, 26.0, 54.0, 72.0, 145.0, 237.0, 445.0, 980.0, 2191.0, 5305.0, 15313.0, 61327.0, 518449.0, 3308478.0, 225669.0, 37515.0, 10829.0, 3850.0, 1646.0, 749.0, 370.0, 212.0, 117.0, 84.0, 54.0, 15.0, 19.0, 25.0, 12.0, 11.0, 8.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9921875, -12.54931640625, -12.1064453125, -11.66357421875, -11.220703125, -10.77783203125, -10.3349609375, -9.89208984375, -9.44921875, -9.00634765625, -8.5634765625, -8.12060546875, -7.677734375, -7.23486328125, -6.7919921875, -6.34912109375, -5.90625, -5.46337890625, -5.0205078125, -4.57763671875, -4.134765625, -3.69189453125, -3.2490234375, -2.80615234375, -2.36328125, -1.92041015625, -1.4775390625, -1.03466796875, -0.591796875, -0.14892578125, 0.2939453125, 0.73681640625, 1.1796875, 1.62255859375, 2.0654296875, 2.50830078125, 2.951171875, 3.39404296875, 3.8369140625, 4.27978515625, 4.72265625, 5.16552734375, 5.6083984375, 6.05126953125, 6.494140625, 6.93701171875, 7.3798828125, 7.82275390625, 8.265625, 8.70849609375, 9.1513671875, 9.59423828125, 10.037109375, 10.47998046875, 10.9228515625, 11.36572265625, 11.80859375, 12.25146484375, 12.6943359375, 13.13720703125, 13.580078125, 14.02294921875, 14.4658203125, 14.90869140625, 15.3515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 7.0, 7.0, 6.0, 14.0, 20.0, 28.0, 50.0, 68.0, 114.0, 247.0, 473.0, 1398.0, 835.0, 326.0, 171.0, 105.0, 64.0, 33.0, 27.0, 21.0, 13.0, 10.0, 5.0, 8.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.0172119140625, -3.823486328125, -3.6297607421875, -3.43603515625, -3.2423095703125, -3.048583984375, -2.8548583984375, -2.6611328125, -2.4674072265625, -2.273681640625, -2.0799560546875, -1.88623046875, -1.6925048828125, -1.498779296875, -1.3050537109375, -1.111328125, -0.9176025390625, -0.723876953125, -0.5301513671875, -0.33642578125, -0.1427001953125, 0.051025390625, 0.2447509765625, 0.4384765625, 0.6322021484375, 0.825927734375, 1.0196533203125, 1.21337890625, 1.4071044921875, 1.600830078125, 1.7945556640625, 1.98828125, 2.1820068359375, 2.375732421875, 2.5694580078125, 2.76318359375, 2.9569091796875, 3.150634765625, 3.3443603515625, 3.5380859375, 3.7318115234375, 3.925537109375, 4.1192626953125, 4.31298828125, 4.5067138671875, 4.700439453125, 4.8941650390625, 5.087890625, 5.2816162109375, 5.475341796875, 5.6690673828125, 5.86279296875, 6.0565185546875, 6.250244140625, 6.4439697265625, 6.6376953125, 6.8314208984375, 7.025146484375, 7.2188720703125, 7.41259765625, 7.6063232421875, 7.800048828125, 7.9937744140625, 8.1875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 15.0, 51.0, 129.0, 279.0, 279.0, 152.0, 61.0, 14.0, 13.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.25927734375, -108.72966766357422, -106.20006561279297, -103.67045593261719, -101.1408462524414, -98.61123657226562, -96.08163452148438, -93.5520248413086, -91.02241516113281, -88.49280548095703, -85.96320343017578, -83.43359375, -80.90398406982422, -78.37437438964844, -75.84477233886719, -73.3151626586914, -70.78555297851562, -68.25594329833984, -65.7263412475586, -63.19673156738281, -60.66712188720703, -58.137516021728516, -55.60791015625, -53.07830047607422, -50.54869842529297, -48.01909255981445, -45.48948287963867, -42.959877014160156, -40.430267333984375, -37.90066146850586, -35.371055603027344, -32.84144592285156, -30.31183624267578, -27.782228469848633, -25.252620697021484, -22.72301483154297, -20.193405151367188, -17.663799285888672, -15.134191513061523, -12.604583740234375, -10.074975967407227, -7.545368194580078, -5.015760898590088, -2.4861536026000977, 0.04345417022705078, 2.573061943054199, 5.102668762207031, 7.63227653503418, 10.161884307861328, 12.691492080688477, 15.221099853515625, 17.75070571899414, 20.280315399169922, 22.809921264648438, 25.339529037475586, 27.869136810302734, 30.398744583129883, 32.92835235595703, 35.45795822143555, 37.98756790161133, 40.517173767089844, 43.046783447265625, 45.57638931274414, 48.105995178222656, 50.63560485839844]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 4.0, 10.0, 9.0, 12.0, 18.0, 20.0, 28.0, 27.0, 48.0, 36.0, 62.0, 49.0, 62.0, 61.0, 66.0, 75.0, 54.0, 71.0, 57.0, 46.0, 31.0, 37.0, 23.0, 22.0, 29.0, 19.0, 13.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.810993194580078, -30.957103729248047, -30.103214263916016, -29.249324798583984, -28.395437240600586, -27.541547775268555, -26.687658309936523, -25.833768844604492, -24.979881286621094, -24.125991821289062, -23.27210235595703, -22.418212890625, -21.5643253326416, -20.71043586730957, -19.85654640197754, -19.002656936645508, -18.148767471313477, -17.294878005981445, -16.440988540649414, -15.5871000289917, -14.733211517333984, -13.879322052001953, -13.025432586669922, -12.17154312133789, -11.317654609680176, -10.463765144348145, -9.60987663269043, -8.755987167358398, -7.902098178863525, -7.048209190368652, -6.194319725036621, -5.340430736541748, -4.486543655395508, -3.6326546669006348, -2.7787654399871826, -1.9248762130737305, -1.0709872245788574, -0.21709823608398438, 0.6367912292480469, 1.49068021774292, 2.344569206237793, 3.198458194732666, 4.052347183227539, 4.90623664855957, 5.760125637054443, 6.614014625549316, 7.467904090881348, 8.321792602539062, 9.175682067871094, 10.029571533203125, 10.88346004486084, 11.737349510192871, 12.591238021850586, 13.445127487182617, 14.299016952514648, 15.15290641784668, 16.006793975830078, 16.86068344116211, 17.71457290649414, 18.568462371826172, 19.42234992980957, 20.2762393951416, 21.130128860473633, 21.984018325805664, 22.837907791137695]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 13.0, 25.0, 17.0, 31.0, 42.0, 71.0, 122.0, 149.0, 238.0, 404.0, 881.0, 1692.0, 4075.0, 11605.0, 41861.0, 167079.0, 502992.0, 233720.0, 58097.0, 15827.0, 5179.0, 2099.0, 1015.0, 507.0, 299.0, 167.0, 106.0, 80.0, 41.0, 38.0, 29.0, 12.0, 17.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.703125, -10.25, -9.796875, -9.34375, -8.890625, -8.4375, -7.984375, -7.53125, -7.078125, -6.625, -6.171875, -5.71875, -5.265625, -4.8125, -4.359375, -3.90625, -3.453125, -3.0, -2.546875, -2.09375, -1.640625, -1.1875, -0.734375, -0.28125, 0.171875, 0.625, 1.078125, 1.53125, 1.984375, 2.4375, 2.890625, 3.34375, 3.796875, 4.25, 4.703125, 5.15625, 5.609375, 6.0625, 6.515625, 6.96875, 7.421875, 7.875, 8.328125, 8.78125, 9.234375, 9.6875, 10.140625, 10.59375, 11.046875, 11.5, 11.953125, 12.40625, 12.859375, 13.3125, 13.765625, 14.21875, 14.671875, 15.125, 15.578125, 16.03125, 16.484375, 16.9375, 17.390625, 17.84375, 18.296875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 6.0, 3.0, 7.0, 16.0, 31.0, 44.0, 50.0, 73.0, 80.0, 90.0, 90.0, 108.0, 79.0, 83.0, 66.0, 61.0, 35.0, 25.0, 19.0, 14.0, 8.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.08203125, -3.96875, -3.85546875, -3.7421875, -3.62890625, -3.515625, -3.40234375, -3.2890625, -3.17578125, -3.0625, -2.94921875, -2.8359375, -2.72265625, -2.609375, -2.49609375, -2.3828125, -2.26953125, -2.15625, -2.04296875, -1.9296875, -1.81640625, -1.703125, -1.58984375, -1.4765625, -1.36328125, -1.25, -1.13671875, -1.0234375, -0.91015625, -0.796875, -0.68359375, -0.5703125, -0.45703125, -0.34375, -0.23046875, -0.1171875, -0.00390625, 0.109375, 0.22265625, 0.3359375, 0.44921875, 0.5625, 0.67578125, 0.7890625, 0.90234375, 1.015625, 1.12890625, 1.2421875, 1.35546875, 1.46875, 1.58203125, 1.6953125, 1.80859375, 1.921875, 2.03515625, 2.1484375, 2.26171875, 2.375, 2.48828125, 2.6015625, 2.71484375, 2.828125, 2.94140625, 3.0546875, 3.16796875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 7.0, 5.0, 7.0, 15.0, 8.0, 19.0, 28.0, 58.0, 68.0, 88.0, 132.0, 208.0, 331.0, 604.0, 1270.0, 2794.0, 7060.0, 19857.0, 61575.0, 197206.0, 446688.0, 210360.0, 65400.0, 21229.0, 7604.0, 2973.0, 1355.0, 627.0, 330.0, 220.0, 126.0, 89.0, 46.0, 57.0, 28.0, 32.0, 20.0, 11.0, 6.0, 2.0, 6.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.453125, -10.141357421875, -9.82958984375, -9.517822265625, -9.2060546875, -8.894287109375, -8.58251953125, -8.270751953125, -7.958984375, -7.647216796875, -7.33544921875, -7.023681640625, -6.7119140625, -6.400146484375, -6.08837890625, -5.776611328125, -5.46484375, -5.153076171875, -4.84130859375, -4.529541015625, -4.2177734375, -3.906005859375, -3.59423828125, -3.282470703125, -2.970703125, -2.658935546875, -2.34716796875, -2.035400390625, -1.7236328125, -1.411865234375, -1.10009765625, -0.788330078125, -0.4765625, -0.164794921875, 0.14697265625, 0.458740234375, 0.7705078125, 1.082275390625, 1.39404296875, 1.705810546875, 2.017578125, 2.329345703125, 2.64111328125, 2.952880859375, 3.2646484375, 3.576416015625, 3.88818359375, 4.199951171875, 4.51171875, 4.823486328125, 5.13525390625, 5.447021484375, 5.7587890625, 6.070556640625, 6.38232421875, 6.694091796875, 7.005859375, 7.317626953125, 7.62939453125, 7.941162109375, 8.2529296875, 8.564697265625, 8.87646484375, 9.188232421875, 9.5]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 2.0, 1.0, 10.0, 12.0, 9.0, 9.0, 15.0, 15.0, 16.0, 23.0, 20.0, 25.0, 23.0, 29.0, 25.0, 31.0, 27.0, 40.0, 36.0, 45.0, 43.0, 40.0, 44.0, 46.0, 39.0, 43.0, 36.0, 30.0, 25.0, 24.0, 37.0, 27.0, 22.0, 24.0, 14.0, 17.0, 15.0, 13.0, 10.0, 3.0, 3.0, 8.0, 11.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.72265625, -7.48712158203125, -7.2515869140625, -7.01605224609375, -6.780517578125, -6.54498291015625, -6.3094482421875, -6.07391357421875, -5.83837890625, -5.60284423828125, -5.3673095703125, -5.13177490234375, -4.896240234375, -4.66070556640625, -4.4251708984375, -4.18963623046875, -3.9541015625, -3.71856689453125, -3.4830322265625, -3.24749755859375, -3.011962890625, -2.77642822265625, -2.5408935546875, -2.30535888671875, -2.06982421875, -1.83428955078125, -1.5987548828125, -1.36322021484375, -1.127685546875, -0.89215087890625, -0.6566162109375, -0.42108154296875, -0.185546875, 0.04998779296875, 0.2855224609375, 0.52105712890625, 0.756591796875, 0.99212646484375, 1.2276611328125, 1.46319580078125, 1.69873046875, 1.93426513671875, 2.1697998046875, 2.40533447265625, 2.640869140625, 2.87640380859375, 3.1119384765625, 3.34747314453125, 3.5830078125, 3.81854248046875, 4.0540771484375, 4.28961181640625, 4.525146484375, 4.76068115234375, 4.9962158203125, 5.23175048828125, 5.46728515625, 5.70281982421875, 5.9383544921875, 6.17388916015625, 6.409423828125, 6.64495849609375, 6.8804931640625, 7.11602783203125, 7.3515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 13.0, 15.0, 10.0, 19.0, 25.0, 37.0, 54.0, 87.0, 131.0, 228.0, 442.0, 906.0, 2164.0, 5792.0, 18763.0, 81614.0, 388692.0, 425420.0, 92185.0, 21208.0, 6305.0, 2272.0, 1002.0, 494.0, 254.0, 139.0, 101.0, 50.0, 34.0, 33.0, 15.0, 8.0, 8.0, 7.0, 6.0, 3.0, 7.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.23828125, -6.065185546875, -5.89208984375, -5.718994140625, -5.5458984375, -5.372802734375, -5.19970703125, -5.026611328125, -4.853515625, -4.680419921875, -4.50732421875, -4.334228515625, -4.1611328125, -3.988037109375, -3.81494140625, -3.641845703125, -3.46875, -3.295654296875, -3.12255859375, -2.949462890625, -2.7763671875, -2.603271484375, -2.43017578125, -2.257080078125, -2.083984375, -1.910888671875, -1.73779296875, -1.564697265625, -1.3916015625, -1.218505859375, -1.04541015625, -0.872314453125, -0.69921875, -0.526123046875, -0.35302734375, -0.179931640625, -0.0068359375, 0.166259765625, 0.33935546875, 0.512451171875, 0.685546875, 0.858642578125, 1.03173828125, 1.204833984375, 1.3779296875, 1.551025390625, 1.72412109375, 1.897216796875, 2.0703125, 2.243408203125, 2.41650390625, 2.589599609375, 2.7626953125, 2.935791015625, 3.10888671875, 3.281982421875, 3.455078125, 3.628173828125, 3.80126953125, 3.974365234375, 4.1474609375, 4.320556640625, 4.49365234375, 4.666748046875, 4.83984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 3.0, 9.0, 7.0, 10.0, 10.0, 17.0, 24.0, 19.0, 23.0, 31.0, 49.0, 52.0, 79.0, 121.0, 128.0, 117.0, 67.0, 53.0, 39.0, 25.0, 15.0, 21.0, 15.0, 10.0, 14.0, 6.0, 9.0, 8.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005936622619628906, -0.0005747750401496887, -0.0005558878183364868, -0.0005370005965232849, -0.000518113374710083, -0.0004992261528968811, -0.0004803389310836792, -0.0004614517092704773, -0.0004425644874572754, -0.0004236772656440735, -0.0004047900438308716, -0.0003859028220176697, -0.0003670156002044678, -0.00034812837839126587, -0.00032924115657806396, -0.00031035393476486206, -0.00029146671295166016, -0.00027257949113845825, -0.00025369226932525635, -0.00023480504751205444, -0.00021591782569885254, -0.00019703060388565063, -0.00017814338207244873, -0.00015925616025924683, -0.00014036893844604492, -0.00012148171663284302, -0.00010259449481964111, -8.370727300643921e-05, -6.48200511932373e-05, -4.59328293800354e-05, -2.7045607566833496e-05, -8.158385753631592e-06, 1.0728836059570312e-05, 2.9616057872772217e-05, 4.850327968597412e-05, 6.739050149917603e-05, 8.627772331237793e-05, 0.00010516494512557983, 0.00012405216693878174, 0.00014293938875198364, 0.00016182661056518555, 0.00018071383237838745, 0.00019960105419158936, 0.00021848827600479126, 0.00023737549781799316, 0.00025626271963119507, 0.00027514994144439697, 0.0002940371632575989, 0.0003129243850708008, 0.0003318116068840027, 0.0003506988286972046, 0.0003695860505104065, 0.0003884732723236084, 0.0004073604941368103, 0.0004262477159500122, 0.0004451349377632141, 0.000464022159576416, 0.0004829093813896179, 0.0005017966032028198, 0.0005206838250160217, 0.0005395710468292236, 0.0005584582686424255, 0.0005773454904556274, 0.0005962327122688293, 0.0006151199340820312]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 8.0, 7.0, 11.0, 9.0, 17.0, 22.0, 29.0, 40.0, 71.0, 86.0, 151.0, 248.0, 408.0, 739.0, 1362.0, 2650.0, 6040.0, 16390.0, 60611.0, 269303.0, 491988.0, 145232.0, 34103.0, 10435.0, 4108.0, 1978.0, 1046.0, 540.0, 311.0, 218.0, 115.0, 85.0, 50.0, 36.0, 26.0, 15.0, 20.0, 10.0, 7.0, 6.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.7890625, -5.60980224609375, -5.4305419921875, -5.25128173828125, -5.072021484375, -4.89276123046875, -4.7135009765625, -4.53424072265625, -4.35498046875, -4.17572021484375, -3.9964599609375, -3.81719970703125, -3.637939453125, -3.45867919921875, -3.2794189453125, -3.10015869140625, -2.9208984375, -2.74163818359375, -2.5623779296875, -2.38311767578125, -2.203857421875, -2.02459716796875, -1.8453369140625, -1.66607666015625, -1.48681640625, -1.30755615234375, -1.1282958984375, -0.94903564453125, -0.769775390625, -0.59051513671875, -0.4112548828125, -0.23199462890625, -0.052734375, 0.12652587890625, 0.3057861328125, 0.48504638671875, 0.664306640625, 0.84356689453125, 1.0228271484375, 1.20208740234375, 1.38134765625, 1.56060791015625, 1.7398681640625, 1.91912841796875, 2.098388671875, 2.27764892578125, 2.4569091796875, 2.63616943359375, 2.8154296875, 2.99468994140625, 3.1739501953125, 3.35321044921875, 3.532470703125, 3.71173095703125, 3.8909912109375, 4.07025146484375, 4.24951171875, 4.42877197265625, 4.6080322265625, 4.78729248046875, 4.966552734375, 5.14581298828125, 5.3250732421875, 5.50433349609375, 5.68359375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 9.0, 7.0, 14.0, 15.0, 30.0, 59.0, 73.0, 88.0, 113.0, 107.0, 125.0, 100.0, 71.0, 62.0, 45.0, 19.0, 22.0, 11.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.10528564453125, -4.8980712890625, -4.69085693359375, -4.483642578125, -4.27642822265625, -4.0692138671875, -3.86199951171875, -3.65478515625, -3.44757080078125, -3.2403564453125, -3.03314208984375, -2.825927734375, -2.61871337890625, -2.4114990234375, -2.20428466796875, -1.9970703125, -1.78985595703125, -1.5826416015625, -1.37542724609375, -1.168212890625, -0.96099853515625, -0.7537841796875, -0.54656982421875, -0.33935546875, -0.13214111328125, 0.0750732421875, 0.28228759765625, 0.489501953125, 0.69671630859375, 0.9039306640625, 1.11114501953125, 1.318359375, 1.52557373046875, 1.7327880859375, 1.94000244140625, 2.147216796875, 2.35443115234375, 2.5616455078125, 2.76885986328125, 2.97607421875, 3.18328857421875, 3.3905029296875, 3.59771728515625, 3.804931640625, 4.01214599609375, 4.2193603515625, 4.42657470703125, 4.6337890625, 4.84100341796875, 5.0482177734375, 5.25543212890625, 5.462646484375, 5.66986083984375, 5.8770751953125, 6.08428955078125, 6.29150390625, 6.49871826171875, 6.7059326171875, 6.91314697265625, 7.120361328125, 7.32757568359375, 7.5347900390625, 7.74200439453125, 7.94921875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 3.0, 9.0, 24.0, 26.0, 45.0, 87.0, 135.0, 166.0, 176.0, 113.0, 75.0, 44.0, 35.0, 22.0, 16.0, 11.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.77217102050781, -103.22450256347656, -100.67684173583984, -98.1291732788086, -95.58150482177734, -93.03384399414062, -90.48617553710938, -87.93850708007812, -85.39083862304688, -82.84317016601562, -80.2955093383789, -77.74784088134766, -75.2001724243164, -72.65251159667969, -70.10484313964844, -67.55717468261719, -65.00951385498047, -62.461849212646484, -59.914180755615234, -57.36651611328125, -54.81884765625, -52.271183013916016, -49.72351837158203, -47.17584991455078, -44.6281852722168, -42.08052062988281, -39.53285217285156, -36.98518753051758, -34.437522888183594, -31.889854431152344, -29.34218978881836, -26.794523239135742, -24.246849060058594, -21.699182510375977, -19.15151596069336, -16.603851318359375, -14.056184768676758, -11.50851821899414, -8.96085262298584, -6.413187026977539, -3.865520477294922, -1.317854404449463, 1.229811668395996, 3.777477741241455, 6.325143814086914, 8.872810363769531, 11.420475959777832, 13.968141555786133, 16.51580810546875, 19.063474655151367, 21.611141204833984, 24.15880584716797, 26.706472396850586, 29.254138946533203, 31.801803588867188, 34.34947204589844, 36.89713668823242, 39.444801330566406, 41.992469787597656, 44.54013442993164, 47.087799072265625, 49.635467529296875, 52.18313217163086, 54.730796813964844, 57.278465270996094]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 9.0, 10.0, 13.0, 15.0, 25.0, 26.0, 45.0, 59.0, 55.0, 79.0, 83.0, 92.0, 92.0, 83.0, 69.0, 59.0, 56.0, 41.0, 30.0, 25.0, 20.0, 15.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-89.35663604736328, -86.5654296875, -83.77422332763672, -80.98301696777344, -78.19181060791016, -75.40060424804688, -72.60939025878906, -69.81819152832031, -67.0269775390625, -64.23577117919922, -61.44456481933594, -58.653358459472656, -55.862152099609375, -53.070945739746094, -50.27973556518555, -47.488529205322266, -44.69732666015625, -41.90612030029297, -39.11491394042969, -36.323707580566406, -33.532501220703125, -30.74129295349121, -27.950084686279297, -25.158878326416016, -22.367671966552734, -19.576465606689453, -16.785259246826172, -13.994050979614258, -11.202844619750977, -8.411638259887695, -5.620429992675781, -2.8292236328125, -0.03802490234375, 2.7531819343566895, 5.544388771057129, 8.335596084594727, 11.126802444458008, 13.918008804321289, 16.709217071533203, 19.500423431396484, 22.291629791259766, 25.082836151123047, 27.874042510986328, 30.665250778198242, 33.456459045410156, 36.24766540527344, 39.03887176513672, 41.830078125, 44.62128448486328, 47.41249084472656, 50.203697204589844, 52.994903564453125, 55.786109924316406, 58.57731628417969, 61.368526458740234, 64.15972900390625, 66.95094299316406, 69.74214935302734, 72.53335571289062, 75.3245620727539, 78.11576843261719, 80.90697479248047, 83.69818115234375, 86.48939514160156, 89.28059387207031]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 4.0, 7.0, 11.0, 23.0, 26.0, 37.0, 62.0, 100.0, 162.0, 347.0, 650.0, 1391.0, 3697.0, 12347.0, 83807.0, 3899350.0, 166136.0, 17690.0, 4780.0, 1840.0, 826.0, 441.0, 204.0, 105.0, 62.0, 66.0, 30.0, 21.0, 11.0, 13.0, 10.0, 9.0, 3.0, 3.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0546875, -14.3890380859375, -13.723388671875, -13.0577392578125, -12.39208984375, -11.7264404296875, -11.060791015625, -10.3951416015625, -9.7294921875, -9.0638427734375, -8.398193359375, -7.7325439453125, -7.06689453125, -6.4012451171875, -5.735595703125, -5.0699462890625, -4.404296875, -3.7386474609375, -3.072998046875, -2.4073486328125, -1.74169921875, -1.0760498046875, -0.410400390625, 0.2552490234375, 0.9208984375, 1.5865478515625, 2.252197265625, 2.9178466796875, 3.58349609375, 4.2491455078125, 4.914794921875, 5.5804443359375, 6.24609375, 6.9117431640625, 7.577392578125, 8.2430419921875, 8.90869140625, 9.5743408203125, 10.239990234375, 10.9056396484375, 11.5712890625, 12.2369384765625, 12.902587890625, 13.5682373046875, 14.23388671875, 14.8995361328125, 15.565185546875, 16.2308349609375, 16.896484375, 17.5621337890625, 18.227783203125, 18.8934326171875, 19.55908203125, 20.2247314453125, 20.890380859375, 21.5560302734375, 22.2216796875, 22.8873291015625, 23.552978515625, 24.2186279296875, 24.88427734375, 25.5499267578125, 26.215576171875, 26.8812255859375, 27.546875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 6.0, 8.0, 13.0, 23.0, 29.0, 57.0, 74.0, 100.0, 102.0, 106.0, 129.0, 82.0, 89.0, 57.0, 48.0, 31.0, 19.0, 12.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.078125, -3.94140625, -3.8046875, -3.66796875, -3.53125, -3.39453125, -3.2578125, -3.12109375, -2.984375, -2.84765625, -2.7109375, -2.57421875, -2.4375, -2.30078125, -2.1640625, -2.02734375, -1.890625, -1.75390625, -1.6171875, -1.48046875, -1.34375, -1.20703125, -1.0703125, -0.93359375, -0.796875, -0.66015625, -0.5234375, -0.38671875, -0.25, -0.11328125, 0.0234375, 0.16015625, 0.296875, 0.43359375, 0.5703125, 0.70703125, 0.84375, 0.98046875, 1.1171875, 1.25390625, 1.390625, 1.52734375, 1.6640625, 1.80078125, 1.9375, 2.07421875, 2.2109375, 2.34765625, 2.484375, 2.62109375, 2.7578125, 2.89453125, 3.03125, 3.16796875, 3.3046875, 3.44140625, 3.578125, 3.71484375, 3.8515625, 3.98828125, 4.125, 4.26171875, 4.3984375, 4.53515625, 4.671875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 9.0, 12.0, 10.0, 22.0, 16.0, 35.0, 40.0, 76.0, 95.0, 161.0, 240.0, 431.0, 801.0, 1575.0, 3250.0, 7841.0, 23085.0, 112989.0, 3016098.0, 924865.0, 72479.0, 17970.0, 6591.0, 2725.0, 1222.0, 639.0, 368.0, 201.0, 131.0, 89.0, 66.0, 50.0, 35.0, 17.0, 21.0, 5.0, 4.0, 4.0, 4.0, 5.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.7265625, -12.3394775390625, -11.952392578125, -11.5653076171875, -11.17822265625, -10.7911376953125, -10.404052734375, -10.0169677734375, -9.6298828125, -9.2427978515625, -8.855712890625, -8.4686279296875, -8.08154296875, -7.6944580078125, -7.307373046875, -6.9202880859375, -6.533203125, -6.1461181640625, -5.759033203125, -5.3719482421875, -4.98486328125, -4.5977783203125, -4.210693359375, -3.8236083984375, -3.4365234375, -3.0494384765625, -2.662353515625, -2.2752685546875, -1.88818359375, -1.5010986328125, -1.114013671875, -0.7269287109375, -0.33984375, 0.0472412109375, 0.434326171875, 0.8214111328125, 1.20849609375, 1.5955810546875, 1.982666015625, 2.3697509765625, 2.7568359375, 3.1439208984375, 3.531005859375, 3.9180908203125, 4.30517578125, 4.6922607421875, 5.079345703125, 5.4664306640625, 5.853515625, 6.2406005859375, 6.627685546875, 7.0147705078125, 7.40185546875, 7.7889404296875, 8.176025390625, 8.5631103515625, 8.9501953125, 9.3372802734375, 9.724365234375, 10.1114501953125, 10.49853515625, 10.8856201171875, 11.272705078125, 11.6597900390625, 12.046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 7.0, 8.0, 14.0, 21.0, 49.0, 79.0, 193.0, 654.0, 2098.0, 527.0, 188.0, 71.0, 44.0, 36.0, 19.0, 22.0, 10.0, 7.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.734375, -6.53289794921875, -6.3314208984375, -6.12994384765625, -5.928466796875, -5.72698974609375, -5.5255126953125, -5.32403564453125, -5.12255859375, -4.92108154296875, -4.7196044921875, -4.51812744140625, -4.316650390625, -4.11517333984375, -3.9136962890625, -3.71221923828125, -3.5107421875, -3.30926513671875, -3.1077880859375, -2.90631103515625, -2.704833984375, -2.50335693359375, -2.3018798828125, -2.10040283203125, -1.89892578125, -1.69744873046875, -1.4959716796875, -1.29449462890625, -1.093017578125, -0.89154052734375, -0.6900634765625, -0.48858642578125, -0.287109375, -0.08563232421875, 0.1158447265625, 0.31732177734375, 0.518798828125, 0.72027587890625, 0.9217529296875, 1.12322998046875, 1.32470703125, 1.52618408203125, 1.7276611328125, 1.92913818359375, 2.130615234375, 2.33209228515625, 2.5335693359375, 2.73504638671875, 2.9365234375, 3.13800048828125, 3.3394775390625, 3.54095458984375, 3.742431640625, 3.94390869140625, 4.1453857421875, 4.34686279296875, 4.54833984375, 4.74981689453125, 4.9512939453125, 5.15277099609375, 5.354248046875, 5.55572509765625, 5.7572021484375, 5.95867919921875, 6.16015625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 9.0, 15.0, 67.0, 223.0, 306.0, 240.0, 93.0, 34.0, 9.0, 7.0, 2.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-87.4576644897461, -85.57437133789062, -83.69107818603516, -81.80778503417969, -79.92449188232422, -78.04119873046875, -76.15791320800781, -74.27462005615234, -72.39132690429688, -70.5080337524414, -68.62474060058594, -66.74144744873047, -64.858154296875, -62.9748649597168, -61.09157180786133, -59.20827865600586, -57.32498550415039, -55.44169235229492, -53.55839920043945, -51.67510986328125, -49.79181671142578, -47.90852355957031, -46.025230407714844, -44.141937255859375, -42.258644104003906, -40.37535095214844, -38.49205780029297, -36.6087646484375, -34.7254753112793, -32.84218215942383, -30.95888900756836, -29.07559585571289, -27.192306518554688, -25.30901336669922, -23.425722122192383, -21.542428970336914, -19.659137725830078, -17.77584457397461, -15.89255142211914, -14.009259223937988, -12.125967025756836, -10.242674827575684, -8.359382629394531, -6.4760894775390625, -4.59279727935791, -2.709505081176758, -0.8262119293212891, 1.0570802688598633, 2.9403724670410156, 4.823664665222168, 6.7069573402404785, 8.590250015258789, 10.473542213439941, 12.356834411621094, 14.240127563476562, 16.12342071533203, 18.006711959838867, 19.890005111694336, 21.773296356201172, 23.65658950805664, 25.53988265991211, 27.423173904418945, 29.306467056274414, 31.18975830078125, 33.07305145263672]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 9.0, 24.0, 36.0, 43.0, 65.0, 71.0, 74.0, 81.0, 81.0, 113.0, 92.0, 81.0, 53.0, 54.0, 35.0, 31.0, 17.0, 18.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.312828063964844, -33.473060607910156, -32.633296966552734, -31.793529510498047, -30.953763961791992, -30.113998413085938, -29.274232864379883, -28.434467315673828, -27.59469985961914, -26.754934310913086, -25.91516876220703, -25.075401306152344, -24.23563575744629, -23.395870208740234, -22.55610466003418, -21.716339111328125, -20.876571655273438, -20.036806106567383, -19.197040557861328, -18.35727310180664, -17.517507553100586, -16.67774200439453, -15.837976455688477, -14.998209953308105, -14.158445358276367, -13.318679809570312, -12.478913307189941, -11.639147758483887, -10.799381256103516, -9.959615707397461, -9.119850158691406, -8.280083656311035, -7.440317153930664, -6.600551128387451, -5.760785102844238, -4.921019554138184, -4.0812530517578125, -3.241487503051758, -2.401721477508545, -1.561955451965332, -0.7221894264221191, 0.11757653951644897, 0.9573425054550171, 1.7971084117889404, 2.6368744373321533, 3.476640224456787, 4.31640625, 5.156172275543213, 5.995938301086426, 6.835704326629639, 7.675470352172852, 8.515235900878906, 9.355002403259277, 10.194767951965332, 11.034534454345703, 11.874300003051758, 12.714065551757812, 13.553831100463867, 14.393597602844238, 15.233363151550293, 16.073129653930664, 16.91289520263672, 17.752660751342773, 18.592426300048828, 19.432193756103516]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 8.0, 7.0, 22.0, 35.0, 30.0, 52.0, 76.0, 89.0, 157.0, 248.0, 399.0, 643.0, 1227.0, 2347.0, 5046.0, 12691.0, 36180.0, 113865.0, 347826.0, 351552.0, 116091.0, 36576.0, 12922.0, 5058.0, 2388.0, 1211.0, 693.0, 409.0, 235.0, 137.0, 91.0, 83.0, 39.0, 27.0, 27.0, 24.0, 9.0, 6.0, 5.0, 11.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.2890625, -10.912841796875, -10.53662109375, -10.160400390625, -9.7841796875, -9.407958984375, -9.03173828125, -8.655517578125, -8.279296875, -7.903076171875, -7.52685546875, -7.150634765625, -6.7744140625, -6.398193359375, -6.02197265625, -5.645751953125, -5.26953125, -4.893310546875, -4.51708984375, -4.140869140625, -3.7646484375, -3.388427734375, -3.01220703125, -2.635986328125, -2.259765625, -1.883544921875, -1.50732421875, -1.131103515625, -0.7548828125, -0.378662109375, -0.00244140625, 0.373779296875, 0.75, 1.126220703125, 1.50244140625, 1.878662109375, 2.2548828125, 2.631103515625, 3.00732421875, 3.383544921875, 3.759765625, 4.135986328125, 4.51220703125, 4.888427734375, 5.2646484375, 5.640869140625, 6.01708984375, 6.393310546875, 6.76953125, 7.145751953125, 7.52197265625, 7.898193359375, 8.2744140625, 8.650634765625, 9.02685546875, 9.403076171875, 9.779296875, 10.155517578125, 10.53173828125, 10.907958984375, 11.2841796875, 11.660400390625, 12.03662109375, 12.412841796875, 12.7890625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 11.0, 10.0, 16.0, 26.0, 25.0, 58.0, 71.0, 79.0, 65.0, 83.0, 90.0, 97.0, 79.0, 73.0, 56.0, 42.0, 29.0, 30.0, 14.0, 19.0, 9.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.03515625, -3.92474365234375, -3.8143310546875, -3.70391845703125, -3.593505859375, -3.48309326171875, -3.3726806640625, -3.26226806640625, -3.15185546875, -3.04144287109375, -2.9310302734375, -2.82061767578125, -2.710205078125, -2.59979248046875, -2.4893798828125, -2.37896728515625, -2.2685546875, -2.15814208984375, -2.0477294921875, -1.93731689453125, -1.826904296875, -1.71649169921875, -1.6060791015625, -1.49566650390625, -1.38525390625, -1.27484130859375, -1.1644287109375, -1.05401611328125, -0.943603515625, -0.83319091796875, -0.7227783203125, -0.61236572265625, -0.501953125, -0.39154052734375, -0.2811279296875, -0.17071533203125, -0.060302734375, 0.05010986328125, 0.1605224609375, 0.27093505859375, 0.38134765625, 0.49176025390625, 0.6021728515625, 0.71258544921875, 0.822998046875, 0.93341064453125, 1.0438232421875, 1.15423583984375, 1.2646484375, 1.37506103515625, 1.4854736328125, 1.59588623046875, 1.706298828125, 1.81671142578125, 1.9271240234375, 2.03753662109375, 2.14794921875, 2.25836181640625, 2.3687744140625, 2.47918701171875, 2.589599609375, 2.70001220703125, 2.8104248046875, 2.92083740234375, 3.03125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 7.0, 3.0, 5.0, 8.0, 10.0, 24.0, 35.0, 52.0, 79.0, 147.0, 265.0, 566.0, 1481.0, 6934.0, 64676.0, 672824.0, 275161.0, 21369.0, 3147.0, 888.0, 388.0, 193.0, 104.0, 71.0, 41.0, 20.0, 22.0, 8.0, 13.0, 3.0, 12.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.1875, -26.50390625, -25.8203125, -25.13671875, -24.453125, -23.76953125, -23.0859375, -22.40234375, -21.71875, -21.03515625, -20.3515625, -19.66796875, -18.984375, -18.30078125, -17.6171875, -16.93359375, -16.25, -15.56640625, -14.8828125, -14.19921875, -13.515625, -12.83203125, -12.1484375, -11.46484375, -10.78125, -10.09765625, -9.4140625, -8.73046875, -8.046875, -7.36328125, -6.6796875, -5.99609375, -5.3125, -4.62890625, -3.9453125, -3.26171875, -2.578125, -1.89453125, -1.2109375, -0.52734375, 0.15625, 0.83984375, 1.5234375, 2.20703125, 2.890625, 3.57421875, 4.2578125, 4.94140625, 5.625, 6.30859375, 6.9921875, 7.67578125, 8.359375, 9.04296875, 9.7265625, 10.41015625, 11.09375, 11.77734375, 12.4609375, 13.14453125, 13.828125, 14.51171875, 15.1953125, 15.87890625, 16.5625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 8.0, 9.0, 4.0, 7.0, 10.0, 17.0, 9.0, 25.0, 29.0, 35.0, 30.0, 43.0, 31.0, 48.0, 37.0, 42.0, 55.0, 44.0, 54.0, 47.0, 35.0, 46.0, 48.0, 48.0, 32.0, 29.0, 31.0, 25.0, 24.0, 26.0, 21.0, 13.0, 15.0, 2.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-10.484375, -10.1929931640625, -9.901611328125, -9.6102294921875, -9.31884765625, -9.0274658203125, -8.736083984375, -8.4447021484375, -8.1533203125, -7.8619384765625, -7.570556640625, -7.2791748046875, -6.98779296875, -6.6964111328125, -6.405029296875, -6.1136474609375, -5.822265625, -5.5308837890625, -5.239501953125, -4.9481201171875, -4.65673828125, -4.3653564453125, -4.073974609375, -3.7825927734375, -3.4912109375, -3.1998291015625, -2.908447265625, -2.6170654296875, -2.32568359375, -2.0343017578125, -1.742919921875, -1.4515380859375, -1.16015625, -0.8687744140625, -0.577392578125, -0.2860107421875, 0.00537109375, 0.2967529296875, 0.588134765625, 0.8795166015625, 1.1708984375, 1.4622802734375, 1.753662109375, 2.0450439453125, 2.33642578125, 2.6278076171875, 2.919189453125, 3.2105712890625, 3.501953125, 3.7933349609375, 4.084716796875, 4.3760986328125, 4.66748046875, 4.9588623046875, 5.250244140625, 5.5416259765625, 5.8330078125, 6.1243896484375, 6.415771484375, 6.7071533203125, 6.99853515625, 7.2899169921875, 7.581298828125, 7.8726806640625, 8.1640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 4.0, 4.0, 6.0, 10.0, 8.0, 19.0, 35.0, 31.0, 47.0, 109.0, 163.0, 271.0, 535.0, 1139.0, 2744.0, 7921.0, 31181.0, 185307.0, 618057.0, 161045.0, 27754.0, 7298.0, 2615.0, 1056.0, 509.0, 255.0, 165.0, 87.0, 72.0, 38.0, 17.0, 13.0, 14.0, 5.0, 5.0, 3.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1171875, -6.89794921875, -6.6787109375, -6.45947265625, -6.240234375, -6.02099609375, -5.8017578125, -5.58251953125, -5.36328125, -5.14404296875, -4.9248046875, -4.70556640625, -4.486328125, -4.26708984375, -4.0478515625, -3.82861328125, -3.609375, -3.39013671875, -3.1708984375, -2.95166015625, -2.732421875, -2.51318359375, -2.2939453125, -2.07470703125, -1.85546875, -1.63623046875, -1.4169921875, -1.19775390625, -0.978515625, -0.75927734375, -0.5400390625, -0.32080078125, -0.1015625, 0.11767578125, 0.3369140625, 0.55615234375, 0.775390625, 0.99462890625, 1.2138671875, 1.43310546875, 1.65234375, 1.87158203125, 2.0908203125, 2.31005859375, 2.529296875, 2.74853515625, 2.9677734375, 3.18701171875, 3.40625, 3.62548828125, 3.8447265625, 4.06396484375, 4.283203125, 4.50244140625, 4.7216796875, 4.94091796875, 5.16015625, 5.37939453125, 5.5986328125, 5.81787109375, 6.037109375, 6.25634765625, 6.4755859375, 6.69482421875, 6.9140625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 15.0, 5.0, 12.0, 17.0, 18.0, 38.0, 40.0, 47.0, 84.0, 127.0, 196.0, 122.0, 87.0, 65.0, 33.0, 40.0, 23.0, 10.0, 12.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010662078857421875, -0.0010392367839813232, -0.001012265682220459, -0.0009852945804595947, -0.0009583234786987305, -0.0009313523769378662, -0.000904381275177002, -0.0008774101734161377, -0.0008504390716552734, -0.0008234679698944092, -0.0007964968681335449, -0.0007695257663726807, -0.0007425546646118164, -0.0007155835628509521, -0.0006886124610900879, -0.0006616413593292236, -0.0006346702575683594, -0.0006076991558074951, -0.0005807280540466309, -0.0005537569522857666, -0.0005267858505249023, -0.0004998147487640381, -0.00047284364700317383, -0.00044587254524230957, -0.0004189014434814453, -0.00039193034172058105, -0.0003649592399597168, -0.00033798813819885254, -0.0003110170364379883, -0.000284045934677124, -0.00025707483291625977, -0.0002301037311553955, -0.00020313262939453125, -0.000176161527633667, -0.00014919042587280273, -0.00012221932411193848, -9.524822235107422e-05, -6.827712059020996e-05, -4.13060188293457e-05, -1.4334917068481445e-05, 1.2636184692382812e-05, 3.960728645324707e-05, 6.657838821411133e-05, 9.354948997497559e-05, 0.00012052059173583984, 0.0001474916934967041, 0.00017446279525756836, 0.00020143389701843262, 0.00022840499877929688, 0.00025537610054016113, 0.0002823472023010254, 0.00030931830406188965, 0.0003362894058227539, 0.00036326050758361816, 0.0003902316093444824, 0.0004172027111053467, 0.00044417381286621094, 0.0004711449146270752, 0.0004981160163879395, 0.0005250871181488037, 0.000552058219909668, 0.0005790293216705322, 0.0006060004234313965, 0.0006329715251922607, 0.000659942626953125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 2.0, 6.0, 5.0, 5.0, 12.0, 26.0, 12.0, 21.0, 34.0, 52.0, 88.0, 123.0, 200.0, 325.0, 634.0, 1315.0, 3209.0, 9389.0, 40373.0, 288078.0, 589879.0, 88824.0, 17030.0, 5022.0, 1901.0, 853.0, 426.0, 219.0, 170.0, 94.0, 74.0, 38.0, 25.0, 23.0, 16.0, 17.0, 14.0, 1.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.09375, -7.842529296875, -7.59130859375, -7.340087890625, -7.0888671875, -6.837646484375, -6.58642578125, -6.335205078125, -6.083984375, -5.832763671875, -5.58154296875, -5.330322265625, -5.0791015625, -4.827880859375, -4.57666015625, -4.325439453125, -4.07421875, -3.822998046875, -3.57177734375, -3.320556640625, -3.0693359375, -2.818115234375, -2.56689453125, -2.315673828125, -2.064453125, -1.813232421875, -1.56201171875, -1.310791015625, -1.0595703125, -0.808349609375, -0.55712890625, -0.305908203125, -0.0546875, 0.196533203125, 0.44775390625, 0.698974609375, 0.9501953125, 1.201416015625, 1.45263671875, 1.703857421875, 1.955078125, 2.206298828125, 2.45751953125, 2.708740234375, 2.9599609375, 3.211181640625, 3.46240234375, 3.713623046875, 3.96484375, 4.216064453125, 4.46728515625, 4.718505859375, 4.9697265625, 5.220947265625, 5.47216796875, 5.723388671875, 5.974609375, 6.225830078125, 6.47705078125, 6.728271484375, 6.9794921875, 7.230712890625, 7.48193359375, 7.733154296875, 7.984375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 9.0, 9.0, 12.0, 17.0, 21.0, 38.0, 41.0, 55.0, 70.0, 84.0, 88.0, 94.0, 110.0, 91.0, 67.0, 58.0, 39.0, 25.0, 24.0, 15.0, 8.0, 6.0, 9.0, 8.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.01953125, -4.8419189453125, -4.664306640625, -4.4866943359375, -4.30908203125, -4.1314697265625, -3.953857421875, -3.7762451171875, -3.5986328125, -3.4210205078125, -3.243408203125, -3.0657958984375, -2.88818359375, -2.7105712890625, -2.532958984375, -2.3553466796875, -2.177734375, -2.0001220703125, -1.822509765625, -1.6448974609375, -1.46728515625, -1.2896728515625, -1.112060546875, -0.9344482421875, -0.7568359375, -0.5792236328125, -0.401611328125, -0.2239990234375, -0.04638671875, 0.1312255859375, 0.308837890625, 0.4864501953125, 0.6640625, 0.8416748046875, 1.019287109375, 1.1968994140625, 1.37451171875, 1.5521240234375, 1.729736328125, 1.9073486328125, 2.0849609375, 2.2625732421875, 2.440185546875, 2.6177978515625, 2.79541015625, 2.9730224609375, 3.150634765625, 3.3282470703125, 3.505859375, 3.6834716796875, 3.861083984375, 4.0386962890625, 4.21630859375, 4.3939208984375, 4.571533203125, 4.7491455078125, 4.9267578125, 5.1043701171875, 5.281982421875, 5.4595947265625, 5.63720703125, 5.8148193359375, 5.992431640625, 6.1700439453125, 6.34765625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 8.0, 18.0, 46.0, 99.0, 191.0, 254.0, 187.0, 104.0, 56.0, 18.0, 6.0, 8.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.26921844482422, -75.263427734375, -71.25764465332031, -67.2518539428711, -63.246063232421875, -59.240272521972656, -55.2344856262207, -51.22869873046875, -47.22290802001953, -43.21711730957031, -39.21133041381836, -35.205543518066406, -31.199752807617188, -27.1939640045166, -23.188175201416016, -19.18238639831543, -15.176597595214844, -11.170808792114258, -7.165019989013672, -3.159231185913086, 0.8465576171875, 4.852346420288086, 8.858135223388672, 12.863924026489258, 16.869712829589844, 20.87550163269043, 24.881290435791016, 28.8870792388916, 32.89286804199219, 36.898658752441406, 40.90444564819336, 44.91023254394531, 48.916015625, 52.92180633544922, 56.92759323120117, 60.933380126953125, 64.93917083740234, 68.94496154785156, 72.95074462890625, 76.95653533935547, 80.96232604980469, 84.9681167602539, 88.97390747070312, 92.97969055175781, 96.98548126220703, 100.99127197265625, 104.99705505371094, 109.00284576416016, 113.00863647460938, 117.0144271850586, 121.02021789550781, 125.0260009765625, 129.03179931640625, 133.03758239746094, 137.04336547851562, 141.04916381835938, 145.05494689941406, 149.06072998046875, 153.0665283203125, 157.0723114013672, 161.07809448242188, 165.08389282226562, 169.0896759033203, 173.09547424316406, 177.10125732421875]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 6.0, 5.0, 9.0, 8.0, 14.0, 8.0, 17.0, 19.0, 26.0, 42.0, 46.0, 46.0, 50.0, 36.0, 63.0, 54.0, 58.0, 58.0, 60.0, 62.0, 40.0, 42.0, 45.0, 35.0, 30.0, 20.0, 26.0, 14.0, 11.0, 15.0, 11.0, 8.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.68226623535156, -50.92022705078125, -49.15818405151367, -47.39614486694336, -45.63410186767578, -43.87206268310547, -42.11001968383789, -40.34798049926758, -38.5859375, -36.82389831542969, -35.06185531616211, -33.2998161315918, -31.53777313232422, -29.775733947753906, -28.013690948486328, -26.251651763916016, -24.48961067199707, -22.727569580078125, -20.96552848815918, -19.203487396240234, -17.44144630432129, -15.67940616607666, -13.917365074157715, -12.15532398223877, -10.393282890319824, -8.631241798400879, -6.869200706481934, -5.1071600914001465, -3.345118999481201, -1.583078384399414, 0.17896270751953125, 1.9410037994384766, 3.703044891357422, 5.465085983276367, 7.2271270751953125, 8.989168167114258, 10.751209259033203, 12.513249397277832, 14.275290489196777, 16.037330627441406, 17.799373626708984, 19.56141471862793, 21.323455810546875, 23.08549690246582, 24.847537994384766, 26.609577178955078, 28.371620178222656, 30.13365936279297, 31.895700454711914, 33.65774154663086, 35.41978073120117, 37.18182373046875, 38.94386291503906, 40.70590591430664, 42.46794509887695, 44.22998809814453, 45.992027282714844, 47.754066467285156, 49.516109466552734, 51.27814865112305, 53.040191650390625, 54.80223083496094, 56.564273834228516, 58.32631301879883, 60.088356018066406]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 3.0, 6.0, 14.0, 14.0, 13.0, 21.0, 24.0, 37.0, 49.0, 74.0, 104.0, 175.0, 279.0, 467.0, 811.0, 1566.0, 3082.0, 6984.0, 20442.0, 95988.0, 3488167.0, 506223.0, 46614.0, 12766.0, 4897.0, 2329.0, 1214.0, 675.0, 392.0, 295.0, 143.0, 107.0, 84.0, 59.0, 36.0, 32.0, 24.0, 16.0, 13.0, 9.0, 8.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.96875, -15.466552734375, -14.96435546875, -14.462158203125, -13.9599609375, -13.457763671875, -12.95556640625, -12.453369140625, -11.951171875, -11.448974609375, -10.94677734375, -10.444580078125, -9.9423828125, -9.440185546875, -8.93798828125, -8.435791015625, -7.93359375, -7.431396484375, -6.92919921875, -6.427001953125, -5.9248046875, -5.422607421875, -4.92041015625, -4.418212890625, -3.916015625, -3.413818359375, -2.91162109375, -2.409423828125, -1.9072265625, -1.405029296875, -0.90283203125, -0.400634765625, 0.1015625, 0.603759765625, 1.10595703125, 1.608154296875, 2.1103515625, 2.612548828125, 3.11474609375, 3.616943359375, 4.119140625, 4.621337890625, 5.12353515625, 5.625732421875, 6.1279296875, 6.630126953125, 7.13232421875, 7.634521484375, 8.13671875, 8.638916015625, 9.14111328125, 9.643310546875, 10.1455078125, 10.647705078125, 11.14990234375, 11.652099609375, 12.154296875, 12.656494140625, 13.15869140625, 13.660888671875, 14.1630859375, 14.665283203125, 15.16748046875, 15.669677734375, 16.171875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 13.0, 10.0, 17.0, 23.0, 29.0, 51.0, 57.0, 72.0, 86.0, 89.0, 93.0, 75.0, 100.0, 69.0, 60.0, 51.0, 32.0, 18.0, 15.0, 18.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.078125, -3.956787109375, -3.83544921875, -3.714111328125, -3.5927734375, -3.471435546875, -3.35009765625, -3.228759765625, -3.107421875, -2.986083984375, -2.86474609375, -2.743408203125, -2.6220703125, -2.500732421875, -2.37939453125, -2.258056640625, -2.13671875, -2.015380859375, -1.89404296875, -1.772705078125, -1.6513671875, -1.530029296875, -1.40869140625, -1.287353515625, -1.166015625, -1.044677734375, -0.92333984375, -0.802001953125, -0.6806640625, -0.559326171875, -0.43798828125, -0.316650390625, -0.1953125, -0.073974609375, 0.04736328125, 0.168701171875, 0.2900390625, 0.411376953125, 0.53271484375, 0.654052734375, 0.775390625, 0.896728515625, 1.01806640625, 1.139404296875, 1.2607421875, 1.382080078125, 1.50341796875, 1.624755859375, 1.74609375, 1.867431640625, 1.98876953125, 2.110107421875, 2.2314453125, 2.352783203125, 2.47412109375, 2.595458984375, 2.716796875, 2.838134765625, 2.95947265625, 3.080810546875, 3.2021484375, 3.323486328125, 3.44482421875, 3.566162109375, 3.6875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 7.0, 9.0, 14.0, 16.0, 19.0, 33.0, 41.0, 71.0, 97.0, 139.0, 180.0, 282.0, 418.0, 643.0, 1151.0, 2148.0, 4255.0, 9896.0, 27425.0, 111850.0, 1986901.0, 1889971.0, 111796.0, 27465.0, 10086.0, 4262.0, 2073.0, 1072.0, 650.0, 422.0, 255.0, 191.0, 127.0, 89.0, 70.0, 57.0, 35.0, 26.0, 8.0, 12.0, 8.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.125, -10.787841796875, -10.45068359375, -10.113525390625, -9.7763671875, -9.439208984375, -9.10205078125, -8.764892578125, -8.427734375, -8.090576171875, -7.75341796875, -7.416259765625, -7.0791015625, -6.741943359375, -6.40478515625, -6.067626953125, -5.73046875, -5.393310546875, -5.05615234375, -4.718994140625, -4.3818359375, -4.044677734375, -3.70751953125, -3.370361328125, -3.033203125, -2.696044921875, -2.35888671875, -2.021728515625, -1.6845703125, -1.347412109375, -1.01025390625, -0.673095703125, -0.3359375, 0.001220703125, 0.33837890625, 0.675537109375, 1.0126953125, 1.349853515625, 1.68701171875, 2.024169921875, 2.361328125, 2.698486328125, 3.03564453125, 3.372802734375, 3.7099609375, 4.047119140625, 4.38427734375, 4.721435546875, 5.05859375, 5.395751953125, 5.73291015625, 6.070068359375, 6.4072265625, 6.744384765625, 7.08154296875, 7.418701171875, 7.755859375, 8.093017578125, 8.43017578125, 8.767333984375, 9.1044921875, 9.441650390625, 9.77880859375, 10.115966796875, 10.453125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 6.0, 9.0, 6.0, 9.0, 13.0, 22.0, 51.0, 75.0, 190.0, 590.0, 2070.0, 614.0, 170.0, 88.0, 59.0, 24.0, 25.0, 12.0, 12.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.484375, -7.2305908203125, -6.976806640625, -6.7230224609375, -6.46923828125, -6.2154541015625, -5.961669921875, -5.7078857421875, -5.4541015625, -5.2003173828125, -4.946533203125, -4.6927490234375, -4.43896484375, -4.1851806640625, -3.931396484375, -3.6776123046875, -3.423828125, -3.1700439453125, -2.916259765625, -2.6624755859375, -2.40869140625, -2.1549072265625, -1.901123046875, -1.6473388671875, -1.3935546875, -1.1397705078125, -0.885986328125, -0.6322021484375, -0.37841796875, -0.1246337890625, 0.129150390625, 0.3829345703125, 0.63671875, 0.8905029296875, 1.144287109375, 1.3980712890625, 1.65185546875, 1.9056396484375, 2.159423828125, 2.4132080078125, 2.6669921875, 2.9207763671875, 3.174560546875, 3.4283447265625, 3.68212890625, 3.9359130859375, 4.189697265625, 4.4434814453125, 4.697265625, 4.9510498046875, 5.204833984375, 5.4586181640625, 5.71240234375, 5.9661865234375, 6.219970703125, 6.4737548828125, 6.7275390625, 6.9813232421875, 7.235107421875, 7.4888916015625, 7.74267578125, 7.9964599609375, 8.250244140625, 8.5040283203125, 8.7578125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 10.0, 22.0, 105.0, 255.0, 323.0, 197.0, 71.0, 13.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.9449462890625, -82.5320816040039, -80.11921691894531, -77.70635986328125, -75.29349517822266, -72.88063049316406, -70.46776580810547, -68.05490112304688, -65.64203643798828, -63.22917175292969, -60.81631088256836, -58.403446197509766, -55.99058151245117, -53.577720642089844, -51.16485595703125, -48.751991271972656, -46.33913040161133, -43.926265716552734, -41.513404846191406, -39.10054016113281, -36.68767547607422, -34.274810791015625, -31.861949920654297, -29.449085235595703, -27.036222457885742, -24.62335968017578, -22.210494995117188, -19.797632217407227, -17.384769439697266, -14.971904754638672, -12.559041976928711, -10.146177291870117, -7.733314514160156, -5.320450782775879, -2.9075875282287598, -0.4947242736816406, 1.9181394577026367, 4.331003189086914, 6.743865966796875, 9.156730651855469, 11.56959342956543, 13.982457160949707, 16.395320892333984, 18.808183670043945, 21.221046447753906, 23.6339111328125, 26.04677391052246, 28.459638595581055, 30.872501373291016, 33.28536605834961, 35.69822692871094, 38.11109161376953, 40.523956298828125, 42.93682098388672, 45.34968185424805, 47.76254653930664, 50.17540740966797, 52.58827209472656, 55.00113296508789, 57.413997650146484, 59.82686233520508, 62.239723205566406, 64.652587890625, 67.0654525756836, 69.47831726074219]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 14.0, 17.0, 27.0, 38.0, 61.0, 76.0, 98.0, 92.0, 107.0, 126.0, 80.0, 84.0, 61.0, 43.0, 29.0, 28.0, 12.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.38896179199219, -37.16796112060547, -35.94696044921875, -34.72595977783203, -33.50495910644531, -32.283958435058594, -31.062959671020508, -29.84195899963379, -28.62095832824707, -27.39995765686035, -26.178956985473633, -24.957956314086914, -23.736957550048828, -22.51595687866211, -21.29495620727539, -20.073955535888672, -18.852954864501953, -17.631954193115234, -16.410953521728516, -15.189953804016113, -13.968953132629395, -12.747952461242676, -11.526952743530273, -10.305952072143555, -9.084951400756836, -7.863950729370117, -6.642950534820557, -5.421950340270996, -4.200949668884277, -2.9799489974975586, -1.758948802947998, -0.5379486083984375, 0.6830482482910156, 1.9040486812591553, 3.125049114227295, 4.3460493087768555, 5.567049980163574, 6.788050651550293, 8.009050369262695, 9.230051040649414, 10.451051712036133, 11.672052383422852, 12.89305305480957, 14.114052772521973, 15.335053443908691, 16.556053161621094, 17.777053833007812, 18.99805450439453, 20.21905517578125, 21.44005584716797, 22.661056518554688, 23.882057189941406, 25.103057861328125, 26.324058532714844, 27.54505729675293, 28.76605796813965, 29.987058639526367, 31.208059310913086, 32.42905807495117, 33.65005874633789, 34.87105941772461, 36.09206008911133, 37.31306076049805, 38.534061431884766, 39.755062103271484]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 9.0, 18.0, 15.0, 23.0, 41.0, 62.0, 103.0, 150.0, 273.0, 434.0, 718.0, 1377.0, 2911.0, 6729.0, 18323.0, 62125.0, 327444.0, 505146.0, 84442.0, 22924.0, 8173.0, 3415.0, 1648.0, 802.0, 435.0, 245.0, 163.0, 111.0, 88.0, 70.0, 40.0, 17.0, 17.0, 10.0, 15.0, 8.0, 6.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.0546875, -14.61328125, -14.171875, -13.73046875, -13.2890625, -12.84765625, -12.40625, -11.96484375, -11.5234375, -11.08203125, -10.640625, -10.19921875, -9.7578125, -9.31640625, -8.875, -8.43359375, -7.9921875, -7.55078125, -7.109375, -6.66796875, -6.2265625, -5.78515625, -5.34375, -4.90234375, -4.4609375, -4.01953125, -3.578125, -3.13671875, -2.6953125, -2.25390625, -1.8125, -1.37109375, -0.9296875, -0.48828125, -0.046875, 0.39453125, 0.8359375, 1.27734375, 1.71875, 2.16015625, 2.6015625, 3.04296875, 3.484375, 3.92578125, 4.3671875, 4.80859375, 5.25, 5.69140625, 6.1328125, 6.57421875, 7.015625, 7.45703125, 7.8984375, 8.33984375, 8.78125, 9.22265625, 9.6640625, 10.10546875, 10.546875, 10.98828125, 11.4296875, 11.87109375, 12.3125, 12.75390625, 13.1953125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 9.0, 10.0, 14.0, 18.0, 28.0, 43.0, 49.0, 92.0, 55.0, 86.0, 82.0, 112.0, 87.0, 61.0, 69.0, 50.0, 35.0, 28.0, 18.0, 15.0, 11.0, 9.0, 8.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.05859375, -3.942840576171875, -3.82708740234375, -3.711334228515625, -3.5955810546875, -3.479827880859375, -3.36407470703125, -3.248321533203125, -3.132568359375, -3.016815185546875, -2.90106201171875, -2.785308837890625, -2.6695556640625, -2.553802490234375, -2.43804931640625, -2.322296142578125, -2.20654296875, -2.090789794921875, -1.97503662109375, -1.859283447265625, -1.7435302734375, -1.627777099609375, -1.51202392578125, -1.396270751953125, -1.280517578125, -1.164764404296875, -1.04901123046875, -0.933258056640625, -0.8175048828125, -0.701751708984375, -0.58599853515625, -0.470245361328125, -0.3544921875, -0.238739013671875, -0.12298583984375, -0.007232666015625, 0.1085205078125, 0.224273681640625, 0.34002685546875, 0.455780029296875, 0.571533203125, 0.687286376953125, 0.80303955078125, 0.918792724609375, 1.0345458984375, 1.150299072265625, 1.26605224609375, 1.381805419921875, 1.49755859375, 1.613311767578125, 1.72906494140625, 1.844818115234375, 1.9605712890625, 2.076324462890625, 2.19207763671875, 2.307830810546875, 2.423583984375, 2.539337158203125, 2.65509033203125, 2.770843505859375, 2.8865966796875, 3.002349853515625, 3.11810302734375, 3.233856201171875, 3.349609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 5.0, 15.0, 18.0, 18.0, 27.0, 60.0, 65.0, 121.0, 254.0, 515.0, 1449.0, 5697.0, 46605.0, 804783.0, 171898.0, 12990.0, 2455.0, 806.0, 343.0, 149.0, 91.0, 57.0, 28.0, 19.0, 20.0, 13.0, 17.0, 8.0, 4.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-26.328125, -25.54736328125, -24.7666015625, -23.98583984375, -23.205078125, -22.42431640625, -21.6435546875, -20.86279296875, -20.08203125, -19.30126953125, -18.5205078125, -17.73974609375, -16.958984375, -16.17822265625, -15.3974609375, -14.61669921875, -13.8359375, -13.05517578125, -12.2744140625, -11.49365234375, -10.712890625, -9.93212890625, -9.1513671875, -8.37060546875, -7.58984375, -6.80908203125, -6.0283203125, -5.24755859375, -4.466796875, -3.68603515625, -2.9052734375, -2.12451171875, -1.34375, -0.56298828125, 0.2177734375, 0.99853515625, 1.779296875, 2.56005859375, 3.3408203125, 4.12158203125, 4.90234375, 5.68310546875, 6.4638671875, 7.24462890625, 8.025390625, 8.80615234375, 9.5869140625, 10.36767578125, 11.1484375, 11.92919921875, 12.7099609375, 13.49072265625, 14.271484375, 15.05224609375, 15.8330078125, 16.61376953125, 17.39453125, 18.17529296875, 18.9560546875, 19.73681640625, 20.517578125, 21.29833984375, 22.0791015625, 22.85986328125, 23.640625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 9.0, 10.0, 10.0, 14.0, 18.0, 27.0, 19.0, 26.0, 43.0, 47.0, 49.0, 50.0, 62.0, 72.0, 54.0, 57.0, 55.0, 65.0, 69.0, 49.0, 42.0, 26.0, 21.0, 21.0, 23.0, 20.0, 13.0, 8.0, 6.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.71875, -10.325927734375, -9.93310546875, -9.540283203125, -9.1474609375, -8.754638671875, -8.36181640625, -7.968994140625, -7.576171875, -7.183349609375, -6.79052734375, -6.397705078125, -6.0048828125, -5.612060546875, -5.21923828125, -4.826416015625, -4.43359375, -4.040771484375, -3.64794921875, -3.255126953125, -2.8623046875, -2.469482421875, -2.07666015625, -1.683837890625, -1.291015625, -0.898193359375, -0.50537109375, -0.112548828125, 0.2802734375, 0.673095703125, 1.06591796875, 1.458740234375, 1.8515625, 2.244384765625, 2.63720703125, 3.030029296875, 3.4228515625, 3.815673828125, 4.20849609375, 4.601318359375, 4.994140625, 5.386962890625, 5.77978515625, 6.172607421875, 6.5654296875, 6.958251953125, 7.35107421875, 7.743896484375, 8.13671875, 8.529541015625, 8.92236328125, 9.315185546875, 9.7080078125, 10.100830078125, 10.49365234375, 10.886474609375, 11.279296875, 11.672119140625, 12.06494140625, 12.457763671875, 12.8505859375, 13.243408203125, 13.63623046875, 14.029052734375, 14.421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 2.0, 2.0, 9.0, 14.0, 17.0, 16.0, 16.0, 32.0, 44.0, 67.0, 147.0, 177.0, 325.0, 587.0, 1101.0, 2428.0, 7149.0, 43345.0, 726034.0, 238489.0, 20129.0, 4553.0, 1782.0, 889.0, 470.0, 258.0, 148.0, 90.0, 71.0, 51.0, 26.0, 15.0, 18.0, 15.0, 8.0, 12.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0703125, -9.7435302734375, -9.416748046875, -9.0899658203125, -8.76318359375, -8.4364013671875, -8.109619140625, -7.7828369140625, -7.4560546875, -7.1292724609375, -6.802490234375, -6.4757080078125, -6.14892578125, -5.8221435546875, -5.495361328125, -5.1685791015625, -4.841796875, -4.5150146484375, -4.188232421875, -3.8614501953125, -3.53466796875, -3.2078857421875, -2.881103515625, -2.5543212890625, -2.2275390625, -1.9007568359375, -1.573974609375, -1.2471923828125, -0.92041015625, -0.5936279296875, -0.266845703125, 0.0599365234375, 0.38671875, 0.7135009765625, 1.040283203125, 1.3670654296875, 1.69384765625, 2.0206298828125, 2.347412109375, 2.6741943359375, 3.0009765625, 3.3277587890625, 3.654541015625, 3.9813232421875, 4.30810546875, 4.6348876953125, 4.961669921875, 5.2884521484375, 5.615234375, 5.9420166015625, 6.268798828125, 6.5955810546875, 6.92236328125, 7.2491455078125, 7.575927734375, 7.9027099609375, 8.2294921875, 8.5562744140625, 8.883056640625, 9.2098388671875, 9.53662109375, 9.8634033203125, 10.190185546875, 10.5169677734375, 10.84375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 5.0, 11.0, 14.0, 16.0, 20.0, 11.0, 22.0, 19.0, 39.0, 38.0, 170.0, 270.0, 119.0, 56.0, 38.0, 23.0, 17.0, 17.0, 12.0, 18.0, 6.0, 14.0, 8.0, 4.0, 3.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0008330345153808594, -0.0008094832301139832, -0.0007859319448471069, -0.0007623806595802307, -0.0007388293743133545, -0.0007152780890464783, -0.000691726803779602, -0.0006681755185127258, -0.0006446242332458496, -0.0006210729479789734, -0.0005975216627120972, -0.000573970377445221, -0.0005504190921783447, -0.0005268678069114685, -0.0005033165216445923, -0.00047976523637771606, -0.00045621395111083984, -0.0004326626658439636, -0.0004091113805770874, -0.0003855600953102112, -0.00036200881004333496, -0.00033845752477645874, -0.0003149062395095825, -0.0002913549542427063, -0.0002678036689758301, -0.00024425238370895386, -0.00022070109844207764, -0.00019714981317520142, -0.0001735985279083252, -0.00015004724264144897, -0.00012649595737457275, -0.00010294467210769653, -7.939338684082031e-05, -5.584210157394409e-05, -3.229081630706787e-05, -8.73953104019165e-06, 1.481175422668457e-05, 3.836303949356079e-05, 6.191432476043701e-05, 8.546561002731323e-05, 0.00010901689529418945, 0.00013256818056106567, 0.0001561194658279419, 0.00017967075109481812, 0.00020322203636169434, 0.00022677332162857056, 0.0002503246068954468, 0.000273875892162323, 0.0002974271774291992, 0.00032097846269607544, 0.00034452974796295166, 0.0003680810332298279, 0.0003916323184967041, 0.0004151836037635803, 0.00043873488903045654, 0.00046228617429733276, 0.000485837459564209, 0.0005093887448310852, 0.0005329400300979614, 0.0005564913153648376, 0.0005800426006317139, 0.0006035938858985901, 0.0006271451711654663, 0.0006506964564323425, 0.0006742477416992188]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 13.0, 22.0, 28.0, 42.0, 70.0, 172.0, 391.0, 792.0, 2342.0, 14920.0, 805832.0, 213150.0, 7872.0, 1706.0, 599.0, 280.0, 140.0, 78.0, 28.0, 19.0, 19.0, 8.0, 4.0, 2.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.6875, -17.003662109375, -16.31982421875, -15.635986328125, -14.9521484375, -14.268310546875, -13.58447265625, -12.900634765625, -12.216796875, -11.532958984375, -10.84912109375, -10.165283203125, -9.4814453125, -8.797607421875, -8.11376953125, -7.429931640625, -6.74609375, -6.062255859375, -5.37841796875, -4.694580078125, -4.0107421875, -3.326904296875, -2.64306640625, -1.959228515625, -1.275390625, -0.591552734375, 0.09228515625, 0.776123046875, 1.4599609375, 2.143798828125, 2.82763671875, 3.511474609375, 4.1953125, 4.879150390625, 5.56298828125, 6.246826171875, 6.9306640625, 7.614501953125, 8.29833984375, 8.982177734375, 9.666015625, 10.349853515625, 11.03369140625, 11.717529296875, 12.4013671875, 13.085205078125, 13.76904296875, 14.452880859375, 15.13671875, 15.820556640625, 16.50439453125, 17.188232421875, 17.8720703125, 18.555908203125, 19.23974609375, 19.923583984375, 20.607421875, 21.291259765625, 21.97509765625, 22.658935546875, 23.3427734375, 24.026611328125, 24.71044921875, 25.394287109375, 26.078125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 11.0, 13.0, 20.0, 38.0, 52.0, 106.0, 210.0, 242.0, 104.0, 68.0, 38.0, 16.0, 11.0, 9.0, 7.0, 4.0, 7.0, 3.0, 3.0, 2.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0390625, -12.6319580078125, -12.224853515625, -11.8177490234375, -11.41064453125, -11.0035400390625, -10.596435546875, -10.1893310546875, -9.7822265625, -9.3751220703125, -8.968017578125, -8.5609130859375, -8.15380859375, -7.7467041015625, -7.339599609375, -6.9324951171875, -6.525390625, -6.1182861328125, -5.711181640625, -5.3040771484375, -4.89697265625, -4.4898681640625, -4.082763671875, -3.6756591796875, -3.2685546875, -2.8614501953125, -2.454345703125, -2.0472412109375, -1.64013671875, -1.2330322265625, -0.825927734375, -0.4188232421875, -0.01171875, 0.3953857421875, 0.802490234375, 1.2095947265625, 1.61669921875, 2.0238037109375, 2.430908203125, 2.8380126953125, 3.2451171875, 3.6522216796875, 4.059326171875, 4.4664306640625, 4.87353515625, 5.2806396484375, 5.687744140625, 6.0948486328125, 6.501953125, 6.9090576171875, 7.316162109375, 7.7232666015625, 8.13037109375, 8.5374755859375, 8.944580078125, 9.3516845703125, 9.7587890625, 10.1658935546875, 10.572998046875, 10.9801025390625, 11.38720703125, 11.7943115234375, 12.201416015625, 12.6085205078125, 13.015625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 17.0, 60.0, 228.0, 389.0, 230.0, 52.0, 22.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-352.475830078125, -345.645751953125, -338.815673828125, -331.985595703125, -325.155517578125, -318.3254089355469, -311.4953308105469, -304.6652526855469, -297.8351745605469, -291.0050964355469, -284.1750183105469, -277.3449401855469, -270.51483154296875, -263.68475341796875, -256.85467529296875, -250.02459716796875, -243.19451904296875, -236.36444091796875, -229.53436279296875, -222.7042694091797, -215.8741912841797, -209.0441131591797, -202.21401977539062, -195.38394165039062, -188.55386352539062, -181.72378540039062, -174.89370727539062, -168.06361389160156, -161.23353576660156, -154.40345764160156, -147.5733642578125, -140.7432861328125, -133.9132080078125, -127.0831298828125, -120.25304412841797, -113.42295837402344, -106.59288024902344, -99.76280212402344, -92.9327163696289, -86.10263061523438, -79.2725601196289, -72.44247436523438, -65.61239624023438, -58.78231430053711, -51.952232360839844, -45.12215042114258, -38.29206848144531, -31.461986541748047, -24.63190460205078, -17.801822662353516, -10.97174072265625, -4.141658782958984, 2.6884231567382812, 9.518505096435547, 16.348587036132812, 23.178668975830078, 30.008750915527344, 36.83883285522461, 43.668914794921875, 50.49899673461914, 57.329078674316406, 64.15916442871094, 70.98924255371094, 77.81932067871094, 84.64940643310547]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 8.0, 7.0, 13.0, 22.0, 17.0, 30.0, 33.0, 40.0, 28.0, 44.0, 55.0, 58.0, 52.0, 46.0, 64.0, 71.0, 70.0, 64.0, 48.0, 47.0, 36.0, 27.0, 24.0, 29.0, 15.0, 13.0, 15.0, 6.0, 10.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.13520812988281, -67.0077133178711, -64.88021850585938, -62.752723693847656, -60.62522888183594, -58.49773406982422, -56.370243072509766, -54.24274826049805, -52.11525344848633, -49.98775863647461, -47.86026382446289, -45.73276901245117, -43.60527801513672, -41.477783203125, -39.35028839111328, -37.22279357910156, -35.095298767089844, -32.967803955078125, -30.840309143066406, -28.71281623840332, -26.5853214263916, -24.457826614379883, -22.330333709716797, -20.202838897705078, -18.07534408569336, -15.94784927368164, -13.820355415344238, -11.692861557006836, -9.565366744995117, -7.437871932983398, -5.310378074645996, -3.1828842163085938, -1.055389404296875, 1.0721049308776855, 3.199599266052246, 5.327093601226807, 7.454587936401367, 9.582082748413086, 11.709576606750488, 13.83707046508789, 15.96456527709961, 18.092060089111328, 20.219554901123047, 22.347047805786133, 24.47454261779785, 26.60203742980957, 28.729530334472656, 30.857025146484375, 32.984519958496094, 35.11201477050781, 37.23950958251953, 39.36700439453125, 41.49449920654297, 43.62199401855469, 45.74948501586914, 47.87697982788086, 50.00447463989258, 52.1319694519043, 54.259464263916016, 56.386959075927734, 58.51445007324219, 60.641944885253906, 62.769439697265625, 64.89693450927734, 67.02442932128906]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 3.0, 15.0, 11.0, 20.0, 48.0, 54.0, 90.0, 147.0, 345.0, 1243.0, 6768.0, 121817.0, 4029583.0, 29018.0, 3516.0, 882.0, 349.0, 133.0, 85.0, 47.0, 37.0, 22.0, 16.0, 11.0, 6.0, 6.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.09375, -39.69140625, -38.2890625, -36.88671875, -35.484375, -34.08203125, -32.6796875, -31.27734375, -29.875, -28.47265625, -27.0703125, -25.66796875, -24.265625, -22.86328125, -21.4609375, -20.05859375, -18.65625, -17.25390625, -15.8515625, -14.44921875, -13.046875, -11.64453125, -10.2421875, -8.83984375, -7.4375, -6.03515625, -4.6328125, -3.23046875, -1.828125, -0.42578125, 0.9765625, 2.37890625, 3.78125, 5.18359375, 6.5859375, 7.98828125, 9.390625, 10.79296875, 12.1953125, 13.59765625, 15.0, 16.40234375, 17.8046875, 19.20703125, 20.609375, 22.01171875, 23.4140625, 24.81640625, 26.21875, 27.62109375, 29.0234375, 30.42578125, 31.828125, 33.23046875, 34.6328125, 36.03515625, 37.4375, 38.83984375, 40.2421875, 41.64453125, 43.046875, 44.44921875, 45.8515625, 47.25390625, 48.65625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 6.0, 12.0, 10.0, 17.0, 29.0, 35.0, 57.0, 79.0, 79.0, 102.0, 94.0, 83.0, 94.0, 67.0, 66.0, 44.0, 34.0, 33.0, 16.0, 10.0, 10.0, 7.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25390625, -4.12518310546875, -3.9964599609375, -3.86773681640625, -3.739013671875, -3.61029052734375, -3.4815673828125, -3.35284423828125, -3.22412109375, -3.09539794921875, -2.9666748046875, -2.83795166015625, -2.709228515625, -2.58050537109375, -2.4517822265625, -2.32305908203125, -2.1943359375, -2.06561279296875, -1.9368896484375, -1.80816650390625, -1.679443359375, -1.55072021484375, -1.4219970703125, -1.29327392578125, -1.16455078125, -1.03582763671875, -0.9071044921875, -0.77838134765625, -0.649658203125, -0.52093505859375, -0.3922119140625, -0.26348876953125, -0.134765625, -0.00604248046875, 0.1226806640625, 0.25140380859375, 0.380126953125, 0.50885009765625, 0.6375732421875, 0.76629638671875, 0.89501953125, 1.02374267578125, 1.1524658203125, 1.28118896484375, 1.409912109375, 1.53863525390625, 1.6673583984375, 1.79608154296875, 1.9248046875, 2.05352783203125, 2.1822509765625, 2.31097412109375, 2.439697265625, 2.56842041015625, 2.6971435546875, 2.82586669921875, 2.95458984375, 3.08331298828125, 3.2120361328125, 3.34075927734375, 3.469482421875, 3.59820556640625, 3.7269287109375, 3.85565185546875, 3.984375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 9.0, 9.0, 16.0, 21.0, 24.0, 37.0, 56.0, 61.0, 92.0, 141.0, 217.0, 337.0, 665.0, 1470.0, 4122.0, 15232.0, 89908.0, 3506648.0, 525058.0, 37104.0, 8286.0, 2549.0, 952.0, 433.0, 253.0, 171.0, 124.0, 72.0, 59.0, 50.0, 31.0, 21.0, 22.0, 18.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.5, -16.98193359375, -16.4638671875, -15.94580078125, -15.427734375, -14.90966796875, -14.3916015625, -13.87353515625, -13.35546875, -12.83740234375, -12.3193359375, -11.80126953125, -11.283203125, -10.76513671875, -10.2470703125, -9.72900390625, -9.2109375, -8.69287109375, -8.1748046875, -7.65673828125, -7.138671875, -6.62060546875, -6.1025390625, -5.58447265625, -5.06640625, -4.54833984375, -4.0302734375, -3.51220703125, -2.994140625, -2.47607421875, -1.9580078125, -1.43994140625, -0.921875, -0.40380859375, 0.1142578125, 0.63232421875, 1.150390625, 1.66845703125, 2.1865234375, 2.70458984375, 3.22265625, 3.74072265625, 4.2587890625, 4.77685546875, 5.294921875, 5.81298828125, 6.3310546875, 6.84912109375, 7.3671875, 7.88525390625, 8.4033203125, 8.92138671875, 9.439453125, 9.95751953125, 10.4755859375, 10.99365234375, 11.51171875, 12.02978515625, 12.5478515625, 13.06591796875, 13.583984375, 14.10205078125, 14.6201171875, 15.13818359375, 15.65625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 11.0, 10.0, 17.0, 41.0, 82.0, 176.0, 793.0, 2304.0, 424.0, 93.0, 47.0, 24.0, 19.0, 12.0, 9.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.79296875, -7.50726318359375, -7.2215576171875, -6.93585205078125, -6.650146484375, -6.36444091796875, -6.0787353515625, -5.79302978515625, -5.50732421875, -5.22161865234375, -4.9359130859375, -4.65020751953125, -4.364501953125, -4.07879638671875, -3.7930908203125, -3.50738525390625, -3.2216796875, -2.93597412109375, -2.6502685546875, -2.36456298828125, -2.078857421875, -1.79315185546875, -1.5074462890625, -1.22174072265625, -0.93603515625, -0.65032958984375, -0.3646240234375, -0.07891845703125, 0.206787109375, 0.49249267578125, 0.7781982421875, 1.06390380859375, 1.349609375, 1.63531494140625, 1.9210205078125, 2.20672607421875, 2.492431640625, 2.77813720703125, 3.0638427734375, 3.34954833984375, 3.63525390625, 3.92095947265625, 4.2066650390625, 4.49237060546875, 4.778076171875, 5.06378173828125, 5.3494873046875, 5.63519287109375, 5.9208984375, 6.20660400390625, 6.4923095703125, 6.77801513671875, 7.063720703125, 7.34942626953125, 7.6351318359375, 7.92083740234375, 8.20654296875, 8.49224853515625, 8.7779541015625, 9.06365966796875, 9.349365234375, 9.63507080078125, 9.9207763671875, 10.20648193359375, 10.4921875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 19.0, 50.0, 153.0, 267.0, 296.0, 145.0, 50.0, 13.0, 7.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.16471481323242, -44.06044006347656, -41.95616149902344, -39.85188293457031, -37.74760818481445, -35.643333435058594, -33.53905487060547, -31.434778213500977, -29.330501556396484, -27.226224899291992, -25.1219482421875, -23.017671585083008, -20.913394927978516, -18.809118270874023, -16.70484161376953, -14.600564956665039, -12.496288299560547, -10.392011642456055, -8.287734985351562, -6.18345832824707, -4.079181671142578, -1.974905014038086, 0.12937164306640625, 2.2336483001708984, 4.337924957275391, 6.442201614379883, 8.546478271484375, 10.650754928588867, 12.75503158569336, 14.859308242797852, 16.963584899902344, 19.067861557006836, 21.172142028808594, 23.276418685913086, 25.380695343017578, 27.48497200012207, 29.589248657226562, 31.693525314331055, 33.79780197143555, 35.902076721191406, 38.00635528564453, 40.110633850097656, 42.214908599853516, 44.319183349609375, 46.4234619140625, 48.527740478515625, 50.632015228271484, 52.736289978027344, 54.84056854248047, 56.944847106933594, 59.04912185668945, 61.15339660644531, 63.25767517089844, 65.36195373535156, 67.46623229980469, 69.57050323486328, 71.6747817993164, 73.77906036376953, 75.88333129882812, 77.98760986328125, 80.09188842773438, 82.1961669921875, 84.30044555664062, 86.40471649169922, 88.50899505615234]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 5.0, 12.0, 30.0, 32.0, 30.0, 66.0, 49.0, 70.0, 70.0, 80.0, 70.0, 72.0, 71.0, 62.0, 62.0, 50.0, 48.0, 41.0, 20.0, 12.0, 19.0, 10.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.1035041809082, -31.309825897216797, -30.51614761352539, -29.722469329833984, -28.928789138793945, -28.13511085510254, -27.341432571411133, -26.547754287719727, -25.754074096679688, -24.96039581298828, -24.166717529296875, -23.37303924560547, -22.57935905456543, -21.785680770874023, -20.992002487182617, -20.19832420349121, -19.404645919799805, -18.6109676361084, -17.817289352416992, -17.023609161376953, -16.229930877685547, -15.43625259399414, -14.642574310302734, -13.848896026611328, -13.055216789245605, -12.2615385055542, -11.467859268188477, -10.67418098449707, -9.880502700805664, -9.086823463439941, -8.293145179748535, -7.499466419219971, -6.705789566040039, -5.912110805511475, -5.11843204498291, -4.324753761291504, -3.5310750007629395, -2.737396240234375, -1.9437179565429688, -1.1500391960144043, -0.35636043548583984, 0.43731820583343506, 1.23099684715271, 2.0246753692626953, 2.8183541297912598, 3.612032890319824, 4.4057111740112305, 5.199389934539795, 5.993068695068359, 6.786747455596924, 7.580426216125488, 8.374104499816895, 9.167783737182617, 9.961462020874023, 10.75514030456543, 11.548818588256836, 12.342497825622559, 13.136176109313965, 13.929855346679688, 14.723533630371094, 15.5172119140625, 16.310890197753906, 17.104568481445312, 17.89824867248535, 18.691926956176758]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 8.0, 13.0, 19.0, 28.0, 48.0, 87.0, 159.0, 235.0, 415.0, 887.0, 1890.0, 4715.0, 16204.0, 72632.0, 560115.0, 321466.0, 50521.0, 11856.0, 3936.0, 1636.0, 781.0, 358.0, 212.0, 126.0, 66.0, 44.0, 32.0, 23.0, 9.0, 10.0, 2.0, 4.0, 5.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.046875, -19.50341796875, -18.9599609375, -18.41650390625, -17.873046875, -17.32958984375, -16.7861328125, -16.24267578125, -15.69921875, -15.15576171875, -14.6123046875, -14.06884765625, -13.525390625, -12.98193359375, -12.4384765625, -11.89501953125, -11.3515625, -10.80810546875, -10.2646484375, -9.72119140625, -9.177734375, -8.63427734375, -8.0908203125, -7.54736328125, -7.00390625, -6.46044921875, -5.9169921875, -5.37353515625, -4.830078125, -4.28662109375, -3.7431640625, -3.19970703125, -2.65625, -2.11279296875, -1.5693359375, -1.02587890625, -0.482421875, 0.06103515625, 0.6044921875, 1.14794921875, 1.69140625, 2.23486328125, 2.7783203125, 3.32177734375, 3.865234375, 4.40869140625, 4.9521484375, 5.49560546875, 6.0390625, 6.58251953125, 7.1259765625, 7.66943359375, 8.212890625, 8.75634765625, 9.2998046875, 9.84326171875, 10.38671875, 10.93017578125, 11.4736328125, 12.01708984375, 12.560546875, 13.10400390625, 13.6474609375, 14.19091796875, 14.734375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 8.0, 9.0, 16.0, 20.0, 29.0, 35.0, 60.0, 75.0, 83.0, 78.0, 99.0, 71.0, 82.0, 81.0, 56.0, 42.0, 31.0, 35.0, 26.0, 14.0, 11.0, 11.0, 4.0, 5.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.3203125, -4.200897216796875, -4.08148193359375, -3.962066650390625, -3.8426513671875, -3.723236083984375, -3.60382080078125, -3.484405517578125, -3.364990234375, -3.245574951171875, -3.12615966796875, -3.006744384765625, -2.8873291015625, -2.767913818359375, -2.64849853515625, -2.529083251953125, -2.40966796875, -2.290252685546875, -2.17083740234375, -2.051422119140625, -1.9320068359375, -1.812591552734375, -1.69317626953125, -1.573760986328125, -1.454345703125, -1.334930419921875, -1.21551513671875, -1.096099853515625, -0.9766845703125, -0.857269287109375, -0.73785400390625, -0.618438720703125, -0.4990234375, -0.379608154296875, -0.26019287109375, -0.140777587890625, -0.0213623046875, 0.098052978515625, 0.21746826171875, 0.336883544921875, 0.456298828125, 0.575714111328125, 0.69512939453125, 0.814544677734375, 0.9339599609375, 1.053375244140625, 1.17279052734375, 1.292205810546875, 1.41162109375, 1.531036376953125, 1.65045166015625, 1.769866943359375, 1.8892822265625, 2.008697509765625, 2.12811279296875, 2.247528076171875, 2.366943359375, 2.486358642578125, 2.60577392578125, 2.725189208984375, 2.8446044921875, 2.964019775390625, 3.08343505859375, 3.202850341796875, 3.322265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 2.0, 10.0, 10.0, 9.0, 22.0, 26.0, 37.0, 38.0, 68.0, 98.0, 154.0, 230.0, 362.0, 626.0, 1117.0, 2311.0, 4956.0, 11517.0, 29057.0, 80155.0, 279950.0, 454499.0, 114425.0, 40589.0, 15496.0, 6553.0, 2856.0, 1433.0, 760.0, 413.0, 243.0, 155.0, 108.0, 71.0, 49.0, 44.0, 29.0, 17.0, 20.0, 6.0, 7.0, 6.0, 6.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.54296875, -7.29290771484375, -7.0428466796875, -6.79278564453125, -6.542724609375, -6.29266357421875, -6.0426025390625, -5.79254150390625, -5.54248046875, -5.29241943359375, -5.0423583984375, -4.79229736328125, -4.542236328125, -4.29217529296875, -4.0421142578125, -3.79205322265625, -3.5419921875, -3.29193115234375, -3.0418701171875, -2.79180908203125, -2.541748046875, -2.29168701171875, -2.0416259765625, -1.79156494140625, -1.54150390625, -1.29144287109375, -1.0413818359375, -0.79132080078125, -0.541259765625, -0.29119873046875, -0.0411376953125, 0.20892333984375, 0.458984375, 0.70904541015625, 0.9591064453125, 1.20916748046875, 1.459228515625, 1.70928955078125, 1.9593505859375, 2.20941162109375, 2.45947265625, 2.70953369140625, 2.9595947265625, 3.20965576171875, 3.459716796875, 3.70977783203125, 3.9598388671875, 4.20989990234375, 4.4599609375, 4.71002197265625, 4.9600830078125, 5.21014404296875, 5.460205078125, 5.71026611328125, 5.9603271484375, 6.21038818359375, 6.46044921875, 6.71051025390625, 6.9605712890625, 7.21063232421875, 7.460693359375, 7.71075439453125, 7.9608154296875, 8.21087646484375, 8.4609375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 8.0, 6.0, 15.0, 11.0, 21.0, 11.0, 21.0, 26.0, 17.0, 27.0, 28.0, 39.0, 38.0, 33.0, 34.0, 48.0, 58.0, 54.0, 38.0, 45.0, 50.0, 39.0, 39.0, 30.0, 38.0, 35.0, 23.0, 26.0, 23.0, 12.0, 18.0, 19.0, 14.0, 9.0, 9.0, 4.0, 10.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.2734375, -8.99267578125, -8.7119140625, -8.43115234375, -8.150390625, -7.86962890625, -7.5888671875, -7.30810546875, -7.02734375, -6.74658203125, -6.4658203125, -6.18505859375, -5.904296875, -5.62353515625, -5.3427734375, -5.06201171875, -4.78125, -4.50048828125, -4.2197265625, -3.93896484375, -3.658203125, -3.37744140625, -3.0966796875, -2.81591796875, -2.53515625, -2.25439453125, -1.9736328125, -1.69287109375, -1.412109375, -1.13134765625, -0.8505859375, -0.56982421875, -0.2890625, -0.00830078125, 0.2724609375, 0.55322265625, 0.833984375, 1.11474609375, 1.3955078125, 1.67626953125, 1.95703125, 2.23779296875, 2.5185546875, 2.79931640625, 3.080078125, 3.36083984375, 3.6416015625, 3.92236328125, 4.203125, 4.48388671875, 4.7646484375, 5.04541015625, 5.326171875, 5.60693359375, 5.8876953125, 6.16845703125, 6.44921875, 6.72998046875, 7.0107421875, 7.29150390625, 7.572265625, 7.85302734375, 8.1337890625, 8.41455078125, 8.6953125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 5.0, 4.0, 1.0, 3.0, 4.0, 9.0, 12.0, 11.0, 23.0, 29.0, 43.0, 78.0, 111.0, 189.0, 359.0, 619.0, 1333.0, 2807.0, 7600.0, 22888.0, 84273.0, 403252.0, 404508.0, 84288.0, 23049.0, 7384.0, 2823.0, 1275.0, 664.0, 335.0, 224.0, 125.0, 72.0, 50.0, 34.0, 14.0, 16.0, 8.0, 7.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.572265625, -3.46063232421875, -3.3489990234375, -3.23736572265625, -3.125732421875, -3.01409912109375, -2.9024658203125, -2.79083251953125, -2.67919921875, -2.56756591796875, -2.4559326171875, -2.34429931640625, -2.232666015625, -2.12103271484375, -2.0093994140625, -1.89776611328125, -1.7861328125, -1.67449951171875, -1.5628662109375, -1.45123291015625, -1.339599609375, -1.22796630859375, -1.1163330078125, -1.00469970703125, -0.89306640625, -0.78143310546875, -0.6697998046875, -0.55816650390625, -0.446533203125, -0.33489990234375, -0.2232666015625, -0.11163330078125, 0.0, 0.11163330078125, 0.2232666015625, 0.33489990234375, 0.446533203125, 0.55816650390625, 0.6697998046875, 0.78143310546875, 0.89306640625, 1.00469970703125, 1.1163330078125, 1.22796630859375, 1.339599609375, 1.45123291015625, 1.5628662109375, 1.67449951171875, 1.7861328125, 1.89776611328125, 2.0093994140625, 2.12103271484375, 2.232666015625, 2.34429931640625, 2.4559326171875, 2.56756591796875, 2.67919921875, 2.79083251953125, 2.9024658203125, 3.01409912109375, 3.125732421875, 3.23736572265625, 3.3489990234375, 3.46063232421875, 3.572265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 5.0, 6.0, 4.0, 9.0, 13.0, 17.0, 17.0, 23.0, 26.0, 54.0, 93.0, 219.0, 214.0, 99.0, 49.0, 24.0, 23.0, 22.0, 11.0, 9.0, 14.0, 5.0, 7.0, 8.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003807544708251953, -0.000362638384103775, -0.00034452229738235474, -0.00032640621066093445, -0.00030829012393951416, -0.00029017403721809387, -0.0002720579504966736, -0.0002539418637752533, -0.000235825777053833, -0.00021770969033241272, -0.00019959360361099243, -0.00018147751688957214, -0.00016336143016815186, -0.00014524534344673157, -0.00012712925672531128, -0.00010901317000389099, -9.08970832824707e-05, -7.278099656105042e-05, -5.466490983963013e-05, -3.654882311820984e-05, -1.843273639678955e-05, -3.166496753692627e-07, 1.7799437046051025e-05, 3.5915523767471313e-05, 5.40316104888916e-05, 7.214769721031189e-05, 9.026378393173218e-05, 0.00010837987065315247, 0.00012649595737457275, 0.00014461204409599304, 0.00016272813081741333, 0.00018084421753883362, 0.0001989603042602539, 0.0002170763909816742, 0.00023519247770309448, 0.00025330856442451477, 0.00027142465114593506, 0.00028954073786735535, 0.00030765682458877563, 0.0003257729113101959, 0.0003438889980316162, 0.0003620050847530365, 0.0003801211714744568, 0.0003982372581958771, 0.00041635334491729736, 0.00043446943163871765, 0.00045258551836013794, 0.00047070160508155823, 0.0004888176918029785, 0.0005069337785243988, 0.0005250498652458191, 0.0005431659519672394, 0.0005612820386886597, 0.00057939812541008, 0.0005975142121315002, 0.0006156302988529205, 0.0006337463855743408, 0.0006518624722957611, 0.0006699785590171814, 0.0006880946457386017, 0.000706210732460022, 0.0007243268191814423, 0.0007424429059028625, 0.0007605589926242828, 0.0007786750793457031]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 10.0, 14.0, 32.0, 41.0, 53.0, 104.0, 159.0, 302.0, 642.0, 1450.0, 3541.0, 10300.0, 37945.0, 186309.0, 607173.0, 153155.0, 32414.0, 9089.0, 3150.0, 1393.0, 587.0, 283.0, 163.0, 81.0, 52.0, 36.0, 28.0, 15.0, 7.0, 12.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.26953125, -3.13006591796875, -2.9906005859375, -2.85113525390625, -2.711669921875, -2.57220458984375, -2.4327392578125, -2.29327392578125, -2.15380859375, -2.01434326171875, -1.8748779296875, -1.73541259765625, -1.595947265625, -1.45648193359375, -1.3170166015625, -1.17755126953125, -1.0380859375, -0.89862060546875, -0.7591552734375, -0.61968994140625, -0.480224609375, -0.34075927734375, -0.2012939453125, -0.06182861328125, 0.07763671875, 0.21710205078125, 0.3565673828125, 0.49603271484375, 0.635498046875, 0.77496337890625, 0.9144287109375, 1.05389404296875, 1.193359375, 1.33282470703125, 1.4722900390625, 1.61175537109375, 1.751220703125, 1.89068603515625, 2.0301513671875, 2.16961669921875, 2.30908203125, 2.44854736328125, 2.5880126953125, 2.72747802734375, 2.866943359375, 3.00640869140625, 3.1458740234375, 3.28533935546875, 3.4248046875, 3.56427001953125, 3.7037353515625, 3.84320068359375, 3.982666015625, 4.12213134765625, 4.2615966796875, 4.40106201171875, 4.54052734375, 4.67999267578125, 4.8194580078125, 4.95892333984375, 5.098388671875, 5.23785400390625, 5.3773193359375, 5.51678466796875, 5.65625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 1.0, 1.0, 4.0, 6.0, 3.0, 8.0, 11.0, 13.0, 19.0, 22.0, 30.0, 49.0, 50.0, 76.0, 105.0, 148.0, 121.0, 81.0, 56.0, 47.0, 45.0, 26.0, 20.0, 10.0, 11.0, 12.0, 7.0, 6.0, 4.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.089996337890625, -2.94757080078125, -2.805145263671875, -2.6627197265625, -2.520294189453125, -2.37786865234375, -2.235443115234375, -2.093017578125, -1.950592041015625, -1.80816650390625, -1.665740966796875, -1.5233154296875, -1.380889892578125, -1.23846435546875, -1.096038818359375, -0.95361328125, -0.811187744140625, -0.66876220703125, -0.526336669921875, -0.3839111328125, -0.241485595703125, -0.09906005859375, 0.043365478515625, 0.185791015625, 0.328216552734375, 0.47064208984375, 0.613067626953125, 0.7554931640625, 0.897918701171875, 1.04034423828125, 1.182769775390625, 1.3251953125, 1.467620849609375, 1.61004638671875, 1.752471923828125, 1.8948974609375, 2.037322998046875, 2.17974853515625, 2.322174072265625, 2.464599609375, 2.607025146484375, 2.74945068359375, 2.891876220703125, 3.0343017578125, 3.176727294921875, 3.31915283203125, 3.461578369140625, 3.60400390625, 3.746429443359375, 3.88885498046875, 4.031280517578125, 4.1737060546875, 4.316131591796875, 4.45855712890625, 4.600982666015625, 4.743408203125, 4.885833740234375, 5.02825927734375, 5.170684814453125, 5.3131103515625, 5.455535888671875, 5.59796142578125, 5.740386962890625, 5.8828125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 10.0, 11.0, 16.0, 34.0, 26.0, 42.0, 76.0, 93.0, 104.0, 134.0, 117.0, 111.0, 64.0, 55.0, 34.0, 23.0, 14.0, 12.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-70.6212158203125, -68.93730926513672, -67.2533950805664, -65.56948852539062, -63.88557815551758, -62.2016716003418, -60.51776123046875, -58.83385467529297, -57.14994430541992, -55.466033935546875, -53.782127380371094, -52.09821701049805, -50.414306640625, -48.73040008544922, -47.04648971557617, -45.362579345703125, -43.678672790527344, -41.9947624206543, -40.310855865478516, -38.62694549560547, -36.94303512573242, -35.25912857055664, -33.575218200683594, -31.89130973815918, -30.2073974609375, -28.523488998413086, -26.83957862854004, -25.155670166015625, -23.47176170349121, -21.787853240966797, -20.10394287109375, -18.420034408569336, -16.736125946044922, -15.052216529846191, -13.368308067321777, -11.684398651123047, -10.000490188598633, -8.316580772399902, -6.632671356201172, -4.948762893676758, -3.2648534774780273, -1.5809444189071655, 0.10296463966369629, 1.7868738174438477, 3.47078275680542, 5.154691696166992, 6.838601112365723, 8.522509574890137, 10.206418991088867, 11.890328407287598, 13.574236869812012, 15.258146286010742, 16.942054748535156, 18.625965118408203, 20.309873580932617, 21.99378204345703, 23.677692413330078, 25.361600875854492, 27.04551124572754, 28.729419708251953, 30.413328170776367, 32.09723663330078, 33.78114700317383, 35.465057373046875, 37.148963928222656]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 7.0, 6.0, 7.0, 15.0, 11.0, 15.0, 22.0, 23.0, 28.0, 39.0, 35.0, 37.0, 49.0, 55.0, 54.0, 44.0, 48.0, 54.0, 40.0, 43.0, 60.0, 31.0, 37.0, 43.0, 37.0, 38.0, 24.0, 18.0, 18.0, 18.0, 13.0, 7.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.81719970703125, -40.212703704833984, -38.60820770263672, -37.00370788574219, -35.39921188354492, -33.794715881347656, -32.19021987915039, -30.585723876953125, -28.981225967407227, -27.37672996520996, -25.772232055664062, -24.167736053466797, -22.56324005126953, -20.958742141723633, -19.354246139526367, -17.74974822998047, -16.145252227783203, -14.540755271911621, -12.936258316040039, -11.331762313842773, -9.727265357971191, -8.12276840209961, -6.518272399902344, -4.913775444030762, -3.3092784881591797, -1.7047817707061768, -0.10028505325317383, 1.50421142578125, 3.108708381652832, 4.713205337524414, 6.31770133972168, 7.922198295593262, 9.526691436767578, 11.13118839263916, 12.735685348510742, 14.340181350708008, 15.94467830657959, 17.549175262451172, 19.153671264648438, 20.758167266845703, 22.3626651763916, 23.967161178588867, 25.571659088134766, 27.17615509033203, 28.780651092529297, 30.385149002075195, 31.98964500427246, 33.59414291381836, 35.198638916015625, 36.80313491821289, 38.407630920410156, 40.01213073730469, 41.61662673950195, 43.22112274169922, 44.825618743896484, 46.43011474609375, 48.03461456298828, 49.63911056518555, 51.24360656738281, 52.848106384277344, 54.45260238647461, 56.057098388671875, 57.66159439086914, 59.266090393066406, 60.87058639526367]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 8.0, 12.0, 10.0, 16.0, 21.0, 41.0, 46.0, 110.0, 135.0, 244.0, 493.0, 997.0, 2404.0, 7183.0, 30602.0, 471167.0, 3605964.0, 57018.0, 11093.0, 3591.0, 1452.0, 733.0, 374.0, 190.0, 130.0, 87.0, 50.0, 34.0, 32.0, 12.0, 10.0, 10.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.0, -22.1533203125, -21.306640625, -20.4599609375, -19.61328125, -18.7666015625, -17.919921875, -17.0732421875, -16.2265625, -15.3798828125, -14.533203125, -13.6865234375, -12.83984375, -11.9931640625, -11.146484375, -10.2998046875, -9.453125, -8.6064453125, -7.759765625, -6.9130859375, -6.06640625, -5.2197265625, -4.373046875, -3.5263671875, -2.6796875, -1.8330078125, -0.986328125, -0.1396484375, 0.70703125, 1.5537109375, 2.400390625, 3.2470703125, 4.09375, 4.9404296875, 5.787109375, 6.6337890625, 7.48046875, 8.3271484375, 9.173828125, 10.0205078125, 10.8671875, 11.7138671875, 12.560546875, 13.4072265625, 14.25390625, 15.1005859375, 15.947265625, 16.7939453125, 17.640625, 18.4873046875, 19.333984375, 20.1806640625, 21.02734375, 21.8740234375, 22.720703125, 23.5673828125, 24.4140625, 25.2607421875, 26.107421875, 26.9541015625, 27.80078125, 28.6474609375, 29.494140625, 30.3408203125, 31.1875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 9.0, 10.0, 10.0, 31.0, 35.0, 56.0, 65.0, 79.0, 85.0, 92.0, 97.0, 75.0, 67.0, 63.0, 55.0, 46.0, 35.0, 30.0, 13.0, 13.0, 6.0, 8.0, 5.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.328125, -4.19488525390625, -4.0616455078125, -3.92840576171875, -3.795166015625, -3.66192626953125, -3.5286865234375, -3.39544677734375, -3.26220703125, -3.12896728515625, -2.9957275390625, -2.86248779296875, -2.729248046875, -2.59600830078125, -2.4627685546875, -2.32952880859375, -2.1962890625, -2.06304931640625, -1.9298095703125, -1.79656982421875, -1.663330078125, -1.53009033203125, -1.3968505859375, -1.26361083984375, -1.13037109375, -0.99713134765625, -0.8638916015625, -0.73065185546875, -0.597412109375, -0.46417236328125, -0.3309326171875, -0.19769287109375, -0.064453125, 0.06878662109375, 0.2020263671875, 0.33526611328125, 0.468505859375, 0.60174560546875, 0.7349853515625, 0.86822509765625, 1.00146484375, 1.13470458984375, 1.2679443359375, 1.40118408203125, 1.534423828125, 1.66766357421875, 1.8009033203125, 1.93414306640625, 2.0673828125, 2.20062255859375, 2.3338623046875, 2.46710205078125, 2.600341796875, 2.73358154296875, 2.8668212890625, 3.00006103515625, 3.13330078125, 3.26654052734375, 3.3997802734375, 3.53302001953125, 3.666259765625, 3.79949951171875, 3.9327392578125, 4.06597900390625, 4.19921875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 4.0, 2.0, 5.0, 6.0, 13.0, 14.0, 22.0, 28.0, 46.0, 63.0, 118.0, 166.0, 259.0, 422.0, 633.0, 1102.0, 2025.0, 3847.0, 8029.0, 19285.0, 58664.0, 299652.0, 3340233.0, 356380.0, 64850.0, 20781.0, 8483.0, 4053.0, 2124.0, 1186.0, 647.0, 409.0, 249.0, 170.0, 106.0, 68.0, 47.0, 35.0, 25.0, 10.0, 10.0, 10.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.5546875, -10.239990234375, -9.92529296875, -9.610595703125, -9.2958984375, -8.981201171875, -8.66650390625, -8.351806640625, -8.037109375, -7.722412109375, -7.40771484375, -7.093017578125, -6.7783203125, -6.463623046875, -6.14892578125, -5.834228515625, -5.51953125, -5.204833984375, -4.89013671875, -4.575439453125, -4.2607421875, -3.946044921875, -3.63134765625, -3.316650390625, -3.001953125, -2.687255859375, -2.37255859375, -2.057861328125, -1.7431640625, -1.428466796875, -1.11376953125, -0.799072265625, -0.484375, -0.169677734375, 0.14501953125, 0.459716796875, 0.7744140625, 1.089111328125, 1.40380859375, 1.718505859375, 2.033203125, 2.347900390625, 2.66259765625, 2.977294921875, 3.2919921875, 3.606689453125, 3.92138671875, 4.236083984375, 4.55078125, 4.865478515625, 5.18017578125, 5.494873046875, 5.8095703125, 6.124267578125, 6.43896484375, 6.753662109375, 7.068359375, 7.383056640625, 7.69775390625, 8.012451171875, 8.3271484375, 8.641845703125, 8.95654296875, 9.271240234375, 9.5859375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 12.0, 5.0, 9.0, 13.0, 20.0, 15.0, 32.0, 58.0, 78.0, 196.0, 412.0, 1853.0, 786.0, 239.0, 120.0, 71.0, 34.0, 21.0, 25.0, 8.0, 12.0, 9.0, 5.0, 6.0, 3.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.34765625, -6.1748046875, -6.001953125, -5.8291015625, -5.65625, -5.4833984375, -5.310546875, -5.1376953125, -4.96484375, -4.7919921875, -4.619140625, -4.4462890625, -4.2734375, -4.1005859375, -3.927734375, -3.7548828125, -3.58203125, -3.4091796875, -3.236328125, -3.0634765625, -2.890625, -2.7177734375, -2.544921875, -2.3720703125, -2.19921875, -2.0263671875, -1.853515625, -1.6806640625, -1.5078125, -1.3349609375, -1.162109375, -0.9892578125, -0.81640625, -0.6435546875, -0.470703125, -0.2978515625, -0.125, 0.0478515625, 0.220703125, 0.3935546875, 0.56640625, 0.7392578125, 0.912109375, 1.0849609375, 1.2578125, 1.4306640625, 1.603515625, 1.7763671875, 1.94921875, 2.1220703125, 2.294921875, 2.4677734375, 2.640625, 2.8134765625, 2.986328125, 3.1591796875, 3.33203125, 3.5048828125, 3.677734375, 3.8505859375, 4.0234375, 4.1962890625, 4.369140625, 4.5419921875, 4.71484375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 6.0, 10.0, 15.0, 44.0, 54.0, 94.0, 144.0, 193.0, 175.0, 101.0, 77.0, 42.0, 18.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.78074645996094, -35.65587615966797, -34.531005859375, -33.40613555908203, -32.28126525878906, -31.156394958496094, -30.031524658203125, -28.906654357910156, -27.781784057617188, -26.65691375732422, -25.53204345703125, -24.40717315673828, -23.282302856445312, -22.157432556152344, -21.032562255859375, -19.907691955566406, -18.782821655273438, -17.65795135498047, -16.5330810546875, -15.408210754394531, -14.283340454101562, -13.158470153808594, -12.033599853515625, -10.908729553222656, -9.783859252929688, -8.658988952636719, -7.53411865234375, -6.409248352050781, -5.2843780517578125, -4.159507751464844, -3.034637451171875, -1.9097671508789062, -0.7848968505859375, 0.33997344970703125, 1.46484375, 2.5897140502929688, 3.7145843505859375, 4.839454650878906, 5.964324951171875, 7.089195251464844, 8.214065551757812, 9.338935852050781, 10.46380615234375, 11.588676452636719, 12.713546752929688, 13.838417053222656, 14.963287353515625, 16.088157653808594, 17.213027954101562, 18.33789825439453, 19.4627685546875, 20.58763885498047, 21.712509155273438, 22.837379455566406, 23.962249755859375, 25.087120056152344, 26.211990356445312, 27.33686065673828, 28.46173095703125, 29.58660125732422, 30.711471557617188, 31.836341857910156, 32.961212158203125, 34.086082458496094, 35.21095275878906]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 7.0, 6.0, 16.0, 19.0, 23.0, 31.0, 29.0, 38.0, 43.0, 55.0, 70.0, 59.0, 73.0, 74.0, 67.0, 63.0, 61.0, 67.0, 42.0, 40.0, 28.0, 33.0, 25.0, 12.0, 8.0, 7.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.62228775024414, -29.81966209411621, -29.01703453063965, -28.21440887451172, -27.411781311035156, -26.609155654907227, -25.806529998779297, -25.003902435302734, -24.201276779174805, -23.398651123046875, -22.596023559570312, -21.793397903442383, -20.99077033996582, -20.18814468383789, -19.385517120361328, -18.5828914642334, -17.78026580810547, -16.97764015197754, -16.175012588500977, -15.372386932373047, -14.5697603225708, -13.767133712768555, -12.964507102966309, -12.161880493164062, -11.3592529296875, -10.556626319885254, -9.753999710083008, -8.951374053955078, -8.148747444152832, -7.346120834350586, -6.54349422454834, -5.740868091583252, -4.938241958618164, -4.135615348815918, -3.33298921585083, -2.530362606048584, -1.727736234664917, -0.92510986328125, -0.1224832534790039, 0.680142879486084, 1.48276948928833, 2.285395860671997, 3.088022232055664, 3.89064884185791, 4.693275451660156, 5.495901584625244, 6.29852819442749, 7.101154327392578, 7.903780937194824, 8.70640754699707, 9.509034156799316, 10.311660766601562, 11.114286422729492, 11.916913032531738, 12.719539642333984, 13.522165298461914, 14.324792861938477, 15.127419471740723, 15.930046081542969, 16.7326717376709, 17.53529930114746, 18.33792495727539, 19.140552520751953, 19.943178176879883, 20.745803833007812]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 4.0, 11.0, 6.0, 17.0, 21.0, 34.0, 45.0, 77.0, 118.0, 213.0, 326.0, 552.0, 1018.0, 1860.0, 3842.0, 9505.0, 29307.0, 101891.0, 336977.0, 384941.0, 122479.0, 35130.0, 11071.0, 4494.0, 1971.0, 1117.0, 641.0, 345.0, 194.0, 103.0, 78.0, 53.0, 40.0, 22.0, 14.0, 11.0, 5.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.5859375, -10.179931640625, -9.77392578125, -9.367919921875, -8.9619140625, -8.555908203125, -8.14990234375, -7.743896484375, -7.337890625, -6.931884765625, -6.52587890625, -6.119873046875, -5.7138671875, -5.307861328125, -4.90185546875, -4.495849609375, -4.08984375, -3.683837890625, -3.27783203125, -2.871826171875, -2.4658203125, -2.059814453125, -1.65380859375, -1.247802734375, -0.841796875, -0.435791015625, -0.02978515625, 0.376220703125, 0.7822265625, 1.188232421875, 1.59423828125, 2.000244140625, 2.40625, 2.812255859375, 3.21826171875, 3.624267578125, 4.0302734375, 4.436279296875, 4.84228515625, 5.248291015625, 5.654296875, 6.060302734375, 6.46630859375, 6.872314453125, 7.2783203125, 7.684326171875, 8.09033203125, 8.496337890625, 8.90234375, 9.308349609375, 9.71435546875, 10.120361328125, 10.5263671875, 10.932373046875, 11.33837890625, 11.744384765625, 12.150390625, 12.556396484375, 12.96240234375, 13.368408203125, 13.7744140625, 14.180419921875, 14.58642578125, 14.992431640625, 15.3984375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 7.0, 6.0, 5.0, 13.0, 10.0, 21.0, 34.0, 49.0, 64.0, 52.0, 74.0, 84.0, 72.0, 85.0, 69.0, 67.0, 55.0, 56.0, 42.0, 40.0, 26.0, 20.0, 15.0, 8.0, 10.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.52734375, -4.40264892578125, -4.2779541015625, -4.15325927734375, -4.028564453125, -3.90386962890625, -3.7791748046875, -3.65447998046875, -3.52978515625, -3.40509033203125, -3.2803955078125, -3.15570068359375, -3.031005859375, -2.90631103515625, -2.7816162109375, -2.65692138671875, -2.5322265625, -2.40753173828125, -2.2828369140625, -2.15814208984375, -2.033447265625, -1.90875244140625, -1.7840576171875, -1.65936279296875, -1.53466796875, -1.40997314453125, -1.2852783203125, -1.16058349609375, -1.035888671875, -0.91119384765625, -0.7864990234375, -0.66180419921875, -0.537109375, -0.41241455078125, -0.2877197265625, -0.16302490234375, -0.038330078125, 0.08636474609375, 0.2110595703125, 0.33575439453125, 0.46044921875, 0.58514404296875, 0.7098388671875, 0.83453369140625, 0.959228515625, 1.08392333984375, 1.2086181640625, 1.33331298828125, 1.4580078125, 1.58270263671875, 1.7073974609375, 1.83209228515625, 1.956787109375, 2.08148193359375, 2.2061767578125, 2.33087158203125, 2.45556640625, 2.58026123046875, 2.7049560546875, 2.82965087890625, 2.954345703125, 3.07904052734375, 3.2037353515625, 3.32843017578125, 3.453125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 12.0, 13.0, 12.0, 18.0, 29.0, 45.0, 66.0, 89.0, 144.0, 203.0, 275.0, 452.0, 823.0, 1827.0, 6502.0, 45840.0, 462614.0, 472210.0, 46813.0, 6496.0, 1801.0, 826.0, 444.0, 264.0, 217.0, 138.0, 109.0, 82.0, 48.0, 35.0, 23.0, 14.0, 15.0, 11.0, 7.0, 7.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.5, -16.916748046875, -16.33349609375, -15.750244140625, -15.1669921875, -14.583740234375, -14.00048828125, -13.417236328125, -12.833984375, -12.250732421875, -11.66748046875, -11.084228515625, -10.5009765625, -9.917724609375, -9.33447265625, -8.751220703125, -8.16796875, -7.584716796875, -7.00146484375, -6.418212890625, -5.8349609375, -5.251708984375, -4.66845703125, -4.085205078125, -3.501953125, -2.918701171875, -2.33544921875, -1.752197265625, -1.1689453125, -0.585693359375, -0.00244140625, 0.580810546875, 1.1640625, 1.747314453125, 2.33056640625, 2.913818359375, 3.4970703125, 4.080322265625, 4.66357421875, 5.246826171875, 5.830078125, 6.413330078125, 6.99658203125, 7.579833984375, 8.1630859375, 8.746337890625, 9.32958984375, 9.912841796875, 10.49609375, 11.079345703125, 11.66259765625, 12.245849609375, 12.8291015625, 13.412353515625, 13.99560546875, 14.578857421875, 15.162109375, 15.745361328125, 16.32861328125, 16.911865234375, 17.4951171875, 18.078369140625, 18.66162109375, 19.244873046875, 19.828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 9.0, 6.0, 10.0, 11.0, 10.0, 16.0, 23.0, 15.0, 28.0, 35.0, 27.0, 31.0, 38.0, 47.0, 45.0, 39.0, 53.0, 56.0, 54.0, 48.0, 48.0, 41.0, 52.0, 44.0, 33.0, 28.0, 26.0, 25.0, 22.0, 10.0, 20.0, 11.0, 7.0, 12.0, 7.0, 5.0, 1.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.5078125, -13.1177978515625, -12.727783203125, -12.3377685546875, -11.94775390625, -11.5577392578125, -11.167724609375, -10.7777099609375, -10.3876953125, -9.9976806640625, -9.607666015625, -9.2176513671875, -8.82763671875, -8.4376220703125, -8.047607421875, -7.6575927734375, -7.267578125, -6.8775634765625, -6.487548828125, -6.0975341796875, -5.70751953125, -5.3175048828125, -4.927490234375, -4.5374755859375, -4.1474609375, -3.7574462890625, -3.367431640625, -2.9774169921875, -2.58740234375, -2.1973876953125, -1.807373046875, -1.4173583984375, -1.02734375, -0.6373291015625, -0.247314453125, 0.1427001953125, 0.53271484375, 0.9227294921875, 1.312744140625, 1.7027587890625, 2.0927734375, 2.4827880859375, 2.872802734375, 3.2628173828125, 3.65283203125, 4.0428466796875, 4.432861328125, 4.8228759765625, 5.212890625, 5.6029052734375, 5.992919921875, 6.3829345703125, 6.77294921875, 7.1629638671875, 7.552978515625, 7.9429931640625, 8.3330078125, 8.7230224609375, 9.113037109375, 9.5030517578125, 9.89306640625, 10.2830810546875, 10.673095703125, 11.0631103515625, 11.453125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 3.0, 8.0, 10.0, 34.0, 79.0, 244.0, 1219.0, 1022885.0, 23321.0, 484.0, 142.0, 57.0, 24.0, 27.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.9375, -75.00390625, -73.0703125, -71.13671875, -69.203125, -67.26953125, -65.3359375, -63.40234375, -61.46875, -59.53515625, -57.6015625, -55.66796875, -53.734375, -51.80078125, -49.8671875, -47.93359375, -46.0, -44.06640625, -42.1328125, -40.19921875, -38.265625, -36.33203125, -34.3984375, -32.46484375, -30.53125, -28.59765625, -26.6640625, -24.73046875, -22.796875, -20.86328125, -18.9296875, -16.99609375, -15.0625, -13.12890625, -11.1953125, -9.26171875, -7.328125, -5.39453125, -3.4609375, -1.52734375, 0.40625, 2.33984375, 4.2734375, 6.20703125, 8.140625, 10.07421875, 12.0078125, 13.94140625, 15.875, 17.80859375, 19.7421875, 21.67578125, 23.609375, 25.54296875, 27.4765625, 29.41015625, 31.34375, 33.27734375, 35.2109375, 37.14453125, 39.078125, 41.01171875, 42.9453125, 44.87890625, 46.8125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 6.0, 22.0, 24.0, 32.0, 44.0, 54.0, 83.0, 168.0, 202.0, 95.0, 68.0, 49.0, 34.0, 37.0, 23.0, 16.0, 13.0, 3.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0011129379272460938, -0.0010852590203285217, -0.0010575801134109497, -0.0010299012064933777, -0.0010022222995758057, -0.0009745433926582336, -0.0009468644857406616, -0.0009191855788230896, -0.0008915066719055176, -0.0008638277649879456, -0.0008361488580703735, -0.0008084699511528015, -0.0007807910442352295, -0.0007531121373176575, -0.0007254332304000854, -0.0006977543234825134, -0.0006700754165649414, -0.0006423965096473694, -0.0006147176027297974, -0.0005870386958122253, -0.0005593597888946533, -0.0005316808819770813, -0.0005040019750595093, -0.00047632306814193726, -0.00044864416122436523, -0.0004209652543067932, -0.0003932863473892212, -0.00036560744047164917, -0.00033792853355407715, -0.0003102496266365051, -0.0002825707197189331, -0.0002548918128013611, -0.00022721290588378906, -0.00019953399896621704, -0.00017185509204864502, -0.000144176185131073, -0.00011649727821350098, -8.881837129592896e-05, -6.113946437835693e-05, -3.346055746078491e-05, -5.781650543212891e-06, 2.189725637435913e-05, 4.957616329193115e-05, 7.725507020950317e-05, 0.0001049339771270752, 0.00013261288404464722, 0.00016029179096221924, 0.00018797069787979126, 0.00021564960479736328, 0.0002433285117149353, 0.0002710074186325073, 0.00029868632555007935, 0.00032636523246765137, 0.0003540441393852234, 0.0003817230463027954, 0.00040940195322036743, 0.00043708086013793945, 0.0004647597670555115, 0.0004924386739730835, 0.0005201175808906555, 0.0005477964878082275, 0.0005754753947257996, 0.0006031543016433716, 0.0006308332085609436, 0.0006585121154785156]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 12.0, 14.0, 24.0, 46.0, 64.0, 108.0, 208.0, 1196.0, 209095.0, 835675.0, 1619.0, 231.0, 101.0, 69.0, 39.0, 27.0, 10.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.3125, -44.53515625, -42.7578125, -40.98046875, -39.203125, -37.42578125, -35.6484375, -33.87109375, -32.09375, -30.31640625, -28.5390625, -26.76171875, -24.984375, -23.20703125, -21.4296875, -19.65234375, -17.875, -16.09765625, -14.3203125, -12.54296875, -10.765625, -8.98828125, -7.2109375, -5.43359375, -3.65625, -1.87890625, -0.1015625, 1.67578125, 3.453125, 5.23046875, 7.0078125, 8.78515625, 10.5625, 12.33984375, 14.1171875, 15.89453125, 17.671875, 19.44921875, 21.2265625, 23.00390625, 24.78125, 26.55859375, 28.3359375, 30.11328125, 31.890625, 33.66796875, 35.4453125, 37.22265625, 39.0, 40.77734375, 42.5546875, 44.33203125, 46.109375, 47.88671875, 49.6640625, 51.44140625, 53.21875, 54.99609375, 56.7734375, 58.55078125, 60.328125, 62.10546875, 63.8828125, 65.66015625, 67.4375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 12.0, 22.0, 136.0, 464.0, 273.0, 58.0, 17.0, 11.0, 9.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-58.0, -56.8798828125, -55.759765625, -54.6396484375, -53.51953125, -52.3994140625, -51.279296875, -50.1591796875, -49.0390625, -47.9189453125, -46.798828125, -45.6787109375, -44.55859375, -43.4384765625, -42.318359375, -41.1982421875, -40.078125, -38.9580078125, -37.837890625, -36.7177734375, -35.59765625, -34.4775390625, -33.357421875, -32.2373046875, -31.1171875, -29.9970703125, -28.876953125, -27.7568359375, -26.63671875, -25.5166015625, -24.396484375, -23.2763671875, -22.15625, -21.0361328125, -19.916015625, -18.7958984375, -17.67578125, -16.5556640625, -15.435546875, -14.3154296875, -13.1953125, -12.0751953125, -10.955078125, -9.8349609375, -8.71484375, -7.5947265625, -6.474609375, -5.3544921875, -4.234375, -3.1142578125, -1.994140625, -0.8740234375, 0.24609375, 1.3662109375, 2.486328125, 3.6064453125, 4.7265625, 5.8466796875, 6.966796875, 8.0869140625, 9.20703125, 10.3271484375, 11.447265625, 12.5673828125, 13.6875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 22.0, 341.0, 589.0, 46.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-796.689453125, -778.2695922851562, -759.8497314453125, -741.429931640625, -723.0100708007812, -704.5902099609375, -686.17041015625, -667.7505493164062, -649.3306884765625, -630.9108276367188, -612.490966796875, -594.0711669921875, -575.6513061523438, -557.2314453125, -538.8116455078125, -520.3917846679688, -501.971923828125, -483.55206298828125, -465.1322326660156, -446.71240234375, -428.29254150390625, -409.8726806640625, -391.4528503417969, -373.03302001953125, -354.6131591796875, -336.19329833984375, -317.7734680175781, -299.3536376953125, -280.93377685546875, -262.513916015625, -244.09408569335938, -225.6742401123047, -207.25439453125, -188.8345489501953, -170.41470336914062, -151.99485778808594, -133.57501220703125, -115.15516662597656, -96.73532104492188, -78.31547546386719, -59.8956298828125, -41.47578430175781, -23.055938720703125, -4.6360931396484375, 13.78375244140625, 32.20359802246094, 50.623443603515625, 69.04328918457031, 87.463134765625, 105.88298034667969, 124.30282592773438, 142.72267150878906, 161.14251708984375, 179.56236267089844, 197.98220825195312, 216.4020538330078, 234.8218994140625, 253.2417449951172, 271.6615905761719, 290.0814208984375, 308.50128173828125, 326.921142578125, 345.3409729003906, 363.76080322265625, 382.1806640625]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 9.0, 8.0, 6.0, 13.0, 15.0, 11.0, 14.0, 14.0, 19.0, 20.0, 22.0, 27.0, 21.0, 27.0, 34.0, 40.0, 24.0, 37.0, 27.0, 37.0, 45.0, 30.0, 49.0, 41.0, 45.0, 49.0, 25.0, 33.0, 32.0, 31.0, 28.0, 22.0, 18.0, 24.0, 16.0, 15.0, 16.0, 10.0, 11.0, 4.0, 4.0, 5.0, 2.0, 7.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.77617645263672, -52.00102996826172, -50.225887298583984, -48.450740814208984, -46.675594329833984, -44.90045166015625, -43.12530517578125, -41.35015869140625, -39.575016021728516, -37.799869537353516, -36.02472686767578, -34.24958038330078, -32.47443389892578, -30.699291229248047, -28.924144744873047, -27.14900016784668, -25.37385368347168, -23.598709106445312, -21.823562622070312, -20.048418045043945, -18.273273468017578, -16.498126983642578, -14.722982406616211, -12.947837829589844, -11.17269229888916, -9.397546768188477, -7.622402191162109, -5.847256660461426, -4.0721116065979, -2.296966552734375, -0.5218210220336914, 1.2533235549926758, 3.0284690856933594, 4.803614139556885, 6.57875919342041, 8.353904724121094, 10.129049301147461, 11.904194831848145, 13.679340362548828, 15.454484939575195, 17.229629516601562, 19.00477409362793, 20.77992057800293, 22.555065155029297, 24.330209732055664, 26.10535430908203, 27.88050079345703, 29.6556453704834, 31.4307918548584, 33.205936431884766, 34.981082916259766, 36.7562255859375, 38.5313720703125, 40.3065185546875, 42.0816650390625, 43.856807708740234, 45.631954193115234, 47.407100677490234, 49.18224334716797, 50.95738983154297, 52.73253631591797, 54.5076789855957, 56.2828254699707, 58.05796813964844, 59.83311462402344]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 6.0, 3.0, 11.0, 19.0, 29.0, 30.0, 45.0, 79.0, 88.0, 164.0, 278.0, 370.0, 701.0, 1400.0, 2801.0, 6663.0, 18515.0, 74063.0, 776945.0, 3127326.0, 139362.0, 28779.0, 9101.0, 3663.0, 1581.0, 876.0, 511.0, 287.0, 212.0, 111.0, 91.0, 47.0, 42.0, 20.0, 17.0, 15.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-14.1953125, -13.7799072265625, -13.364501953125, -12.9490966796875, -12.53369140625, -12.1182861328125, -11.702880859375, -11.2874755859375, -10.8720703125, -10.4566650390625, -10.041259765625, -9.6258544921875, -9.21044921875, -8.7950439453125, -8.379638671875, -7.9642333984375, -7.548828125, -7.1334228515625, -6.718017578125, -6.3026123046875, -5.88720703125, -5.4718017578125, -5.056396484375, -4.6409912109375, -4.2255859375, -3.8101806640625, -3.394775390625, -2.9793701171875, -2.56396484375, -2.1485595703125, -1.733154296875, -1.3177490234375, -0.90234375, -0.4869384765625, -0.071533203125, 0.3438720703125, 0.75927734375, 1.1746826171875, 1.590087890625, 2.0054931640625, 2.4208984375, 2.8363037109375, 3.251708984375, 3.6671142578125, 4.08251953125, 4.4979248046875, 4.913330078125, 5.3287353515625, 5.744140625, 6.1595458984375, 6.574951171875, 6.9903564453125, 7.40576171875, 7.8211669921875, 8.236572265625, 8.6519775390625, 9.0673828125, 9.4827880859375, 9.898193359375, 10.3135986328125, 10.72900390625, 11.1444091796875, 11.559814453125, 11.9752197265625, 12.390625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 6.0, 2.0, 5.0, 11.0, 13.0, 24.0, 33.0, 38.0, 39.0, 57.0, 63.0, 52.0, 67.0, 70.0, 58.0, 57.0, 72.0, 70.0, 42.0, 47.0, 45.0, 38.0, 20.0, 19.0, 12.0, 7.0, 6.0, 2.0, 3.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5234375, -4.398590087890625, -4.27374267578125, -4.148895263671875, -4.0240478515625, -3.899200439453125, -3.77435302734375, -3.649505615234375, -3.524658203125, -3.399810791015625, -3.27496337890625, -3.150115966796875, -3.0252685546875, -2.900421142578125, -2.77557373046875, -2.650726318359375, -2.52587890625, -2.401031494140625, -2.27618408203125, -2.151336669921875, -2.0264892578125, -1.901641845703125, -1.77679443359375, -1.651947021484375, -1.527099609375, -1.402252197265625, -1.27740478515625, -1.152557373046875, -1.0277099609375, -0.902862548828125, -0.77801513671875, -0.653167724609375, -0.5283203125, -0.403472900390625, -0.27862548828125, -0.153778076171875, -0.0289306640625, 0.095916748046875, 0.22076416015625, 0.345611572265625, 0.470458984375, 0.595306396484375, 0.72015380859375, 0.845001220703125, 0.9698486328125, 1.094696044921875, 1.21954345703125, 1.344390869140625, 1.46923828125, 1.594085693359375, 1.71893310546875, 1.843780517578125, 1.9686279296875, 2.093475341796875, 2.21832275390625, 2.343170166015625, 2.468017578125, 2.592864990234375, 2.71771240234375, 2.842559814453125, 2.9674072265625, 3.092254638671875, 3.21710205078125, 3.341949462890625, 3.466796875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 11.0, 9.0, 19.0, 40.0, 51.0, 85.0, 131.0, 238.0, 347.0, 625.0, 1096.0, 2393.0, 5674.0, 15633.0, 60783.0, 483667.0, 3298725.0, 261910.0, 41974.0, 12079.0, 4407.0, 1996.0, 993.0, 545.0, 300.0, 206.0, 124.0, 79.0, 43.0, 30.0, 23.0, 12.0, 15.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.7578125, -12.41650390625, -12.0751953125, -11.73388671875, -11.392578125, -11.05126953125, -10.7099609375, -10.36865234375, -10.02734375, -9.68603515625, -9.3447265625, -9.00341796875, -8.662109375, -8.32080078125, -7.9794921875, -7.63818359375, -7.296875, -6.95556640625, -6.6142578125, -6.27294921875, -5.931640625, -5.59033203125, -5.2490234375, -4.90771484375, -4.56640625, -4.22509765625, -3.8837890625, -3.54248046875, -3.201171875, -2.85986328125, -2.5185546875, -2.17724609375, -1.8359375, -1.49462890625, -1.1533203125, -0.81201171875, -0.470703125, -0.12939453125, 0.2119140625, 0.55322265625, 0.89453125, 1.23583984375, 1.5771484375, 1.91845703125, 2.259765625, 2.60107421875, 2.9423828125, 3.28369140625, 3.625, 3.96630859375, 4.3076171875, 4.64892578125, 4.990234375, 5.33154296875, 5.6728515625, 6.01416015625, 6.35546875, 6.69677734375, 7.0380859375, 7.37939453125, 7.720703125, 8.06201171875, 8.4033203125, 8.74462890625, 9.0859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 6.0, 1.0, 2.0, 17.0, 11.0, 17.0, 19.0, 42.0, 54.0, 101.0, 184.0, 482.0, 1645.0, 923.0, 275.0, 119.0, 55.0, 31.0, 21.0, 23.0, 7.0, 13.0, 6.0, 4.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.46875, -8.22528076171875, -7.9818115234375, -7.73834228515625, -7.494873046875, -7.25140380859375, -7.0079345703125, -6.76446533203125, -6.52099609375, -6.27752685546875, -6.0340576171875, -5.79058837890625, -5.547119140625, -5.30364990234375, -5.0601806640625, -4.81671142578125, -4.5732421875, -4.32977294921875, -4.0863037109375, -3.84283447265625, -3.599365234375, -3.35589599609375, -3.1124267578125, -2.86895751953125, -2.62548828125, -2.38201904296875, -2.1385498046875, -1.89508056640625, -1.651611328125, -1.40814208984375, -1.1646728515625, -0.92120361328125, -0.677734375, -0.43426513671875, -0.1907958984375, 0.05267333984375, 0.296142578125, 0.53961181640625, 0.7830810546875, 1.02655029296875, 1.27001953125, 1.51348876953125, 1.7569580078125, 2.00042724609375, 2.243896484375, 2.48736572265625, 2.7308349609375, 2.97430419921875, 3.2177734375, 3.46124267578125, 3.7047119140625, 3.94818115234375, 4.191650390625, 4.43511962890625, 4.6785888671875, 4.92205810546875, 5.16552734375, 5.40899658203125, 5.6524658203125, 5.89593505859375, 6.139404296875, 6.38287353515625, 6.6263427734375, 6.86981201171875, 7.11328125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 8.0, 17.0, 14.0, 40.0, 104.0, 188.0, 261.0, 234.0, 95.0, 28.0, 8.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.065826416015625, -54.70390319824219, -52.34197998046875, -49.98005676269531, -47.618133544921875, -45.25621032714844, -42.894290924072266, -40.53236770629883, -38.17044448852539, -35.80852127075195, -33.446598052978516, -31.08467674255371, -28.722753524780273, -26.360830307006836, -23.99890899658203, -21.636985778808594, -19.275062561035156, -16.91313934326172, -14.551217079162598, -12.189294815063477, -9.827371597290039, -7.465448379516602, -5.1035261154174805, -2.7416038513183594, -0.3796806335449219, 1.9822421073913574, 4.344164848327637, 6.706087589263916, 9.068010330200195, 11.429933547973633, 13.791855812072754, 16.153778076171875, 18.515708923339844, 20.87763214111328, 23.23955535888672, 25.601476669311523, 27.96339988708496, 30.3253231048584, 32.6872444152832, 35.04916763305664, 37.41109085083008, 39.773014068603516, 42.13493728637695, 44.49686050415039, 46.85877990722656, 49.220703125, 51.58262634277344, 53.944549560546875, 56.30647277832031, 58.66839599609375, 61.03031921386719, 63.392242431640625, 65.75416564941406, 68.1160888671875, 70.47801208496094, 72.83993530273438, 75.20185852050781, 77.56378173828125, 79.92570495605469, 82.28762817382812, 84.64955139160156, 87.011474609375, 89.37339782714844, 91.73532104492188, 94.09723663330078]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 6.0, 3.0, 6.0, 14.0, 7.0, 14.0, 25.0, 23.0, 20.0, 33.0, 29.0, 32.0, 39.0, 50.0, 42.0, 48.0, 46.0, 47.0, 53.0, 44.0, 47.0, 40.0, 45.0, 39.0, 44.0, 37.0, 43.0, 22.0, 17.0, 19.0, 21.0, 16.0, 10.0, 5.0, 5.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.25265121459961, -26.316022872924805, -25.37939453125, -24.442768096923828, -23.506139755249023, -22.56951141357422, -21.632884979248047, -20.696256637573242, -19.759628295898438, -18.822999954223633, -17.886371612548828, -16.949745178222656, -16.01311683654785, -15.076488494873047, -14.139861106872559, -13.20323371887207, -12.266605377197266, -11.329977035522461, -10.393349647521973, -9.456722259521484, -8.52009391784668, -7.583466053009033, -6.646838188171387, -5.71021032333374, -4.773582458496094, -3.8369545936584473, -2.900326728820801, -1.9636988639831543, -1.0270709991455078, -0.09044313430786133, 0.8461847305297852, 1.7828125953674316, 2.719440460205078, 3.6560683250427246, 4.592696189880371, 5.529324054718018, 6.465951919555664, 7.4025797843933105, 8.339207649230957, 9.275835037231445, 10.21246337890625, 11.149091720581055, 12.085719108581543, 13.022346496582031, 13.958974838256836, 14.89560317993164, 15.832230567932129, 16.768857955932617, 17.705486297607422, 18.642114639282227, 19.57874298095703, 20.515369415283203, 21.451997756958008, 22.388626098632812, 23.325252532958984, 24.26188087463379, 25.198509216308594, 26.1351375579834, 27.071765899658203, 28.008392333984375, 28.94502067565918, 29.881649017333984, 30.818275451660156, 31.75490379333496, 32.691532135009766]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 6.0, 10.0, 8.0, 10.0, 26.0, 37.0, 52.0, 68.0, 102.0, 187.0, 314.0, 520.0, 973.0, 2020.0, 4400.0, 11810.0, 39820.0, 161253.0, 467606.0, 265551.0, 64350.0, 17860.0, 6061.0, 2560.0, 1270.0, 674.0, 377.0, 219.0, 136.0, 96.0, 45.0, 35.0, 24.0, 17.0, 11.0, 8.0, 5.0, 3.0, 1.0, 4.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-14.578125, -14.145263671875, -13.71240234375, -13.279541015625, -12.8466796875, -12.413818359375, -11.98095703125, -11.548095703125, -11.115234375, -10.682373046875, -10.24951171875, -9.816650390625, -9.3837890625, -8.950927734375, -8.51806640625, -8.085205078125, -7.65234375, -7.219482421875, -6.78662109375, -6.353759765625, -5.9208984375, -5.488037109375, -5.05517578125, -4.622314453125, -4.189453125, -3.756591796875, -3.32373046875, -2.890869140625, -2.4580078125, -2.025146484375, -1.59228515625, -1.159423828125, -0.7265625, -0.293701171875, 0.13916015625, 0.572021484375, 1.0048828125, 1.437744140625, 1.87060546875, 2.303466796875, 2.736328125, 3.169189453125, 3.60205078125, 4.034912109375, 4.4677734375, 4.900634765625, 5.33349609375, 5.766357421875, 6.19921875, 6.632080078125, 7.06494140625, 7.497802734375, 7.9306640625, 8.363525390625, 8.79638671875, 9.229248046875, 9.662109375, 10.094970703125, 10.52783203125, 10.960693359375, 11.3935546875, 11.826416015625, 12.25927734375, 12.692138671875, 13.125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 2.0, 1.0, 5.0, 6.0, 13.0, 17.0, 11.0, 20.0, 29.0, 36.0, 48.0, 43.0, 58.0, 60.0, 58.0, 79.0, 68.0, 59.0, 62.0, 62.0, 61.0, 43.0, 29.0, 34.0, 28.0, 16.0, 13.0, 10.0, 7.0, 3.0, 1.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.516357421875, -4.38818359375, -4.260009765625, -4.1318359375, -4.003662109375, -3.87548828125, -3.747314453125, -3.619140625, -3.490966796875, -3.36279296875, -3.234619140625, -3.1064453125, -2.978271484375, -2.85009765625, -2.721923828125, -2.59375, -2.465576171875, -2.33740234375, -2.209228515625, -2.0810546875, -1.952880859375, -1.82470703125, -1.696533203125, -1.568359375, -1.440185546875, -1.31201171875, -1.183837890625, -1.0556640625, -0.927490234375, -0.79931640625, -0.671142578125, -0.54296875, -0.414794921875, -0.28662109375, -0.158447265625, -0.0302734375, 0.097900390625, 0.22607421875, 0.354248046875, 0.482421875, 0.610595703125, 0.73876953125, 0.866943359375, 0.9951171875, 1.123291015625, 1.25146484375, 1.379638671875, 1.5078125, 1.635986328125, 1.76416015625, 1.892333984375, 2.0205078125, 2.148681640625, 2.27685546875, 2.405029296875, 2.533203125, 2.661376953125, 2.78955078125, 2.917724609375, 3.0458984375, 3.174072265625, 3.30224609375, 3.430419921875, 3.55859375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 1.0, 6.0, 10.0, 11.0, 12.0, 23.0, 30.0, 29.0, 54.0, 82.0, 122.0, 194.0, 375.0, 640.0, 1382.0, 4538.0, 35086.0, 763389.0, 225253.0, 12603.0, 2560.0, 923.0, 479.0, 272.0, 152.0, 96.0, 67.0, 45.0, 22.0, 24.0, 18.0, 18.0, 10.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.625, -34.600830078125, -33.57666015625, -32.552490234375, -31.5283203125, -30.504150390625, -29.47998046875, -28.455810546875, -27.431640625, -26.407470703125, -25.38330078125, -24.359130859375, -23.3349609375, -22.310791015625, -21.28662109375, -20.262451171875, -19.23828125, -18.214111328125, -17.18994140625, -16.165771484375, -15.1416015625, -14.117431640625, -13.09326171875, -12.069091796875, -11.044921875, -10.020751953125, -8.99658203125, -7.972412109375, -6.9482421875, -5.924072265625, -4.89990234375, -3.875732421875, -2.8515625, -1.827392578125, -0.80322265625, 0.220947265625, 1.2451171875, 2.269287109375, 3.29345703125, 4.317626953125, 5.341796875, 6.365966796875, 7.39013671875, 8.414306640625, 9.4384765625, 10.462646484375, 11.48681640625, 12.510986328125, 13.53515625, 14.559326171875, 15.58349609375, 16.607666015625, 17.6318359375, 18.656005859375, 19.68017578125, 20.704345703125, 21.728515625, 22.752685546875, 23.77685546875, 24.801025390625, 25.8251953125, 26.849365234375, 27.87353515625, 28.897705078125, 29.921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 4.0, 8.0, 6.0, 8.0, 8.0, 13.0, 12.0, 18.0, 7.0, 22.0, 13.0, 19.0, 35.0, 22.0, 40.0, 39.0, 38.0, 45.0, 57.0, 36.0, 51.0, 36.0, 47.0, 48.0, 38.0, 36.0, 43.0, 34.0, 26.0, 32.0, 18.0, 29.0, 16.0, 14.0, 10.0, 21.0, 6.0, 10.0, 9.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-14.3203125, -13.8558349609375, -13.391357421875, -12.9268798828125, -12.46240234375, -11.9979248046875, -11.533447265625, -11.0689697265625, -10.6044921875, -10.1400146484375, -9.675537109375, -9.2110595703125, -8.74658203125, -8.2821044921875, -7.817626953125, -7.3531494140625, -6.888671875, -6.4241943359375, -5.959716796875, -5.4952392578125, -5.03076171875, -4.5662841796875, -4.101806640625, -3.6373291015625, -3.1728515625, -2.7083740234375, -2.243896484375, -1.7794189453125, -1.31494140625, -0.8504638671875, -0.385986328125, 0.0784912109375, 0.54296875, 1.0074462890625, 1.471923828125, 1.9364013671875, 2.40087890625, 2.8653564453125, 3.329833984375, 3.7943115234375, 4.2587890625, 4.7232666015625, 5.187744140625, 5.6522216796875, 6.11669921875, 6.5811767578125, 7.045654296875, 7.5101318359375, 7.974609375, 8.4390869140625, 8.903564453125, 9.3680419921875, 9.83251953125, 10.2969970703125, 10.761474609375, 11.2259521484375, 11.6904296875, 12.1549072265625, 12.619384765625, 13.0838623046875, 13.54833984375, 14.0128173828125, 14.477294921875, 14.9417724609375, 15.40625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 0.0, 4.0, 6.0, 17.0, 13.0, 22.0, 38.0, 95.0, 280.0, 832.0, 3241.0, 67171.0, 940450.0, 32740.0, 2592.0, 631.0, 195.0, 91.0, 55.0, 23.0, 18.0, 16.0, 4.0, 8.0, 0.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.296875, -19.781982421875, -19.26708984375, -18.752197265625, -18.2373046875, -17.722412109375, -17.20751953125, -16.692626953125, -16.177734375, -15.662841796875, -15.14794921875, -14.633056640625, -14.1181640625, -13.603271484375, -13.08837890625, -12.573486328125, -12.05859375, -11.543701171875, -11.02880859375, -10.513916015625, -9.9990234375, -9.484130859375, -8.96923828125, -8.454345703125, -7.939453125, -7.424560546875, -6.90966796875, -6.394775390625, -5.8798828125, -5.364990234375, -4.85009765625, -4.335205078125, -3.8203125, -3.305419921875, -2.79052734375, -2.275634765625, -1.7607421875, -1.245849609375, -0.73095703125, -0.216064453125, 0.298828125, 0.813720703125, 1.32861328125, 1.843505859375, 2.3583984375, 2.873291015625, 3.38818359375, 3.903076171875, 4.41796875, 4.932861328125, 5.44775390625, 5.962646484375, 6.4775390625, 6.992431640625, 7.50732421875, 8.022216796875, 8.537109375, 9.052001953125, 9.56689453125, 10.081787109375, 10.5966796875, 11.111572265625, 11.62646484375, 12.141357421875, 12.65625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 6.0, 4.0, 8.0, 10.0, 20.0, 14.0, 16.0, 27.0, 23.0, 44.0, 46.0, 56.0, 59.0, 62.0, 60.0, 86.0, 78.0, 56.0, 50.0, 48.0, 46.0, 38.0, 23.0, 23.0, 15.0, 16.0, 9.0, 12.0, 12.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0005693435668945312, -0.0005539208650588989, -0.0005384981632232666, -0.0005230754613876343, -0.000507652759552002, -0.0004922300577163696, -0.0004768073558807373, -0.000461384654045105, -0.00044596195220947266, -0.00043053925037384033, -0.000415116548538208, -0.0003996938467025757, -0.00038427114486694336, -0.00036884844303131104, -0.0003534257411956787, -0.0003380030393600464, -0.00032258033752441406, -0.00030715763568878174, -0.0002917349338531494, -0.0002763122320175171, -0.00026088953018188477, -0.00024546682834625244, -0.00023004412651062012, -0.0002146214246749878, -0.00019919872283935547, -0.00018377602100372314, -0.00016835331916809082, -0.0001529306173324585, -0.00013750791549682617, -0.00012208521366119385, -0.00010666251182556152, -9.12398099899292e-05, -7.581710815429688e-05, -6.039440631866455e-05, -4.4971704483032227e-05, -2.9549002647399902e-05, -1.4126300811767578e-05, 1.296401023864746e-06, 1.671910285949707e-05, 3.2141804695129395e-05, 4.756450653076172e-05, 6.298720836639404e-05, 7.840991020202637e-05, 9.383261203765869e-05, 0.00010925531387329102, 0.00012467801570892334, 0.00014010071754455566, 0.000155523419380188, 0.0001709461212158203, 0.00018636882305145264, 0.00020179152488708496, 0.00021721422672271729, 0.0002326369285583496, 0.00024805963039398193, 0.00026348233222961426, 0.0002789050340652466, 0.0002943277359008789, 0.00030975043773651123, 0.00032517313957214355, 0.0003405958414077759, 0.0003560185432434082, 0.00037144124507904053, 0.00038686394691467285, 0.0004022866487503052, 0.0004177093505859375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 9.0, 4.0, 10.0, 14.0, 16.0, 26.0, 43.0, 88.0, 191.0, 388.0, 1331.0, 23888.0, 993325.0, 26876.0, 1496.0, 425.0, 153.0, 107.0, 54.0, 36.0, 17.0, 14.0, 13.0, 4.0, 6.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.375, -21.561767578125, -20.74853515625, -19.935302734375, -19.1220703125, -18.308837890625, -17.49560546875, -16.682373046875, -15.869140625, -15.055908203125, -14.24267578125, -13.429443359375, -12.6162109375, -11.802978515625, -10.98974609375, -10.176513671875, -9.36328125, -8.550048828125, -7.73681640625, -6.923583984375, -6.1103515625, -5.297119140625, -4.48388671875, -3.670654296875, -2.857421875, -2.044189453125, -1.23095703125, -0.417724609375, 0.3955078125, 1.208740234375, 2.02197265625, 2.835205078125, 3.6484375, 4.461669921875, 5.27490234375, 6.088134765625, 6.9013671875, 7.714599609375, 8.52783203125, 9.341064453125, 10.154296875, 10.967529296875, 11.78076171875, 12.593994140625, 13.4072265625, 14.220458984375, 15.03369140625, 15.846923828125, 16.66015625, 17.473388671875, 18.28662109375, 19.099853515625, 19.9130859375, 20.726318359375, 21.53955078125, 22.352783203125, 23.166015625, 23.979248046875, 24.79248046875, 25.605712890625, 26.4189453125, 27.232177734375, 28.04541015625, 28.858642578125, 29.671875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 5.0, 9.0, 11.0, 18.0, 30.0, 48.0, 102.0, 217.0, 230.0, 138.0, 59.0, 38.0, 23.0, 13.0, 7.0, 13.0, 7.0, 3.0, 0.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5, -14.9697265625, -14.439453125, -13.9091796875, -13.37890625, -12.8486328125, -12.318359375, -11.7880859375, -11.2578125, -10.7275390625, -10.197265625, -9.6669921875, -9.13671875, -8.6064453125, -8.076171875, -7.5458984375, -7.015625, -6.4853515625, -5.955078125, -5.4248046875, -4.89453125, -4.3642578125, -3.833984375, -3.3037109375, -2.7734375, -2.2431640625, -1.712890625, -1.1826171875, -0.65234375, -0.1220703125, 0.408203125, 0.9384765625, 1.46875, 1.9990234375, 2.529296875, 3.0595703125, 3.58984375, 4.1201171875, 4.650390625, 5.1806640625, 5.7109375, 6.2412109375, 6.771484375, 7.3017578125, 7.83203125, 8.3623046875, 8.892578125, 9.4228515625, 9.953125, 10.4833984375, 11.013671875, 11.5439453125, 12.07421875, 12.6044921875, 13.134765625, 13.6650390625, 14.1953125, 14.7255859375, 15.255859375, 15.7861328125, 16.31640625, 16.8466796875, 17.376953125, 17.9072265625, 18.4375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 9.0, 47.0, 445.0, 438.0, 56.0, 10.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-708.0048217773438, -693.8768310546875, -679.7488403320312, -665.620849609375, -651.4928588867188, -637.3648681640625, -623.23681640625, -609.10888671875, -594.9808349609375, -580.8528442382812, -566.724853515625, -552.5968627929688, -538.4688720703125, -524.3408813476562, -510.2128601074219, -496.0848693847656, -481.9569091796875, -467.82891845703125, -453.700927734375, -439.57293701171875, -425.4449157714844, -411.3169250488281, -397.1889343261719, -383.0609436035156, -368.93292236328125, -354.804931640625, -340.67694091796875, -326.5489501953125, -312.4209289550781, -298.2929382324219, -284.1649475097656, -270.0369567871094, -255.90895080566406, -241.7809600830078, -227.6529541015625, -213.52496337890625, -199.39697265625, -185.26898193359375, -171.14097595214844, -157.0129852294922, -142.88497924804688, -128.75698852539062, -114.62899017333984, -100.50099182128906, -86.37300109863281, -72.24500274658203, -58.11700439453125, -43.989013671875, -29.86102294921875, -15.733027458190918, -1.605031967163086, 12.522964477539062, 26.650959014892578, 40.778953552246094, 54.906951904296875, 69.03494262695312, 83.1629409790039, 97.29093933105469, 111.41893005371094, 125.54692840576172, 139.6749267578125, 153.80291748046875, 167.930908203125, 182.05889892578125, 196.18690490722656]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 7.0, 8.0, 10.0, 8.0, 20.0, 12.0, 23.0, 26.0, 31.0, 32.0, 42.0, 30.0, 43.0, 54.0, 54.0, 51.0, 64.0, 58.0, 58.0, 41.0, 46.0, 51.0, 31.0, 32.0, 35.0, 24.0, 21.0, 23.0, 23.0, 15.0, 11.0, 3.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.16397094726562, -77.36493682861328, -74.56590270996094, -71.76686096191406, -68.96782684326172, -66.16879272460938, -63.36975860595703, -60.57072448730469, -57.77168655395508, -54.972652435302734, -52.173614501953125, -49.37458038330078, -46.57554626464844, -43.77650833129883, -40.977474212646484, -38.178436279296875, -35.37940216064453, -32.58036804199219, -29.781330108642578, -26.982295989990234, -24.183259963989258, -21.38422393798828, -18.585189819335938, -15.786153793334961, -12.987117767333984, -10.188081741333008, -7.389046669006348, -4.5900115966796875, -1.790975570678711, 1.0080604553222656, 3.8070945739746094, 6.606130599975586, 9.405166625976562, 12.204202651977539, 15.0032377243042, 17.80227279663086, 20.601308822631836, 23.400344848632812, 26.199378967285156, 28.998414993286133, 31.79745101928711, 34.59648513793945, 37.39552307128906, 40.194557189941406, 42.99359130859375, 45.79262924194336, 48.5916633605957, 51.39070129394531, 54.189735412597656, 56.98876953125, 59.78780746459961, 62.58684158325195, 65.38587951660156, 68.1849136352539, 70.98394775390625, 73.7829818725586, 76.58201599121094, 79.38105010986328, 82.18008422851562, 84.9791259765625, 87.77816009521484, 90.57719421386719, 93.37622833251953, 96.17526245117188, 98.97430419921875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 9.0, 21.0, 33.0, 45.0, 99.0, 179.0, 444.0, 2595.0, 94515.0, 4088802.0, 6242.0, 815.0, 198.0, 100.0, 61.0, 45.0, 24.0, 14.0, 9.0, 6.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.125, -46.5302734375, -44.935546875, -43.3408203125, -41.74609375, -40.1513671875, -38.556640625, -36.9619140625, -35.3671875, -33.7724609375, -32.177734375, -30.5830078125, -28.98828125, -27.3935546875, -25.798828125, -24.2041015625, -22.609375, -21.0146484375, -19.419921875, -17.8251953125, -16.23046875, -14.6357421875, -13.041015625, -11.4462890625, -9.8515625, -8.2568359375, -6.662109375, -5.0673828125, -3.47265625, -1.8779296875, -0.283203125, 1.3115234375, 2.90625, 4.5009765625, 6.095703125, 7.6904296875, 9.28515625, 10.8798828125, 12.474609375, 14.0693359375, 15.6640625, 17.2587890625, 18.853515625, 20.4482421875, 22.04296875, 23.6376953125, 25.232421875, 26.8271484375, 28.421875, 30.0166015625, 31.611328125, 33.2060546875, 34.80078125, 36.3955078125, 37.990234375, 39.5849609375, 41.1796875, 42.7744140625, 44.369140625, 45.9638671875, 47.55859375, 49.1533203125, 50.748046875, 52.3427734375, 53.9375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 8.0, 8.0, 11.0, 9.0, 14.0, 16.0, 27.0, 26.0, 35.0, 32.0, 46.0, 56.0, 55.0, 77.0, 69.0, 69.0, 73.0, 63.0, 42.0, 56.0, 45.0, 31.0, 27.0, 18.0, 14.0, 12.0, 15.0, 7.0, 5.0, 7.0, 7.0, 7.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.42578125, -5.27874755859375, -5.1317138671875, -4.98468017578125, -4.837646484375, -4.69061279296875, -4.5435791015625, -4.39654541015625, -4.24951171875, -4.10247802734375, -3.9554443359375, -3.80841064453125, -3.661376953125, -3.51434326171875, -3.3673095703125, -3.22027587890625, -3.0732421875, -2.92620849609375, -2.7791748046875, -2.63214111328125, -2.485107421875, -2.33807373046875, -2.1910400390625, -2.04400634765625, -1.89697265625, -1.74993896484375, -1.6029052734375, -1.45587158203125, -1.308837890625, -1.16180419921875, -1.0147705078125, -0.86773681640625, -0.720703125, -0.57366943359375, -0.4266357421875, -0.27960205078125, -0.132568359375, 0.01446533203125, 0.1614990234375, 0.30853271484375, 0.45556640625, 0.60260009765625, 0.7496337890625, 0.89666748046875, 1.043701171875, 1.19073486328125, 1.3377685546875, 1.48480224609375, 1.6318359375, 1.77886962890625, 1.9259033203125, 2.07293701171875, 2.219970703125, 2.36700439453125, 2.5140380859375, 2.66107177734375, 2.80810546875, 2.95513916015625, 3.1021728515625, 3.24920654296875, 3.396240234375, 3.54327392578125, 3.6903076171875, 3.83734130859375, 3.984375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 8.0, 7.0, 9.0, 13.0, 10.0, 17.0, 16.0, 22.0, 38.0, 46.0, 57.0, 94.0, 158.0, 249.0, 435.0, 786.0, 1781.0, 4301.0, 12903.0, 56165.0, 1037441.0, 2998423.0, 59263.0, 13626.0, 4496.0, 1912.0, 839.0, 472.0, 254.0, 130.0, 81.0, 59.0, 43.0, 25.0, 18.0, 23.0, 11.0, 8.0, 10.0, 9.0, 5.0, 1.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 5.0], "bins": [-9.671875, -9.4033203125, -9.134765625, -8.8662109375, -8.59765625, -8.3291015625, -8.060546875, -7.7919921875, -7.5234375, -7.2548828125, -6.986328125, -6.7177734375, -6.44921875, -6.1806640625, -5.912109375, -5.6435546875, -5.375, -5.1064453125, -4.837890625, -4.5693359375, -4.30078125, -4.0322265625, -3.763671875, -3.4951171875, -3.2265625, -2.9580078125, -2.689453125, -2.4208984375, -2.15234375, -1.8837890625, -1.615234375, -1.3466796875, -1.078125, -0.8095703125, -0.541015625, -0.2724609375, -0.00390625, 0.2646484375, 0.533203125, 0.8017578125, 1.0703125, 1.3388671875, 1.607421875, 1.8759765625, 2.14453125, 2.4130859375, 2.681640625, 2.9501953125, 3.21875, 3.4873046875, 3.755859375, 4.0244140625, 4.29296875, 4.5615234375, 4.830078125, 5.0986328125, 5.3671875, 5.6357421875, 5.904296875, 6.1728515625, 6.44140625, 6.7099609375, 6.978515625, 7.2470703125, 7.515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 12.0, 9.0, 19.0, 44.0, 102.0, 204.0, 2823.0, 554.0, 158.0, 66.0, 27.0, 23.0, 12.0, 11.0, 6.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.595703125, -3.5188751220703125, -3.442047119140625, -3.3652191162109375, -3.28839111328125, -3.2115631103515625, -3.134735107421875, -3.0579071044921875, -2.9810791015625, -2.9042510986328125, -2.827423095703125, -2.7505950927734375, -2.67376708984375, -2.5969390869140625, -2.520111083984375, -2.4432830810546875, -2.366455078125, -2.2896270751953125, -2.212799072265625, -2.1359710693359375, -2.05914306640625, -1.9823150634765625, -1.905487060546875, -1.8286590576171875, -1.7518310546875, -1.6750030517578125, -1.598175048828125, -1.5213470458984375, -1.44451904296875, -1.3676910400390625, -1.290863037109375, -1.2140350341796875, -1.13720703125, -1.0603790283203125, -0.983551025390625, -0.9067230224609375, -0.82989501953125, -0.7530670166015625, -0.676239013671875, -0.5994110107421875, -0.5225830078125, -0.4457550048828125, -0.368927001953125, -0.2920989990234375, -0.21527099609375, -0.1384429931640625, -0.061614990234375, 0.0152130126953125, 0.092041015625, 0.1688690185546875, 0.245697021484375, 0.3225250244140625, 0.39935302734375, 0.4761810302734375, 0.553009033203125, 0.6298370361328125, 0.7066650390625, 0.7834930419921875, 0.860321044921875, 0.9371490478515625, 1.01397705078125, 1.0908050537109375, 1.167633056640625, 1.2444610595703125, 1.3212890625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 11.0, 11.0, 29.0, 50.0, 73.0, 121.0, 146.0, 180.0, 144.0, 105.0, 66.0, 32.0, 19.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.632227897644043, -11.285164833068848, -10.938101768493652, -10.591038703918457, -10.243974685668945, -9.89691162109375, -9.549848556518555, -9.20278549194336, -8.855722427368164, -8.508659362792969, -8.161596298217773, -7.81453275680542, -7.467469692230225, -7.120406627655029, -6.773343086242676, -6.4262800216674805, -6.079216957092285, -5.73215389251709, -5.3850908279418945, -5.038027286529541, -4.690964221954346, -4.34390115737915, -3.996837854385376, -3.6497745513916016, -3.3027114868164062, -2.955648422241211, -2.6085851192474365, -2.261521816253662, -1.9144587516784668, -1.567395567893982, -1.220332384109497, -0.8732690811157227, -0.5262060165405273, -0.17914283275604248, 0.16792035102844238, 0.5149835348129272, 0.8620467185974121, 1.209109902381897, 1.5561730861663818, 1.9032363891601562, 2.2502994537353516, 2.597362518310547, 2.9444258213043213, 3.2914891242980957, 3.638552188873291, 3.9856152534484863, 4.33267879486084, 4.679741859436035, 5.0268049240112305, 5.373867988586426, 5.720931053161621, 6.067994594573975, 6.41505765914917, 6.762120723724365, 7.109184265136719, 7.456247329711914, 7.803310394287109, 8.150373458862305, 8.4974365234375, 8.844499588012695, 9.19156265258789, 9.538626670837402, 9.885689735412598, 10.232752799987793, 10.579815864562988]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 2.0, 8.0, 3.0, 5.0, 9.0, 9.0, 17.0, 15.0, 15.0, 12.0, 15.0, 16.0, 23.0, 28.0, 30.0, 29.0, 37.0, 47.0, 43.0, 30.0, 42.0, 41.0, 36.0, 36.0, 34.0, 39.0, 36.0, 29.0, 41.0, 34.0, 30.0, 25.0, 34.0, 25.0, 16.0, 16.0, 12.0, 16.0, 10.0, 14.0, 10.0, 7.0, 8.0, 5.0, 3.0, 4.0, 0.0, 7.0, 1.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.253279685974121, -3.142451286315918, -3.031622886657715, -2.9207944869995117, -2.8099658489227295, -2.6991374492645264, -2.5883090496063232, -2.47748064994812, -2.366652250289917, -2.255823850631714, -2.1449954509735107, -2.0341668128967285, -1.923338532447815, -1.8125100135803223, -1.7016816139221191, -1.590853214263916, -1.4800246953964233, -1.3691962957382202, -1.2583677768707275, -1.1475393772125244, -1.0367109775543213, -0.9258825182914734, -0.8150540590286255, -0.7042256593704224, -0.5933972001075745, -0.48256877064704895, -0.37174034118652344, -0.26091188192367554, -0.15008345246315002, -0.03925502300262451, 0.07157343626022339, 0.1824018359184265, 0.2932302951812744, 0.4040587246417999, 0.5148871541023254, 0.6257156133651733, 0.7365440130233765, 0.8473724722862244, 0.9582009315490723, 1.0690293312072754, 1.1798577308654785, 1.2906861305236816, 1.4015146493911743, 1.5123430490493774, 1.6231714487075806, 1.7339999675750732, 1.8448283672332764, 1.9556567668914795, 2.0664854049682617, 2.177313804626465, 2.288142204284668, 2.398970603942871, 2.5097992420196533, 2.6206276416778564, 2.7314560413360596, 2.8422844409942627, 2.953112840652466, 3.063941240310669, 3.174769639968872, 3.2855982780456543, 3.3964266777038574, 3.5072550773620605, 3.6180834770202637, 3.728911876678467, 3.83974027633667]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 5.0, 5.0, 11.0, 12.0, 27.0, 37.0, 52.0, 95.0, 156.0, 264.0, 549.0, 1137.0, 2882.0, 8141.0, 30467.0, 155314.0, 528731.0, 254896.0, 47302.0, 11803.0, 3853.0, 1442.0, 640.0, 315.0, 140.0, 103.0, 65.0, 37.0, 29.0, 18.0, 8.0, 8.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.9609375, -15.486572265625, -15.01220703125, -14.537841796875, -14.0634765625, -13.589111328125, -13.11474609375, -12.640380859375, -12.166015625, -11.691650390625, -11.21728515625, -10.742919921875, -10.2685546875, -9.794189453125, -9.31982421875, -8.845458984375, -8.37109375, -7.896728515625, -7.42236328125, -6.947998046875, -6.4736328125, -5.999267578125, -5.52490234375, -5.050537109375, -4.576171875, -4.101806640625, -3.62744140625, -3.153076171875, -2.6787109375, -2.204345703125, -1.72998046875, -1.255615234375, -0.78125, -0.306884765625, 0.16748046875, 0.641845703125, 1.1162109375, 1.590576171875, 2.06494140625, 2.539306640625, 3.013671875, 3.488037109375, 3.96240234375, 4.436767578125, 4.9111328125, 5.385498046875, 5.85986328125, 6.334228515625, 6.80859375, 7.282958984375, 7.75732421875, 8.231689453125, 8.7060546875, 9.180419921875, 9.65478515625, 10.129150390625, 10.603515625, 11.077880859375, 11.55224609375, 12.026611328125, 12.5009765625, 12.975341796875, 13.44970703125, 13.924072265625, 14.3984375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 5.0, 8.0, 10.0, 13.0, 12.0, 22.0, 22.0, 33.0, 29.0, 29.0, 41.0, 62.0, 65.0, 59.0, 61.0, 89.0, 54.0, 58.0, 52.0, 57.0, 34.0, 30.0, 33.0, 19.0, 19.0, 15.0, 12.0, 10.0, 8.0, 6.0, 7.0, 7.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.35546875, -5.210693359375, -5.06591796875, -4.921142578125, -4.7763671875, -4.631591796875, -4.48681640625, -4.342041015625, -4.197265625, -4.052490234375, -3.90771484375, -3.762939453125, -3.6181640625, -3.473388671875, -3.32861328125, -3.183837890625, -3.0390625, -2.894287109375, -2.74951171875, -2.604736328125, -2.4599609375, -2.315185546875, -2.17041015625, -2.025634765625, -1.880859375, -1.736083984375, -1.59130859375, -1.446533203125, -1.3017578125, -1.156982421875, -1.01220703125, -0.867431640625, -0.72265625, -0.577880859375, -0.43310546875, -0.288330078125, -0.1435546875, 0.001220703125, 0.14599609375, 0.290771484375, 0.435546875, 0.580322265625, 0.72509765625, 0.869873046875, 1.0146484375, 1.159423828125, 1.30419921875, 1.448974609375, 1.59375, 1.738525390625, 1.88330078125, 2.028076171875, 2.1728515625, 2.317626953125, 2.46240234375, 2.607177734375, 2.751953125, 2.896728515625, 3.04150390625, 3.186279296875, 3.3310546875, 3.475830078125, 3.62060546875, 3.765380859375, 3.91015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 3.0, 8.0, 12.0, 19.0, 30.0, 35.0, 53.0, 87.0, 135.0, 238.0, 601.0, 1976.0, 15475.0, 975728.0, 49443.0, 3197.0, 762.0, 316.0, 150.0, 99.0, 56.0, 38.0, 20.0, 21.0, 9.0, 6.0, 9.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-64.1875, -62.3349609375, -60.482421875, -58.6298828125, -56.77734375, -54.9248046875, -53.072265625, -51.2197265625, -49.3671875, -47.5146484375, -45.662109375, -43.8095703125, -41.95703125, -40.1044921875, -38.251953125, -36.3994140625, -34.546875, -32.6943359375, -30.841796875, -28.9892578125, -27.13671875, -25.2841796875, -23.431640625, -21.5791015625, -19.7265625, -17.8740234375, -16.021484375, -14.1689453125, -12.31640625, -10.4638671875, -8.611328125, -6.7587890625, -4.90625, -3.0537109375, -1.201171875, 0.6513671875, 2.50390625, 4.3564453125, 6.208984375, 8.0615234375, 9.9140625, 11.7666015625, 13.619140625, 15.4716796875, 17.32421875, 19.1767578125, 21.029296875, 22.8818359375, 24.734375, 26.5869140625, 28.439453125, 30.2919921875, 32.14453125, 33.9970703125, 35.849609375, 37.7021484375, 39.5546875, 41.4072265625, 43.259765625, 45.1123046875, 46.96484375, 48.8173828125, 50.669921875, 52.5224609375, 54.375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 8.0, 5.0, 13.0, 6.0, 16.0, 21.0, 29.0, 45.0, 34.0, 57.0, 70.0, 64.0, 79.0, 74.0, 75.0, 70.0, 52.0, 51.0, 46.0, 45.0, 32.0, 25.0, 23.0, 14.0, 12.0, 5.0, 5.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.296875, -28.45751953125, -27.6181640625, -26.77880859375, -25.939453125, -25.10009765625, -24.2607421875, -23.42138671875, -22.58203125, -21.74267578125, -20.9033203125, -20.06396484375, -19.224609375, -18.38525390625, -17.5458984375, -16.70654296875, -15.8671875, -15.02783203125, -14.1884765625, -13.34912109375, -12.509765625, -11.67041015625, -10.8310546875, -9.99169921875, -9.15234375, -8.31298828125, -7.4736328125, -6.63427734375, -5.794921875, -4.95556640625, -4.1162109375, -3.27685546875, -2.4375, -1.59814453125, -0.7587890625, 0.08056640625, 0.919921875, 1.75927734375, 2.5986328125, 3.43798828125, 4.27734375, 5.11669921875, 5.9560546875, 6.79541015625, 7.634765625, 8.47412109375, 9.3134765625, 10.15283203125, 10.9921875, 11.83154296875, 12.6708984375, 13.51025390625, 14.349609375, 15.18896484375, 16.0283203125, 16.86767578125, 17.70703125, 18.54638671875, 19.3857421875, 20.22509765625, 21.064453125, 21.90380859375, 22.7431640625, 23.58251953125, 24.421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 7.0, 7.0, 6.0, 10.0, 17.0, 24.0, 24.0, 35.0, 63.0, 78.0, 142.0, 308.0, 1073.0, 11376.0, 992823.0, 39950.0, 1699.0, 390.0, 175.0, 101.0, 64.0, 39.0, 32.0, 30.0, 18.0, 16.0, 9.0, 7.0, 5.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.1875, -25.49169921875, -24.7958984375, -24.10009765625, -23.404296875, -22.70849609375, -22.0126953125, -21.31689453125, -20.62109375, -19.92529296875, -19.2294921875, -18.53369140625, -17.837890625, -17.14208984375, -16.4462890625, -15.75048828125, -15.0546875, -14.35888671875, -13.6630859375, -12.96728515625, -12.271484375, -11.57568359375, -10.8798828125, -10.18408203125, -9.48828125, -8.79248046875, -8.0966796875, -7.40087890625, -6.705078125, -6.00927734375, -5.3134765625, -4.61767578125, -3.921875, -3.22607421875, -2.5302734375, -1.83447265625, -1.138671875, -0.44287109375, 0.2529296875, 0.94873046875, 1.64453125, 2.34033203125, 3.0361328125, 3.73193359375, 4.427734375, 5.12353515625, 5.8193359375, 6.51513671875, 7.2109375, 7.90673828125, 8.6025390625, 9.29833984375, 9.994140625, 10.68994140625, 11.3857421875, 12.08154296875, 12.77734375, 13.47314453125, 14.1689453125, 14.86474609375, 15.560546875, 16.25634765625, 16.9521484375, 17.64794921875, 18.34375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 10.0, 12.0, 14.0, 20.0, 16.0, 25.0, 42.0, 44.0, 44.0, 63.0, 88.0, 79.0, 72.0, 67.0, 78.0, 52.0, 53.0, 62.0, 36.0, 25.0, 21.0, 15.0, 10.0, 16.0, 6.0, 10.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004734992980957031, -0.0004563257098197937, -0.0004391521215438843, -0.00042197853326797485, -0.00040480494499206543, -0.000387631356716156, -0.0003704577684402466, -0.00035328418016433716, -0.00033611059188842773, -0.0003189370036125183, -0.0003017634153366089, -0.00028458982706069946, -0.00026741623878479004, -0.0002502426505088806, -0.0002330690622329712, -0.00021589547395706177, -0.00019872188568115234, -0.00018154829740524292, -0.0001643747091293335, -0.00014720112085342407, -0.00013002753257751465, -0.00011285394430160522, -9.56803560256958e-05, -7.850676774978638e-05, -6.133317947387695e-05, -4.415959119796753e-05, -2.6986002922058105e-05, -9.812414646148682e-06, 7.361173629760742e-06, 2.4534761905670166e-05, 4.170835018157959e-05, 5.8881938457489014e-05, 7.605552673339844e-05, 9.322911500930786e-05, 0.00011040270328521729, 0.0001275762915611267, 0.00014474987983703613, 0.00016192346811294556, 0.00017909705638885498, 0.0001962706446647644, 0.00021344423294067383, 0.00023061782121658325, 0.0002477914094924927, 0.0002649649977684021, 0.0002821385860443115, 0.00029931217432022095, 0.00031648576259613037, 0.0003336593508720398, 0.0003508329391479492, 0.00036800652742385864, 0.00038518011569976807, 0.0004023537039756775, 0.0004195272922515869, 0.00043670088052749634, 0.00045387446880340576, 0.0004710480570793152, 0.0004882216453552246, 0.000505395233631134, 0.0005225688219070435, 0.0005397424101829529, 0.0005569159984588623, 0.0005740895867347717, 0.0005912631750106812, 0.0006084367632865906, 0.0006256103515625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 5.0, 9.0, 14.0, 4.0, 12.0, 14.0, 12.0, 20.0, 43.0, 53.0, 78.0, 139.0, 310.0, 781.0, 2607.0, 23620.0, 994002.0, 22780.0, 2588.0, 752.0, 314.0, 124.0, 83.0, 43.0, 40.0, 27.0, 25.0, 17.0, 6.0, 8.0, 4.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.625, -21.9287109375, -21.232421875, -20.5361328125, -19.83984375, -19.1435546875, -18.447265625, -17.7509765625, -17.0546875, -16.3583984375, -15.662109375, -14.9658203125, -14.26953125, -13.5732421875, -12.876953125, -12.1806640625, -11.484375, -10.7880859375, -10.091796875, -9.3955078125, -8.69921875, -8.0029296875, -7.306640625, -6.6103515625, -5.9140625, -5.2177734375, -4.521484375, -3.8251953125, -3.12890625, -2.4326171875, -1.736328125, -1.0400390625, -0.34375, 0.3525390625, 1.048828125, 1.7451171875, 2.44140625, 3.1376953125, 3.833984375, 4.5302734375, 5.2265625, 5.9228515625, 6.619140625, 7.3154296875, 8.01171875, 8.7080078125, 9.404296875, 10.1005859375, 10.796875, 11.4931640625, 12.189453125, 12.8857421875, 13.58203125, 14.2783203125, 14.974609375, 15.6708984375, 16.3671875, 17.0634765625, 17.759765625, 18.4560546875, 19.15234375, 19.8486328125, 20.544921875, 21.2412109375, 21.9375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 10.0, 19.0, 41.0, 89.0, 193.0, 234.0, 190.0, 95.0, 48.0, 10.0, 8.0, 14.0, 6.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.15625, -15.658935546875, -15.16162109375, -14.664306640625, -14.1669921875, -13.669677734375, -13.17236328125, -12.675048828125, -12.177734375, -11.680419921875, -11.18310546875, -10.685791015625, -10.1884765625, -9.691162109375, -9.19384765625, -8.696533203125, -8.19921875, -7.701904296875, -7.20458984375, -6.707275390625, -6.2099609375, -5.712646484375, -5.21533203125, -4.718017578125, -4.220703125, -3.723388671875, -3.22607421875, -2.728759765625, -2.2314453125, -1.734130859375, -1.23681640625, -0.739501953125, -0.2421875, 0.255126953125, 0.75244140625, 1.249755859375, 1.7470703125, 2.244384765625, 2.74169921875, 3.239013671875, 3.736328125, 4.233642578125, 4.73095703125, 5.228271484375, 5.7255859375, 6.222900390625, 6.72021484375, 7.217529296875, 7.71484375, 8.212158203125, 8.70947265625, 9.206787109375, 9.7041015625, 10.201416015625, 10.69873046875, 11.196044921875, 11.693359375, 12.190673828125, 12.68798828125, 13.185302734375, 13.6826171875, 14.179931640625, 14.67724609375, 15.174560546875, 15.671875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 101.0, 714.0, 169.0, 16.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-883.8162841796875, -863.9818725585938, -844.1473999023438, -824.31298828125, -804.478515625, -784.6441040039062, -764.8096923828125, -744.9752197265625, -725.1408081054688, -705.306396484375, -685.471923828125, -665.6375122070312, -645.8031005859375, -625.9686279296875, -606.1342163085938, -586.2998046875, -566.46533203125, -546.6309204101562, -526.7964477539062, -506.9620361328125, -487.1275939941406, -467.29315185546875, -447.458740234375, -427.6242980957031, -407.78985595703125, -387.9554138183594, -368.1209716796875, -348.28656005859375, -328.4521179199219, -308.61767578125, -288.78326416015625, -268.9488220214844, -249.11441040039062, -229.27996826171875, -209.44554138183594, -189.61111450195312, -169.77667236328125, -149.94223022460938, -130.10780334472656, -110.27337646484375, -90.43893432617188, -70.60449981689453, -50.77006530761719, -30.935630798339844, -11.1011962890625, 8.733238220214844, 28.567672729492188, 48.402099609375, 68.23654174804688, 88.07097625732422, 107.90541076660156, 127.7398452758789, 147.57427978515625, 167.40872192382812, 187.24314880371094, 207.07757568359375, 226.91201782226562, 246.7464599609375, 266.58087158203125, 286.4153137207031, 306.249755859375, 326.0841979980469, 345.91864013671875, 365.7530517578125, 385.5874938964844]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 12.0, 8.0, 14.0, 20.0, 15.0, 24.0, 37.0, 43.0, 43.0, 47.0, 52.0, 64.0, 55.0, 60.0, 70.0, 72.0, 47.0, 63.0, 51.0, 35.0, 42.0, 32.0, 25.0, 30.0, 8.0, 13.0, 15.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.65264892578125, -71.89319610595703, -68.13375091552734, -64.37429809570312, -60.61484909057617, -56.85540008544922, -53.095947265625, -49.33649826049805, -45.577049255371094, -41.81760025024414, -38.05815124511719, -34.29869842529297, -30.539249420166016, -26.779800415039062, -23.020349502563477, -19.26089859008789, -15.501449584960938, -11.741999626159668, -7.982549667358398, -4.223099708557129, -0.4636497497558594, 3.2957992553710938, 7.05525016784668, 10.814701080322266, 14.574150085449219, 18.333599090576172, 22.093050003051758, 25.852500915527344, 29.611949920654297, 33.37139892578125, 37.13085174560547, 40.89030075073242, 44.649749755859375, 48.40919876098633, 52.16864776611328, 55.9281005859375, 59.68754959106445, 63.446998596191406, 67.20645141601562, 70.96589660644531, 74.72534942626953, 78.48480224609375, 82.24424743652344, 86.00370025634766, 89.76315307617188, 93.52259826660156, 97.28205108642578, 101.04150390625, 104.80094909667969, 108.5604019165039, 112.3198471069336, 116.07929992675781, 119.8387451171875, 123.59819793701172, 127.35765075683594, 131.11709594726562, 134.87655639648438, 138.63600158691406, 142.3954620361328, 146.1549072265625, 149.9143524169922, 153.67379760742188, 157.43325805664062, 161.1927032470703, 164.9521484375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 6.0, 3.0, 9.0, 21.0, 26.0, 62.0, 95.0, 217.0, 395.0, 944.0, 3122.0, 14858.0, 241633.0, 3892382.0, 32656.0, 5234.0, 1562.0, 535.0, 214.0, 135.0, 63.0, 41.0, 23.0, 16.0, 15.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.140625, -15.60595703125, -15.0712890625, -14.53662109375, -14.001953125, -13.46728515625, -12.9326171875, -12.39794921875, -11.86328125, -11.32861328125, -10.7939453125, -10.25927734375, -9.724609375, -9.18994140625, -8.6552734375, -8.12060546875, -7.5859375, -7.05126953125, -6.5166015625, -5.98193359375, -5.447265625, -4.91259765625, -4.3779296875, -3.84326171875, -3.30859375, -2.77392578125, -2.2392578125, -1.70458984375, -1.169921875, -0.63525390625, -0.1005859375, 0.43408203125, 0.96875, 1.50341796875, 2.0380859375, 2.57275390625, 3.107421875, 3.64208984375, 4.1767578125, 4.71142578125, 5.24609375, 5.78076171875, 6.3154296875, 6.85009765625, 7.384765625, 7.91943359375, 8.4541015625, 8.98876953125, 9.5234375, 10.05810546875, 10.5927734375, 11.12744140625, 11.662109375, 12.19677734375, 12.7314453125, 13.26611328125, 13.80078125, 14.33544921875, 14.8701171875, 15.40478515625, 15.939453125, 16.47412109375, 17.0087890625, 17.54345703125, 18.078125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 5.0, 10.0, 8.0, 13.0, 13.0, 20.0, 17.0, 31.0, 37.0, 45.0, 59.0, 64.0, 66.0, 74.0, 76.0, 83.0, 65.0, 66.0, 53.0, 48.0, 34.0, 22.0, 28.0, 10.0, 10.0, 7.0, 11.0, 6.0, 6.0, 1.0, 4.0, 5.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41796875, -6.2303466796875, -6.042724609375, -5.8551025390625, -5.66748046875, -5.4798583984375, -5.292236328125, -5.1046142578125, -4.9169921875, -4.7293701171875, -4.541748046875, -4.3541259765625, -4.16650390625, -3.9788818359375, -3.791259765625, -3.6036376953125, -3.416015625, -3.2283935546875, -3.040771484375, -2.8531494140625, -2.66552734375, -2.4779052734375, -2.290283203125, -2.1026611328125, -1.9150390625, -1.7274169921875, -1.539794921875, -1.3521728515625, -1.16455078125, -0.9769287109375, -0.789306640625, -0.6016845703125, -0.4140625, -0.2264404296875, -0.038818359375, 0.1488037109375, 0.33642578125, 0.5240478515625, 0.711669921875, 0.8992919921875, 1.0869140625, 1.2745361328125, 1.462158203125, 1.6497802734375, 1.83740234375, 2.0250244140625, 2.212646484375, 2.4002685546875, 2.587890625, 2.7755126953125, 2.963134765625, 3.1507568359375, 3.33837890625, 3.5260009765625, 3.713623046875, 3.9012451171875, 4.0888671875, 4.2764892578125, 4.464111328125, 4.6517333984375, 4.83935546875, 5.0269775390625, 5.214599609375, 5.4022216796875, 5.58984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 11.0, 14.0, 20.0, 27.0, 35.0, 51.0, 90.0, 115.0, 154.0, 197.0, 319.0, 502.0, 817.0, 1556.0, 3357.0, 8953.0, 31515.0, 166978.0, 3668638.0, 250194.0, 40903.0, 11209.0, 4156.0, 1785.0, 906.0, 562.0, 359.0, 237.0, 188.0, 129.0, 87.0, 70.0, 59.0, 27.0, 16.0, 12.0, 8.0, 12.0, 11.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.3515625, -8.12939453125, -7.9072265625, -7.68505859375, -7.462890625, -7.24072265625, -7.0185546875, -6.79638671875, -6.57421875, -6.35205078125, -6.1298828125, -5.90771484375, -5.685546875, -5.46337890625, -5.2412109375, -5.01904296875, -4.796875, -4.57470703125, -4.3525390625, -4.13037109375, -3.908203125, -3.68603515625, -3.4638671875, -3.24169921875, -3.01953125, -2.79736328125, -2.5751953125, -2.35302734375, -2.130859375, -1.90869140625, -1.6865234375, -1.46435546875, -1.2421875, -1.02001953125, -0.7978515625, -0.57568359375, -0.353515625, -0.13134765625, 0.0908203125, 0.31298828125, 0.53515625, 0.75732421875, 0.9794921875, 1.20166015625, 1.423828125, 1.64599609375, 1.8681640625, 2.09033203125, 2.3125, 2.53466796875, 2.7568359375, 2.97900390625, 3.201171875, 3.42333984375, 3.6455078125, 3.86767578125, 4.08984375, 4.31201171875, 4.5341796875, 4.75634765625, 4.978515625, 5.20068359375, 5.4228515625, 5.64501953125, 5.8671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 16.0, 26.0, 39.0, 78.0, 198.0, 2543.0, 823.0, 191.0, 80.0, 39.0, 18.0, 12.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.611328125, -3.5108642578125, -3.410400390625, -3.3099365234375, -3.20947265625, -3.1090087890625, -3.008544921875, -2.9080810546875, -2.8076171875, -2.7071533203125, -2.606689453125, -2.5062255859375, -2.40576171875, -2.3052978515625, -2.204833984375, -2.1043701171875, -2.00390625, -1.9034423828125, -1.802978515625, -1.7025146484375, -1.60205078125, -1.5015869140625, -1.401123046875, -1.3006591796875, -1.2001953125, -1.0997314453125, -0.999267578125, -0.8988037109375, -0.79833984375, -0.6978759765625, -0.597412109375, -0.4969482421875, -0.396484375, -0.2960205078125, -0.195556640625, -0.0950927734375, 0.00537109375, 0.1058349609375, 0.206298828125, 0.3067626953125, 0.4072265625, 0.5076904296875, 0.608154296875, 0.7086181640625, 0.80908203125, 0.9095458984375, 1.010009765625, 1.1104736328125, 1.2109375, 1.3114013671875, 1.411865234375, 1.5123291015625, 1.61279296875, 1.7132568359375, 1.813720703125, 1.9141845703125, 2.0146484375, 2.1151123046875, 2.215576171875, 2.3160400390625, 2.41650390625, 2.5169677734375, 2.617431640625, 2.7178955078125, 2.818359375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 7.0, 41.0, 138.0, 293.0, 353.0, 134.0, 31.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.61065673828125, -42.66753387451172, -41.72441482543945, -40.78129196166992, -39.838172912597656, -38.895050048828125, -37.95193099975586, -37.00880813598633, -36.06568908691406, -35.12256622314453, -34.179447174072266, -33.236324310302734, -32.29320526123047, -31.35008430480957, -30.406963348388672, -29.46384048461914, -28.520719528198242, -27.577598571777344, -26.634477615356445, -25.691356658935547, -24.74823570251465, -23.80511474609375, -22.86199188232422, -21.918872833251953, -20.975749969482422, -20.032629013061523, -19.089508056640625, -18.146387100219727, -17.203266143798828, -16.26014518737793, -15.317023277282715, -14.373902320861816, -13.430784225463867, -12.487663269042969, -11.54454231262207, -10.601421356201172, -9.658300399780273, -8.715179443359375, -7.77205753326416, -6.828936576843262, -5.885815620422363, -4.942694664001465, -3.9995734691619873, -3.0564522743225098, -2.1133313179016113, -1.170210361480713, -0.22708892822265625, 0.7160320281982422, 1.6591529846191406, 2.602273941040039, 3.5453951358795166, 4.488516330718994, 5.431637287139893, 6.374758243560791, 7.317879676818848, 8.261000633239746, 9.204121589660645, 10.147242546081543, 11.090363502502441, 12.033485412597656, 12.976606369018555, 13.919727325439453, 14.862848281860352, 15.80596923828125, 16.74909019470215]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 14.0, 9.0, 11.0, 14.0, 19.0, 18.0, 27.0, 33.0, 32.0, 28.0, 58.0, 49.0, 59.0, 55.0, 58.0, 57.0, 60.0, 53.0, 48.0, 50.0, 36.0, 44.0, 26.0, 36.0, 25.0, 19.0, 16.0, 11.0, 11.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.727115631103516, -7.502989292144775, -7.278862476348877, -7.054736137390137, -6.8306097984313965, -6.606483459472656, -6.382356643676758, -6.158230304718018, -5.934103965759277, -5.709977626800537, -5.485850811004639, -5.261724472045898, -5.037598133087158, -4.813471794128418, -4.5893449783325195, -4.365218639373779, -4.141091823577881, -3.9169652462005615, -3.6928389072418213, -3.468712329864502, -3.2445859909057617, -3.0204594135284424, -2.796332836151123, -2.572206497192383, -2.3480799198150635, -2.123953342437744, -1.899827003479004, -1.6757004261016846, -1.4515739679336548, -1.227447509765625, -1.0033209323883057, -0.7791944742202759, -0.5550680160522461, -0.3309415280818939, -0.10681504011154175, 0.11731147766113281, 0.3414379358291626, 0.5655643939971924, 0.7896909713745117, 1.0138174295425415, 1.2379438877105713, 1.462070345878601, 1.6861968040466309, 1.9103233814239502, 2.1344499588012695, 2.3585762977600098, 2.582702875137329, 2.8068294525146484, 3.0309557914733887, 3.255082368850708, 3.4792087078094482, 3.7033352851867676, 3.927461624145508, 4.151588439941406, 4.3757147789001465, 4.599841117858887, 4.823967933654785, 5.048094272613525, 5.272221088409424, 5.496347427368164, 5.720473766326904, 5.9446001052856445, 6.168726921081543, 6.392853260040283, 6.616979598999023]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 11.0, 16.0, 19.0, 26.0, 48.0, 88.0, 154.0, 295.0, 613.0, 1477.0, 4054.0, 15208.0, 94212.0, 629325.0, 261009.0, 31129.0, 6897.0, 2195.0, 906.0, 373.0, 213.0, 104.0, 70.0, 34.0, 30.0, 14.0, 7.0, 5.0, 8.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.53125, -17.981689453125, -17.43212890625, -16.882568359375, -16.3330078125, -15.783447265625, -15.23388671875, -14.684326171875, -14.134765625, -13.585205078125, -13.03564453125, -12.486083984375, -11.9365234375, -11.386962890625, -10.83740234375, -10.287841796875, -9.73828125, -9.188720703125, -8.63916015625, -8.089599609375, -7.5400390625, -6.990478515625, -6.44091796875, -5.891357421875, -5.341796875, -4.792236328125, -4.24267578125, -3.693115234375, -3.1435546875, -2.593994140625, -2.04443359375, -1.494873046875, -0.9453125, -0.395751953125, 0.15380859375, 0.703369140625, 1.2529296875, 1.802490234375, 2.35205078125, 2.901611328125, 3.451171875, 4.000732421875, 4.55029296875, 5.099853515625, 5.6494140625, 6.198974609375, 6.74853515625, 7.298095703125, 7.84765625, 8.397216796875, 8.94677734375, 9.496337890625, 10.0458984375, 10.595458984375, 11.14501953125, 11.694580078125, 12.244140625, 12.793701171875, 13.34326171875, 13.892822265625, 14.4423828125, 14.991943359375, 15.54150390625, 16.091064453125, 16.640625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 3.0, 5.0, 7.0, 8.0, 7.0, 18.0, 16.0, 20.0, 32.0, 32.0, 42.0, 51.0, 60.0, 63.0, 72.0, 83.0, 75.0, 65.0, 66.0, 67.0, 43.0, 34.0, 33.0, 25.0, 15.0, 16.0, 6.0, 13.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.453125, -6.2607421875, -6.068359375, -5.8759765625, -5.68359375, -5.4912109375, -5.298828125, -5.1064453125, -4.9140625, -4.7216796875, -4.529296875, -4.3369140625, -4.14453125, -3.9521484375, -3.759765625, -3.5673828125, -3.375, -3.1826171875, -2.990234375, -2.7978515625, -2.60546875, -2.4130859375, -2.220703125, -2.0283203125, -1.8359375, -1.6435546875, -1.451171875, -1.2587890625, -1.06640625, -0.8740234375, -0.681640625, -0.4892578125, -0.296875, -0.1044921875, 0.087890625, 0.2802734375, 0.47265625, 0.6650390625, 0.857421875, 1.0498046875, 1.2421875, 1.4345703125, 1.626953125, 1.8193359375, 2.01171875, 2.2041015625, 2.396484375, 2.5888671875, 2.78125, 2.9736328125, 3.166015625, 3.3583984375, 3.55078125, 3.7431640625, 3.935546875, 4.1279296875, 4.3203125, 4.5126953125, 4.705078125, 4.8974609375, 5.08984375, 5.2822265625, 5.474609375, 5.6669921875, 5.859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 5.0, 9.0, 6.0, 10.0, 28.0, 35.0, 50.0, 108.0, 182.0, 477.0, 1463.0, 8809.0, 926256.0, 105773.0, 3831.0, 847.0, 316.0, 132.0, 78.0, 57.0, 29.0, 13.0, 12.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-64.375, -62.525390625, -60.67578125, -58.826171875, -56.9765625, -55.126953125, -53.27734375, -51.427734375, -49.578125, -47.728515625, -45.87890625, -44.029296875, -42.1796875, -40.330078125, -38.48046875, -36.630859375, -34.78125, -32.931640625, -31.08203125, -29.232421875, -27.3828125, -25.533203125, -23.68359375, -21.833984375, -19.984375, -18.134765625, -16.28515625, -14.435546875, -12.5859375, -10.736328125, -8.88671875, -7.037109375, -5.1875, -3.337890625, -1.48828125, 0.361328125, 2.2109375, 4.060546875, 5.91015625, 7.759765625, 9.609375, 11.458984375, 13.30859375, 15.158203125, 17.0078125, 18.857421875, 20.70703125, 22.556640625, 24.40625, 26.255859375, 28.10546875, 29.955078125, 31.8046875, 33.654296875, 35.50390625, 37.353515625, 39.203125, 41.052734375, 42.90234375, 44.751953125, 46.6015625, 48.451171875, 50.30078125, 52.150390625, 54.0]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 9.0, 12.0, 11.0, 15.0, 18.0, 39.0, 43.0, 48.0, 48.0, 67.0, 82.0, 84.0, 96.0, 76.0, 87.0, 66.0, 50.0, 52.0, 31.0, 19.0, 11.0, 8.0, 6.0, 4.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.5625, -42.32421875, -41.0859375, -39.84765625, -38.609375, -37.37109375, -36.1328125, -34.89453125, -33.65625, -32.41796875, -31.1796875, -29.94140625, -28.703125, -27.46484375, -26.2265625, -24.98828125, -23.75, -22.51171875, -21.2734375, -20.03515625, -18.796875, -17.55859375, -16.3203125, -15.08203125, -13.84375, -12.60546875, -11.3671875, -10.12890625, -8.890625, -7.65234375, -6.4140625, -5.17578125, -3.9375, -2.69921875, -1.4609375, -0.22265625, 1.015625, 2.25390625, 3.4921875, 4.73046875, 5.96875, 7.20703125, 8.4453125, 9.68359375, 10.921875, 12.16015625, 13.3984375, 14.63671875, 15.875, 17.11328125, 18.3515625, 19.58984375, 20.828125, 22.06640625, 23.3046875, 24.54296875, 25.78125, 27.01953125, 28.2578125, 29.49609375, 30.734375, 31.97265625, 33.2109375, 34.44921875, 35.6875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 10.0, 12.0, 11.0, 21.0, 28.0, 53.0, 91.0, 128.0, 228.0, 458.0, 1164.0, 12152.0, 1016106.0, 15669.0, 1325.0, 481.0, 253.0, 109.0, 80.0, 54.0, 23.0, 27.0, 19.0, 17.0, 5.0, 6.0, 1.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.96875, -35.058837890625, -34.14892578125, -33.239013671875, -32.3291015625, -31.419189453125, -30.50927734375, -29.599365234375, -28.689453125, -27.779541015625, -26.86962890625, -25.959716796875, -25.0498046875, -24.139892578125, -23.22998046875, -22.320068359375, -21.41015625, -20.500244140625, -19.59033203125, -18.680419921875, -17.7705078125, -16.860595703125, -15.95068359375, -15.040771484375, -14.130859375, -13.220947265625, -12.31103515625, -11.401123046875, -10.4912109375, -9.581298828125, -8.67138671875, -7.761474609375, -6.8515625, -5.941650390625, -5.03173828125, -4.121826171875, -3.2119140625, -2.302001953125, -1.39208984375, -0.482177734375, 0.427734375, 1.337646484375, 2.24755859375, 3.157470703125, 4.0673828125, 4.977294921875, 5.88720703125, 6.797119140625, 7.70703125, 8.616943359375, 9.52685546875, 10.436767578125, 11.3466796875, 12.256591796875, 13.16650390625, 14.076416015625, 14.986328125, 15.896240234375, 16.80615234375, 17.716064453125, 18.6259765625, 19.535888671875, 20.44580078125, 21.355712890625, 22.265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 10.0, 8.0, 18.0, 11.0, 22.0, 24.0, 24.0, 52.0, 52.0, 54.0, 77.0, 74.0, 72.0, 82.0, 62.0, 64.0, 60.0, 43.0, 35.0, 31.0, 31.0, 21.0, 14.0, 9.0, 6.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044345855712890625, -0.00042738765478134155, -0.00041131675243377686, -0.00039524585008621216, -0.00037917494773864746, -0.00036310404539108276, -0.00034703314304351807, -0.00033096224069595337, -0.00031489133834838867, -0.000298820436000824, -0.0002827495336532593, -0.0002666786313056946, -0.0002506077289581299, -0.00023453682661056519, -0.0002184659242630005, -0.0002023950219154358, -0.0001863241195678711, -0.0001702532172203064, -0.0001541823148727417, -0.000138111412525177, -0.0001220405101776123, -0.00010596960783004761, -8.989870548248291e-05, -7.382780313491821e-05, -5.7756900787353516e-05, -4.168599843978882e-05, -2.561509609222412e-05, -9.544193744659424e-06, 6.5267086029052734e-06, 2.259761095046997e-05, 3.866851329803467e-05, 5.4739415645599365e-05, 7.081031799316406e-05, 8.688122034072876e-05, 0.00010295212268829346, 0.00011902302503585815, 0.00013509392738342285, 0.00015116482973098755, 0.00016723573207855225, 0.00018330663442611694, 0.00019937753677368164, 0.00021544843912124634, 0.00023151934146881104, 0.00024759024381637573, 0.00026366114616394043, 0.0002797320485115051, 0.0002958029508590698, 0.0003118738532066345, 0.0003279447555541992, 0.0003440156579017639, 0.0003600865602493286, 0.0003761574625968933, 0.000392228364944458, 0.0004082992672920227, 0.0004243701696395874, 0.0004404410719871521, 0.0004565119743347168, 0.0004725828766822815, 0.0004886537790298462, 0.0005047246813774109, 0.0005207955837249756, 0.0005368664860725403, 0.000552937388420105, 0.0005690082907676697, 0.0005850791931152344]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 6.0, 16.0, 17.0, 22.0, 35.0, 80.0, 140.0, 260.0, 645.0, 2885.0, 164185.0, 874205.0, 4544.0, 827.0, 336.0, 153.0, 78.0, 45.0, 39.0, 18.0, 10.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.53125, -29.361328125, -28.19140625, -27.021484375, -25.8515625, -24.681640625, -23.51171875, -22.341796875, -21.171875, -20.001953125, -18.83203125, -17.662109375, -16.4921875, -15.322265625, -14.15234375, -12.982421875, -11.8125, -10.642578125, -9.47265625, -8.302734375, -7.1328125, -5.962890625, -4.79296875, -3.623046875, -2.453125, -1.283203125, -0.11328125, 1.056640625, 2.2265625, 3.396484375, 4.56640625, 5.736328125, 6.90625, 8.076171875, 9.24609375, 10.416015625, 11.5859375, 12.755859375, 13.92578125, 15.095703125, 16.265625, 17.435546875, 18.60546875, 19.775390625, 20.9453125, 22.115234375, 23.28515625, 24.455078125, 25.625, 26.794921875, 27.96484375, 29.134765625, 30.3046875, 31.474609375, 32.64453125, 33.814453125, 34.984375, 36.154296875, 37.32421875, 38.494140625, 39.6640625, 40.833984375, 42.00390625, 43.173828125, 44.34375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 7.0, 4.0, 13.0, 17.0, 40.0, 82.0, 224.0, 320.0, 145.0, 56.0, 35.0, 16.0, 15.0, 8.0, 9.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-43.875, -42.9661865234375, -42.057373046875, -41.1485595703125, -40.23974609375, -39.3309326171875, -38.422119140625, -37.5133056640625, -36.6044921875, -35.6956787109375, -34.786865234375, -33.8780517578125, -32.96923828125, -32.0604248046875, -31.151611328125, -30.2427978515625, -29.333984375, -28.4251708984375, -27.516357421875, -26.6075439453125, -25.69873046875, -24.7899169921875, -23.881103515625, -22.9722900390625, -22.0634765625, -21.1546630859375, -20.245849609375, -19.3370361328125, -18.42822265625, -17.5194091796875, -16.610595703125, -15.7017822265625, -14.79296875, -13.8841552734375, -12.975341796875, -12.0665283203125, -11.15771484375, -10.2489013671875, -9.340087890625, -8.4312744140625, -7.5224609375, -6.6136474609375, -5.704833984375, -4.7960205078125, -3.88720703125, -2.9783935546875, -2.069580078125, -1.1607666015625, -0.251953125, 0.6568603515625, 1.565673828125, 2.4744873046875, 3.38330078125, 4.2921142578125, 5.200927734375, 6.1097412109375, 7.0185546875, 7.9273681640625, 8.836181640625, 9.7449951171875, 10.65380859375, 11.5626220703125, 12.471435546875, 13.3802490234375, 14.2890625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 29.0, 263.0, 580.0, 105.0, 14.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-641.8321533203125, -625.5269775390625, -609.2218017578125, -592.9165649414062, -576.6113891601562, -560.3062133789062, -544.0010375976562, -527.6958618164062, -511.3906555175781, -495.0854797363281, -478.7802734375, -462.47509765625, -446.169921875, -429.8647155761719, -413.5595397949219, -397.25433349609375, -380.94915771484375, -364.64398193359375, -348.3387756347656, -332.0335998535156, -315.7283935546875, -299.4232177734375, -283.1180419921875, -266.8128662109375, -250.50765991210938, -234.2024688720703, -217.89727783203125, -201.59210205078125, -185.2869110107422, -168.98171997070312, -152.67654418945312, -136.37135314941406, -120.066162109375, -103.76097106933594, -87.4557876586914, -71.15060424804688, -54.84541320800781, -38.54022216796875, -22.23503875732422, -5.9298553466796875, 10.375335693359375, 26.680522918701172, 42.98571014404297, 59.290897369384766, 75.59608459472656, 91.90127563476562, 108.20645904541016, 124.51164245605469, 140.81683349609375, 157.1220245361328, 173.42721557617188, 189.73239135742188, 206.03758239746094, 222.3427734375, 238.64794921875, 254.95314025878906, 271.2583312988281, 287.5635070800781, 303.86871337890625, 320.17388916015625, 336.47906494140625, 352.7842712402344, 369.0894470214844, 385.3946533203125, 401.6998291015625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 7.0, 5.0, 10.0, 14.0, 27.0, 30.0, 32.0, 45.0, 53.0, 70.0, 79.0, 85.0, 99.0, 72.0, 62.0, 67.0, 62.0, 65.0, 36.0, 25.0, 26.0, 5.0, 7.0, 8.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.74722290039062, -132.8096466064453, -126.8720703125, -120.93449401855469, -114.99691772460938, -109.05934143066406, -103.12176513671875, -97.18418884277344, -91.24661254882812, -85.30903625488281, -79.3714599609375, -73.43388366699219, -67.49630737304688, -61.55873107910156, -55.62115478515625, -49.68357849121094, -43.746002197265625, -37.80842590332031, -31.870849609375, -25.933273315429688, -19.995697021484375, -14.058120727539062, -8.12054443359375, -2.1829681396484375, 3.754608154296875, 9.692184448242188, 15.6297607421875, 21.567337036132812, 27.504913330078125, 33.44248962402344, 39.38006591796875, 45.31764221191406, 51.25520324707031, 57.192779541015625, 63.13035583496094, 69.06793212890625, 75.00550842285156, 80.94308471679688, 86.88066101074219, 92.8182373046875, 98.75581359863281, 104.69338989257812, 110.63096618652344, 116.56854248046875, 122.50611877441406, 128.44369506835938, 134.3812713623047, 140.31884765625, 146.2564239501953, 152.19400024414062, 158.13157653808594, 164.06915283203125, 170.00672912597656, 175.94430541992188, 181.8818817138672, 187.8194580078125, 193.7570343017578, 199.69461059570312, 205.63218688964844, 211.56976318359375, 217.50733947753906, 223.44491577148438, 229.3824920654297, 235.320068359375, 241.2576446533203]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 3.0, 8.0, 12.0, 19.0, 24.0, 30.0, 65.0, 84.0, 151.0, 307.0, 1032.0, 6970.0, 4062245.0, 118450.0, 3534.0, 703.0, 289.0, 141.0, 74.0, 54.0, 30.0, 18.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.9375, -23.97314453125, -23.0087890625, -22.04443359375, -21.080078125, -20.11572265625, -19.1513671875, -18.18701171875, -17.22265625, -16.25830078125, -15.2939453125, -14.32958984375, -13.365234375, -12.40087890625, -11.4365234375, -10.47216796875, -9.5078125, -8.54345703125, -7.5791015625, -6.61474609375, -5.650390625, -4.68603515625, -3.7216796875, -2.75732421875, -1.79296875, -0.82861328125, 0.1357421875, 1.10009765625, 2.064453125, 3.02880859375, 3.9931640625, 4.95751953125, 5.921875, 6.88623046875, 7.8505859375, 8.81494140625, 9.779296875, 10.74365234375, 11.7080078125, 12.67236328125, 13.63671875, 14.60107421875, 15.5654296875, 16.52978515625, 17.494140625, 18.45849609375, 19.4228515625, 20.38720703125, 21.3515625, 22.31591796875, 23.2802734375, 24.24462890625, 25.208984375, 26.17333984375, 27.1376953125, 28.10205078125, 29.06640625, 30.03076171875, 30.9951171875, 31.95947265625, 32.923828125, 33.88818359375, 34.8525390625, 35.81689453125, 36.78125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 14.0, 19.0, 39.0, 43.0, 77.0, 113.0, 129.0, 151.0, 121.0, 93.0, 69.0, 42.0, 25.0, 22.0, 11.0, 8.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3203125, -11.9132080078125, -11.506103515625, -11.0989990234375, -10.69189453125, -10.2847900390625, -9.877685546875, -9.4705810546875, -9.0634765625, -8.6563720703125, -8.249267578125, -7.8421630859375, -7.43505859375, -7.0279541015625, -6.620849609375, -6.2137451171875, -5.806640625, -5.3995361328125, -4.992431640625, -4.5853271484375, -4.17822265625, -3.7711181640625, -3.364013671875, -2.9569091796875, -2.5498046875, -2.1427001953125, -1.735595703125, -1.3284912109375, -0.92138671875, -0.5142822265625, -0.107177734375, 0.2999267578125, 0.70703125, 1.1141357421875, 1.521240234375, 1.9283447265625, 2.33544921875, 2.7425537109375, 3.149658203125, 3.5567626953125, 3.9638671875, 4.3709716796875, 4.778076171875, 5.1851806640625, 5.59228515625, 5.9993896484375, 6.406494140625, 6.8135986328125, 7.220703125, 7.6278076171875, 8.034912109375, 8.4420166015625, 8.84912109375, 9.2562255859375, 9.663330078125, 10.0704345703125, 10.4775390625, 10.8846435546875, 11.291748046875, 11.6988525390625, 12.10595703125, 12.5130615234375, 12.920166015625, 13.3272705078125, 13.734375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 8.0, 6.0, 8.0, 18.0, 14.0, 15.0, 23.0, 25.0, 41.0, 69.0, 93.0, 109.0, 132.0, 219.0, 340.0, 581.0, 1053.0, 2137.0, 5649.0, 21914.0, 216956.0, 3882162.0, 46477.0, 9658.0, 3086.0, 1359.0, 717.0, 481.0, 289.0, 195.0, 120.0, 103.0, 79.0, 46.0, 33.0, 18.0, 15.0, 13.0, 5.0, 12.0, 5.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.3046875, -8.0203857421875, -7.736083984375, -7.4517822265625, -7.16748046875, -6.8831787109375, -6.598876953125, -6.3145751953125, -6.0302734375, -5.7459716796875, -5.461669921875, -5.1773681640625, -4.89306640625, -4.6087646484375, -4.324462890625, -4.0401611328125, -3.755859375, -3.4715576171875, -3.187255859375, -2.9029541015625, -2.61865234375, -2.3343505859375, -2.050048828125, -1.7657470703125, -1.4814453125, -1.1971435546875, -0.912841796875, -0.6285400390625, -0.34423828125, -0.0599365234375, 0.224365234375, 0.5086669921875, 0.79296875, 1.0772705078125, 1.361572265625, 1.6458740234375, 1.93017578125, 2.2144775390625, 2.498779296875, 2.7830810546875, 3.0673828125, 3.3516845703125, 3.635986328125, 3.9202880859375, 4.20458984375, 4.4888916015625, 4.773193359375, 5.0574951171875, 5.341796875, 5.6260986328125, 5.910400390625, 6.1947021484375, 6.47900390625, 6.7633056640625, 7.047607421875, 7.3319091796875, 7.6162109375, 7.9005126953125, 8.184814453125, 8.4691162109375, 8.75341796875, 9.0377197265625, 9.322021484375, 9.6063232421875, 9.890625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 14.0, 29.0, 34.0, 81.0, 388.0, 3224.0, 169.0, 50.0, 35.0, 23.0, 8.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.85546875, -1.7679443359375, -1.680419921875, -1.5928955078125, -1.50537109375, -1.4178466796875, -1.330322265625, -1.2427978515625, -1.1552734375, -1.0677490234375, -0.980224609375, -0.8927001953125, -0.80517578125, -0.7176513671875, -0.630126953125, -0.5426025390625, -0.455078125, -0.3675537109375, -0.280029296875, -0.1925048828125, -0.10498046875, -0.0174560546875, 0.070068359375, 0.1575927734375, 0.2451171875, 0.3326416015625, 0.420166015625, 0.5076904296875, 0.59521484375, 0.6827392578125, 0.770263671875, 0.8577880859375, 0.9453125, 1.0328369140625, 1.120361328125, 1.2078857421875, 1.29541015625, 1.3829345703125, 1.470458984375, 1.5579833984375, 1.6455078125, 1.7330322265625, 1.820556640625, 1.9080810546875, 1.99560546875, 2.0831298828125, 2.170654296875, 2.2581787109375, 2.345703125, 2.4332275390625, 2.520751953125, 2.6082763671875, 2.69580078125, 2.7833251953125, 2.870849609375, 2.9583740234375, 3.0458984375, 3.1334228515625, 3.220947265625, 3.3084716796875, 3.39599609375, 3.4835205078125, 3.571044921875, 3.6585693359375, 3.74609375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 18.0, 38.0, 72.0, 157.0, 216.0, 195.0, 144.0, 79.0, 35.0, 23.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.33430290222168, -9.913188934326172, -9.492074012756348, -9.07096004486084, -8.649845123291016, -8.228731155395508, -7.807616710662842, -7.386502265930176, -6.965388298034668, -6.544273853302002, -6.123159408569336, -5.702045440673828, -5.280930995941162, -4.859816551208496, -4.43870210647583, -4.017587661743164, -3.596473217010498, -3.175358772277832, -2.754244565963745, -2.333130121231079, -1.9120157957077026, -1.4909014701843262, -1.0697870254516602, -0.6486728191375732, -0.22755837440490723, 0.19355598092079163, 0.6146703362464905, 1.0357847213745117, 1.4568990468978882, 1.8780133724212646, 2.2991278171539307, 2.7202420234680176, 3.1413564682006836, 3.5624709129333496, 3.9835851192474365, 4.404699325561523, 4.8258137702941895, 5.2469282150268555, 5.6680426597595215, 6.0891571044921875, 6.510271072387695, 6.931385517120361, 7.352499961853027, 7.773613929748535, 8.19472885131836, 8.615842819213867, 9.036956787109375, 9.4580717086792, 9.879186630249023, 10.300300598144531, 10.721415519714355, 11.142529487609863, 11.563644409179688, 11.984758377075195, 12.405872344970703, 12.826987266540527, 13.248101234436035, 13.669215202331543, 14.090330123901367, 14.511444091796875, 14.9325590133667, 15.353672981262207, 15.774787902832031, 16.19590187072754, 16.617015838623047]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 6.0, 7.0, 13.0, 11.0, 19.0, 27.0, 30.0, 46.0, 44.0, 55.0, 50.0, 55.0, 62.0, 69.0, 77.0, 72.0, 67.0, 46.0, 50.0, 48.0, 32.0, 33.0, 23.0, 18.0, 7.0, 10.0, 13.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.06987190246582, -7.850759029388428, -7.631646156311035, -7.412533283233643, -7.19342041015625, -6.974307537078857, -6.755194664001465, -6.536081314086914, -6.31696891784668, -6.097856044769287, -5.8787431716918945, -5.659630298614502, -5.440517425537109, -5.221404552459717, -5.002291679382324, -4.783178329467773, -4.564065456390381, -4.344952583312988, -4.125839710235596, -3.906726837158203, -3.6876139640808105, -3.468501091003418, -3.2493879795074463, -3.0302751064300537, -2.811162233352661, -2.5920493602752686, -2.372936487197876, -2.1538233757019043, -1.9347106218338013, -1.7155977487564087, -1.4964847564697266, -1.277371883392334, -1.0582594871520996, -0.839146614074707, -0.6200336813926697, -0.4009207487106323, -0.18180787563323975, 0.03730499744415283, 0.25641798973083496, 0.47553086280822754, 0.6946437358856201, 0.9137566089630127, 1.1328694820404053, 1.3519824743270874, 1.57109534740448, 1.7902082204818726, 2.0093212127685547, 2.2284340858459473, 2.44754695892334, 2.6666598320007324, 2.885772705078125, 3.1048855781555176, 3.32399845123291, 3.5431113243103027, 3.7622244358062744, 3.981337308883667, 4.2004499435424805, 4.419562816619873, 4.638675689697266, 4.857788562774658, 5.076901435852051, 5.296014308929443, 5.515127182006836, 5.734240531921387, 5.953353404998779]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 10.0, 18.0, 19.0, 26.0, 41.0, 59.0, 98.0, 164.0, 292.0, 555.0, 1182.0, 3121.0, 9664.0, 50001.0, 519501.0, 410160.0, 40268.0, 8392.0, 2654.0, 1092.0, 510.0, 289.0, 142.0, 97.0, 58.0, 47.0, 24.0, 19.0, 7.0, 10.0, 11.0, 6.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.4375, -16.8916015625, -16.345703125, -15.7998046875, -15.25390625, -14.7080078125, -14.162109375, -13.6162109375, -13.0703125, -12.5244140625, -11.978515625, -11.4326171875, -10.88671875, -10.3408203125, -9.794921875, -9.2490234375, -8.703125, -8.1572265625, -7.611328125, -7.0654296875, -6.51953125, -5.9736328125, -5.427734375, -4.8818359375, -4.3359375, -3.7900390625, -3.244140625, -2.6982421875, -2.15234375, -1.6064453125, -1.060546875, -0.5146484375, 0.03125, 0.5771484375, 1.123046875, 1.6689453125, 2.21484375, 2.7607421875, 3.306640625, 3.8525390625, 4.3984375, 4.9443359375, 5.490234375, 6.0361328125, 6.58203125, 7.1279296875, 7.673828125, 8.2197265625, 8.765625, 9.3115234375, 9.857421875, 10.4033203125, 10.94921875, 11.4951171875, 12.041015625, 12.5869140625, 13.1328125, 13.6787109375, 14.224609375, 14.7705078125, 15.31640625, 15.8623046875, 16.408203125, 16.9541015625, 17.5]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 2.0, 10.0, 22.0, 21.0, 50.0, 65.0, 86.0, 126.0, 137.0, 145.0, 95.0, 94.0, 52.0, 33.0, 22.0, 16.0, 9.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.671875, -12.2598876953125, -11.847900390625, -11.4359130859375, -11.02392578125, -10.6119384765625, -10.199951171875, -9.7879638671875, -9.3759765625, -8.9639892578125, -8.552001953125, -8.1400146484375, -7.72802734375, -7.3160400390625, -6.904052734375, -6.4920654296875, -6.080078125, -5.6680908203125, -5.256103515625, -4.8441162109375, -4.43212890625, -4.0201416015625, -3.608154296875, -3.1961669921875, -2.7841796875, -2.3721923828125, -1.960205078125, -1.5482177734375, -1.13623046875, -0.7242431640625, -0.312255859375, 0.0997314453125, 0.51171875, 0.9237060546875, 1.335693359375, 1.7476806640625, 2.15966796875, 2.5716552734375, 2.983642578125, 3.3956298828125, 3.8076171875, 4.2196044921875, 4.631591796875, 5.0435791015625, 5.45556640625, 5.8675537109375, 6.279541015625, 6.6915283203125, 7.103515625, 7.5155029296875, 7.927490234375, 8.3394775390625, 8.75146484375, 9.1634521484375, 9.575439453125, 9.9874267578125, 10.3994140625, 10.8114013671875, 11.223388671875, 11.6353759765625, 12.04736328125, 12.4593505859375, 12.871337890625, 13.2833251953125, 13.6953125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 8.0, 8.0, 9.0, 11.0, 27.0, 33.0, 73.0, 128.0, 233.0, 564.0, 1413.0, 6590.0, 140535.0, 880440.0, 14730.0, 2389.0, 697.0, 290.0, 149.0, 95.0, 46.0, 37.0, 19.0, 15.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.78125, -58.0322265625, -56.283203125, -54.5341796875, -52.78515625, -51.0361328125, -49.287109375, -47.5380859375, -45.7890625, -44.0400390625, -42.291015625, -40.5419921875, -38.79296875, -37.0439453125, -35.294921875, -33.5458984375, -31.796875, -30.0478515625, -28.298828125, -26.5498046875, -24.80078125, -23.0517578125, -21.302734375, -19.5537109375, -17.8046875, -16.0556640625, -14.306640625, -12.5576171875, -10.80859375, -9.0595703125, -7.310546875, -5.5615234375, -3.8125, -2.0634765625, -0.314453125, 1.4345703125, 3.18359375, 4.9326171875, 6.681640625, 8.4306640625, 10.1796875, 11.9287109375, 13.677734375, 15.4267578125, 17.17578125, 18.9248046875, 20.673828125, 22.4228515625, 24.171875, 25.9208984375, 27.669921875, 29.4189453125, 31.16796875, 32.9169921875, 34.666015625, 36.4150390625, 38.1640625, 39.9130859375, 41.662109375, 43.4111328125, 45.16015625, 46.9091796875, 48.658203125, 50.4072265625, 52.15625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 10.0, 6.0, 22.0, 17.0, 37.0, 57.0, 97.0, 130.0, 148.0, 159.0, 120.0, 70.0, 43.0, 24.0, 18.0, 9.0, 12.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-127.9375, -124.87890625, -121.8203125, -118.76171875, -115.703125, -112.64453125, -109.5859375, -106.52734375, -103.46875, -100.41015625, -97.3515625, -94.29296875, -91.234375, -88.17578125, -85.1171875, -82.05859375, -79.0, -75.94140625, -72.8828125, -69.82421875, -66.765625, -63.70703125, -60.6484375, -57.58984375, -54.53125, -51.47265625, -48.4140625, -45.35546875, -42.296875, -39.23828125, -36.1796875, -33.12109375, -30.0625, -27.00390625, -23.9453125, -20.88671875, -17.828125, -14.76953125, -11.7109375, -8.65234375, -5.59375, -2.53515625, 0.5234375, 3.58203125, 6.640625, 9.69921875, 12.7578125, 15.81640625, 18.875, 21.93359375, 24.9921875, 28.05078125, 31.109375, 34.16796875, 37.2265625, 40.28515625, 43.34375, 46.40234375, 49.4609375, 52.51953125, 55.578125, 58.63671875, 61.6953125, 64.75390625, 67.8125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 8.0, 13.0, 14.0, 20.0, 24.0, 26.0, 47.0, 51.0, 62.0, 110.0, 144.0, 255.0, 534.0, 1412.0, 12939.0, 1011280.0, 18615.0, 1630.0, 570.0, 272.0, 175.0, 79.0, 69.0, 49.0, 38.0, 24.0, 25.0, 23.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.265625, -24.348388671875, -23.43115234375, -22.513916015625, -21.5966796875, -20.679443359375, -19.76220703125, -18.844970703125, -17.927734375, -17.010498046875, -16.09326171875, -15.176025390625, -14.2587890625, -13.341552734375, -12.42431640625, -11.507080078125, -10.58984375, -9.672607421875, -8.75537109375, -7.838134765625, -6.9208984375, -6.003662109375, -5.08642578125, -4.169189453125, -3.251953125, -2.334716796875, -1.41748046875, -0.500244140625, 0.4169921875, 1.334228515625, 2.25146484375, 3.168701171875, 4.0859375, 5.003173828125, 5.92041015625, 6.837646484375, 7.7548828125, 8.672119140625, 9.58935546875, 10.506591796875, 11.423828125, 12.341064453125, 13.25830078125, 14.175537109375, 15.0927734375, 16.010009765625, 16.92724609375, 17.844482421875, 18.76171875, 19.678955078125, 20.59619140625, 21.513427734375, 22.4306640625, 23.347900390625, 24.26513671875, 25.182373046875, 26.099609375, 27.016845703125, 27.93408203125, 28.851318359375, 29.7685546875, 30.685791015625, 31.60302734375, 32.520263671875, 33.4375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 12.0, 8.0, 10.0, 15.0, 10.0, 34.0, 50.0, 66.0, 95.0, 168.0, 187.0, 114.0, 73.0, 40.0, 27.0, 32.0, 15.0, 11.0, 11.0, 8.0, 9.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010967254638671875, -0.001067832112312317, -0.0010389387607574463, -0.0010100454092025757, -0.000981152057647705, -0.0009522587060928345, -0.0009233653545379639, -0.0008944720029830933, -0.0008655786514282227, -0.000836685299873352, -0.0008077919483184814, -0.0007788985967636108, -0.0007500052452087402, -0.0007211118936538696, -0.000692218542098999, -0.0006633251905441284, -0.0006344318389892578, -0.0006055384874343872, -0.0005766451358795166, -0.000547751784324646, -0.0005188584327697754, -0.0004899650812149048, -0.0004610717296600342, -0.0004321783781051636, -0.00040328502655029297, -0.00037439167499542236, -0.00034549832344055176, -0.00031660497188568115, -0.00028771162033081055, -0.00025881826877593994, -0.00022992491722106934, -0.00020103156566619873, -0.00017213821411132812, -0.00014324486255645752, -0.00011435151100158691, -8.545815944671631e-05, -5.65648078918457e-05, -2.7671456336975098e-05, 1.2218952178955078e-06, 3.0115246772766113e-05, 5.900859832763672e-05, 8.790194988250732e-05, 0.00011679530143737793, 0.00014568865299224854, 0.00017458200454711914, 0.00020347535610198975, 0.00023236870765686035, 0.00026126205921173096, 0.00029015541076660156, 0.00031904876232147217, 0.0003479421138763428, 0.0003768354654312134, 0.000405728816986084, 0.0004346221685409546, 0.0004635155200958252, 0.0004924088716506958, 0.0005213022232055664, 0.000550195574760437, 0.0005790889263153076, 0.0006079822778701782, 0.0006368756294250488, 0.0006657689809799194, 0.00069466233253479, 0.0007235556840896606, 0.0007524490356445312]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 3.0, 4.0, 8.0, 13.0, 25.0, 15.0, 30.0, 56.0, 126.0, 222.0, 396.0, 952.0, 3620.0, 42531.0, 977784.0, 18674.0, 2526.0, 746.0, 386.0, 182.0, 85.0, 54.0, 42.0, 24.0, 13.0, 14.0, 7.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-32.21875, -31.379150390625, -30.53955078125, -29.699951171875, -28.8603515625, -28.020751953125, -27.18115234375, -26.341552734375, -25.501953125, -24.662353515625, -23.82275390625, -22.983154296875, -22.1435546875, -21.303955078125, -20.46435546875, -19.624755859375, -18.78515625, -17.945556640625, -17.10595703125, -16.266357421875, -15.4267578125, -14.587158203125, -13.74755859375, -12.907958984375, -12.068359375, -11.228759765625, -10.38916015625, -9.549560546875, -8.7099609375, -7.870361328125, -7.03076171875, -6.191162109375, -5.3515625, -4.511962890625, -3.67236328125, -2.832763671875, -1.9931640625, -1.153564453125, -0.31396484375, 0.525634765625, 1.365234375, 2.204833984375, 3.04443359375, 3.884033203125, 4.7236328125, 5.563232421875, 6.40283203125, 7.242431640625, 8.08203125, 8.921630859375, 9.76123046875, 10.600830078125, 11.4404296875, 12.280029296875, 13.11962890625, 13.959228515625, 14.798828125, 15.638427734375, 16.47802734375, 17.317626953125, 18.1572265625, 18.996826171875, 19.83642578125, 20.676025390625, 21.515625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 6.0, 6.0, 8.0, 14.0, 30.0, 38.0, 80.0, 164.0, 305.0, 182.0, 72.0, 23.0, 15.0, 14.0, 9.0, 4.0, 8.0, 3.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.65625, -19.77880859375, -18.9013671875, -18.02392578125, -17.146484375, -16.26904296875, -15.3916015625, -14.51416015625, -13.63671875, -12.75927734375, -11.8818359375, -11.00439453125, -10.126953125, -9.24951171875, -8.3720703125, -7.49462890625, -6.6171875, -5.73974609375, -4.8623046875, -3.98486328125, -3.107421875, -2.22998046875, -1.3525390625, -0.47509765625, 0.40234375, 1.27978515625, 2.1572265625, 3.03466796875, 3.912109375, 4.78955078125, 5.6669921875, 6.54443359375, 7.421875, 8.29931640625, 9.1767578125, 10.05419921875, 10.931640625, 11.80908203125, 12.6865234375, 13.56396484375, 14.44140625, 15.31884765625, 16.1962890625, 17.07373046875, 17.951171875, 18.82861328125, 19.7060546875, 20.58349609375, 21.4609375, 22.33837890625, 23.2158203125, 24.09326171875, 24.970703125, 25.84814453125, 26.7255859375, 27.60302734375, 28.48046875, 29.35791015625, 30.2353515625, 31.11279296875, 31.990234375, 32.86767578125, 33.7451171875, 34.62255859375, 35.5]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 6.0, 13.0, 145.0, 658.0, 155.0, 19.0, 5.0, 2.0, 1.0, 2.0], "bins": [-1140.389404296875, -1120.529296875, -1100.669189453125, -1080.8089599609375, -1060.9488525390625, -1041.0887451171875, -1021.2285766601562, -1001.368408203125, -981.50830078125, -961.648193359375, -941.7880249023438, -921.9278564453125, -902.0677490234375, -882.2076416015625, -862.3474731445312, -842.4873046875, -822.627197265625, -802.76708984375, -782.9069213867188, -763.0467529296875, -743.1866455078125, -723.3265380859375, -703.4663696289062, -683.606201171875, -663.74609375, -643.885986328125, -624.0258178710938, -604.1656494140625, -584.3055419921875, -564.4454345703125, -544.5852661132812, -524.72509765625, -504.8650207519531, -485.0048828125, -465.1447448730469, -445.28460693359375, -425.4244689941406, -405.5643310546875, -385.7041931152344, -365.84405517578125, -345.9839172363281, -326.123779296875, -306.2636413574219, -286.40350341796875, -266.5433654785156, -246.6832275390625, -226.82308959960938, -206.96295166015625, -187.10281372070312, -167.24267578125, -147.38253784179688, -127.52239990234375, -107.66226196289062, -87.8021240234375, -67.94198608398438, -48.08184814453125, -28.221710205078125, -8.361572265625, 11.498565673828125, 31.35870361328125, 51.218841552734375, 71.0789794921875, 90.93911743164062, 110.79925537109375, 130.65939331054688]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 1.0, 4.0, 8.0, 8.0, 12.0, 12.0, 20.0, 24.0, 23.0, 31.0, 27.0, 34.0, 39.0, 47.0, 46.0, 47.0, 80.0, 67.0, 65.0, 49.0, 45.0, 48.0, 30.0, 42.0, 30.0, 22.0, 27.0, 21.0, 17.0, 16.0, 15.0, 7.0, 9.0, 6.0, 5.0, 5.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.40904235839844, -123.25886535644531, -118.10868835449219, -112.95851135253906, -107.80833435058594, -102.65815734863281, -97.50798797607422, -92.3578109741211, -87.20763397216797, -82.05745697021484, -76.90727996826172, -71.7571029663086, -66.60693359375, -61.45675277709961, -56.30657958984375, -51.156402587890625, -46.0062255859375, -40.856048583984375, -35.70587158203125, -30.55569839477539, -25.405521392822266, -20.25534439086914, -15.105169296264648, -9.954994201660156, -4.804817199707031, 0.34535884857177734, 5.495534896850586, 10.645710945129395, 15.795886993408203, 20.946063995361328, 26.09623908996582, 31.246414184570312, 36.396575927734375, 41.5467529296875, 46.696929931640625, 51.847103118896484, 56.99728012084961, 62.147457122802734, 67.2976303100586, 72.44780731201172, 77.59798431396484, 82.74816131591797, 87.8983383178711, 93.04851531982422, 98.19868469238281, 103.34886169433594, 108.49903869628906, 113.64921569824219, 118.79939270019531, 123.94956970214844, 129.09974670410156, 134.2499237060547, 139.4001007080078, 144.55027770996094, 149.70045471191406, 154.85061645507812, 160.00079345703125, 165.15097045898438, 170.3011474609375, 175.45132446289062, 180.60150146484375, 185.75167846679688, 190.90185546875, 196.05203247070312, 201.20220947265625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 9.0, 15.0, 19.0, 50.0, 97.0, 174.0, 386.0, 1104.0, 4291.0, 62434.0, 4101634.0, 20054.0, 2539.0, 811.0, 321.0, 163.0, 67.0, 40.0, 16.0, 20.0, 6.0, 7.0, 4.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.28125, -21.4951171875, -20.708984375, -19.9228515625, -19.13671875, -18.3505859375, -17.564453125, -16.7783203125, -15.9921875, -15.2060546875, -14.419921875, -13.6337890625, -12.84765625, -12.0615234375, -11.275390625, -10.4892578125, -9.703125, -8.9169921875, -8.130859375, -7.3447265625, -6.55859375, -5.7724609375, -4.986328125, -4.2001953125, -3.4140625, -2.6279296875, -1.841796875, -1.0556640625, -0.26953125, 0.5166015625, 1.302734375, 2.0888671875, 2.875, 3.6611328125, 4.447265625, 5.2333984375, 6.01953125, 6.8056640625, 7.591796875, 8.3779296875, 9.1640625, 9.9501953125, 10.736328125, 11.5224609375, 12.30859375, 13.0947265625, 13.880859375, 14.6669921875, 15.453125, 16.2392578125, 17.025390625, 17.8115234375, 18.59765625, 19.3837890625, 20.169921875, 20.9560546875, 21.7421875, 22.5283203125, 23.314453125, 24.1005859375, 24.88671875, 25.6728515625, 26.458984375, 27.2451171875, 28.03125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 15.0, 18.0, 20.0, 40.0, 49.0, 82.0, 119.0, 132.0, 143.0, 128.0, 84.0, 61.0, 36.0, 26.0, 23.0, 9.0, 4.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.890625, -10.438720703125, -9.98681640625, -9.534912109375, -9.0830078125, -8.631103515625, -8.17919921875, -7.727294921875, -7.275390625, -6.823486328125, -6.37158203125, -5.919677734375, -5.4677734375, -5.015869140625, -4.56396484375, -4.112060546875, -3.66015625, -3.208251953125, -2.75634765625, -2.304443359375, -1.8525390625, -1.400634765625, -0.94873046875, -0.496826171875, -0.044921875, 0.406982421875, 0.85888671875, 1.310791015625, 1.7626953125, 2.214599609375, 2.66650390625, 3.118408203125, 3.5703125, 4.022216796875, 4.47412109375, 4.926025390625, 5.3779296875, 5.829833984375, 6.28173828125, 6.733642578125, 7.185546875, 7.637451171875, 8.08935546875, 8.541259765625, 8.9931640625, 9.445068359375, 9.89697265625, 10.348876953125, 10.80078125, 11.252685546875, 11.70458984375, 12.156494140625, 12.6083984375, 13.060302734375, 13.51220703125, 13.964111328125, 14.416015625, 14.867919921875, 15.31982421875, 15.771728515625, 16.2236328125, 16.675537109375, 17.12744140625, 17.579345703125, 18.03125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 9.0, 5.0, 9.0, 11.0, 23.0, 31.0, 27.0, 38.0, 50.0, 68.0, 113.0, 196.0, 299.0, 517.0, 930.0, 1794.0, 3746.0, 9575.0, 38653.0, 618908.0, 3444122.0, 54310.0, 11910.0, 4359.0, 2096.0, 1030.0, 564.0, 331.0, 187.0, 113.0, 74.0, 51.0, 29.0, 21.0, 16.0, 16.0, 19.0, 7.0, 9.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5703125, -6.33642578125, -6.1025390625, -5.86865234375, -5.634765625, -5.40087890625, -5.1669921875, -4.93310546875, -4.69921875, -4.46533203125, -4.2314453125, -3.99755859375, -3.763671875, -3.52978515625, -3.2958984375, -3.06201171875, -2.828125, -2.59423828125, -2.3603515625, -2.12646484375, -1.892578125, -1.65869140625, -1.4248046875, -1.19091796875, -0.95703125, -0.72314453125, -0.4892578125, -0.25537109375, -0.021484375, 0.21240234375, 0.4462890625, 0.68017578125, 0.9140625, 1.14794921875, 1.3818359375, 1.61572265625, 1.849609375, 2.08349609375, 2.3173828125, 2.55126953125, 2.78515625, 3.01904296875, 3.2529296875, 3.48681640625, 3.720703125, 3.95458984375, 4.1884765625, 4.42236328125, 4.65625, 4.89013671875, 5.1240234375, 5.35791015625, 5.591796875, 5.82568359375, 6.0595703125, 6.29345703125, 6.52734375, 6.76123046875, 6.9951171875, 7.22900390625, 7.462890625, 7.69677734375, 7.9306640625, 8.16455078125, 8.3984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 1.0, 3.0, 7.0, 10.0, 21.0, 56.0, 186.0, 2877.0, 658.0, 151.0, 51.0, 20.0, 14.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.78125, -7.59954833984375, -7.4178466796875, -7.23614501953125, -7.054443359375, -6.87274169921875, -6.6910400390625, -6.50933837890625, -6.32763671875, -6.14593505859375, -5.9642333984375, -5.78253173828125, -5.600830078125, -5.41912841796875, -5.2374267578125, -5.05572509765625, -4.8740234375, -4.69232177734375, -4.5106201171875, -4.32891845703125, -4.147216796875, -3.96551513671875, -3.7838134765625, -3.60211181640625, -3.42041015625, -3.23870849609375, -3.0570068359375, -2.87530517578125, -2.693603515625, -2.51190185546875, -2.3302001953125, -2.14849853515625, -1.966796875, -1.78509521484375, -1.6033935546875, -1.42169189453125, -1.239990234375, -1.05828857421875, -0.8765869140625, -0.69488525390625, -0.51318359375, -0.33148193359375, -0.1497802734375, 0.03192138671875, 0.213623046875, 0.39532470703125, 0.5770263671875, 0.75872802734375, 0.9404296875, 1.12213134765625, 1.3038330078125, 1.48553466796875, 1.667236328125, 1.84893798828125, 2.0306396484375, 2.21234130859375, 2.39404296875, 2.57574462890625, 2.7574462890625, 2.93914794921875, 3.120849609375, 3.30255126953125, 3.4842529296875, 3.66595458984375, 3.84765625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 13.0, 32.0, 60.0, 76.0, 150.0, 156.0, 162.0, 132.0, 80.0, 44.0, 39.0, 18.0, 10.0, 6.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.871991157531738, -6.30872917175293, -5.745467185974121, -5.182205677032471, -4.618943691253662, -4.0556817054748535, -3.492419958114624, -2.9291582107543945, -2.365896224975586, -1.802634358406067, -1.2393724918365479, -0.6761106252670288, -0.11284875869750977, 0.45041322708129883, 1.0136749744415283, 1.5769367218017578, 2.1401987075805664, 2.703460693359375, 3.2667224407196045, 3.829984188079834, 4.393246173858643, 4.956508159637451, 5.519769668579102, 6.08303165435791, 6.646293640136719, 7.209555625915527, 7.772817611694336, 8.336079597473145, 8.899341583251953, 9.462602615356445, 10.025864601135254, 10.589126586914062, 11.152389526367188, 11.715651512145996, 12.278913497924805, 12.842175483703613, 13.405437469482422, 13.968698501586914, 14.531960487365723, 15.095222473144531, 15.65848445892334, 16.22174644470215, 16.78500747680664, 17.348270416259766, 17.911531448364258, 18.474794387817383, 19.038055419921875, 19.601318359375, 20.164579391479492, 20.727840423583984, 21.29110336303711, 21.8543643951416, 22.417627334594727, 22.98088836669922, 23.544151306152344, 24.107412338256836, 24.670673370361328, 25.23393440246582, 25.797197341918945, 26.360458374023438, 26.923721313476562, 27.486982345581055, 28.05024528503418, 28.613506317138672, 29.176769256591797]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 8.0, 11.0, 16.0, 9.0, 22.0, 28.0, 26.0, 39.0, 41.0, 52.0, 56.0, 71.0, 52.0, 41.0, 67.0, 51.0, 48.0, 57.0, 53.0, 48.0, 43.0, 35.0, 19.0, 32.0, 15.0, 9.0, 13.0, 11.0, 13.0, 8.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.107368469238281, -14.705106735229492, -14.302845001220703, -13.90058422088623, -13.498322486877441, -13.096060752868652, -12.693799018859863, -12.29153823852539, -11.889276504516602, -11.487014770507812, -11.084753036499023, -10.68249225616455, -10.280230522155762, -9.877968788146973, -9.475707054138184, -9.073446273803711, -8.671184539794922, -8.268922805786133, -7.866661548614502, -7.464399814605713, -7.062138557434082, -6.659876823425293, -6.257615089416504, -5.855353832244873, -5.453091621398926, -5.050829887390137, -4.648568630218506, -4.246306896209717, -3.844045639038086, -3.441783905029297, -3.039522409439087, -2.637260913848877, -2.234999656677246, -1.8327381610870361, -1.4304766654968262, -1.0282150506973267, -0.6259535551071167, -0.2236919403076172, 0.17856955528259277, 0.5808310508728027, 0.9830925464630127, 1.3853540420532227, 1.7876155376434326, 2.1898770332336426, 2.5921387672424316, 2.9944002628326416, 3.3966617584228516, 3.7989232540130615, 4.2011847496032715, 4.6034464836120605, 5.005707740783691, 5.4079694747924805, 5.810230731964111, 6.2124924659729, 6.614753723144531, 7.01701545715332, 7.419277191162109, 7.821538925170898, 8.223800659179688, 8.62606143951416, 9.02832317352295, 9.430584907531738, 9.832846641540527, 10.235107421875, 10.637369155883789]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 7.0, 4.0, 9.0, 15.0, 21.0, 27.0, 33.0, 68.0, 97.0, 172.0, 257.0, 510.0, 1092.0, 2818.0, 11153.0, 82528.0, 735756.0, 188035.0, 18924.0, 4067.0, 1438.0, 690.0, 328.0, 184.0, 118.0, 71.0, 38.0, 24.0, 19.0, 14.0, 10.0, 9.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-26.765625, -26.035400390625, -25.30517578125, -24.574951171875, -23.8447265625, -23.114501953125, -22.38427734375, -21.654052734375, -20.923828125, -20.193603515625, -19.46337890625, -18.733154296875, -18.0029296875, -17.272705078125, -16.54248046875, -15.812255859375, -15.08203125, -14.351806640625, -13.62158203125, -12.891357421875, -12.1611328125, -11.430908203125, -10.70068359375, -9.970458984375, -9.240234375, -8.510009765625, -7.77978515625, -7.049560546875, -6.3193359375, -5.589111328125, -4.85888671875, -4.128662109375, -3.3984375, -2.668212890625, -1.93798828125, -1.207763671875, -0.4775390625, 0.252685546875, 0.98291015625, 1.713134765625, 2.443359375, 3.173583984375, 3.90380859375, 4.634033203125, 5.3642578125, 6.094482421875, 6.82470703125, 7.554931640625, 8.28515625, 9.015380859375, 9.74560546875, 10.475830078125, 11.2060546875, 11.936279296875, 12.66650390625, 13.396728515625, 14.126953125, 14.857177734375, 15.58740234375, 16.317626953125, 17.0478515625, 17.778076171875, 18.50830078125, 19.238525390625, 19.96875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 14.0, 15.0, 19.0, 36.0, 52.0, 67.0, 115.0, 139.0, 138.0, 142.0, 75.0, 68.0, 41.0, 26.0, 28.0, 9.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9765625, -10.5242919921875, -10.072021484375, -9.6197509765625, -9.16748046875, -8.7152099609375, -8.262939453125, -7.8106689453125, -7.3583984375, -6.9061279296875, -6.453857421875, -6.0015869140625, -5.54931640625, -5.0970458984375, -4.644775390625, -4.1925048828125, -3.740234375, -3.2879638671875, -2.835693359375, -2.3834228515625, -1.93115234375, -1.4788818359375, -1.026611328125, -0.5743408203125, -0.1220703125, 0.3302001953125, 0.782470703125, 1.2347412109375, 1.68701171875, 2.1392822265625, 2.591552734375, 3.0438232421875, 3.49609375, 3.9483642578125, 4.400634765625, 4.8529052734375, 5.30517578125, 5.7574462890625, 6.209716796875, 6.6619873046875, 7.1142578125, 7.5665283203125, 8.018798828125, 8.4710693359375, 8.92333984375, 9.3756103515625, 9.827880859375, 10.2801513671875, 10.732421875, 11.1846923828125, 11.636962890625, 12.0892333984375, 12.54150390625, 12.9937744140625, 13.446044921875, 13.8983154296875, 14.3505859375, 14.8028564453125, 15.255126953125, 15.7073974609375, 16.15966796875, 16.6119384765625, 17.064208984375, 17.5164794921875, 17.96875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 4.0, 5.0, 13.0, 9.0, 20.0, 20.0, 41.0, 66.0, 93.0, 178.0, 305.0, 732.0, 2740.0, 19727.0, 959131.0, 59092.0, 4383.0, 1020.0, 402.0, 197.0, 131.0, 86.0, 38.0, 37.0, 25.0, 20.0, 11.0, 10.0, 7.0, 2.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.59375, -49.91064453125, -48.2275390625, -46.54443359375, -44.861328125, -43.17822265625, -41.4951171875, -39.81201171875, -38.12890625, -36.44580078125, -34.7626953125, -33.07958984375, -31.396484375, -29.71337890625, -28.0302734375, -26.34716796875, -24.6640625, -22.98095703125, -21.2978515625, -19.61474609375, -17.931640625, -16.24853515625, -14.5654296875, -12.88232421875, -11.19921875, -9.51611328125, -7.8330078125, -6.14990234375, -4.466796875, -2.78369140625, -1.1005859375, 0.58251953125, 2.265625, 3.94873046875, 5.6318359375, 7.31494140625, 8.998046875, 10.68115234375, 12.3642578125, 14.04736328125, 15.73046875, 17.41357421875, 19.0966796875, 20.77978515625, 22.462890625, 24.14599609375, 25.8291015625, 27.51220703125, 29.1953125, 30.87841796875, 32.5615234375, 34.24462890625, 35.927734375, 37.61083984375, 39.2939453125, 40.97705078125, 42.66015625, 44.34326171875, 46.0263671875, 47.70947265625, 49.392578125, 51.07568359375, 52.7587890625, 54.44189453125, 56.125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 4.0, 2.0, 13.0, 10.0, 24.0, 30.0, 60.0, 93.0, 137.0, 142.0, 144.0, 118.0, 81.0, 57.0, 25.0, 19.0, 11.0, 5.0, 7.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.125, -51.6435546875, -49.162109375, -46.6806640625, -44.19921875, -41.7177734375, -39.236328125, -36.7548828125, -34.2734375, -31.7919921875, -29.310546875, -26.8291015625, -24.34765625, -21.8662109375, -19.384765625, -16.9033203125, -14.421875, -11.9404296875, -9.458984375, -6.9775390625, -4.49609375, -2.0146484375, 0.466796875, 2.9482421875, 5.4296875, 7.9111328125, 10.392578125, 12.8740234375, 15.35546875, 17.8369140625, 20.318359375, 22.7998046875, 25.28125, 27.7626953125, 30.244140625, 32.7255859375, 35.20703125, 37.6884765625, 40.169921875, 42.6513671875, 45.1328125, 47.6142578125, 50.095703125, 52.5771484375, 55.05859375, 57.5400390625, 60.021484375, 62.5029296875, 64.984375, 67.4658203125, 69.947265625, 72.4287109375, 74.91015625, 77.3916015625, 79.873046875, 82.3544921875, 84.8359375, 87.3173828125, 89.798828125, 92.2802734375, 94.76171875, 97.2431640625, 99.724609375, 102.2060546875, 104.6875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 4.0, 6.0, 10.0, 10.0, 18.0, 18.0, 25.0, 33.0, 50.0, 59.0, 99.0, 84.0, 150.0, 162.0, 335.0, 546.0, 1216.0, 3934.0, 22008.0, 433564.0, 553691.0, 25295.0, 4254.0, 1247.0, 603.0, 318.0, 226.0, 154.0, 103.0, 85.0, 64.0, 37.0, 30.0, 20.0, 23.0, 13.0, 16.0, 11.0, 6.0, 10.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.890625, -7.644287109375, -7.39794921875, -7.151611328125, -6.9052734375, -6.658935546875, -6.41259765625, -6.166259765625, -5.919921875, -5.673583984375, -5.42724609375, -5.180908203125, -4.9345703125, -4.688232421875, -4.44189453125, -4.195556640625, -3.94921875, -3.702880859375, -3.45654296875, -3.210205078125, -2.9638671875, -2.717529296875, -2.47119140625, -2.224853515625, -1.978515625, -1.732177734375, -1.48583984375, -1.239501953125, -0.9931640625, -0.746826171875, -0.50048828125, -0.254150390625, -0.0078125, 0.238525390625, 0.48486328125, 0.731201171875, 0.9775390625, 1.223876953125, 1.47021484375, 1.716552734375, 1.962890625, 2.209228515625, 2.45556640625, 2.701904296875, 2.9482421875, 3.194580078125, 3.44091796875, 3.687255859375, 3.93359375, 4.179931640625, 4.42626953125, 4.672607421875, 4.9189453125, 5.165283203125, 5.41162109375, 5.657958984375, 5.904296875, 6.150634765625, 6.39697265625, 6.643310546875, 6.8896484375, 7.135986328125, 7.38232421875, 7.628662109375, 7.875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 8.0, 7.0, 11.0, 10.0, 11.0, 25.0, 31.0, 31.0, 59.0, 70.0, 93.0, 162.0, 156.0, 77.0, 48.0, 53.0, 35.0, 34.0, 25.0, 16.0, 13.0, 7.0, 6.0, 4.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006117820739746094, -0.0005850419402122498, -0.0005583018064498901, -0.0005315616726875305, -0.0005048215389251709, -0.0004780814051628113, -0.00045134127140045166, -0.00042460113763809204, -0.0003978610038757324, -0.0003711208701133728, -0.0003443807363510132, -0.00031764060258865356, -0.00029090046882629395, -0.0002641603350639343, -0.0002374202013015747, -0.0002106800675392151, -0.00018393993377685547, -0.00015719980001449585, -0.00013045966625213623, -0.00010371953248977661, -7.697939872741699e-05, -5.023926496505737e-05, -2.3499131202697754e-05, 3.2410025596618652e-06, 2.9981136322021484e-05, 5.6721270084381104e-05, 8.346140384674072e-05, 0.00011020153760910034, 0.00013694167137145996, 0.00016368180513381958, 0.0001904219388961792, 0.00021716207265853882, 0.00024390220642089844, 0.00027064234018325806, 0.0002973824739456177, 0.0003241226077079773, 0.0003508627414703369, 0.00037760287523269653, 0.00040434300899505615, 0.00043108314275741577, 0.0004578232765197754, 0.000484563410282135, 0.0005113035440444946, 0.0005380436778068542, 0.0005647838115692139, 0.0005915239453315735, 0.0006182640790939331, 0.0006450042128562927, 0.0006717443466186523, 0.000698484480381012, 0.0007252246141433716, 0.0007519647479057312, 0.0007787048816680908, 0.0008054450154304504, 0.0008321851491928101, 0.0008589252829551697, 0.0008856654167175293, 0.0009124055504798889, 0.0009391456842422485, 0.0009658858180046082, 0.0009926259517669678, 0.0010193660855293274, 0.001046106219291687, 0.0010728463530540466, 0.0010995864868164062]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 6.0, 2.0, 3.0, 7.0, 10.0, 17.0, 15.0, 25.0, 37.0, 47.0, 73.0, 138.0, 300.0, 998.0, 9806.0, 994406.0, 39897.0, 1835.0, 463.0, 181.0, 94.0, 67.0, 28.0, 21.0, 17.0, 18.0, 11.0, 5.0, 3.0, 4.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.671875, -20.96533203125, -20.2587890625, -19.55224609375, -18.845703125, -18.13916015625, -17.4326171875, -16.72607421875, -16.01953125, -15.31298828125, -14.6064453125, -13.89990234375, -13.193359375, -12.48681640625, -11.7802734375, -11.07373046875, -10.3671875, -9.66064453125, -8.9541015625, -8.24755859375, -7.541015625, -6.83447265625, -6.1279296875, -5.42138671875, -4.71484375, -4.00830078125, -3.3017578125, -2.59521484375, -1.888671875, -1.18212890625, -0.4755859375, 0.23095703125, 0.9375, 1.64404296875, 2.3505859375, 3.05712890625, 3.763671875, 4.47021484375, 5.1767578125, 5.88330078125, 6.58984375, 7.29638671875, 8.0029296875, 8.70947265625, 9.416015625, 10.12255859375, 10.8291015625, 11.53564453125, 12.2421875, 12.94873046875, 13.6552734375, 14.36181640625, 15.068359375, 15.77490234375, 16.4814453125, 17.18798828125, 17.89453125, 18.60107421875, 19.3076171875, 20.01416015625, 20.720703125, 21.42724609375, 22.1337890625, 22.84033203125, 23.546875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 10.0, 9.0, 11.0, 14.0, 18.0, 39.0, 56.0, 135.0, 193.0, 200.0, 112.0, 63.0, 40.0, 19.0, 17.0, 13.0, 9.0, 7.0, 2.0, 6.0, 5.0, 5.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.421875, -13.96875, -13.515625, -13.0625, -12.609375, -12.15625, -11.703125, -11.25, -10.796875, -10.34375, -9.890625, -9.4375, -8.984375, -8.53125, -8.078125, -7.625, -7.171875, -6.71875, -6.265625, -5.8125, -5.359375, -4.90625, -4.453125, -4.0, -3.546875, -3.09375, -2.640625, -2.1875, -1.734375, -1.28125, -0.828125, -0.375, 0.078125, 0.53125, 0.984375, 1.4375, 1.890625, 2.34375, 2.796875, 3.25, 3.703125, 4.15625, 4.609375, 5.0625, 5.515625, 5.96875, 6.421875, 6.875, 7.328125, 7.78125, 8.234375, 8.6875, 9.140625, 9.59375, 10.046875, 10.5, 10.953125, 11.40625, 11.859375, 12.3125, 12.765625, 13.21875, 13.671875, 14.125, 14.578125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 13.0, 48.0, 348.0, 491.0, 84.0, 15.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-699.6353759765625, -684.1427612304688, -668.6500854492188, -653.157470703125, -637.664794921875, -622.1721801757812, -606.6795654296875, -591.1868896484375, -575.6942749023438, -560.20166015625, -544.708984375, -529.2163696289062, -513.7236938476562, -498.2310791015625, -482.7384338378906, -467.24578857421875, -451.7531433105469, -436.260498046875, -420.7678527832031, -405.27520751953125, -389.7825927734375, -374.2899475097656, -358.79730224609375, -343.3046569824219, -327.81201171875, -312.3193664550781, -296.82672119140625, -281.3341064453125, -265.8414611816406, -250.34881591796875, -234.85617065429688, -219.363525390625, -203.87094116210938, -188.3782958984375, -172.8856658935547, -157.3930206298828, -141.900390625, -126.40774536132812, -110.91510009765625, -95.4224624633789, -79.92982482910156, -64.43718719482422, -48.94454574584961, -33.451904296875, -17.959266662597656, -2.4666290283203125, 13.026016235351562, 28.518653869628906, 44.01129150390625, 59.503929138183594, 74.99656677246094, 90.48921203613281, 105.98184967041016, 121.4744873046875, 136.96713256835938, 152.45977783203125, 167.95240783691406, 183.44505310058594, 198.93768310546875, 214.43032836914062, 229.9229736328125, 245.4156036376953, 260.90826416015625, 276.40087890625, 291.8935241699219]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 2.0, 1.0, 12.0, 9.0, 7.0, 14.0, 23.0, 17.0, 27.0, 23.0, 44.0, 28.0, 54.0, 55.0, 67.0, 71.0, 57.0, 56.0, 63.0, 63.0, 43.0, 37.0, 31.0, 33.0, 39.0, 29.0, 21.0, 8.0, 25.0, 10.0, 6.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.53662109375, -132.01046752929688, -126.48431396484375, -120.95816040039062, -115.43199920654297, -109.90584564208984, -104.37969207763672, -98.85353088378906, -93.32737731933594, -87.80122375488281, -82.27507019042969, -76.74891662597656, -71.2227554321289, -65.69660186767578, -60.170448303222656, -54.644290924072266, -49.118141174316406, -43.59198760986328, -38.06583023071289, -32.539676666259766, -27.013521194458008, -21.48736572265625, -15.961212158203125, -10.435054779052734, -4.908901214599609, 0.6172537803649902, 6.14340877532959, 11.669563293457031, 17.19571876525879, 22.721874237060547, 28.248027801513672, 33.77418518066406, 39.30033874511719, 44.82649230957031, 50.3526496887207, 55.87880325317383, 61.40496063232422, 66.93111419677734, 72.45726776123047, 77.98342895507812, 83.50958251953125, 89.03573608398438, 94.5618896484375, 100.08804321289062, 105.61420440673828, 111.1403579711914, 116.66651153564453, 122.19267272949219, 127.71881866455078, 133.24497985839844, 138.77113342285156, 144.2972869873047, 149.8234405517578, 155.34959411621094, 160.87574768066406, 166.4019012451172, 171.9280548095703, 177.45420837402344, 182.98036193847656, 188.5065155029297, 194.0326690673828, 199.558837890625, 205.08499145507812, 210.61114501953125, 216.13729858398438]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 15.0, 17.0, 27.0, 33.0, 65.0, 118.0, 267.0, 521.0, 1347.0, 5139.0, 36865.0, 3590343.0, 539932.0, 14117.0, 3262.0, 1111.0, 470.0, 253.0, 140.0, 80.0, 52.0, 30.0, 21.0, 16.0, 9.0, 8.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1328125, -10.5711669921875, -10.009521484375, -9.4478759765625, -8.88623046875, -8.3245849609375, -7.762939453125, -7.2012939453125, -6.6396484375, -6.0780029296875, -5.516357421875, -4.9547119140625, -4.39306640625, -3.8314208984375, -3.269775390625, -2.7081298828125, -2.146484375, -1.5848388671875, -1.023193359375, -0.4615478515625, 0.10009765625, 0.6617431640625, 1.223388671875, 1.7850341796875, 2.3466796875, 2.9083251953125, 3.469970703125, 4.0316162109375, 4.59326171875, 5.1549072265625, 5.716552734375, 6.2781982421875, 6.83984375, 7.4014892578125, 7.963134765625, 8.5247802734375, 9.08642578125, 9.6480712890625, 10.209716796875, 10.7713623046875, 11.3330078125, 11.8946533203125, 12.456298828125, 13.0179443359375, 13.57958984375, 14.1412353515625, 14.702880859375, 15.2645263671875, 15.826171875, 16.3878173828125, 16.949462890625, 17.5111083984375, 18.07275390625, 18.6343994140625, 19.196044921875, 19.7576904296875, 20.3193359375, 20.8809814453125, 21.442626953125, 22.0042724609375, 22.56591796875, 23.1275634765625, 23.689208984375, 24.2508544921875, 24.8125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 8.0, 10.0, 22.0, 21.0, 23.0, 38.0, 39.0, 44.0, 51.0, 73.0, 86.0, 85.0, 107.0, 58.0, 76.0, 62.0, 43.0, 26.0, 25.0, 17.0, 15.0, 10.0, 12.0, 12.0, 12.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.55859375, -6.29632568359375, -6.0340576171875, -5.77178955078125, -5.509521484375, -5.24725341796875, -4.9849853515625, -4.72271728515625, -4.46044921875, -4.19818115234375, -3.9359130859375, -3.67364501953125, -3.411376953125, -3.14910888671875, -2.8868408203125, -2.62457275390625, -2.3623046875, -2.10003662109375, -1.8377685546875, -1.57550048828125, -1.313232421875, -1.05096435546875, -0.7886962890625, -0.52642822265625, -0.26416015625, -0.00189208984375, 0.2603759765625, 0.52264404296875, 0.784912109375, 1.04718017578125, 1.3094482421875, 1.57171630859375, 1.833984375, 2.09625244140625, 2.3585205078125, 2.62078857421875, 2.883056640625, 3.14532470703125, 3.4075927734375, 3.66986083984375, 3.93212890625, 4.19439697265625, 4.4566650390625, 4.71893310546875, 4.981201171875, 5.24346923828125, 5.5057373046875, 5.76800537109375, 6.0302734375, 6.29254150390625, 6.5548095703125, 6.81707763671875, 7.079345703125, 7.34161376953125, 7.6038818359375, 7.86614990234375, 8.12841796875, 8.39068603515625, 8.6529541015625, 8.91522216796875, 9.177490234375, 9.43975830078125, 9.7020263671875, 9.96429443359375, 10.2265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 7.0, 8.0, 8.0, 10.0, 15.0, 20.0, 30.0, 67.0, 118.0, 374.0, 932.0, 2813.0, 12900.0, 152686.0, 3943009.0, 69658.0, 8344.0, 2087.0, 671.0, 244.0, 103.0, 70.0, 29.0, 9.0, 19.0, 13.0, 5.0, 4.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6875, -14.169921875, -13.65234375, -13.134765625, -12.6171875, -12.099609375, -11.58203125, -11.064453125, -10.546875, -10.029296875, -9.51171875, -8.994140625, -8.4765625, -7.958984375, -7.44140625, -6.923828125, -6.40625, -5.888671875, -5.37109375, -4.853515625, -4.3359375, -3.818359375, -3.30078125, -2.783203125, -2.265625, -1.748046875, -1.23046875, -0.712890625, -0.1953125, 0.322265625, 0.83984375, 1.357421875, 1.875, 2.392578125, 2.91015625, 3.427734375, 3.9453125, 4.462890625, 4.98046875, 5.498046875, 6.015625, 6.533203125, 7.05078125, 7.568359375, 8.0859375, 8.603515625, 9.12109375, 9.638671875, 10.15625, 10.673828125, 11.19140625, 11.708984375, 12.2265625, 12.744140625, 13.26171875, 13.779296875, 14.296875, 14.814453125, 15.33203125, 15.849609375, 16.3671875, 16.884765625, 17.40234375, 17.919921875, 18.4375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 6.0, 7.0, 9.0, 11.0, 18.0, 21.0, 32.0, 44.0, 140.0, 498.0, 1404.0, 1155.0, 368.0, 116.0, 76.0, 42.0, 32.0, 26.0, 10.0, 10.0, 9.0, 4.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.640625, -13.198486328125, -12.75634765625, -12.314208984375, -11.8720703125, -11.429931640625, -10.98779296875, -10.545654296875, -10.103515625, -9.661376953125, -9.21923828125, -8.777099609375, -8.3349609375, -7.892822265625, -7.45068359375, -7.008544921875, -6.56640625, -6.124267578125, -5.68212890625, -5.239990234375, -4.7978515625, -4.355712890625, -3.91357421875, -3.471435546875, -3.029296875, -2.587158203125, -2.14501953125, -1.702880859375, -1.2607421875, -0.818603515625, -0.37646484375, 0.065673828125, 0.5078125, 0.949951171875, 1.39208984375, 1.834228515625, 2.2763671875, 2.718505859375, 3.16064453125, 3.602783203125, 4.044921875, 4.487060546875, 4.92919921875, 5.371337890625, 5.8134765625, 6.255615234375, 6.69775390625, 7.139892578125, 7.58203125, 8.024169921875, 8.46630859375, 8.908447265625, 9.3505859375, 9.792724609375, 10.23486328125, 10.677001953125, 11.119140625, 11.561279296875, 12.00341796875, 12.445556640625, 12.8876953125, 13.329833984375, 13.77197265625, 14.214111328125, 14.65625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 15.0, 25.0, 56.0, 159.0, 275.0, 238.0, 118.0, 54.0, 19.0, 15.0, 5.0, 7.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.93806457519531, -69.41360473632812, -65.8891372680664, -62.36467742919922, -58.84021759033203, -55.31575393676758, -51.791290283203125, -48.26683044433594, -44.74237060546875, -41.2179069519043, -37.69344711303711, -34.168983459472656, -30.64452362060547, -27.120059967041016, -23.595598220825195, -20.071136474609375, -16.546672821044922, -13.022211074829102, -9.497749328613281, -5.9732866287231445, -2.448824882507324, 1.0756378173828125, 4.600099563598633, 8.124561309814453, 11.649023056030273, 15.173484802246094, 18.697946548461914, 22.222408294677734, 25.746871948242188, 29.271333694458008, 32.79579544067383, 36.32025909423828, 39.84471893310547, 43.36918258666992, 46.89364242553711, 50.41810607910156, 53.94256591796875, 57.4670295715332, 60.991493225097656, 64.51595306396484, 68.04041290283203, 71.56487274169922, 75.08934020996094, 78.61380004882812, 82.13825988769531, 85.6627197265625, 89.18718719482422, 92.7116470336914, 96.23611450195312, 99.76057434082031, 103.28504180908203, 106.80950164794922, 110.3339614868164, 113.85842895507812, 117.38288879394531, 120.9073486328125, 124.43180847167969, 127.95626831054688, 131.48072814941406, 135.00518798828125, 138.5296630859375, 142.0541229248047, 145.57858276367188, 149.10304260253906, 152.62750244140625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 9.0, 15.0, 13.0, 16.0, 23.0, 17.0, 26.0, 26.0, 50.0, 45.0, 51.0, 57.0, 67.0, 57.0, 71.0, 67.0, 65.0, 59.0, 61.0, 34.0, 26.0, 31.0, 22.0, 23.0, 15.0, 16.0, 8.0, 9.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-87.04853057861328, -84.96570587158203, -82.88287353515625, -80.800048828125, -78.71721649169922, -76.63439178466797, -74.55155944824219, -72.46873474121094, -70.38591003417969, -68.30308532714844, -66.22025299072266, -64.1374282836914, -62.05459976196289, -59.971771240234375, -57.88894271850586, -55.806114196777344, -53.72328567504883, -51.64045715332031, -49.5576286315918, -47.47480010986328, -45.39197540283203, -43.309146881103516, -41.226318359375, -39.143489837646484, -37.06066131591797, -34.97783279418945, -32.89500427246094, -30.812177658081055, -28.729351043701172, -26.646522521972656, -24.56369400024414, -22.480865478515625, -20.39804458618164, -18.315216064453125, -16.232389450073242, -14.149560928344727, -12.066733360290527, -9.983905792236328, -7.9010772705078125, -5.818249702453613, -3.735422134399414, -1.6525943279266357, 0.4302334785461426, 2.5130615234375, 4.595889091491699, 6.678716659545898, 8.761545181274414, 10.844372749328613, 12.927200317382812, 15.010027885437012, 17.09285545349121, 19.175683975219727, 21.25851058959961, 23.341339111328125, 25.42416763305664, 27.506996154785156, 29.58982276916504, 31.672651290893555, 33.75547790527344, 35.83830642700195, 37.92113494873047, 40.00395965576172, 42.0867919921875, 44.16961669921875, 46.252445220947266]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 10.0, 15.0, 13.0, 28.0, 24.0, 40.0, 61.0, 89.0, 148.0, 231.0, 427.0, 817.0, 1810.0, 4706.0, 14830.0, 67038.0, 412674.0, 447939.0, 72867.0, 15893.0, 5007.0, 1922.0, 842.0, 429.0, 246.0, 133.0, 88.0, 55.0, 41.0, 35.0, 22.0, 7.0, 14.0, 12.0, 4.0, 8.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-12.3125, -11.8883056640625, -11.464111328125, -11.0399169921875, -10.61572265625, -10.1915283203125, -9.767333984375, -9.3431396484375, -8.9189453125, -8.4947509765625, -8.070556640625, -7.6463623046875, -7.22216796875, -6.7979736328125, -6.373779296875, -5.9495849609375, -5.525390625, -5.1011962890625, -4.677001953125, -4.2528076171875, -3.82861328125, -3.4044189453125, -2.980224609375, -2.5560302734375, -2.1318359375, -1.7076416015625, -1.283447265625, -0.8592529296875, -0.43505859375, -0.0108642578125, 0.413330078125, 0.8375244140625, 1.26171875, 1.6859130859375, 2.110107421875, 2.5343017578125, 2.95849609375, 3.3826904296875, 3.806884765625, 4.2310791015625, 4.6552734375, 5.0794677734375, 5.503662109375, 5.9278564453125, 6.35205078125, 6.7762451171875, 7.200439453125, 7.6246337890625, 8.048828125, 8.4730224609375, 8.897216796875, 9.3214111328125, 9.74560546875, 10.1697998046875, 10.593994140625, 11.0181884765625, 11.4423828125, 11.8665771484375, 12.290771484375, 12.7149658203125, 13.13916015625, 13.5633544921875, 13.987548828125, 14.4117431640625, 14.8359375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 3.0, 10.0, 9.0, 28.0, 24.0, 36.0, 45.0, 49.0, 78.0, 71.0, 75.0, 100.0, 80.0, 85.0, 76.0, 62.0, 37.0, 27.0, 24.0, 15.0, 13.0, 9.0, 8.0, 7.0, 10.0, 7.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41796875, -6.15728759765625, -5.8966064453125, -5.63592529296875, -5.375244140625, -5.11456298828125, -4.8538818359375, -4.59320068359375, -4.33251953125, -4.07183837890625, -3.8111572265625, -3.55047607421875, -3.289794921875, -3.02911376953125, -2.7684326171875, -2.50775146484375, -2.2470703125, -1.98638916015625, -1.7257080078125, -1.46502685546875, -1.204345703125, -0.94366455078125, -0.6829833984375, -0.42230224609375, -0.16162109375, 0.09906005859375, 0.3597412109375, 0.62042236328125, 0.881103515625, 1.14178466796875, 1.4024658203125, 1.66314697265625, 1.923828125, 2.18450927734375, 2.4451904296875, 2.70587158203125, 2.966552734375, 3.22723388671875, 3.4879150390625, 3.74859619140625, 4.00927734375, 4.26995849609375, 4.5306396484375, 4.79132080078125, 5.052001953125, 5.31268310546875, 5.5733642578125, 5.83404541015625, 6.0947265625, 6.35540771484375, 6.6160888671875, 6.87677001953125, 7.137451171875, 7.39813232421875, 7.6588134765625, 7.91949462890625, 8.18017578125, 8.44085693359375, 8.7015380859375, 8.96221923828125, 9.222900390625, 9.48358154296875, 9.7442626953125, 10.00494384765625, 10.265625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 10.0, 8.0, 15.0, 17.0, 30.0, 42.0, 39.0, 56.0, 82.0, 113.0, 205.0, 397.0, 1154.0, 6166.0, 415719.0, 615378.0, 6775.0, 1210.0, 457.0, 241.0, 138.0, 70.0, 54.0, 37.0, 30.0, 19.0, 23.0, 19.0, 12.0, 8.0, 8.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.0, -50.32373046875, -48.6474609375, -46.97119140625, -45.294921875, -43.61865234375, -41.9423828125, -40.26611328125, -38.58984375, -36.91357421875, -35.2373046875, -33.56103515625, -31.884765625, -30.20849609375, -28.5322265625, -26.85595703125, -25.1796875, -23.50341796875, -21.8271484375, -20.15087890625, -18.474609375, -16.79833984375, -15.1220703125, -13.44580078125, -11.76953125, -10.09326171875, -8.4169921875, -6.74072265625, -5.064453125, -3.38818359375, -1.7119140625, -0.03564453125, 1.640625, 3.31689453125, 4.9931640625, 6.66943359375, 8.345703125, 10.02197265625, 11.6982421875, 13.37451171875, 15.05078125, 16.72705078125, 18.4033203125, 20.07958984375, 21.755859375, 23.43212890625, 25.1083984375, 26.78466796875, 28.4609375, 30.13720703125, 31.8134765625, 33.48974609375, 35.166015625, 36.84228515625, 38.5185546875, 40.19482421875, 41.87109375, 43.54736328125, 45.2236328125, 46.89990234375, 48.576171875, 50.25244140625, 51.9287109375, 53.60498046875, 55.28125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 5.0, 8.0, 16.0, 16.0, 23.0, 23.0, 46.0, 48.0, 64.0, 83.0, 87.0, 86.0, 85.0, 69.0, 69.0, 52.0, 49.0, 37.0, 27.0, 19.0, 12.0, 19.0, 5.0, 4.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-36.34375, -35.19482421875, -34.0458984375, -32.89697265625, -31.748046875, -30.59912109375, -29.4501953125, -28.30126953125, -27.15234375, -26.00341796875, -24.8544921875, -23.70556640625, -22.556640625, -21.40771484375, -20.2587890625, -19.10986328125, -17.9609375, -16.81201171875, -15.6630859375, -14.51416015625, -13.365234375, -12.21630859375, -11.0673828125, -9.91845703125, -8.76953125, -7.62060546875, -6.4716796875, -5.32275390625, -4.173828125, -3.02490234375, -1.8759765625, -0.72705078125, 0.421875, 1.57080078125, 2.7197265625, 3.86865234375, 5.017578125, 6.16650390625, 7.3154296875, 8.46435546875, 9.61328125, 10.76220703125, 11.9111328125, 13.06005859375, 14.208984375, 15.35791015625, 16.5068359375, 17.65576171875, 18.8046875, 19.95361328125, 21.1025390625, 22.25146484375, 23.400390625, 24.54931640625, 25.6982421875, 26.84716796875, 27.99609375, 29.14501953125, 30.2939453125, 31.44287109375, 32.591796875, 33.74072265625, 34.8896484375, 36.03857421875, 37.1875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 10.0, 7.0, 9.0, 7.0, 8.0, 16.0, 25.0, 47.0, 96.0, 137.0, 311.0, 805.0, 3746.0, 145418.0, 888869.0, 7105.0, 1147.0, 371.0, 161.0, 89.0, 55.0, 32.0, 26.0, 13.0, 11.0, 7.0, 4.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.234375, -17.608642578125, -16.98291015625, -16.357177734375, -15.7314453125, -15.105712890625, -14.47998046875, -13.854248046875, -13.228515625, -12.602783203125, -11.97705078125, -11.351318359375, -10.7255859375, -10.099853515625, -9.47412109375, -8.848388671875, -8.22265625, -7.596923828125, -6.97119140625, -6.345458984375, -5.7197265625, -5.093994140625, -4.46826171875, -3.842529296875, -3.216796875, -2.591064453125, -1.96533203125, -1.339599609375, -0.7138671875, -0.088134765625, 0.53759765625, 1.163330078125, 1.7890625, 2.414794921875, 3.04052734375, 3.666259765625, 4.2919921875, 4.917724609375, 5.54345703125, 6.169189453125, 6.794921875, 7.420654296875, 8.04638671875, 8.672119140625, 9.2978515625, 9.923583984375, 10.54931640625, 11.175048828125, 11.80078125, 12.426513671875, 13.05224609375, 13.677978515625, 14.3037109375, 14.929443359375, 15.55517578125, 16.180908203125, 16.806640625, 17.432373046875, 18.05810546875, 18.683837890625, 19.3095703125, 19.935302734375, 20.56103515625, 21.186767578125, 21.8125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 4.0, 10.0, 25.0, 29.0, 13.0, 41.0, 51.0, 83.0, 186.0, 208.0, 123.0, 64.0, 43.0, 26.0, 25.0, 17.0, 11.0, 10.0, 8.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011768341064453125, -0.001140296459197998, -0.0011037588119506836, -0.0010672211647033691, -0.0010306835174560547, -0.0009941458702087402, -0.0009576082229614258, -0.0009210705757141113, -0.0008845329284667969, -0.0008479952812194824, -0.000811457633972168, -0.0007749199867248535, -0.0007383823394775391, -0.0007018446922302246, -0.0006653070449829102, -0.0006287693977355957, -0.0005922317504882812, -0.0005556941032409668, -0.0005191564559936523, -0.0004826188087463379, -0.00044608116149902344, -0.000409543514251709, -0.00037300586700439453, -0.0003364682197570801, -0.0002999305725097656, -0.00026339292526245117, -0.00022685527801513672, -0.00019031763076782227, -0.0001537799835205078, -0.00011724233627319336, -8.07046890258789e-05, -4.416704177856445e-05, -7.62939453125e-06, 2.8908252716064453e-05, 6.54458999633789e-05, 0.00010198354721069336, 0.0001385211944580078, 0.00017505884170532227, 0.00021159648895263672, 0.00024813413619995117, 0.0002846717834472656, 0.0003212094306945801, 0.00035774707794189453, 0.000394284725189209, 0.00043082237243652344, 0.0004673600196838379, 0.0005038976669311523, 0.0005404353141784668, 0.0005769729614257812, 0.0006135106086730957, 0.0006500482559204102, 0.0006865859031677246, 0.0007231235504150391, 0.0007596611976623535, 0.000796198844909668, 0.0008327364921569824, 0.0008692741394042969, 0.0009058117866516113, 0.0009423494338989258, 0.0009788870811462402, 0.0010154247283935547, 0.0010519623756408691, 0.0010885000228881836, 0.001125037670135498, 0.0011615753173828125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 14.0, 9.0, 20.0, 16.0, 35.0, 39.0, 49.0, 81.0, 119.0, 203.0, 384.0, 852.0, 3233.0, 26524.0, 948772.0, 61017.0, 4848.0, 1208.0, 437.0, 238.0, 147.0, 94.0, 54.0, 43.0, 29.0, 23.0, 19.0, 6.0, 11.0, 8.0, 2.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.078125, -16.61181640625, -16.1455078125, -15.67919921875, -15.212890625, -14.74658203125, -14.2802734375, -13.81396484375, -13.34765625, -12.88134765625, -12.4150390625, -11.94873046875, -11.482421875, -11.01611328125, -10.5498046875, -10.08349609375, -9.6171875, -9.15087890625, -8.6845703125, -8.21826171875, -7.751953125, -7.28564453125, -6.8193359375, -6.35302734375, -5.88671875, -5.42041015625, -4.9541015625, -4.48779296875, -4.021484375, -3.55517578125, -3.0888671875, -2.62255859375, -2.15625, -1.68994140625, -1.2236328125, -0.75732421875, -0.291015625, 0.17529296875, 0.6416015625, 1.10791015625, 1.57421875, 2.04052734375, 2.5068359375, 2.97314453125, 3.439453125, 3.90576171875, 4.3720703125, 4.83837890625, 5.3046875, 5.77099609375, 6.2373046875, 6.70361328125, 7.169921875, 7.63623046875, 8.1025390625, 8.56884765625, 9.03515625, 9.50146484375, 9.9677734375, 10.43408203125, 10.900390625, 11.36669921875, 11.8330078125, 12.29931640625, 12.765625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 9.0, 6.0, 9.0, 7.0, 9.0, 8.0, 10.0, 19.0, 26.0, 51.0, 69.0, 95.0, 133.0, 176.0, 112.0, 84.0, 54.0, 29.0, 22.0, 14.0, 12.0, 7.0, 8.0, 7.0, 6.0, 3.0, 4.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-14.171875, -13.8294677734375, -13.487060546875, -13.1446533203125, -12.80224609375, -12.4598388671875, -12.117431640625, -11.7750244140625, -11.4326171875, -11.0902099609375, -10.747802734375, -10.4053955078125, -10.06298828125, -9.7205810546875, -9.378173828125, -9.0357666015625, -8.693359375, -8.3509521484375, -8.008544921875, -7.6661376953125, -7.32373046875, -6.9813232421875, -6.638916015625, -6.2965087890625, -5.9541015625, -5.6116943359375, -5.269287109375, -4.9268798828125, -4.58447265625, -4.2420654296875, -3.899658203125, -3.5572509765625, -3.21484375, -2.8724365234375, -2.530029296875, -2.1876220703125, -1.84521484375, -1.5028076171875, -1.160400390625, -0.8179931640625, -0.4755859375, -0.1331787109375, 0.209228515625, 0.5516357421875, 0.89404296875, 1.2364501953125, 1.578857421875, 1.9212646484375, 2.263671875, 2.6060791015625, 2.948486328125, 3.2908935546875, 3.63330078125, 3.9757080078125, 4.318115234375, 4.6605224609375, 5.0029296875, 5.3453369140625, 5.687744140625, 6.0301513671875, 6.37255859375, 6.7149658203125, 7.057373046875, 7.3997802734375, 7.7421875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 7.0, 14.0, 45.0, 279.0, 473.0, 144.0, 23.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-336.9058837890625, -326.8128662109375, -316.7198486328125, -306.6268615722656, -296.5338439941406, -286.4408264160156, -276.3478088378906, -266.2547912597656, -256.16180419921875, -246.06878662109375, -235.9757843017578, -225.8827667236328, -215.78976440429688, -205.69674682617188, -195.60372924804688, -185.51071166992188, -175.41769409179688, -165.32467651367188, -155.23167419433594, -145.13865661621094, -135.045654296875, -124.95263671875, -114.859619140625, -104.76660919189453, -94.67359924316406, -84.5805892944336, -74.48757934570312, -64.39456176757812, -54.301551818847656, -44.20854187011719, -34.11552810668945, -24.02251434326172, -13.92950439453125, -3.8364925384521484, 6.256519317626953, 16.349531173706055, 26.442543029785156, 36.535552978515625, 46.62856674194336, 56.721580505371094, 66.81459045410156, 76.90760040283203, 87.0006103515625, 97.0936279296875, 107.18663787841797, 117.27964782714844, 127.37266540527344, 137.46566772460938, 147.55868530273438, 157.65170288085938, 167.7447052001953, 177.8377227783203, 187.93072509765625, 198.02374267578125, 208.11676025390625, 218.20977783203125, 228.3027801513672, 238.3957977294922, 248.48880004882812, 258.5818176269531, 268.6748352050781, 278.767822265625, 288.86083984375, 298.953857421875, 309.046875]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 5.0, 11.0, 12.0, 20.0, 31.0, 50.0, 44.0, 61.0, 74.0, 84.0, 92.0, 86.0, 83.0, 72.0, 62.0, 49.0, 52.0, 33.0, 27.0, 20.0, 13.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.2024383544922, -135.21311950683594, -130.22381591796875, -125.2344970703125, -120.24517822265625, -115.255859375, -110.26654815673828, -105.27723693847656, -100.28791809082031, -95.29859924316406, -90.30928802490234, -85.31997680664062, -80.33065795898438, -75.34133911132812, -70.3520278930664, -65.36271667480469, -60.37339782714844, -55.38408279418945, -50.39476776123047, -45.405452728271484, -40.4161376953125, -35.426822662353516, -30.43750762939453, -25.448192596435547, -20.458877563476562, -15.469562530517578, -10.480247497558594, -5.490932464599609, -0.501617431640625, 4.487697601318359, 9.477012634277344, 14.466327667236328, 19.45562744140625, 24.444942474365234, 29.43425750732422, 34.4235725402832, 39.41288757324219, 44.40220260620117, 49.391517639160156, 54.38083267211914, 59.370147705078125, 64.35946655273438, 69.3487777709961, 74.33808898925781, 79.32740783691406, 84.31672668457031, 89.30603790283203, 94.29534912109375, 99.28466796875, 104.27398681640625, 109.26329803466797, 114.25260925292969, 119.24192810058594, 124.23124694824219, 129.22055053710938, 134.20986938476562, 139.19918823242188, 144.18850708007812, 149.17782592773438, 154.16712951660156, 159.1564483642578, 164.14576721191406, 169.13507080078125, 174.1243896484375, 179.11370849609375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 10.0, 17.0, 49.0, 121.0, 371.0, 12639.0, 4180355.0, 470.0, 141.0, 53.0, 19.0, 13.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.0625, -114.6376953125, -109.212890625, -103.7880859375, -98.36328125, -92.9384765625, -87.513671875, -82.0888671875, -76.6640625, -71.2392578125, -65.814453125, -60.3896484375, -54.96484375, -49.5400390625, -44.115234375, -38.6904296875, -33.265625, -27.8408203125, -22.416015625, -16.9912109375, -11.56640625, -6.1416015625, -0.716796875, 4.7080078125, 10.1328125, 15.5576171875, 20.982421875, 26.4072265625, 31.83203125, 37.2568359375, 42.681640625, 48.1064453125, 53.53125, 58.9560546875, 64.380859375, 69.8056640625, 75.23046875, 80.6552734375, 86.080078125, 91.5048828125, 96.9296875, 102.3544921875, 107.779296875, 113.2041015625, 118.62890625, 124.0537109375, 129.478515625, 134.9033203125, 140.328125, 145.7529296875, 151.177734375, 156.6025390625, 162.02734375, 167.4521484375, 172.876953125, 178.3017578125, 183.7265625, 189.1513671875, 194.576171875, 200.0009765625, 205.42578125, 210.8505859375, 216.275390625, 221.7001953125, 227.125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 13.0, 27.0, 49.0, 72.0, 113.0, 165.0, 208.0, 156.0, 88.0, 51.0, 33.0, 19.0, 9.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.90625, -10.342041015625, -9.77783203125, -9.213623046875, -8.6494140625, -8.085205078125, -7.52099609375, -6.956787109375, -6.392578125, -5.828369140625, -5.26416015625, -4.699951171875, -4.1357421875, -3.571533203125, -3.00732421875, -2.443115234375, -1.87890625, -1.314697265625, -0.75048828125, -0.186279296875, 0.3779296875, 0.942138671875, 1.50634765625, 2.070556640625, 2.634765625, 3.198974609375, 3.76318359375, 4.327392578125, 4.8916015625, 5.455810546875, 6.02001953125, 6.584228515625, 7.1484375, 7.712646484375, 8.27685546875, 8.841064453125, 9.4052734375, 9.969482421875, 10.53369140625, 11.097900390625, 11.662109375, 12.226318359375, 12.79052734375, 13.354736328125, 13.9189453125, 14.483154296875, 15.04736328125, 15.611572265625, 16.17578125, 16.739990234375, 17.30419921875, 17.868408203125, 18.4326171875, 18.996826171875, 19.56103515625, 20.125244140625, 20.689453125, 21.253662109375, 21.81787109375, 22.382080078125, 22.9462890625, 23.510498046875, 24.07470703125, 24.638916015625, 25.203125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 10.0, 10.0, 20.0, 42.0, 84.0, 151.0, 316.0, 630.0, 1380.0, 3545.0, 11533.0, 64347.0, 3049103.0, 1009663.0, 39147.0, 8729.0, 2802.0, 1215.0, 663.0, 371.0, 210.0, 125.0, 63.0, 56.0, 16.0, 12.0, 13.0, 3.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2421875, -7.923583984375, -7.60498046875, -7.286376953125, -6.9677734375, -6.649169921875, -6.33056640625, -6.011962890625, -5.693359375, -5.374755859375, -5.05615234375, -4.737548828125, -4.4189453125, -4.100341796875, -3.78173828125, -3.463134765625, -3.14453125, -2.825927734375, -2.50732421875, -2.188720703125, -1.8701171875, -1.551513671875, -1.23291015625, -0.914306640625, -0.595703125, -0.277099609375, 0.04150390625, 0.360107421875, 0.6787109375, 0.997314453125, 1.31591796875, 1.634521484375, 1.953125, 2.271728515625, 2.59033203125, 2.908935546875, 3.2275390625, 3.546142578125, 3.86474609375, 4.183349609375, 4.501953125, 4.820556640625, 5.13916015625, 5.457763671875, 5.7763671875, 6.094970703125, 6.41357421875, 6.732177734375, 7.05078125, 7.369384765625, 7.68798828125, 8.006591796875, 8.3251953125, 8.643798828125, 8.96240234375, 9.281005859375, 9.599609375, 9.918212890625, 10.23681640625, 10.555419921875, 10.8740234375, 11.192626953125, 11.51123046875, 11.829833984375, 12.1484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 2.0, 2.0, 2.0, 9.0, 6.0, 11.0, 11.0, 20.0, 33.0, 77.0, 174.0, 562.0, 1318.0, 1154.0, 403.0, 125.0, 67.0, 28.0, 18.0, 13.0, 16.0, 6.0, 6.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4609375, -9.079345703125, -8.69775390625, -8.316162109375, -7.9345703125, -7.552978515625, -7.17138671875, -6.789794921875, -6.408203125, -6.026611328125, -5.64501953125, -5.263427734375, -4.8818359375, -4.500244140625, -4.11865234375, -3.737060546875, -3.35546875, -2.973876953125, -2.59228515625, -2.210693359375, -1.8291015625, -1.447509765625, -1.06591796875, -0.684326171875, -0.302734375, 0.078857421875, 0.46044921875, 0.842041015625, 1.2236328125, 1.605224609375, 1.98681640625, 2.368408203125, 2.75, 3.131591796875, 3.51318359375, 3.894775390625, 4.2763671875, 4.657958984375, 5.03955078125, 5.421142578125, 5.802734375, 6.184326171875, 6.56591796875, 6.947509765625, 7.3291015625, 7.710693359375, 8.09228515625, 8.473876953125, 8.85546875, 9.237060546875, 9.61865234375, 10.000244140625, 10.3818359375, 10.763427734375, 11.14501953125, 11.526611328125, 11.908203125, 12.289794921875, 12.67138671875, 13.052978515625, 13.4345703125, 13.816162109375, 14.19775390625, 14.579345703125, 14.9609375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 9.0, 83.0, 348.0, 386.0, 117.0, 35.0, 10.0, 5.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.6655044555664, -79.9333267211914, -75.2011489868164, -70.4689712524414, -65.7367935180664, -61.004615783691406, -56.272438049316406, -51.540260314941406, -46.808082580566406, -42.075904846191406, -37.343727111816406, -32.611549377441406, -27.879371643066406, -23.147193908691406, -18.415016174316406, -13.682838439941406, -8.950660705566406, -4.218482971191406, 0.5136947631835938, 5.245872497558594, 9.978050231933594, 14.710227966308594, 19.442405700683594, 24.174583435058594, 28.906761169433594, 33.638938903808594, 38.371116638183594, 43.103294372558594, 47.835472106933594, 52.567649841308594, 57.299827575683594, 62.032005310058594, 66.76419067382812, 71.49636840820312, 76.22854614257812, 80.96072387695312, 85.69290161132812, 90.42507934570312, 95.15725708007812, 99.88943481445312, 104.62161254882812, 109.35379028320312, 114.08596801757812, 118.81814575195312, 123.55032348632812, 128.28250122070312, 133.01467895507812, 137.74685668945312, 142.47903442382812, 147.21121215820312, 151.94338989257812, 156.67556762695312, 161.40774536132812, 166.13992309570312, 170.87210083007812, 175.60427856445312, 180.33645629882812, 185.06863403320312, 189.80081176757812, 194.53298950195312, 199.26516723632812, 203.99734497070312, 208.72952270507812, 213.46170043945312, 218.19387817382812]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 15.0, 22.0, 32.0, 39.0, 62.0, 68.0, 80.0, 86.0, 109.0, 95.0, 76.0, 67.0, 60.0, 47.0, 31.0, 33.0, 25.0, 15.0, 9.0, 2.0, 6.0, 6.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-99.24797821044922, -97.10259246826172, -94.95720672607422, -92.81182098388672, -90.66643524169922, -88.52104949951172, -86.37566375732422, -84.23027801513672, -82.08489227294922, -79.93950653076172, -77.79412078857422, -75.64873504638672, -73.50334930419922, -71.35796356201172, -69.21257781982422, -67.06719207763672, -64.92180633544922, -62.77642059326172, -60.63103485107422, -58.48564910888672, -56.34026336669922, -54.19487762451172, -52.04949188232422, -49.90410614013672, -47.75872039794922, -45.61333465576172, -43.46794891357422, -41.32256317138672, -39.17717742919922, -37.03179168701172, -34.88640594482422, -32.74102020263672, -30.59564208984375, -28.45025634765625, -26.30487060546875, -24.15948486328125, -22.01409912109375, -19.86871337890625, -17.72332763671875, -15.57794189453125, -13.43255615234375, -11.28717041015625, -9.14178466796875, -6.99639892578125, -4.85101318359375, -2.70562744140625, -0.56024169921875, 1.58514404296875, 3.73052978515625, 5.87591552734375, 8.02130126953125, 10.16668701171875, 12.31207275390625, 14.45745849609375, 16.60284423828125, 18.74822998046875, 20.89361572265625, 23.03900146484375, 25.18438720703125, 27.32977294921875, 29.47515869140625, 31.62054443359375, 33.76593017578125, 35.91131591796875, 38.05670166015625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 4.0, 7.0, 3.0, 10.0, 13.0, 18.0, 32.0, 47.0, 72.0, 160.0, 336.0, 1023.0, 5003.0, 63953.0, 860786.0, 108086.0, 6915.0, 1256.0, 425.0, 153.0, 93.0, 48.0, 24.0, 22.0, 18.0, 13.0, 7.0, 9.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.921875, -18.152099609375, -17.38232421875, -16.612548828125, -15.8427734375, -15.072998046875, -14.30322265625, -13.533447265625, -12.763671875, -11.993896484375, -11.22412109375, -10.454345703125, -9.6845703125, -8.914794921875, -8.14501953125, -7.375244140625, -6.60546875, -5.835693359375, -5.06591796875, -4.296142578125, -3.5263671875, -2.756591796875, -1.98681640625, -1.217041015625, -0.447265625, 0.322509765625, 1.09228515625, 1.862060546875, 2.6318359375, 3.401611328125, 4.17138671875, 4.941162109375, 5.7109375, 6.480712890625, 7.25048828125, 8.020263671875, 8.7900390625, 9.559814453125, 10.32958984375, 11.099365234375, 11.869140625, 12.638916015625, 13.40869140625, 14.178466796875, 14.9482421875, 15.718017578125, 16.48779296875, 17.257568359375, 18.02734375, 18.797119140625, 19.56689453125, 20.336669921875, 21.1064453125, 21.876220703125, 22.64599609375, 23.415771484375, 24.185546875, 24.955322265625, 25.72509765625, 26.494873046875, 27.2646484375, 28.034423828125, 28.80419921875, 29.573974609375, 30.34375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 13.0, 17.0, 31.0, 31.0, 46.0, 48.0, 73.0, 80.0, 91.0, 113.0, 101.0, 96.0, 76.0, 50.0, 38.0, 18.0, 25.0, 13.0, 14.0, 7.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1171875, -7.82080078125, -7.5244140625, -7.22802734375, -6.931640625, -6.63525390625, -6.3388671875, -6.04248046875, -5.74609375, -5.44970703125, -5.1533203125, -4.85693359375, -4.560546875, -4.26416015625, -3.9677734375, -3.67138671875, -3.375, -3.07861328125, -2.7822265625, -2.48583984375, -2.189453125, -1.89306640625, -1.5966796875, -1.30029296875, -1.00390625, -0.70751953125, -0.4111328125, -0.11474609375, 0.181640625, 0.47802734375, 0.7744140625, 1.07080078125, 1.3671875, 1.66357421875, 1.9599609375, 2.25634765625, 2.552734375, 2.84912109375, 3.1455078125, 3.44189453125, 3.73828125, 4.03466796875, 4.3310546875, 4.62744140625, 4.923828125, 5.22021484375, 5.5166015625, 5.81298828125, 6.109375, 6.40576171875, 6.7021484375, 6.99853515625, 7.294921875, 7.59130859375, 7.8876953125, 8.18408203125, 8.48046875, 8.77685546875, 9.0732421875, 9.36962890625, 9.666015625, 9.96240234375, 10.2587890625, 10.55517578125, 10.8515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 10.0, 4.0, 8.0, 21.0, 21.0, 31.0, 52.0, 64.0, 79.0, 138.0, 241.0, 503.0, 1069.0, 3317.0, 15610.0, 194783.0, 775559.0, 46981.0, 6580.0, 1847.0, 740.0, 341.0, 164.0, 135.0, 76.0, 54.0, 30.0, 22.0, 15.0, 11.0, 8.0, 9.0, 8.0, 6.0, 5.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.359375, -21.70654296875, -21.0537109375, -20.40087890625, -19.748046875, -19.09521484375, -18.4423828125, -17.78955078125, -17.13671875, -16.48388671875, -15.8310546875, -15.17822265625, -14.525390625, -13.87255859375, -13.2197265625, -12.56689453125, -11.9140625, -11.26123046875, -10.6083984375, -9.95556640625, -9.302734375, -8.64990234375, -7.9970703125, -7.34423828125, -6.69140625, -6.03857421875, -5.3857421875, -4.73291015625, -4.080078125, -3.42724609375, -2.7744140625, -2.12158203125, -1.46875, -0.81591796875, -0.1630859375, 0.48974609375, 1.142578125, 1.79541015625, 2.4482421875, 3.10107421875, 3.75390625, 4.40673828125, 5.0595703125, 5.71240234375, 6.365234375, 7.01806640625, 7.6708984375, 8.32373046875, 8.9765625, 9.62939453125, 10.2822265625, 10.93505859375, 11.587890625, 12.24072265625, 12.8935546875, 13.54638671875, 14.19921875, 14.85205078125, 15.5048828125, 16.15771484375, 16.810546875, 17.46337890625, 18.1162109375, 18.76904296875, 19.421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 0.0, 1.0, 5.0, 4.0, 6.0, 9.0, 7.0, 16.0, 13.0, 24.0, 27.0, 26.0, 39.0, 50.0, 46.0, 49.0, 50.0, 72.0, 62.0, 75.0, 48.0, 81.0, 62.0, 48.0, 39.0, 24.0, 23.0, 17.0, 21.0, 13.0, 13.0, 9.0, 5.0, 9.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.640625, -21.91064453125, -21.1806640625, -20.45068359375, -19.720703125, -18.99072265625, -18.2607421875, -17.53076171875, -16.80078125, -16.07080078125, -15.3408203125, -14.61083984375, -13.880859375, -13.15087890625, -12.4208984375, -11.69091796875, -10.9609375, -10.23095703125, -9.5009765625, -8.77099609375, -8.041015625, -7.31103515625, -6.5810546875, -5.85107421875, -5.12109375, -4.39111328125, -3.6611328125, -2.93115234375, -2.201171875, -1.47119140625, -0.7412109375, -0.01123046875, 0.71875, 1.44873046875, 2.1787109375, 2.90869140625, 3.638671875, 4.36865234375, 5.0986328125, 5.82861328125, 6.55859375, 7.28857421875, 8.0185546875, 8.74853515625, 9.478515625, 10.20849609375, 10.9384765625, 11.66845703125, 12.3984375, 13.12841796875, 13.8583984375, 14.58837890625, 15.318359375, 16.04833984375, 16.7783203125, 17.50830078125, 18.23828125, 18.96826171875, 19.6982421875, 20.42822265625, 21.158203125, 21.88818359375, 22.6181640625, 23.34814453125, 24.078125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 7.0, 8.0, 3.0, 12.0, 34.0, 44.0, 84.0, 209.0, 685.0, 4051.0, 1029592.0, 12174.0, 1065.0, 338.0, 117.0, 65.0, 24.0, 15.0, 10.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.0, -44.3955078125, -42.791015625, -41.1865234375, -39.58203125, -37.9775390625, -36.373046875, -34.7685546875, -33.1640625, -31.5595703125, -29.955078125, -28.3505859375, -26.74609375, -25.1416015625, -23.537109375, -21.9326171875, -20.328125, -18.7236328125, -17.119140625, -15.5146484375, -13.91015625, -12.3056640625, -10.701171875, -9.0966796875, -7.4921875, -5.8876953125, -4.283203125, -2.6787109375, -1.07421875, 0.5302734375, 2.134765625, 3.7392578125, 5.34375, 6.9482421875, 8.552734375, 10.1572265625, 11.76171875, 13.3662109375, 14.970703125, 16.5751953125, 18.1796875, 19.7841796875, 21.388671875, 22.9931640625, 24.59765625, 26.2021484375, 27.806640625, 29.4111328125, 31.015625, 32.6201171875, 34.224609375, 35.8291015625, 37.43359375, 39.0380859375, 40.642578125, 42.2470703125, 43.8515625, 45.4560546875, 47.060546875, 48.6650390625, 50.26953125, 51.8740234375, 53.478515625, 55.0830078125, 56.6875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1.0, 6.0, 2.0, 7.0, 9.0, 8.0, 10.0, 24.0, 34.0, 58.0, 97.0, 212.0, 224.0, 123.0, 62.0, 39.0, 27.0, 19.0, 12.0, 13.0, 4.0, 8.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014371871948242188, -0.0013994872570037842, -0.0013617873191833496, -0.001324087381362915, -0.0012863874435424805, -0.001248687505722046, -0.0012109875679016113, -0.0011732876300811768, -0.0011355876922607422, -0.0010978877544403076, -0.001060187816619873, -0.0010224878787994385, -0.000984787940979004, -0.0009470880031585693, -0.0009093880653381348, -0.0008716881275177002, -0.0008339881896972656, -0.0007962882518768311, -0.0007585883140563965, -0.0007208883762359619, -0.0006831884384155273, -0.0006454885005950928, -0.0006077885627746582, -0.0005700886249542236, -0.0005323886871337891, -0.0004946887493133545, -0.0004569888114929199, -0.00041928887367248535, -0.0003815889358520508, -0.0003438889980316162, -0.00030618906021118164, -0.00026848912239074707, -0.0002307891845703125, -0.00019308924674987793, -0.00015538930892944336, -0.00011768937110900879, -7.998943328857422e-05, -4.228949546813965e-05, -4.589557647705078e-06, 3.311038017272949e-05, 7.081031799316406e-05, 0.00010851025581359863, 0.0001462101936340332, 0.00018391013145446777, 0.00022161006927490234, 0.0002593100070953369, 0.0002970099449157715, 0.00033470988273620605, 0.0003724098205566406, 0.0004101097583770752, 0.00044780969619750977, 0.00048550963401794434, 0.0005232095718383789, 0.0005609095096588135, 0.000598609447479248, 0.0006363093852996826, 0.0006740093231201172, 0.0007117092609405518, 0.0007494091987609863, 0.0007871091365814209, 0.0008248090744018555, 0.00086250901222229, 0.0009002089500427246, 0.0009379088878631592, 0.0009756088256835938]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 4.0, 13.0, 19.0, 27.0, 85.0, 250.0, 865.0, 8015.0, 1008776.0, 28472.0, 1478.0, 321.0, 123.0, 40.0, 27.0, 10.0, 9.0, 2.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.359375, -19.56591796875, -18.7724609375, -17.97900390625, -17.185546875, -16.39208984375, -15.5986328125, -14.80517578125, -14.01171875, -13.21826171875, -12.4248046875, -11.63134765625, -10.837890625, -10.04443359375, -9.2509765625, -8.45751953125, -7.6640625, -6.87060546875, -6.0771484375, -5.28369140625, -4.490234375, -3.69677734375, -2.9033203125, -2.10986328125, -1.31640625, -0.52294921875, 0.2705078125, 1.06396484375, 1.857421875, 2.65087890625, 3.4443359375, 4.23779296875, 5.03125, 5.82470703125, 6.6181640625, 7.41162109375, 8.205078125, 8.99853515625, 9.7919921875, 10.58544921875, 11.37890625, 12.17236328125, 12.9658203125, 13.75927734375, 14.552734375, 15.34619140625, 16.1396484375, 16.93310546875, 17.7265625, 18.52001953125, 19.3134765625, 20.10693359375, 20.900390625, 21.69384765625, 22.4873046875, 23.28076171875, 24.07421875, 24.86767578125, 25.6611328125, 26.45458984375, 27.248046875, 28.04150390625, 28.8349609375, 29.62841796875, 30.421875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 2.0, 3.0, 4.0, 10.0, 15.0, 25.0, 46.0, 63.0, 137.0, 153.0, 172.0, 141.0, 98.0, 45.0, 26.0, 21.0, 10.0, 10.0, 8.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.3359375, -10.0509033203125, -9.765869140625, -9.4808349609375, -9.19580078125, -8.9107666015625, -8.625732421875, -8.3406982421875, -8.0556640625, -7.7706298828125, -7.485595703125, -7.2005615234375, -6.91552734375, -6.6304931640625, -6.345458984375, -6.0604248046875, -5.775390625, -5.4903564453125, -5.205322265625, -4.9202880859375, -4.63525390625, -4.3502197265625, -4.065185546875, -3.7801513671875, -3.4951171875, -3.2100830078125, -2.925048828125, -2.6400146484375, -2.35498046875, -2.0699462890625, -1.784912109375, -1.4998779296875, -1.21484375, -0.9298095703125, -0.644775390625, -0.3597412109375, -0.07470703125, 0.2103271484375, 0.495361328125, 0.7803955078125, 1.0654296875, 1.3504638671875, 1.635498046875, 1.9205322265625, 2.20556640625, 2.4906005859375, 2.775634765625, 3.0606689453125, 3.345703125, 3.6307373046875, 3.915771484375, 4.2008056640625, 4.48583984375, 4.7708740234375, 5.055908203125, 5.3409423828125, 5.6259765625, 5.9110107421875, 6.196044921875, 6.4810791015625, 6.76611328125, 7.0511474609375, 7.336181640625, 7.6212158203125, 7.90625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 9.0, 14.0, 45.0, 194.0, 431.0, 216.0, 49.0, 17.0, 10.0, 3.0, 3.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-252.65597534179688, -244.66619873046875, -236.67642211914062, -228.6866455078125, -220.69686889648438, -212.70709228515625, -204.71731567382812, -196.7275390625, -188.73776245117188, -180.74798583984375, -172.75820922851562, -164.7684326171875, -156.77865600585938, -148.78887939453125, -140.79910278320312, -132.809326171875, -124.8195571899414, -116.82978057861328, -108.84000396728516, -100.85022735595703, -92.8604507446289, -84.87068176269531, -76.88090515136719, -68.89112854003906, -60.90134811401367, -52.91157150268555, -44.92179489135742, -36.93202209472656, -28.942243576049805, -20.952468872070312, -12.962692260742188, -4.9729156494140625, 3.0168609619140625, 11.006637573242188, 18.996414184570312, 26.986188888549805, 34.97596740722656, 42.96574020385742, 50.95551681518555, 58.94529342651367, 66.93507385253906, 74.92485046386719, 82.91462707519531, 90.90440368652344, 98.89418029785156, 106.88395690917969, 114.87373352050781, 122.86351013183594, 130.853271484375, 138.84304809570312, 146.83282470703125, 154.82260131835938, 162.8123779296875, 170.80215454101562, 178.79193115234375, 186.78170776367188, 194.771484375, 202.76126098632812, 210.75103759765625, 218.74081420898438, 226.7305908203125, 234.72036743164062, 242.71014404296875, 250.69992065429688, 258.689697265625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 7.0, 4.0, 11.0, 11.0, 9.0, 15.0, 18.0, 30.0, 23.0, 33.0, 20.0, 39.0, 43.0, 41.0, 51.0, 58.0, 67.0, 65.0, 57.0, 41.0, 44.0, 38.0, 35.0, 31.0, 30.0, 26.0, 29.0, 16.0, 17.0, 13.0, 15.0, 10.0, 13.0, 4.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-81.83976745605469, -79.42585754394531, -77.01194763183594, -74.59803771972656, -72.18412780761719, -69.77021026611328, -67.3563003540039, -64.94239044189453, -62.528480529785156, -60.11457061767578, -57.700660705566406, -55.286746978759766, -52.87283706665039, -50.458927154541016, -48.045013427734375, -45.631103515625, -43.217193603515625, -40.80328369140625, -38.389373779296875, -35.975460052490234, -33.56155014038086, -31.147640228271484, -28.733728408813477, -26.31981658935547, -23.905906677246094, -21.49199676513672, -19.07808494567871, -16.664173126220703, -14.250263214111328, -11.836352348327637, -9.422441482543945, -7.0085296630859375, -4.594612121582031, -2.18070125579834, 0.23320960998535156, 2.647120475769043, 5.061031341552734, 7.474942207336426, 9.888853073120117, 12.302764892578125, 14.7166748046875, 17.130584716796875, 19.544496536254883, 21.95840835571289, 24.372318267822266, 26.78622817993164, 29.20013999938965, 31.614051818847656, 34.02796173095703, 36.441871643066406, 38.85578155517578, 41.26969528198242, 43.6836051940918, 46.09751510620117, 48.51142883300781, 50.92533874511719, 53.33924865722656, 55.75315856933594, 58.16706848144531, 60.58098220825195, 62.99489212036133, 65.40880584716797, 67.82271575927734, 70.23662567138672, 72.6505355834961]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 8.0, 22.0, 48.0, 157.0, 948.0, 3749880.0, 442383.0, 604.0, 138.0, 46.0, 20.0, 11.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.09375, -50.22900390625, -48.3642578125, -46.49951171875, -44.634765625, -42.77001953125, -40.9052734375, -39.04052734375, -37.17578125, -35.31103515625, -33.4462890625, -31.58154296875, -29.716796875, -27.85205078125, -25.9873046875, -24.12255859375, -22.2578125, -20.39306640625, -18.5283203125, -16.66357421875, -14.798828125, -12.93408203125, -11.0693359375, -9.20458984375, -7.33984375, -5.47509765625, -3.6103515625, -1.74560546875, 0.119140625, 1.98388671875, 3.8486328125, 5.71337890625, 7.578125, 9.44287109375, 11.3076171875, 13.17236328125, 15.037109375, 16.90185546875, 18.7666015625, 20.63134765625, 22.49609375, 24.36083984375, 26.2255859375, 28.09033203125, 29.955078125, 31.81982421875, 33.6845703125, 35.54931640625, 37.4140625, 39.27880859375, 41.1435546875, 43.00830078125, 44.873046875, 46.73779296875, 48.6025390625, 50.46728515625, 52.33203125, 54.19677734375, 56.0615234375, 57.92626953125, 59.791015625, 61.65576171875, 63.5205078125, 65.38525390625, 67.25]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 3.0, 4.0, 13.0, 12.0, 10.0, 18.0, 25.0, 37.0, 43.0, 48.0, 51.0, 74.0, 74.0, 69.0, 71.0, 74.0, 62.0, 55.0, 56.0, 42.0, 40.0, 38.0, 20.0, 16.0, 17.0, 3.0, 6.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.90234375, -6.7110595703125, -6.519775390625, -6.3284912109375, -6.13720703125, -5.9459228515625, -5.754638671875, -5.5633544921875, -5.3720703125, -5.1807861328125, -4.989501953125, -4.7982177734375, -4.60693359375, -4.4156494140625, -4.224365234375, -4.0330810546875, -3.841796875, -3.6505126953125, -3.459228515625, -3.2679443359375, -3.07666015625, -2.8853759765625, -2.694091796875, -2.5028076171875, -2.3115234375, -2.1202392578125, -1.928955078125, -1.7376708984375, -1.54638671875, -1.3551025390625, -1.163818359375, -0.9725341796875, -0.78125, -0.5899658203125, -0.398681640625, -0.2073974609375, -0.01611328125, 0.1751708984375, 0.366455078125, 0.5577392578125, 0.7490234375, 0.9403076171875, 1.131591796875, 1.3228759765625, 1.51416015625, 1.7054443359375, 1.896728515625, 2.0880126953125, 2.279296875, 2.4705810546875, 2.661865234375, 2.8531494140625, 3.04443359375, 3.2357177734375, 3.427001953125, 3.6182861328125, 3.8095703125, 4.0008544921875, 4.192138671875, 4.3834228515625, 4.57470703125, 4.7659912109375, 4.957275390625, 5.1485595703125, 5.33984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 11.0, 20.0, 30.0, 40.0, 80.0, 136.0, 225.0, 518.0, 1367.0, 5562.0, 46502.0, 3100804.0, 1003594.0, 29258.0, 4147.0, 1094.0, 373.0, 191.0, 120.0, 73.0, 52.0, 28.0, 17.0, 16.0, 5.0, 7.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.4375, -13.0408935546875, -12.644287109375, -12.2476806640625, -11.85107421875, -11.4544677734375, -11.057861328125, -10.6612548828125, -10.2646484375, -9.8680419921875, -9.471435546875, -9.0748291015625, -8.67822265625, -8.2816162109375, -7.885009765625, -7.4884033203125, -7.091796875, -6.6951904296875, -6.298583984375, -5.9019775390625, -5.50537109375, -5.1087646484375, -4.712158203125, -4.3155517578125, -3.9189453125, -3.5223388671875, -3.125732421875, -2.7291259765625, -2.33251953125, -1.9359130859375, -1.539306640625, -1.1427001953125, -0.74609375, -0.3494873046875, 0.047119140625, 0.4437255859375, 0.84033203125, 1.2369384765625, 1.633544921875, 2.0301513671875, 2.4267578125, 2.8233642578125, 3.219970703125, 3.6165771484375, 4.01318359375, 4.4097900390625, 4.806396484375, 5.2030029296875, 5.599609375, 5.9962158203125, 6.392822265625, 6.7894287109375, 7.18603515625, 7.5826416015625, 7.979248046875, 8.3758544921875, 8.7724609375, 9.1690673828125, 9.565673828125, 9.9622802734375, 10.35888671875, 10.7554931640625, 11.152099609375, 11.5487060546875, 11.9453125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 4.0, 10.0, 13.0, 28.0, 46.0, 82.0, 173.0, 457.0, 1119.0, 1189.0, 495.0, 203.0, 100.0, 49.0, 38.0, 22.0, 17.0, 12.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0, -12.5513916015625, -12.102783203125, -11.6541748046875, -11.20556640625, -10.7569580078125, -10.308349609375, -9.8597412109375, -9.4111328125, -8.9625244140625, -8.513916015625, -8.0653076171875, -7.61669921875, -7.1680908203125, -6.719482421875, -6.2708740234375, -5.822265625, -5.3736572265625, -4.925048828125, -4.4764404296875, -4.02783203125, -3.5792236328125, -3.130615234375, -2.6820068359375, -2.2333984375, -1.7847900390625, -1.336181640625, -0.8875732421875, -0.43896484375, 0.0096435546875, 0.458251953125, 0.9068603515625, 1.35546875, 1.8040771484375, 2.252685546875, 2.7012939453125, 3.14990234375, 3.5985107421875, 4.047119140625, 4.4957275390625, 4.9443359375, 5.3929443359375, 5.841552734375, 6.2901611328125, 6.73876953125, 7.1873779296875, 7.635986328125, 8.0845947265625, 8.533203125, 8.9818115234375, 9.430419921875, 9.8790283203125, 10.32763671875, 10.7762451171875, 11.224853515625, 11.6734619140625, 12.1220703125, 12.5706787109375, 13.019287109375, 13.4678955078125, 13.91650390625, 14.3651123046875, 14.813720703125, 15.2623291015625, 15.7109375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 14.0, 44.0, 146.0, 268.0, 223.0, 157.0, 67.0, 30.0, 14.0, 11.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.55770874023438, -77.29863739013672, -74.03956604003906, -70.78050231933594, -67.52143096923828, -64.26235961914062, -61.00328826904297, -57.74422073364258, -54.48515319824219, -51.22608184814453, -47.96701431274414, -44.707942962646484, -41.448875427246094, -38.18980407714844, -34.93073272705078, -31.67166519165039, -28.412593841552734, -25.15352439880371, -21.894454956054688, -18.63538360595703, -15.376315116882324, -12.117244720458984, -8.858175277709961, -5.5991058349609375, -2.340036392211914, 0.9190332889556885, 4.178102970123291, 7.437172889709473, 10.696242332458496, 13.955312728881836, 17.21438217163086, 20.473451614379883, 23.732521057128906, 26.99159049987793, 30.250659942626953, 33.50973129272461, 36.768798828125, 40.027870178222656, 43.28694152832031, 46.5460090637207, 49.805076599121094, 53.06414794921875, 56.32321548461914, 59.5822868347168, 62.84135437011719, 66.10042572021484, 69.3594970703125, 72.61856079101562, 75.87763977050781, 79.13671112060547, 82.39578247070312, 85.65484619140625, 88.9139175415039, 92.17298889160156, 95.43206024169922, 98.69113159179688, 101.9501953125, 105.20926666259766, 108.46833801269531, 111.72740173339844, 114.9864730834961, 118.24554443359375, 121.5046157836914, 124.76368713378906, 128.0227508544922]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 8.0, 16.0, 22.0, 32.0, 36.0, 39.0, 44.0, 53.0, 72.0, 78.0, 68.0, 82.0, 62.0, 56.0, 51.0, 50.0, 38.0, 43.0, 44.0, 28.0, 24.0, 11.0, 7.0, 12.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.06772232055664, -44.183868408203125, -42.300018310546875, -40.41616439819336, -38.53231430053711, -36.648460388183594, -34.764610290527344, -32.88075637817383, -30.996904373168945, -29.113052368164062, -27.22920036315918, -25.345348358154297, -23.46149444580078, -21.57764434814453, -19.693790435791016, -17.809938430786133, -15.92608642578125, -14.042234420776367, -12.158382415771484, -10.274529457092285, -8.390677452087402, -6.5068254470825195, -4.62297248840332, -2.7391204833984375, -0.8552684783935547, 1.0285837650299072, 2.912436008453369, 4.79628849029541, 6.680140495300293, 8.563992500305176, 10.447845458984375, 12.331697463989258, 14.215545654296875, 16.099397659301758, 17.98324966430664, 19.867103576660156, 21.750953674316406, 23.634807586669922, 25.518659591674805, 27.402511596679688, 29.28636360168457, 31.170215606689453, 33.05406951904297, 34.93791961669922, 36.821773529052734, 38.705623626708984, 40.5894775390625, 42.47332763671875, 44.357181549072266, 46.24103546142578, 48.12488555908203, 50.00873947143555, 51.8925895690918, 53.77644348144531, 55.66029357910156, 57.54414749145508, 59.428001403808594, 61.31185531616211, 63.19570541381836, 65.07955932617188, 66.96340942382812, 68.84725952148438, 70.73111724853516, 72.6149673461914, 74.49881744384766]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 13.0, 8.0, 8.0, 6.0, 12.0, 20.0, 22.0, 43.0, 45.0, 55.0, 101.0, 143.0, 273.0, 471.0, 963.0, 2184.0, 6173.0, 23235.0, 114528.0, 515201.0, 306596.0, 58142.0, 13158.0, 3867.0, 1566.0, 678.0, 357.0, 239.0, 124.0, 111.0, 48.0, 30.0, 32.0, 24.0, 16.0, 11.0, 16.0, 5.0, 7.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-12.5625, -12.2115478515625, -11.860595703125, -11.5096435546875, -11.15869140625, -10.8077392578125, -10.456787109375, -10.1058349609375, -9.7548828125, -9.4039306640625, -9.052978515625, -8.7020263671875, -8.35107421875, -8.0001220703125, -7.649169921875, -7.2982177734375, -6.947265625, -6.5963134765625, -6.245361328125, -5.8944091796875, -5.54345703125, -5.1925048828125, -4.841552734375, -4.4906005859375, -4.1396484375, -3.7886962890625, -3.437744140625, -3.0867919921875, -2.73583984375, -2.3848876953125, -2.033935546875, -1.6829833984375, -1.33203125, -0.9810791015625, -0.630126953125, -0.2791748046875, 0.07177734375, 0.4227294921875, 0.773681640625, 1.1246337890625, 1.4755859375, 1.8265380859375, 2.177490234375, 2.5284423828125, 2.87939453125, 3.2303466796875, 3.581298828125, 3.9322509765625, 4.283203125, 4.6341552734375, 4.985107421875, 5.3360595703125, 5.68701171875, 6.0379638671875, 6.388916015625, 6.7398681640625, 7.0908203125, 7.4417724609375, 7.792724609375, 8.1436767578125, 8.49462890625, 8.8455810546875, 9.196533203125, 9.5474853515625, 9.8984375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 6.0, 10.0, 17.0, 21.0, 20.0, 25.0, 34.0, 43.0, 49.0, 47.0, 61.0, 38.0, 62.0, 79.0, 71.0, 61.0, 44.0, 48.0, 62.0, 36.0, 31.0, 32.0, 16.0, 18.0, 14.0, 13.0, 7.0, 10.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.72265625, -5.561767578125, -5.40087890625, -5.239990234375, -5.0791015625, -4.918212890625, -4.75732421875, -4.596435546875, -4.435546875, -4.274658203125, -4.11376953125, -3.952880859375, -3.7919921875, -3.631103515625, -3.47021484375, -3.309326171875, -3.1484375, -2.987548828125, -2.82666015625, -2.665771484375, -2.5048828125, -2.343994140625, -2.18310546875, -2.022216796875, -1.861328125, -1.700439453125, -1.53955078125, -1.378662109375, -1.2177734375, -1.056884765625, -0.89599609375, -0.735107421875, -0.57421875, -0.413330078125, -0.25244140625, -0.091552734375, 0.0693359375, 0.230224609375, 0.39111328125, 0.552001953125, 0.712890625, 0.873779296875, 1.03466796875, 1.195556640625, 1.3564453125, 1.517333984375, 1.67822265625, 1.839111328125, 2.0, 2.160888671875, 2.32177734375, 2.482666015625, 2.6435546875, 2.804443359375, 2.96533203125, 3.126220703125, 3.287109375, 3.447998046875, 3.60888671875, 3.769775390625, 3.9306640625, 4.091552734375, 4.25244140625, 4.413330078125, 4.57421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 6.0, 12.0, 18.0, 24.0, 20.0, 45.0, 77.0, 134.0, 245.0, 581.0, 1851.0, 11224.0, 930430.0, 97729.0, 4198.0, 1098.0, 391.0, 184.0, 85.0, 59.0, 37.0, 28.0, 17.0, 12.0, 8.0, 8.0, 7.0, 4.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.8125, -41.27099609375, -39.7294921875, -38.18798828125, -36.646484375, -35.10498046875, -33.5634765625, -32.02197265625, -30.48046875, -28.93896484375, -27.3974609375, -25.85595703125, -24.314453125, -22.77294921875, -21.2314453125, -19.68994140625, -18.1484375, -16.60693359375, -15.0654296875, -13.52392578125, -11.982421875, -10.44091796875, -8.8994140625, -7.35791015625, -5.81640625, -4.27490234375, -2.7333984375, -1.19189453125, 0.349609375, 1.89111328125, 3.4326171875, 4.97412109375, 6.515625, 8.05712890625, 9.5986328125, 11.14013671875, 12.681640625, 14.22314453125, 15.7646484375, 17.30615234375, 18.84765625, 20.38916015625, 21.9306640625, 23.47216796875, 25.013671875, 26.55517578125, 28.0966796875, 29.63818359375, 31.1796875, 32.72119140625, 34.2626953125, 35.80419921875, 37.345703125, 38.88720703125, 40.4287109375, 41.97021484375, 43.51171875, 45.05322265625, 46.5947265625, 48.13623046875, 49.677734375, 51.21923828125, 52.7607421875, 54.30224609375, 55.84375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 9.0, 12.0, 8.0, 15.0, 15.0, 14.0, 30.0, 38.0, 52.0, 47.0, 60.0, 77.0, 55.0, 73.0, 67.0, 67.0, 54.0, 66.0, 52.0, 48.0, 28.0, 33.0, 19.0, 18.0, 7.0, 7.0, 12.0, 4.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.59375, -24.81298828125, -24.0322265625, -23.25146484375, -22.470703125, -21.68994140625, -20.9091796875, -20.12841796875, -19.34765625, -18.56689453125, -17.7861328125, -17.00537109375, -16.224609375, -15.44384765625, -14.6630859375, -13.88232421875, -13.1015625, -12.32080078125, -11.5400390625, -10.75927734375, -9.978515625, -9.19775390625, -8.4169921875, -7.63623046875, -6.85546875, -6.07470703125, -5.2939453125, -4.51318359375, -3.732421875, -2.95166015625, -2.1708984375, -1.39013671875, -0.609375, 0.17138671875, 0.9521484375, 1.73291015625, 2.513671875, 3.29443359375, 4.0751953125, 4.85595703125, 5.63671875, 6.41748046875, 7.1982421875, 7.97900390625, 8.759765625, 9.54052734375, 10.3212890625, 11.10205078125, 11.8828125, 12.66357421875, 13.4443359375, 14.22509765625, 15.005859375, 15.78662109375, 16.5673828125, 17.34814453125, 18.12890625, 18.90966796875, 19.6904296875, 20.47119140625, 21.251953125, 22.03271484375, 22.8134765625, 23.59423828125, 24.375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 7.0, 13.0, 9.0, 21.0, 25.0, 37.0, 46.0, 94.0, 199.0, 673.0, 6444.0, 974657.0, 63745.0, 1923.0, 331.0, 103.0, 63.0, 40.0, 27.0, 15.0, 10.0, 16.0, 9.0, 9.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.859375, -19.253173828125, -18.64697265625, -18.040771484375, -17.4345703125, -16.828369140625, -16.22216796875, -15.615966796875, -15.009765625, -14.403564453125, -13.79736328125, -13.191162109375, -12.5849609375, -11.978759765625, -11.37255859375, -10.766357421875, -10.16015625, -9.553955078125, -8.94775390625, -8.341552734375, -7.7353515625, -7.129150390625, -6.52294921875, -5.916748046875, -5.310546875, -4.704345703125, -4.09814453125, -3.491943359375, -2.8857421875, -2.279541015625, -1.67333984375, -1.067138671875, -0.4609375, 0.145263671875, 0.75146484375, 1.357666015625, 1.9638671875, 2.570068359375, 3.17626953125, 3.782470703125, 4.388671875, 4.994873046875, 5.60107421875, 6.207275390625, 6.8134765625, 7.419677734375, 8.02587890625, 8.632080078125, 9.23828125, 9.844482421875, 10.45068359375, 11.056884765625, 11.6630859375, 12.269287109375, 12.87548828125, 13.481689453125, 14.087890625, 14.694091796875, 15.30029296875, 15.906494140625, 16.5126953125, 17.118896484375, 17.72509765625, 18.331298828125, 18.9375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 10.0, 9.0, 9.0, 10.0, 11.0, 21.0, 23.0, 21.0, 34.0, 37.0, 39.0, 73.0, 101.0, 140.0, 94.0, 84.0, 50.0, 32.0, 21.0, 22.0, 23.0, 23.0, 13.0, 15.0, 12.0, 10.0, 12.0, 10.0, 3.0, 2.0, 7.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00072479248046875, -0.0007032901048660278, -0.0006817877292633057, -0.0006602853536605835, -0.0006387829780578613, -0.0006172806024551392, -0.000595778226852417, -0.0005742758512496948, -0.0005527734756469727, -0.0005312711000442505, -0.0005097687244415283, -0.00048826634883880615, -0.000466763973236084, -0.0004452615976333618, -0.00042375922203063965, -0.0004022568464279175, -0.0003807544708251953, -0.00035925209522247314, -0.000337749719619751, -0.0003162473440170288, -0.00029474496841430664, -0.00027324259281158447, -0.0002517402172088623, -0.00023023784160614014, -0.00020873546600341797, -0.0001872330904006958, -0.00016573071479797363, -0.00014422833919525146, -0.0001227259635925293, -0.00010122358798980713, -7.972121238708496e-05, -5.821883678436279e-05, -3.6716461181640625e-05, -1.5214085578918457e-05, 6.288290023803711e-06, 2.779066562652588e-05, 4.929304122924805e-05, 7.079541683197021e-05, 9.229779243469238e-05, 0.00011380016803741455, 0.00013530254364013672, 0.0001568049192428589, 0.00017830729484558105, 0.00019980967044830322, 0.0002213120460510254, 0.00024281442165374756, 0.0002643167972564697, 0.0002858191728591919, 0.00030732154846191406, 0.00032882392406463623, 0.0003503262996673584, 0.00037182867527008057, 0.00039333105087280273, 0.0004148334264755249, 0.00043633580207824707, 0.00045783817768096924, 0.0004793405532836914, 0.0005008429288864136, 0.0005223453044891357, 0.0005438476800918579, 0.0005653500556945801, 0.0005868524312973022, 0.0006083548069000244, 0.0006298571825027466, 0.0006513595581054688]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 11.0, 10.0, 12.0, 19.0, 23.0, 31.0, 39.0, 71.0, 105.0, 217.0, 511.0, 1562.0, 7250.0, 259951.0, 765990.0, 9748.0, 1856.0, 584.0, 217.0, 104.0, 73.0, 49.0, 24.0, 21.0, 22.0, 7.0, 9.0, 5.0, 2.0, 5.0, 3.0, 8.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7578125, -13.30029296875, -12.8427734375, -12.38525390625, -11.927734375, -11.47021484375, -11.0126953125, -10.55517578125, -10.09765625, -9.64013671875, -9.1826171875, -8.72509765625, -8.267578125, -7.81005859375, -7.3525390625, -6.89501953125, -6.4375, -5.97998046875, -5.5224609375, -5.06494140625, -4.607421875, -4.14990234375, -3.6923828125, -3.23486328125, -2.77734375, -2.31982421875, -1.8623046875, -1.40478515625, -0.947265625, -0.48974609375, -0.0322265625, 0.42529296875, 0.8828125, 1.34033203125, 1.7978515625, 2.25537109375, 2.712890625, 3.17041015625, 3.6279296875, 4.08544921875, 4.54296875, 5.00048828125, 5.4580078125, 5.91552734375, 6.373046875, 6.83056640625, 7.2880859375, 7.74560546875, 8.203125, 8.66064453125, 9.1181640625, 9.57568359375, 10.033203125, 10.49072265625, 10.9482421875, 11.40576171875, 11.86328125, 12.32080078125, 12.7783203125, 13.23583984375, 13.693359375, 14.15087890625, 14.6083984375, 15.06591796875, 15.5234375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 4.0, 8.0, 9.0, 12.0, 25.0, 22.0, 29.0, 45.0, 71.0, 96.0, 127.0, 136.0, 109.0, 79.0, 65.0, 48.0, 37.0, 21.0, 8.0, 10.0, 15.0, 3.0, 4.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.73046875, -6.52178955078125, -6.3131103515625, -6.10443115234375, -5.895751953125, -5.68707275390625, -5.4783935546875, -5.26971435546875, -5.06103515625, -4.85235595703125, -4.6436767578125, -4.43499755859375, -4.226318359375, -4.01763916015625, -3.8089599609375, -3.60028076171875, -3.3916015625, -3.18292236328125, -2.9742431640625, -2.76556396484375, -2.556884765625, -2.34820556640625, -2.1395263671875, -1.93084716796875, -1.72216796875, -1.51348876953125, -1.3048095703125, -1.09613037109375, -0.887451171875, -0.67877197265625, -0.4700927734375, -0.26141357421875, -0.052734375, 0.15594482421875, 0.3646240234375, 0.57330322265625, 0.781982421875, 0.99066162109375, 1.1993408203125, 1.40802001953125, 1.61669921875, 1.82537841796875, 2.0340576171875, 2.24273681640625, 2.451416015625, 2.66009521484375, 2.8687744140625, 3.07745361328125, 3.2861328125, 3.49481201171875, 3.7034912109375, 3.91217041015625, 4.120849609375, 4.32952880859375, 4.5382080078125, 4.74688720703125, 4.95556640625, 5.16424560546875, 5.3729248046875, 5.58160400390625, 5.790283203125, 5.99896240234375, 6.2076416015625, 6.41632080078125, 6.625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 14.0, 35.0, 193.0, 487.0, 214.0, 37.0, 8.0, 5.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.3119125366211, -79.03627014160156, -70.76062774658203, -62.484981536865234, -54.2093391418457, -45.93369674682617, -37.658050537109375, -29.382408142089844, -21.106765747070312, -12.831122398376465, -4.555479049682617, 3.720165252685547, 11.995807647705078, 20.27145004272461, 28.547096252441406, 36.82273864746094, 45.09838104248047, 53.3740234375, 61.64966583251953, 69.92530822753906, 78.20095825195312, 86.47659301757812, 94.75224304199219, 103.02788543701172, 111.30352783203125, 119.57917022705078, 127.85481262207031, 136.13046264648438, 144.40609741210938, 152.68174743652344, 160.9573974609375, 169.2330322265625, 177.50869750976562, 185.7843475341797, 194.0599822998047, 202.33563232421875, 210.61126708984375, 218.8869171142578, 227.16256713867188, 235.43820190429688, 243.71383666992188, 251.98948669433594, 260.26513671875, 268.540771484375, 276.81640625, 285.092041015625, 293.3677062988281, 301.6433410644531, 309.91900634765625, 318.19464111328125, 326.4703063964844, 334.7459411621094, 343.0215759277344, 351.2972106933594, 359.5728759765625, 367.8485107421875, 376.1241455078125, 384.3997802734375, 392.6754455566406, 400.9510803222656, 409.2267150878906, 417.5023498535156, 425.77801513671875, 434.05364990234375, 442.32928466796875]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 3.0, 11.0, 19.0, 20.0, 22.0, 18.0, 30.0, 36.0, 40.0, 44.0, 46.0, 68.0, 78.0, 96.0, 83.0, 63.0, 44.0, 46.0, 40.0, 34.0, 26.0, 33.0, 21.0, 22.0, 17.0, 10.0, 9.0, 10.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-120.84520721435547, -117.93478393554688, -115.02435302734375, -112.11392974853516, -109.20350646972656, -106.29308319091797, -103.38265991210938, -100.47222900390625, -97.56180572509766, -94.65138244628906, -91.74095153808594, -88.83052825927734, -85.92010498046875, -83.00968170166016, -80.09925842285156, -77.18882751464844, -74.27840423583984, -71.36798095703125, -68.45755004882812, -65.54712677001953, -62.63670349121094, -59.726280212402344, -56.815853118896484, -53.905426025390625, -50.99500274658203, -48.08457946777344, -45.17415237426758, -42.26372528076172, -39.353302001953125, -36.44287872314453, -33.53245162963867, -30.622026443481445, -27.71160888671875, -24.801183700561523, -21.890758514404297, -18.98033332824707, -16.069908142089844, -13.159482955932617, -10.24905776977539, -7.338632583618164, -4.4282073974609375, -1.517782211303711, 1.3926429748535156, 4.303068161010742, 7.213493347167969, 10.123918533325195, 13.034343719482422, 15.944768905639648, 18.855194091796875, 21.7656192779541, 24.676044464111328, 27.586469650268555, 30.49689483642578, 33.407318115234375, 36.317745208740234, 39.228172302246094, 42.13859558105469, 45.04901885986328, 47.95944595336914, 50.869873046875, 53.780296325683594, 56.69071960449219, 59.60114669799805, 62.511573791503906, 65.4219970703125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 10.0, 11.0, 28.0, 51.0, 73.0, 182.0, 410.0, 1410.0, 8098.0, 612841.0, 3544686.0, 22223.0, 3033.0, 774.0, 227.0, 106.0, 47.0, 30.0, 20.0, 7.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.65625, -13.153564453125, -12.65087890625, -12.148193359375, -11.6455078125, -11.142822265625, -10.64013671875, -10.137451171875, -9.634765625, -9.132080078125, -8.62939453125, -8.126708984375, -7.6240234375, -7.121337890625, -6.61865234375, -6.115966796875, -5.61328125, -5.110595703125, -4.60791015625, -4.105224609375, -3.6025390625, -3.099853515625, -2.59716796875, -2.094482421875, -1.591796875, -1.089111328125, -0.58642578125, -0.083740234375, 0.4189453125, 0.921630859375, 1.42431640625, 1.927001953125, 2.4296875, 2.932373046875, 3.43505859375, 3.937744140625, 4.4404296875, 4.943115234375, 5.44580078125, 5.948486328125, 6.451171875, 6.953857421875, 7.45654296875, 7.959228515625, 8.4619140625, 8.964599609375, 9.46728515625, 9.969970703125, 10.47265625, 10.975341796875, 11.47802734375, 11.980712890625, 12.4833984375, 12.986083984375, 13.48876953125, 13.991455078125, 14.494140625, 14.996826171875, 15.49951171875, 16.002197265625, 16.5048828125, 17.007568359375, 17.51025390625, 18.012939453125, 18.515625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 18.0, 26.0, 39.0, 46.0, 86.0, 119.0, 123.0, 134.0, 107.0, 89.0, 84.0, 40.0, 25.0, 24.0, 12.0, 10.0, 4.0, 2.0, 7.0, 0.0, 1.0, 4.0], "bins": [-15.46875, -15.1546630859375, -14.840576171875, -14.5264892578125, -14.21240234375, -13.8983154296875, -13.584228515625, -13.2701416015625, -12.9560546875, -12.6419677734375, -12.327880859375, -12.0137939453125, -11.69970703125, -11.3856201171875, -11.071533203125, -10.7574462890625, -10.443359375, -10.1292724609375, -9.815185546875, -9.5010986328125, -9.18701171875, -8.8729248046875, -8.558837890625, -8.2447509765625, -7.9306640625, -7.6165771484375, -7.302490234375, -6.9884033203125, -6.67431640625, -6.3602294921875, -6.046142578125, -5.7320556640625, -5.41796875, -5.1038818359375, -4.789794921875, -4.4757080078125, -4.16162109375, -3.8475341796875, -3.533447265625, -3.2193603515625, -2.9052734375, -2.5911865234375, -2.277099609375, -1.9630126953125, -1.64892578125, -1.3348388671875, -1.020751953125, -0.7066650390625, -0.392578125, -0.0784912109375, 0.235595703125, 0.5496826171875, 0.86376953125, 1.1778564453125, 1.491943359375, 1.8060302734375, 2.1201171875, 2.4342041015625, 2.748291015625, 3.0623779296875, 3.37646484375, 3.6905517578125, 4.004638671875, 4.3187255859375, 4.6328125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 5.0, 4.0, 10.0, 34.0, 31.0, 67.0, 101.0, 218.0, 460.0, 1064.0, 3570.0, 18515.0, 533441.0, 3573933.0, 51458.0, 7413.0, 2142.0, 820.0, 403.0, 201.0, 128.0, 80.0, 70.0, 38.0, 22.0, 20.0, 8.0, 13.0, 8.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.515625, -11.0921630859375, -10.668701171875, -10.2452392578125, -9.82177734375, -9.3983154296875, -8.974853515625, -8.5513916015625, -8.1279296875, -7.7044677734375, -7.281005859375, -6.8575439453125, -6.43408203125, -6.0106201171875, -5.587158203125, -5.1636962890625, -4.740234375, -4.3167724609375, -3.893310546875, -3.4698486328125, -3.04638671875, -2.6229248046875, -2.199462890625, -1.7760009765625, -1.3525390625, -0.9290771484375, -0.505615234375, -0.0821533203125, 0.34130859375, 0.7647705078125, 1.188232421875, 1.6116943359375, 2.03515625, 2.4586181640625, 2.882080078125, 3.3055419921875, 3.72900390625, 4.1524658203125, 4.575927734375, 4.9993896484375, 5.4228515625, 5.8463134765625, 6.269775390625, 6.6932373046875, 7.11669921875, 7.5401611328125, 7.963623046875, 8.3870849609375, 8.810546875, 9.2340087890625, 9.657470703125, 10.0809326171875, 10.50439453125, 10.9278564453125, 11.351318359375, 11.7747802734375, 12.1982421875, 12.6217041015625, 13.045166015625, 13.4686279296875, 13.89208984375, 14.3155517578125, 14.739013671875, 15.1624755859375, 15.5859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 5.0, 9.0, 13.0, 15.0, 35.0, 82.0, 292.0, 1088.0, 1620.0, 607.0, 152.0, 56.0, 36.0, 18.0, 16.0, 6.0, 6.0, 6.0, 6.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8984375, -11.3101806640625, -10.721923828125, -10.1336669921875, -9.54541015625, -8.9571533203125, -8.368896484375, -7.7806396484375, -7.1923828125, -6.6041259765625, -6.015869140625, -5.4276123046875, -4.83935546875, -4.2510986328125, -3.662841796875, -3.0745849609375, -2.486328125, -1.8980712890625, -1.309814453125, -0.7215576171875, -0.13330078125, 0.4549560546875, 1.043212890625, 1.6314697265625, 2.2197265625, 2.8079833984375, 3.396240234375, 3.9844970703125, 4.57275390625, 5.1610107421875, 5.749267578125, 6.3375244140625, 6.92578125, 7.5140380859375, 8.102294921875, 8.6905517578125, 9.27880859375, 9.8670654296875, 10.455322265625, 11.0435791015625, 11.6318359375, 12.2200927734375, 12.808349609375, 13.3966064453125, 13.98486328125, 14.5731201171875, 15.161376953125, 15.7496337890625, 16.337890625, 16.9261474609375, 17.514404296875, 18.1026611328125, 18.69091796875, 19.2791748046875, 19.867431640625, 20.4556884765625, 21.0439453125, 21.6322021484375, 22.220458984375, 22.8087158203125, 23.39697265625, 23.9852294921875, 24.573486328125, 25.1617431640625, 25.75]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 12.0, 16.0, 62.0, 139.0, 256.0, 236.0, 148.0, 67.0, 25.0, 8.0, 11.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.29754638671875, -96.07888793945312, -92.8602294921875, -89.64157104492188, -86.42291259765625, -83.20425415039062, -79.98558807373047, -76.76692962646484, -73.54827117919922, -70.3296127319336, -67.11095428466797, -63.89229202270508, -60.67363357543945, -57.45497512817383, -54.23631286621094, -51.01765441894531, -47.79899597167969, -44.58033752441406, -41.36167907714844, -38.14301681518555, -34.92435836791992, -31.705699920654297, -28.48703956604004, -25.26837921142578, -22.049720764160156, -18.83106231689453, -15.612401962280273, -12.393742561340332, -9.17508316040039, -5.956424713134766, -2.737764358520508, 0.48089599609375, 3.6995468139648438, 6.918206214904785, 10.136865615844727, 13.355525016784668, 16.57418441772461, 19.792842864990234, 23.011503219604492, 26.23016357421875, 29.448822021484375, 32.66748046875, 35.886138916015625, 39.104801177978516, 42.32345962524414, 45.542118072509766, 48.760780334472656, 51.97943878173828, 55.198097229003906, 58.41675567626953, 61.635414123535156, 64.85407257080078, 68.07273864746094, 71.29139709472656, 74.51005554199219, 77.72871398925781, 80.94737243652344, 84.16603088378906, 87.38468933105469, 90.60334777832031, 93.82200622558594, 97.04066467285156, 100.25933074951172, 103.47798919677734, 106.69664764404297]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 7.0, 16.0, 40.0, 64.0, 89.0, 139.0, 156.0, 136.0, 109.0, 90.0, 64.0, 42.0, 14.0, 15.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.57620239257812, -118.540771484375, -114.50533294677734, -110.46990203857422, -106.43446350097656, -102.39903259277344, -98.36360168457031, -94.32817077636719, -90.29273223876953, -86.2573013305664, -82.22186279296875, -78.18643188476562, -74.1510009765625, -70.11556243896484, -66.08013153076172, -62.04469680786133, -58.00926208496094, -53.97382736206055, -49.938392639160156, -45.90296173095703, -41.86752700805664, -37.83209228515625, -33.796661376953125, -29.761226654052734, -25.725791931152344, -21.690357208251953, -17.654924392700195, -13.619490623474121, -9.584056854248047, -5.548622131347656, -1.5131893157958984, 2.5222434997558594, 6.55767822265625, 10.593111991882324, 14.628545761108398, 18.663978576660156, 22.699413299560547, 26.734848022460938, 30.770280838012695, 34.80571365356445, 38.841148376464844, 42.876583099365234, 46.912017822265625, 50.94744873046875, 54.98288345336914, 59.01831817626953, 63.053749084472656, 67.08918762207031, 71.12461853027344, 75.16004943847656, 79.19548797607422, 83.23091888427734, 87.266357421875, 91.30178833007812, 95.33721923828125, 99.37265014648438, 103.40808868408203, 107.44351959228516, 111.47895812988281, 115.51438903808594, 119.54981994628906, 123.58525848388672, 127.62068939208984, 131.6561279296875, 135.69155883789062]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 10.0, 11.0, 15.0, 23.0, 24.0, 33.0, 47.0, 57.0, 130.0, 236.0, 392.0, 1010.0, 3056.0, 12601.0, 77616.0, 611960.0, 294973.0, 35994.0, 6995.0, 1897.0, 691.0, 324.0, 166.0, 93.0, 62.0, 35.0, 24.0, 27.0, 22.0, 9.0, 4.0, 1.0, 6.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-15.6875, -15.26123046875, -14.8349609375, -14.40869140625, -13.982421875, -13.55615234375, -13.1298828125, -12.70361328125, -12.27734375, -11.85107421875, -11.4248046875, -10.99853515625, -10.572265625, -10.14599609375, -9.7197265625, -9.29345703125, -8.8671875, -8.44091796875, -8.0146484375, -7.58837890625, -7.162109375, -6.73583984375, -6.3095703125, -5.88330078125, -5.45703125, -5.03076171875, -4.6044921875, -4.17822265625, -3.751953125, -3.32568359375, -2.8994140625, -2.47314453125, -2.046875, -1.62060546875, -1.1943359375, -0.76806640625, -0.341796875, 0.08447265625, 0.5107421875, 0.93701171875, 1.36328125, 1.78955078125, 2.2158203125, 2.64208984375, 3.068359375, 3.49462890625, 3.9208984375, 4.34716796875, 4.7734375, 5.19970703125, 5.6259765625, 6.05224609375, 6.478515625, 6.90478515625, 7.3310546875, 7.75732421875, 8.18359375, 8.60986328125, 9.0361328125, 9.46240234375, 9.888671875, 10.31494140625, 10.7412109375, 11.16748046875, 11.59375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 7.0, 1.0, 5.0, 6.0, 8.0, 11.0, 12.0, 21.0, 26.0, 26.0, 45.0, 44.0, 53.0, 63.0, 55.0, 69.0, 69.0, 64.0, 65.0, 58.0, 64.0, 42.0, 41.0, 29.0, 21.0, 23.0, 13.0, 18.0, 14.0, 5.0, 9.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.21221923828125, -5.0533447265625, -4.89447021484375, -4.735595703125, -4.57672119140625, -4.4178466796875, -4.25897216796875, -4.10009765625, -3.94122314453125, -3.7823486328125, -3.62347412109375, -3.464599609375, -3.30572509765625, -3.1468505859375, -2.98797607421875, -2.8291015625, -2.67022705078125, -2.5113525390625, -2.35247802734375, -2.193603515625, -2.03472900390625, -1.8758544921875, -1.71697998046875, -1.55810546875, -1.39923095703125, -1.2403564453125, -1.08148193359375, -0.922607421875, -0.76373291015625, -0.6048583984375, -0.44598388671875, -0.287109375, -0.12823486328125, 0.0306396484375, 0.18951416015625, 0.348388671875, 0.50726318359375, 0.6661376953125, 0.82501220703125, 0.98388671875, 1.14276123046875, 1.3016357421875, 1.46051025390625, 1.619384765625, 1.77825927734375, 1.9371337890625, 2.09600830078125, 2.2548828125, 2.41375732421875, 2.5726318359375, 2.73150634765625, 2.890380859375, 3.04925537109375, 3.2081298828125, 3.36700439453125, 3.52587890625, 3.68475341796875, 3.8436279296875, 4.00250244140625, 4.161376953125, 4.32025146484375, 4.4791259765625, 4.63800048828125, 4.796875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 7.0, 15.0, 29.0, 57.0, 110.0, 311.0, 1237.0, 21303.0, 1017754.0, 6612.0, 720.0, 210.0, 93.0, 50.0, 29.0, 15.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.8125, -63.40625, -61.0, -58.59375, -56.1875, -53.78125, -51.375, -48.96875, -46.5625, -44.15625, -41.75, -39.34375, -36.9375, -34.53125, -32.125, -29.71875, -27.3125, -24.90625, -22.5, -20.09375, -17.6875, -15.28125, -12.875, -10.46875, -8.0625, -5.65625, -3.25, -0.84375, 1.5625, 3.96875, 6.375, 8.78125, 11.1875, 13.59375, 16.0, 18.40625, 20.8125, 23.21875, 25.625, 28.03125, 30.4375, 32.84375, 35.25, 37.65625, 40.0625, 42.46875, 44.875, 47.28125, 49.6875, 52.09375, 54.5, 56.90625, 59.3125, 61.71875, 64.125, 66.53125, 68.9375, 71.34375, 73.75, 76.15625, 78.5625, 80.96875, 83.375, 85.78125, 88.1875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 6.0, 5.0, 6.0, 11.0, 14.0, 20.0, 38.0, 41.0, 57.0, 64.0, 79.0, 85.0, 93.0, 98.0, 97.0, 66.0, 64.0, 46.0, 26.0, 21.0, 16.0, 17.0, 12.0, 9.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.09375, -29.225830078125, -28.35791015625, -27.489990234375, -26.6220703125, -25.754150390625, -24.88623046875, -24.018310546875, -23.150390625, -22.282470703125, -21.41455078125, -20.546630859375, -19.6787109375, -18.810791015625, -17.94287109375, -17.074951171875, -16.20703125, -15.339111328125, -14.47119140625, -13.603271484375, -12.7353515625, -11.867431640625, -10.99951171875, -10.131591796875, -9.263671875, -8.395751953125, -7.52783203125, -6.659912109375, -5.7919921875, -4.924072265625, -4.05615234375, -3.188232421875, -2.3203125, -1.452392578125, -0.58447265625, 0.283447265625, 1.1513671875, 2.019287109375, 2.88720703125, 3.755126953125, 4.623046875, 5.490966796875, 6.35888671875, 7.226806640625, 8.0947265625, 8.962646484375, 9.83056640625, 10.698486328125, 11.56640625, 12.434326171875, 13.30224609375, 14.170166015625, 15.0380859375, 15.906005859375, 16.77392578125, 17.641845703125, 18.509765625, 19.377685546875, 20.24560546875, 21.113525390625, 21.9814453125, 22.849365234375, 23.71728515625, 24.585205078125, 25.453125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 5.0, 5.0, 17.0, 12.0, 18.0, 23.0, 39.0, 68.0, 80.0, 139.0, 268.0, 591.0, 1862.0, 11808.0, 361177.0, 655611.0, 13324.0, 2101.0, 650.0, 277.0, 157.0, 86.0, 62.0, 39.0, 35.0, 22.0, 17.0, 5.0, 6.0, 11.0, 8.0, 5.0, 3.0, 4.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.9140625, -11.56396484375, -11.2138671875, -10.86376953125, -10.513671875, -10.16357421875, -9.8134765625, -9.46337890625, -9.11328125, -8.76318359375, -8.4130859375, -8.06298828125, -7.712890625, -7.36279296875, -7.0126953125, -6.66259765625, -6.3125, -5.96240234375, -5.6123046875, -5.26220703125, -4.912109375, -4.56201171875, -4.2119140625, -3.86181640625, -3.51171875, -3.16162109375, -2.8115234375, -2.46142578125, -2.111328125, -1.76123046875, -1.4111328125, -1.06103515625, -0.7109375, -0.36083984375, -0.0107421875, 0.33935546875, 0.689453125, 1.03955078125, 1.3896484375, 1.73974609375, 2.08984375, 2.43994140625, 2.7900390625, 3.14013671875, 3.490234375, 3.84033203125, 4.1904296875, 4.54052734375, 4.890625, 5.24072265625, 5.5908203125, 5.94091796875, 6.291015625, 6.64111328125, 6.9912109375, 7.34130859375, 7.69140625, 8.04150390625, 8.3916015625, 8.74169921875, 9.091796875, 9.44189453125, 9.7919921875, 10.14208984375, 10.4921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 12.0, 6.0, 16.0, 16.0, 21.0, 30.0, 44.0, 45.0, 102.0, 222.0, 220.0, 89.0, 44.0, 40.0, 20.0, 16.0, 12.0, 10.0, 4.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013113021850585938, -0.0012689381837844849, -0.001226574182510376, -0.001184210181236267, -0.0011418461799621582, -0.0010994821786880493, -0.0010571181774139404, -0.0010147541761398315, -0.0009723901748657227, -0.0009300261735916138, -0.0008876621723175049, -0.000845298171043396, -0.0008029341697692871, -0.0007605701684951782, -0.0007182061672210693, -0.0006758421659469604, -0.0006334781646728516, -0.0005911141633987427, -0.0005487501621246338, -0.0005063861608505249, -0.000464022159576416, -0.00042165815830230713, -0.00037929415702819824, -0.00033693015575408936, -0.00029456615447998047, -0.0002522021532058716, -0.0002098381519317627, -0.0001674741506576538, -0.00012511014938354492, -8.274614810943604e-05, -4.038214683532715e-05, 1.9818544387817383e-06, 4.4345855712890625e-05, 8.670985698699951e-05, 0.0001290738582611084, 0.00017143785953521729, 0.00021380186080932617, 0.00025616586208343506, 0.00029852986335754395, 0.00034089386463165283, 0.0003832578659057617, 0.0004256218671798706, 0.0004679858684539795, 0.0005103498697280884, 0.0005527138710021973, 0.0005950778722763062, 0.000637441873550415, 0.0006798058748245239, 0.0007221698760986328, 0.0007645338773727417, 0.0008068978786468506, 0.0008492618799209595, 0.0008916258811950684, 0.0009339898824691772, 0.0009763538837432861, 0.001018717885017395, 0.001061081886291504, 0.0011034458875656128, 0.0011458098888397217, 0.0011881738901138306, 0.0012305378913879395, 0.0012729018926620483, 0.0013152658939361572, 0.0013576298952102661, 0.001399993896484375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 7.0, 6.0, 7.0, 9.0, 9.0, 16.0, 25.0, 25.0, 41.0, 55.0, 63.0, 121.0, 139.0, 262.0, 464.0, 871.0, 1975.0, 5546.0, 24670.0, 335739.0, 636657.0, 30710.0, 6649.0, 2246.0, 915.0, 465.0, 266.0, 179.0, 111.0, 82.0, 42.0, 36.0, 33.0, 20.0, 20.0, 19.0, 14.0, 11.0, 7.0, 4.0, 5.0, 7.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.60546875, -6.41705322265625, -6.2286376953125, -6.04022216796875, -5.851806640625, -5.66339111328125, -5.4749755859375, -5.28656005859375, -5.09814453125, -4.90972900390625, -4.7213134765625, -4.53289794921875, -4.344482421875, -4.15606689453125, -3.9676513671875, -3.77923583984375, -3.5908203125, -3.40240478515625, -3.2139892578125, -3.02557373046875, -2.837158203125, -2.64874267578125, -2.4603271484375, -2.27191162109375, -2.08349609375, -1.89508056640625, -1.7066650390625, -1.51824951171875, -1.329833984375, -1.14141845703125, -0.9530029296875, -0.76458740234375, -0.576171875, -0.38775634765625, -0.1993408203125, -0.01092529296875, 0.177490234375, 0.36590576171875, 0.5543212890625, 0.74273681640625, 0.93115234375, 1.11956787109375, 1.3079833984375, 1.49639892578125, 1.684814453125, 1.87322998046875, 2.0616455078125, 2.25006103515625, 2.4384765625, 2.62689208984375, 2.8153076171875, 3.00372314453125, 3.192138671875, 3.38055419921875, 3.5689697265625, 3.75738525390625, 3.94580078125, 4.13421630859375, 4.3226318359375, 4.51104736328125, 4.699462890625, 4.88787841796875, 5.0762939453125, 5.26470947265625, 5.453125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 8.0, 11.0, 10.0, 17.0, 36.0, 56.0, 60.0, 166.0, 210.0, 135.0, 97.0, 43.0, 40.0, 29.0, 14.0, 13.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.8203125, -7.6002197265625, -7.380126953125, -7.1600341796875, -6.93994140625, -6.7198486328125, -6.499755859375, -6.2796630859375, -6.0595703125, -5.8394775390625, -5.619384765625, -5.3992919921875, -5.17919921875, -4.9591064453125, -4.739013671875, -4.5189208984375, -4.298828125, -4.0787353515625, -3.858642578125, -3.6385498046875, -3.41845703125, -3.1983642578125, -2.978271484375, -2.7581787109375, -2.5380859375, -2.3179931640625, -2.097900390625, -1.8778076171875, -1.65771484375, -1.4376220703125, -1.217529296875, -0.9974365234375, -0.77734375, -0.5572509765625, -0.337158203125, -0.1170654296875, 0.10302734375, 0.3231201171875, 0.543212890625, 0.7633056640625, 0.9833984375, 1.2034912109375, 1.423583984375, 1.6436767578125, 1.86376953125, 2.0838623046875, 2.303955078125, 2.5240478515625, 2.744140625, 2.9642333984375, 3.184326171875, 3.4044189453125, 3.62451171875, 3.8446044921875, 4.064697265625, 4.2847900390625, 4.5048828125, 4.7249755859375, 4.945068359375, 5.1651611328125, 5.38525390625, 5.6053466796875, 5.825439453125, 6.0455322265625, 6.265625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 13.0, 11.0, 20.0, 68.0, 264.0, 443.0, 136.0, 31.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-292.6822509765625, -285.79541015625, -278.9085388183594, -272.0216979980469, -265.13482666015625, -258.24798583984375, -251.3611297607422, -244.47427368164062, -237.58743286132812, -230.70057678222656, -223.813720703125, -216.9268798828125, -210.04002380371094, -203.15316772460938, -196.2663116455078, -189.37945556640625, -182.49261474609375, -175.6057586669922, -168.71890258789062, -161.83206176757812, -154.94520568847656, -148.058349609375, -141.17149353027344, -134.28463745117188, -127.39778137207031, -120.51092529296875, -113.62407684326172, -106.73722076416016, -99.85037231445312, -92.96351623535156, -86.07666015625, -79.18981170654297, -72.30296325683594, -65.41610717773438, -58.529258728027344, -51.64240264892578, -44.75555419921875, -37.86869812011719, -30.98184585571289, -24.094993591308594, -17.208141326904297, -10.3212890625, -3.4344358444213867, 3.4524173736572266, 10.339269638061523, 17.226123809814453, 24.11297607421875, 30.999828338623047, 37.886680603027344, 44.77353286743164, 51.66038513183594, 58.5472412109375, 65.43408966064453, 72.3209457397461, 79.20779418945312, 86.09465026855469, 92.98150634765625, 99.86836242675781, 106.75521087646484, 113.6420669555664, 120.52891540527344, 127.415771484375, 134.30262756347656, 141.18948364257812, 148.07632446289062]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 10.0, 18.0, 19.0, 19.0, 27.0, 25.0, 30.0, 42.0, 41.0, 56.0, 62.0, 80.0, 106.0, 84.0, 62.0, 51.0, 55.0, 25.0, 29.0, 24.0, 27.0, 17.0, 24.0, 13.0, 11.0, 6.0, 9.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.449310302734375, -56.087928771972656, -53.7265510559082, -51.36517333984375, -49.00379180908203, -46.64241027832031, -44.28103256225586, -41.919654846191406, -39.55827331542969, -37.19689178466797, -34.835514068603516, -32.47413635253906, -30.112754821777344, -27.751375198364258, -25.389995574951172, -23.028615951538086, -20.667236328125, -18.305856704711914, -15.944477081298828, -13.583097457885742, -11.221717834472656, -8.86033821105957, -6.498958587646484, -4.137578964233398, -1.7761993408203125, 0.5851802825927734, 2.9465599060058594, 5.307939529418945, 7.669319152832031, 10.030698776245117, 12.392078399658203, 14.753458023071289, 17.114837646484375, 19.47621726989746, 21.837596893310547, 24.198976516723633, 26.56035614013672, 28.921735763549805, 31.28311538696289, 33.644493103027344, 36.00587463378906, 38.36725616455078, 40.728633880615234, 43.09001159667969, 45.451393127441406, 47.812774658203125, 50.17415237426758, 52.53553009033203, 54.89691162109375, 57.25829315185547, 59.61967086791992, 61.981048583984375, 64.3424301147461, 66.70381164550781, 69.065185546875, 71.42656707763672, 73.78794860839844, 76.14933013916016, 78.51071166992188, 80.87208557128906, 83.23346710205078, 85.5948486328125, 87.95622253417969, 90.3176040649414, 92.67898559570312]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 13.0, 8.0, 18.0, 48.0, 72.0, 182.0, 542.0, 2458.0, 36556.0, 4103170.0, 47448.0, 2766.0, 617.0, 202.0, 84.0, 46.0, 28.0, 4.0, 12.0, 4.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.5, -22.85693359375, -22.2138671875, -21.57080078125, -20.927734375, -20.28466796875, -19.6416015625, -18.99853515625, -18.35546875, -17.71240234375, -17.0693359375, -16.42626953125, -15.783203125, -15.14013671875, -14.4970703125, -13.85400390625, -13.2109375, -12.56787109375, -11.9248046875, -11.28173828125, -10.638671875, -9.99560546875, -9.3525390625, -8.70947265625, -8.06640625, -7.42333984375, -6.7802734375, -6.13720703125, -5.494140625, -4.85107421875, -4.2080078125, -3.56494140625, -2.921875, -2.27880859375, -1.6357421875, -0.99267578125, -0.349609375, 0.29345703125, 0.9365234375, 1.57958984375, 2.22265625, 2.86572265625, 3.5087890625, 4.15185546875, 4.794921875, 5.43798828125, 6.0810546875, 6.72412109375, 7.3671875, 8.01025390625, 8.6533203125, 9.29638671875, 9.939453125, 10.58251953125, 11.2255859375, 11.86865234375, 12.51171875, 13.15478515625, 13.7978515625, 14.44091796875, 15.083984375, 15.72705078125, 16.3701171875, 17.01318359375, 17.65625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 9.0, 18.0, 28.0, 36.0, 50.0, 83.0, 89.0, 85.0, 110.0, 117.0, 95.0, 86.0, 68.0, 36.0, 25.0, 20.0, 11.0, 5.0, 6.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7109375, -6.4693603515625, -6.227783203125, -5.9862060546875, -5.74462890625, -5.5030517578125, -5.261474609375, -5.0198974609375, -4.7783203125, -4.5367431640625, -4.295166015625, -4.0535888671875, -3.81201171875, -3.5704345703125, -3.328857421875, -3.0872802734375, -2.845703125, -2.6041259765625, -2.362548828125, -2.1209716796875, -1.87939453125, -1.6378173828125, -1.396240234375, -1.1546630859375, -0.9130859375, -0.6715087890625, -0.429931640625, -0.1883544921875, 0.05322265625, 0.2947998046875, 0.536376953125, 0.7779541015625, 1.01953125, 1.2611083984375, 1.502685546875, 1.7442626953125, 1.98583984375, 2.2274169921875, 2.468994140625, 2.7105712890625, 2.9521484375, 3.1937255859375, 3.435302734375, 3.6768798828125, 3.91845703125, 4.1600341796875, 4.401611328125, 4.6431884765625, 4.884765625, 5.1263427734375, 5.367919921875, 5.6094970703125, 5.85107421875, 6.0926513671875, 6.334228515625, 6.5758056640625, 6.8173828125, 7.0589599609375, 7.300537109375, 7.5421142578125, 7.78369140625, 8.0252685546875, 8.266845703125, 8.5084228515625, 8.75]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 8.0, 4.0, 11.0, 10.0, 18.0, 22.0, 53.0, 101.0, 162.0, 386.0, 845.0, 1888.0, 5923.0, 65471.0, 4048603.0, 58564.0, 6811.0, 2622.0, 1279.0, 668.0, 347.0, 178.0, 111.0, 55.0, 39.0, 28.0, 12.0, 16.0, 9.0, 11.0, 7.0, 4.0, 8.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-20.296875, -19.7403564453125, -19.183837890625, -18.6273193359375, -18.07080078125, -17.5142822265625, -16.957763671875, -16.4012451171875, -15.8447265625, -15.2882080078125, -14.731689453125, -14.1751708984375, -13.61865234375, -13.0621337890625, -12.505615234375, -11.9490966796875, -11.392578125, -10.8360595703125, -10.279541015625, -9.7230224609375, -9.16650390625, -8.6099853515625, -8.053466796875, -7.4969482421875, -6.9404296875, -6.3839111328125, -5.827392578125, -5.2708740234375, -4.71435546875, -4.1578369140625, -3.601318359375, -3.0447998046875, -2.48828125, -1.9317626953125, -1.375244140625, -0.8187255859375, -0.26220703125, 0.2943115234375, 0.850830078125, 1.4073486328125, 1.9638671875, 2.5203857421875, 3.076904296875, 3.6334228515625, 4.18994140625, 4.7464599609375, 5.302978515625, 5.8594970703125, 6.416015625, 6.9725341796875, 7.529052734375, 8.0855712890625, 8.64208984375, 9.1986083984375, 9.755126953125, 10.3116455078125, 10.8681640625, 11.4246826171875, 11.981201171875, 12.5377197265625, 13.09423828125, 13.6507568359375, 14.207275390625, 14.7637939453125, 15.3203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 9.0, 11.0, 36.0, 72.0, 255.0, 1131.0, 1812.0, 488.0, 126.0, 41.0, 26.0, 23.0, 12.0, 10.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.359375, -12.80712890625, -12.2548828125, -11.70263671875, -11.150390625, -10.59814453125, -10.0458984375, -9.49365234375, -8.94140625, -8.38916015625, -7.8369140625, -7.28466796875, -6.732421875, -6.18017578125, -5.6279296875, -5.07568359375, -4.5234375, -3.97119140625, -3.4189453125, -2.86669921875, -2.314453125, -1.76220703125, -1.2099609375, -0.65771484375, -0.10546875, 0.44677734375, 0.9990234375, 1.55126953125, 2.103515625, 2.65576171875, 3.2080078125, 3.76025390625, 4.3125, 4.86474609375, 5.4169921875, 5.96923828125, 6.521484375, 7.07373046875, 7.6259765625, 8.17822265625, 8.73046875, 9.28271484375, 9.8349609375, 10.38720703125, 10.939453125, 11.49169921875, 12.0439453125, 12.59619140625, 13.1484375, 13.70068359375, 14.2529296875, 14.80517578125, 15.357421875, 15.90966796875, 16.4619140625, 17.01416015625, 17.56640625, 18.11865234375, 18.6708984375, 19.22314453125, 19.775390625, 20.32763671875, 20.8798828125, 21.43212890625, 21.984375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 12.0, 35.0, 690.0, 234.0, 23.0, 4.0, 6.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.16606140136719, -107.79784393310547, -95.42962646484375, -83.06141662597656, -70.69319915771484, -58.324981689453125, -45.95677185058594, -33.58855438232422, -21.2203369140625, -8.852121353149414, 3.516094207763672, 15.884307861328125, 28.252525329589844, 40.62074279785156, 52.98895263671875, 65.35717010498047, 77.72538757324219, 90.0936050415039, 102.46182250976562, 114.83003234863281, 127.19824981689453, 139.56646728515625, 151.93467712402344, 164.30288696289062, 176.67111206054688, 189.03932189941406, 201.4075469970703, 213.7757568359375, 226.14398193359375, 238.51219177246094, 250.88040161132812, 263.2486267089844, 275.6168212890625, 287.98504638671875, 300.3532409667969, 312.7214660644531, 325.0896911621094, 337.4578857421875, 349.82611083984375, 362.1943359375, 374.56256103515625, 386.9307861328125, 399.2989807128906, 411.6672058105469, 424.0354309082031, 436.40362548828125, 448.7718505859375, 461.14007568359375, 473.5082702636719, 485.8764953613281, 498.24468994140625, 510.6129150390625, 522.9811401367188, 535.349365234375, 547.717529296875, 560.0857543945312, 572.4539794921875, 584.8222045898438, 597.1904296875, 609.55859375, 621.9268188476562, 634.2950439453125, 646.6632690429688, 659.031494140625, 671.3997192382812]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 11.0, 12.0, 31.0, 39.0, 60.0, 85.0, 101.0, 103.0, 144.0, 112.0, 87.0, 92.0, 35.0, 31.0, 27.0, 14.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.94977569580078, -119.7951431274414, -116.64051055908203, -113.48587799072266, -110.33124542236328, -107.1766128540039, -104.02198028564453, -100.86734771728516, -97.71271514892578, -94.5580825805664, -91.40345001220703, -88.24881744384766, -85.09418487548828, -81.9395523071289, -78.78491973876953, -75.63028717041016, -72.47566223144531, -69.32102966308594, -66.16639709472656, -63.01176452636719, -59.85713195800781, -56.70249938964844, -53.54786682128906, -50.39323425292969, -47.23860168457031, -44.08396911621094, -40.92933654785156, -37.77470397949219, -34.62007141113281, -31.465438842773438, -28.310808181762695, -25.15617561340332, -22.001541137695312, -18.846908569335938, -15.692276000976562, -12.537644386291504, -9.383011817932129, -6.228379249572754, -3.0737476348876953, 0.08088493347167969, 3.2355175018310547, 6.39015007019043, 9.544782638549805, 12.699414253234863, 15.854046821594238, 19.008678436279297, 22.163311004638672, 25.317943572998047, 28.472576141357422, 31.627208709716797, 34.78184127807617, 37.93647384643555, 41.09110641479492, 44.2457389831543, 47.400367736816406, 50.55500030517578, 53.709632873535156, 56.86426544189453, 60.018898010253906, 63.17353057861328, 66.32816314697266, 69.48279571533203, 72.6374282836914, 75.79206085205078, 78.94669342041016]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 10.0, 7.0, 11.0, 9.0, 16.0, 18.0, 39.0, 41.0, 74.0, 88.0, 134.0, 228.0, 323.0, 667.0, 1446.0, 3754.0, 12474.0, 57509.0, 342642.0, 503645.0, 97033.0, 19311.0, 5257.0, 1859.0, 791.0, 414.0, 237.0, 147.0, 99.0, 72.0, 55.0, 31.0, 31.0, 21.0, 15.0, 12.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.40625, -8.144775390625, -7.88330078125, -7.621826171875, -7.3603515625, -7.098876953125, -6.83740234375, -6.575927734375, -6.314453125, -6.052978515625, -5.79150390625, -5.530029296875, -5.2685546875, -5.007080078125, -4.74560546875, -4.484130859375, -4.22265625, -3.961181640625, -3.69970703125, -3.438232421875, -3.1767578125, -2.915283203125, -2.65380859375, -2.392333984375, -2.130859375, -1.869384765625, -1.60791015625, -1.346435546875, -1.0849609375, -0.823486328125, -0.56201171875, -0.300537109375, -0.0390625, 0.222412109375, 0.48388671875, 0.745361328125, 1.0068359375, 1.268310546875, 1.52978515625, 1.791259765625, 2.052734375, 2.314208984375, 2.57568359375, 2.837158203125, 3.0986328125, 3.360107421875, 3.62158203125, 3.883056640625, 4.14453125, 4.406005859375, 4.66748046875, 4.928955078125, 5.1904296875, 5.451904296875, 5.71337890625, 5.974853515625, 6.236328125, 6.497802734375, 6.75927734375, 7.020751953125, 7.2822265625, 7.543701171875, 7.80517578125, 8.066650390625, 8.328125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 13.0, 17.0, 26.0, 29.0, 54.0, 77.0, 91.0, 96.0, 89.0, 116.0, 102.0, 86.0, 72.0, 43.0, 23.0, 21.0, 11.0, 11.0, 10.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6015625, -8.35443115234375, -8.1072998046875, -7.86016845703125, -7.613037109375, -7.36590576171875, -7.1187744140625, -6.87164306640625, -6.62451171875, -6.37738037109375, -6.1302490234375, -5.88311767578125, -5.635986328125, -5.38885498046875, -5.1417236328125, -4.89459228515625, -4.6474609375, -4.40032958984375, -4.1531982421875, -3.90606689453125, -3.658935546875, -3.41180419921875, -3.1646728515625, -2.91754150390625, -2.67041015625, -2.42327880859375, -2.1761474609375, -1.92901611328125, -1.681884765625, -1.43475341796875, -1.1876220703125, -0.94049072265625, -0.693359375, -0.44622802734375, -0.1990966796875, 0.04803466796875, 0.295166015625, 0.54229736328125, 0.7894287109375, 1.03656005859375, 1.28369140625, 1.53082275390625, 1.7779541015625, 2.02508544921875, 2.272216796875, 2.51934814453125, 2.7664794921875, 3.01361083984375, 3.2607421875, 3.50787353515625, 3.7550048828125, 4.00213623046875, 4.249267578125, 4.49639892578125, 4.7435302734375, 4.99066162109375, 5.23779296875, 5.48492431640625, 5.7320556640625, 5.97918701171875, 6.226318359375, 6.47344970703125, 6.7205810546875, 6.96771240234375, 7.21484375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 11.0, 12.0, 28.0, 32.0, 40.0, 45.0, 84.0, 115.0, 209.0, 423.0, 934.0, 2435.0, 7972.0, 38905.0, 334281.0, 596095.0, 51898.0, 9843.0, 2960.0, 1103.0, 473.0, 245.0, 139.0, 85.0, 52.0, 25.0, 15.0, 15.0, 19.0, 6.0, 9.0, 8.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.421875, -11.086669921875, -10.75146484375, -10.416259765625, -10.0810546875, -9.745849609375, -9.41064453125, -9.075439453125, -8.740234375, -8.405029296875, -8.06982421875, -7.734619140625, -7.3994140625, -7.064208984375, -6.72900390625, -6.393798828125, -6.05859375, -5.723388671875, -5.38818359375, -5.052978515625, -4.7177734375, -4.382568359375, -4.04736328125, -3.712158203125, -3.376953125, -3.041748046875, -2.70654296875, -2.371337890625, -2.0361328125, -1.700927734375, -1.36572265625, -1.030517578125, -0.6953125, -0.360107421875, -0.02490234375, 0.310302734375, 0.6455078125, 0.980712890625, 1.31591796875, 1.651123046875, 1.986328125, 2.321533203125, 2.65673828125, 2.991943359375, 3.3271484375, 3.662353515625, 3.99755859375, 4.332763671875, 4.66796875, 5.003173828125, 5.33837890625, 5.673583984375, 6.0087890625, 6.343994140625, 6.67919921875, 7.014404296875, 7.349609375, 7.684814453125, 8.02001953125, 8.355224609375, 8.6904296875, 9.025634765625, 9.36083984375, 9.696044921875, 10.03125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 6.0, 10.0, 12.0, 15.0, 18.0, 30.0, 17.0, 22.0, 26.0, 38.0, 44.0, 38.0, 44.0, 55.0, 48.0, 57.0, 55.0, 63.0, 48.0, 61.0, 51.0, 38.0, 36.0, 29.0, 20.0, 19.0, 17.0, 11.0, 15.0, 14.0, 7.0, 5.0, 8.0, 6.0, 5.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.9296875, -15.4771728515625, -15.024658203125, -14.5721435546875, -14.11962890625, -13.6671142578125, -13.214599609375, -12.7620849609375, -12.3095703125, -11.8570556640625, -11.404541015625, -10.9520263671875, -10.49951171875, -10.0469970703125, -9.594482421875, -9.1419677734375, -8.689453125, -8.2369384765625, -7.784423828125, -7.3319091796875, -6.87939453125, -6.4268798828125, -5.974365234375, -5.5218505859375, -5.0693359375, -4.6168212890625, -4.164306640625, -3.7117919921875, -3.25927734375, -2.8067626953125, -2.354248046875, -1.9017333984375, -1.44921875, -0.9967041015625, -0.544189453125, -0.0916748046875, 0.36083984375, 0.8133544921875, 1.265869140625, 1.7183837890625, 2.1708984375, 2.6234130859375, 3.075927734375, 3.5284423828125, 3.98095703125, 4.4334716796875, 4.885986328125, 5.3385009765625, 5.791015625, 6.2435302734375, 6.696044921875, 7.1485595703125, 7.60107421875, 8.0535888671875, 8.506103515625, 8.9586181640625, 9.4111328125, 9.8636474609375, 10.316162109375, 10.7686767578125, 11.22119140625, 11.6737060546875, 12.126220703125, 12.5787353515625, 13.03125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 8.0, 9.0, 34.0, 52.0, 109.0, 234.0, 575.0, 1631.0, 5670.0, 29481.0, 605832.0, 370717.0, 26198.0, 5401.0, 1602.0, 554.0, 253.0, 83.0, 47.0, 17.0, 17.0, 5.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7734375, -4.628662109375, -4.48388671875, -4.339111328125, -4.1943359375, -4.049560546875, -3.90478515625, -3.760009765625, -3.615234375, -3.470458984375, -3.32568359375, -3.180908203125, -3.0361328125, -2.891357421875, -2.74658203125, -2.601806640625, -2.45703125, -2.312255859375, -2.16748046875, -2.022705078125, -1.8779296875, -1.733154296875, -1.58837890625, -1.443603515625, -1.298828125, -1.154052734375, -1.00927734375, -0.864501953125, -0.7197265625, -0.574951171875, -0.43017578125, -0.285400390625, -0.140625, 0.004150390625, 0.14892578125, 0.293701171875, 0.4384765625, 0.583251953125, 0.72802734375, 0.872802734375, 1.017578125, 1.162353515625, 1.30712890625, 1.451904296875, 1.5966796875, 1.741455078125, 1.88623046875, 2.031005859375, 2.17578125, 2.320556640625, 2.46533203125, 2.610107421875, 2.7548828125, 2.899658203125, 3.04443359375, 3.189208984375, 3.333984375, 3.478759765625, 3.62353515625, 3.768310546875, 3.9130859375, 4.057861328125, 4.20263671875, 4.347412109375, 4.4921875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 6.0, 15.0, 20.0, 43.0, 91.0, 237.0, 311.0, 158.0, 46.0, 25.0, 14.0, 8.0, 8.0, 5.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0016460418701171875, -0.0016018599271774292, -0.001557677984237671, -0.0015134960412979126, -0.0014693140983581543, -0.001425132155418396, -0.0013809502124786377, -0.0013367682695388794, -0.001292586326599121, -0.0012484043836593628, -0.0012042224407196045, -0.0011600404977798462, -0.0011158585548400879, -0.0010716766119003296, -0.0010274946689605713, -0.000983312726020813, -0.0009391307830810547, -0.0008949488401412964, -0.0008507668972015381, -0.0008065849542617798, -0.0007624030113220215, -0.0007182210683822632, -0.0006740391254425049, -0.0006298571825027466, -0.0005856752395629883, -0.00054149329662323, -0.0004973113536834717, -0.0004531294107437134, -0.0004089474678039551, -0.0003647655248641968, -0.0003205835819244385, -0.0002764016389846802, -0.00023221969604492188, -0.00018803775310516357, -0.00014385581016540527, -9.967386722564697e-05, -5.549192428588867e-05, -1.1309981346130371e-05, 3.287196159362793e-05, 7.705390453338623e-05, 0.00012123584747314453, 0.00016541779041290283, 0.00020959973335266113, 0.00025378167629241943, 0.00029796361923217773, 0.00034214556217193604, 0.00038632750511169434, 0.00043050944805145264, 0.00047469139099121094, 0.0005188733339309692, 0.0005630552768707275, 0.0006072372198104858, 0.0006514191627502441, 0.0006956011056900024, 0.0007397830486297607, 0.000783964991569519, 0.0008281469345092773, 0.0008723288774490356, 0.0009165108203887939, 0.0009606927633285522, 0.0010048747062683105, 0.0010490566492080688, 0.0010932385921478271, 0.0011374205350875854, 0.0011816024780273438]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 8.0, 9.0, 13.0, 10.0, 24.0, 29.0, 35.0, 65.0, 106.0, 190.0, 359.0, 708.0, 1628.0, 3747.0, 10218.0, 33402.0, 161661.0, 672420.0, 122101.0, 26956.0, 8719.0, 3254.0, 1409.0, 645.0, 353.0, 175.0, 107.0, 52.0, 44.0, 26.0, 25.0, 13.0, 13.0, 8.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.23046875, -2.142730712890625, -2.05499267578125, -1.967254638671875, -1.8795166015625, -1.791778564453125, -1.70404052734375, -1.616302490234375, -1.528564453125, -1.440826416015625, -1.35308837890625, -1.265350341796875, -1.1776123046875, -1.089874267578125, -1.00213623046875, -0.914398193359375, -0.82666015625, -0.738922119140625, -0.65118408203125, -0.563446044921875, -0.4757080078125, -0.387969970703125, -0.30023193359375, -0.212493896484375, -0.124755859375, -0.037017822265625, 0.05072021484375, 0.138458251953125, 0.2261962890625, 0.313934326171875, 0.40167236328125, 0.489410400390625, 0.5771484375, 0.664886474609375, 0.75262451171875, 0.840362548828125, 0.9281005859375, 1.015838623046875, 1.10357666015625, 1.191314697265625, 1.279052734375, 1.366790771484375, 1.45452880859375, 1.542266845703125, 1.6300048828125, 1.717742919921875, 1.80548095703125, 1.893218994140625, 1.98095703125, 2.068695068359375, 2.15643310546875, 2.244171142578125, 2.3319091796875, 2.419647216796875, 2.50738525390625, 2.595123291015625, 2.682861328125, 2.770599365234375, 2.85833740234375, 2.946075439453125, 3.0338134765625, 3.121551513671875, 3.20928955078125, 3.297027587890625, 3.384765625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 12.0, 12.0, 6.0, 10.0, 22.0, 35.0, 44.0, 71.0, 98.0, 110.0, 108.0, 115.0, 94.0, 70.0, 49.0, 37.0, 28.0, 23.0, 15.0, 10.0, 4.0, 5.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.06640625, -2.958984375, -2.8515625, -2.744140625, -2.63671875, -2.529296875, -2.421875, -2.314453125, -2.20703125, -2.099609375, -1.9921875, -1.884765625, -1.77734375, -1.669921875, -1.5625, -1.455078125, -1.34765625, -1.240234375, -1.1328125, -1.025390625, -0.91796875, -0.810546875, -0.703125, -0.595703125, -0.48828125, -0.380859375, -0.2734375, -0.166015625, -0.05859375, 0.048828125, 0.15625, 0.263671875, 0.37109375, 0.478515625, 0.5859375, 0.693359375, 0.80078125, 0.908203125, 1.015625, 1.123046875, 1.23046875, 1.337890625, 1.4453125, 1.552734375, 1.66015625, 1.767578125, 1.875, 1.982421875, 2.08984375, 2.197265625, 2.3046875, 2.412109375, 2.51953125, 2.626953125, 2.734375, 2.841796875, 2.94921875, 3.056640625, 3.1640625, 3.271484375, 3.37890625, 3.486328125, 3.59375, 3.701171875, 3.80859375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 13.0, 34.0, 138.0, 515.0, 213.0, 51.0, 16.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-241.558837890625, -236.14993286132812, -230.7410430908203, -225.33213806152344, -219.92324829101562, -214.51434326171875, -209.10543823242188, -203.69654846191406, -198.2876434326172, -192.8787384033203, -187.4698486328125, -182.06094360351562, -176.6520538330078, -171.24314880371094, -165.83425903320312, -160.42535400390625, -155.01644897460938, -149.6075439453125, -144.1986541748047, -138.7897491455078, -133.380859375, -127.97195434570312, -122.56305694580078, -117.15415954589844, -111.74526977539062, -106.33637237548828, -100.92747497558594, -95.51856994628906, -90.10967254638672, -84.70077514648438, -79.29187774658203, -73.88298034667969, -68.47406768798828, -63.06517028808594, -57.65626907348633, -52.247371673583984, -46.838470458984375, -41.42957305908203, -36.02067565917969, -30.611774444580078, -25.202877044677734, -19.793977737426758, -14.385079383850098, -8.976181030273438, -3.567281723022461, 1.8416175842285156, 7.250514984130859, 12.659416198730469, 18.068313598632812, 23.47721290588379, 28.886112213134766, 34.29500961303711, 39.70391082763672, 45.11280822753906, 50.521705627441406, 55.930606842041016, 61.33950424194336, 66.74840545654297, 72.15730285644531, 77.56620025634766, 82.97509765625, 88.38400268554688, 93.79289245605469, 99.20179748535156, 104.6106948852539]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 9.0, 5.0, 13.0, 18.0, 17.0, 24.0, 34.0, 32.0, 37.0, 34.0, 47.0, 64.0, 73.0, 127.0, 93.0, 49.0, 50.0, 43.0, 51.0, 34.0, 31.0, 22.0, 22.0, 21.0, 13.0, 9.0, 11.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.80262756347656, -69.66513061523438, -67.52763366699219, -65.39014434814453, -63.252647399902344, -61.115150451660156, -58.977657318115234, -56.84016418457031, -54.702667236328125, -52.56517028808594, -50.427677154541016, -48.290184020996094, -46.152687072753906, -44.01519012451172, -41.8776969909668, -39.740203857421875, -37.60270690917969, -35.4652099609375, -33.32771682739258, -31.190221786499023, -29.05272674560547, -26.915231704711914, -24.77773666381836, -22.640241622924805, -20.50274658203125, -18.365251541137695, -16.22775650024414, -14.090261459350586, -11.952766418457031, -9.815271377563477, -7.677776336669922, -5.540281295776367, -3.4027862548828125, -1.2652912139892578, 0.8722038269042969, 3.0096988677978516, 5.147193908691406, 7.284688949584961, 9.422183990478516, 11.55967903137207, 13.697174072265625, 15.83466911315918, 17.972164154052734, 20.10965919494629, 22.247154235839844, 24.3846492767334, 26.522144317626953, 28.659639358520508, 30.797134399414062, 32.93463134765625, 35.07212448120117, 37.209617614746094, 39.34711456298828, 41.48461151123047, 43.62210464477539, 45.75959777832031, 47.8970947265625, 50.03459167480469, 52.17208480834961, 54.30957794189453, 56.44707489013672, 58.584571838378906, 60.72206497192383, 62.85955810546875, 64.99705505371094]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 2.0, 6.0, 9.0, 10.0, 14.0, 25.0, 36.0, 61.0, 108.0, 150.0, 258.0, 514.0, 951.0, 2455.0, 8576.0, 66569.0, 1535252.0, 2460844.0, 99975.0, 12007.0, 3432.0, 1438.0, 662.0, 346.0, 209.0, 106.0, 90.0, 53.0, 32.0, 25.0, 21.0, 8.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.2421875, -7.04150390625, -6.8408203125, -6.64013671875, -6.439453125, -6.23876953125, -6.0380859375, -5.83740234375, -5.63671875, -5.43603515625, -5.2353515625, -5.03466796875, -4.833984375, -4.63330078125, -4.4326171875, -4.23193359375, -4.03125, -3.83056640625, -3.6298828125, -3.42919921875, -3.228515625, -3.02783203125, -2.8271484375, -2.62646484375, -2.42578125, -2.22509765625, -2.0244140625, -1.82373046875, -1.623046875, -1.42236328125, -1.2216796875, -1.02099609375, -0.8203125, -0.61962890625, -0.4189453125, -0.21826171875, -0.017578125, 0.18310546875, 0.3837890625, 0.58447265625, 0.78515625, 0.98583984375, 1.1865234375, 1.38720703125, 1.587890625, 1.78857421875, 1.9892578125, 2.18994140625, 2.390625, 2.59130859375, 2.7919921875, 2.99267578125, 3.193359375, 3.39404296875, 3.5947265625, 3.79541015625, 3.99609375, 4.19677734375, 4.3974609375, 4.59814453125, 4.798828125, 4.99951171875, 5.2001953125, 5.40087890625, 5.6015625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 8.0, 5.0, 12.0, 8.0, 17.0, 22.0, 41.0, 39.0, 72.0, 63.0, 70.0, 83.0, 72.0, 70.0, 93.0, 73.0, 60.0, 46.0, 31.0, 27.0, 21.0, 30.0, 9.0, 5.0, 14.0, 3.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.18450927734375, -6.0018310546875, -5.81915283203125, -5.636474609375, -5.45379638671875, -5.2711181640625, -5.08843994140625, -4.90576171875, -4.72308349609375, -4.5404052734375, -4.35772705078125, -4.175048828125, -3.99237060546875, -3.8096923828125, -3.62701416015625, -3.4443359375, -3.26165771484375, -3.0789794921875, -2.89630126953125, -2.713623046875, -2.53094482421875, -2.3482666015625, -2.16558837890625, -1.98291015625, -1.80023193359375, -1.6175537109375, -1.43487548828125, -1.252197265625, -1.06951904296875, -0.8868408203125, -0.70416259765625, -0.521484375, -0.33880615234375, -0.1561279296875, 0.02655029296875, 0.209228515625, 0.39190673828125, 0.5745849609375, 0.75726318359375, 0.93994140625, 1.12261962890625, 1.3052978515625, 1.48797607421875, 1.670654296875, 1.85333251953125, 2.0360107421875, 2.21868896484375, 2.4013671875, 2.58404541015625, 2.7667236328125, 2.94940185546875, 3.132080078125, 3.31475830078125, 3.4974365234375, 3.68011474609375, 3.86279296875, 4.04547119140625, 4.2281494140625, 4.41082763671875, 4.593505859375, 4.77618408203125, 4.9588623046875, 5.14154052734375, 5.32421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 11.0, 26.0, 58.0, 167.0, 505.0, 1970.0, 39627.0, 4127314.0, 22358.0, 1564.0, 412.0, 145.0, 54.0, 35.0, 18.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.4375, -20.776611328125, -20.11572265625, -19.454833984375, -18.7939453125, -18.133056640625, -17.47216796875, -16.811279296875, -16.150390625, -15.489501953125, -14.82861328125, -14.167724609375, -13.5068359375, -12.845947265625, -12.18505859375, -11.524169921875, -10.86328125, -10.202392578125, -9.54150390625, -8.880615234375, -8.2197265625, -7.558837890625, -6.89794921875, -6.237060546875, -5.576171875, -4.915283203125, -4.25439453125, -3.593505859375, -2.9326171875, -2.271728515625, -1.61083984375, -0.949951171875, -0.2890625, 0.371826171875, 1.03271484375, 1.693603515625, 2.3544921875, 3.015380859375, 3.67626953125, 4.337158203125, 4.998046875, 5.658935546875, 6.31982421875, 6.980712890625, 7.6416015625, 8.302490234375, 8.96337890625, 9.624267578125, 10.28515625, 10.946044921875, 11.60693359375, 12.267822265625, 12.9287109375, 13.589599609375, 14.25048828125, 14.911376953125, 15.572265625, 16.233154296875, 16.89404296875, 17.554931640625, 18.2158203125, 18.876708984375, 19.53759765625, 20.198486328125, 20.859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 10.0, 8.0, 14.0, 41.0, 51.0, 112.0, 255.0, 535.0, 968.0, 1053.0, 531.0, 248.0, 104.0, 53.0, 21.0, 28.0, 11.0, 8.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.84765625, -6.56231689453125, -6.2769775390625, -5.99163818359375, -5.706298828125, -5.42095947265625, -5.1356201171875, -4.85028076171875, -4.56494140625, -4.27960205078125, -3.9942626953125, -3.70892333984375, -3.423583984375, -3.13824462890625, -2.8529052734375, -2.56756591796875, -2.2822265625, -1.99688720703125, -1.7115478515625, -1.42620849609375, -1.140869140625, -0.85552978515625, -0.5701904296875, -0.28485107421875, 0.00048828125, 0.28582763671875, 0.5711669921875, 0.85650634765625, 1.141845703125, 1.42718505859375, 1.7125244140625, 1.99786376953125, 2.283203125, 2.56854248046875, 2.8538818359375, 3.13922119140625, 3.424560546875, 3.70989990234375, 3.9952392578125, 4.28057861328125, 4.56591796875, 4.85125732421875, 5.1365966796875, 5.42193603515625, 5.707275390625, 5.99261474609375, 6.2779541015625, 6.56329345703125, 6.8486328125, 7.13397216796875, 7.4193115234375, 7.70465087890625, 7.989990234375, 8.27532958984375, 8.5606689453125, 8.84600830078125, 9.13134765625, 9.41668701171875, 9.7020263671875, 9.98736572265625, 10.272705078125, 10.55804443359375, 10.8433837890625, 11.12872314453125, 11.4140625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 26.0, 51.0, 134.0, 252.0, 262.0, 151.0, 66.0, 28.0, 11.0, 7.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.0130615234375, -61.362998962402344, -58.71293640136719, -56.06287384033203, -53.41280746459961, -50.76274490356445, -48.1126823425293, -45.462615966796875, -42.81255340576172, -40.16249084472656, -37.512428283691406, -34.86236572265625, -32.21229934692383, -29.562236785888672, -26.912174224853516, -24.262109756469727, -21.612049102783203, -18.961986541748047, -16.311922073364258, -13.661859512329102, -11.011795997619629, -8.361732482910156, -5.711669921875, -3.061605453491211, -0.4115428924560547, 2.238520383834839, 4.888583660125732, 7.538646697998047, 10.18871021270752, 12.838773727416992, 15.488836288452148, 18.138900756835938, 20.788963317871094, 23.43902587890625, 26.08909034729004, 28.739152908325195, 31.389217376708984, 34.03927993774414, 36.6893424987793, 39.33940887451172, 41.989471435546875, 44.63953399658203, 47.28959655761719, 49.939659118652344, 52.589725494384766, 55.23978805541992, 57.88985061645508, 60.5399169921875, 63.18997573852539, 65.84004211425781, 68.49010467529297, 71.14016723632812, 73.79022979736328, 76.44029235839844, 79.0903549194336, 81.74041748046875, 84.3904800415039, 87.04054260253906, 89.69060516357422, 92.34066772460938, 94.99073028564453, 97.64079284667969, 100.29086303710938, 102.94092559814453, 105.59098815917969]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 9.0, 4.0, 15.0, 11.0, 20.0, 17.0, 26.0, 30.0, 33.0, 33.0, 39.0, 46.0, 50.0, 62.0, 47.0, 58.0, 54.0, 58.0, 58.0, 44.0, 40.0, 46.0, 39.0, 35.0, 19.0, 16.0, 24.0, 20.0, 17.0, 11.0, 6.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.986772537231445, -28.023006439208984, -27.05923843383789, -26.09547233581543, -25.131704330444336, -24.167938232421875, -23.20417022705078, -22.24040412902832, -21.27663803100586, -20.3128719329834, -19.349103927612305, -18.385337829589844, -17.42156982421875, -16.45780372619629, -15.494036674499512, -14.530269622802734, -13.56650161743164, -12.602734565734863, -11.638967514038086, -10.675201416015625, -9.711433410644531, -8.74766731262207, -7.783900260925293, -6.820133209228516, -5.856366157531738, -4.892599105834961, -3.9288322925567627, -2.9650654792785645, -2.001298427581787, -1.0375313758850098, -0.07376480102539062, 0.8900022506713867, 1.8537712097167969, 2.817538261413574, 3.7813050746917725, 4.745071887969971, 5.708838939666748, 6.672605991363525, 7.6363725662231445, 8.600139617919922, 9.5639066696167, 10.527673721313477, 11.491440773010254, 12.455207824707031, 13.418973922729492, 14.382741928100586, 15.346508026123047, 16.31027603149414, 17.2740421295166, 18.237808227539062, 19.201576232910156, 20.165342330932617, 21.12911033630371, 22.092876434326172, 23.056644439697266, 24.020410537719727, 24.984176635742188, 25.94794273376465, 26.911710739135742, 27.875476837158203, 28.839244842529297, 29.803010940551758, 30.76677703857422, 31.730545043945312, 32.694313049316406]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 14.0, 10.0, 20.0, 25.0, 36.0, 45.0, 67.0, 130.0, 235.0, 527.0, 1194.0, 3330.0, 11682.0, 55776.0, 366165.0, 504530.0, 81539.0, 16225.0, 4250.0, 1464.0, 569.0, 307.0, 138.0, 90.0, 57.0, 33.0, 30.0, 18.0, 13.0, 12.0, 6.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.65625, -8.4024658203125, -8.148681640625, -7.8948974609375, -7.64111328125, -7.3873291015625, -7.133544921875, -6.8797607421875, -6.6259765625, -6.3721923828125, -6.118408203125, -5.8646240234375, -5.61083984375, -5.3570556640625, -5.103271484375, -4.8494873046875, -4.595703125, -4.3419189453125, -4.088134765625, -3.8343505859375, -3.58056640625, -3.3267822265625, -3.072998046875, -2.8192138671875, -2.5654296875, -2.3116455078125, -2.057861328125, -1.8040771484375, -1.55029296875, -1.2965087890625, -1.042724609375, -0.7889404296875, -0.53515625, -0.2813720703125, -0.027587890625, 0.2261962890625, 0.47998046875, 0.7337646484375, 0.987548828125, 1.2413330078125, 1.4951171875, 1.7489013671875, 2.002685546875, 2.2564697265625, 2.51025390625, 2.7640380859375, 3.017822265625, 3.2716064453125, 3.525390625, 3.7791748046875, 4.032958984375, 4.2867431640625, 4.54052734375, 4.7943115234375, 5.048095703125, 5.3018798828125, 5.5556640625, 5.8094482421875, 6.063232421875, 6.3170166015625, 6.57080078125, 6.8245849609375, 7.078369140625, 7.3321533203125, 7.5859375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 8.0, 9.0, 9.0, 15.0, 21.0, 20.0, 28.0, 45.0, 47.0, 62.0, 81.0, 91.0, 61.0, 75.0, 74.0, 75.0, 57.0, 45.0, 38.0, 39.0, 30.0, 19.0, 17.0, 13.0, 8.0, 4.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.39453125, -6.21209716796875, -6.0296630859375, -5.84722900390625, -5.664794921875, -5.48236083984375, -5.2999267578125, -5.11749267578125, -4.93505859375, -4.75262451171875, -4.5701904296875, -4.38775634765625, -4.205322265625, -4.02288818359375, -3.8404541015625, -3.65802001953125, -3.4755859375, -3.29315185546875, -3.1107177734375, -2.92828369140625, -2.745849609375, -2.56341552734375, -2.3809814453125, -2.19854736328125, -2.01611328125, -1.83367919921875, -1.6512451171875, -1.46881103515625, -1.286376953125, -1.10394287109375, -0.9215087890625, -0.73907470703125, -0.556640625, -0.37420654296875, -0.1917724609375, -0.00933837890625, 0.173095703125, 0.35552978515625, 0.5379638671875, 0.72039794921875, 0.90283203125, 1.08526611328125, 1.2677001953125, 1.45013427734375, 1.632568359375, 1.81500244140625, 1.9974365234375, 2.17987060546875, 2.3623046875, 2.54473876953125, 2.7271728515625, 2.90960693359375, 3.092041015625, 3.27447509765625, 3.4569091796875, 3.63934326171875, 3.82177734375, 4.00421142578125, 4.1866455078125, 4.36907958984375, 4.551513671875, 4.73394775390625, 4.9163818359375, 5.09881591796875, 5.28125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 1.0, 5.0, 10.0, 6.0, 21.0, 30.0, 36.0, 54.0, 64.0, 111.0, 211.0, 336.0, 699.0, 1688.0, 6829.0, 60592.0, 852073.0, 111961.0, 9916.0, 2171.0, 759.0, 330.0, 223.0, 124.0, 91.0, 64.0, 45.0, 26.0, 19.0, 15.0, 15.0, 5.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7421875, -14.2900390625, -13.837890625, -13.3857421875, -12.93359375, -12.4814453125, -12.029296875, -11.5771484375, -11.125, -10.6728515625, -10.220703125, -9.7685546875, -9.31640625, -8.8642578125, -8.412109375, -7.9599609375, -7.5078125, -7.0556640625, -6.603515625, -6.1513671875, -5.69921875, -5.2470703125, -4.794921875, -4.3427734375, -3.890625, -3.4384765625, -2.986328125, -2.5341796875, -2.08203125, -1.6298828125, -1.177734375, -0.7255859375, -0.2734375, 0.1787109375, 0.630859375, 1.0830078125, 1.53515625, 1.9873046875, 2.439453125, 2.8916015625, 3.34375, 3.7958984375, 4.248046875, 4.7001953125, 5.15234375, 5.6044921875, 6.056640625, 6.5087890625, 6.9609375, 7.4130859375, 7.865234375, 8.3173828125, 8.76953125, 9.2216796875, 9.673828125, 10.1259765625, 10.578125, 11.0302734375, 11.482421875, 11.9345703125, 12.38671875, 12.8388671875, 13.291015625, 13.7431640625, 14.1953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 8.0, 8.0, 7.0, 10.0, 14.0, 17.0, 22.0, 20.0, 19.0, 32.0, 43.0, 45.0, 48.0, 37.0, 39.0, 53.0, 57.0, 50.0, 52.0, 49.0, 55.0, 42.0, 53.0, 45.0, 27.0, 29.0, 27.0, 20.0, 21.0, 11.0, 10.0, 7.0, 7.0, 6.0, 4.0, 5.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.96875, -13.511474609375, -13.05419921875, -12.596923828125, -12.1396484375, -11.682373046875, -11.22509765625, -10.767822265625, -10.310546875, -9.853271484375, -9.39599609375, -8.938720703125, -8.4814453125, -8.024169921875, -7.56689453125, -7.109619140625, -6.65234375, -6.195068359375, -5.73779296875, -5.280517578125, -4.8232421875, -4.365966796875, -3.90869140625, -3.451416015625, -2.994140625, -2.536865234375, -2.07958984375, -1.622314453125, -1.1650390625, -0.707763671875, -0.25048828125, 0.206787109375, 0.6640625, 1.121337890625, 1.57861328125, 2.035888671875, 2.4931640625, 2.950439453125, 3.40771484375, 3.864990234375, 4.322265625, 4.779541015625, 5.23681640625, 5.694091796875, 6.1513671875, 6.608642578125, 7.06591796875, 7.523193359375, 7.98046875, 8.437744140625, 8.89501953125, 9.352294921875, 9.8095703125, 10.266845703125, 10.72412109375, 11.181396484375, 11.638671875, 12.095947265625, 12.55322265625, 13.010498046875, 13.4677734375, 13.925048828125, 14.38232421875, 14.839599609375, 15.296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 8.0, 12.0, 7.0, 16.0, 17.0, 31.0, 56.0, 95.0, 154.0, 303.0, 682.0, 1504.0, 3981.0, 12561.0, 54763.0, 762196.0, 173890.0, 26453.0, 7202.0, 2567.0, 1022.0, 463.0, 224.0, 131.0, 69.0, 41.0, 31.0, 12.0, 8.0, 5.0, 8.0, 3.0, 3.0, 6.0, 5.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.27734375, -3.1741943359375, -3.071044921875, -2.9678955078125, -2.86474609375, -2.7615966796875, -2.658447265625, -2.5552978515625, -2.4521484375, -2.3489990234375, -2.245849609375, -2.1427001953125, -2.03955078125, -1.9364013671875, -1.833251953125, -1.7301025390625, -1.626953125, -1.5238037109375, -1.420654296875, -1.3175048828125, -1.21435546875, -1.1112060546875, -1.008056640625, -0.9049072265625, -0.8017578125, -0.6986083984375, -0.595458984375, -0.4923095703125, -0.38916015625, -0.2860107421875, -0.182861328125, -0.0797119140625, 0.0234375, 0.1265869140625, 0.229736328125, 0.3328857421875, 0.43603515625, 0.5391845703125, 0.642333984375, 0.7454833984375, 0.8486328125, 0.9517822265625, 1.054931640625, 1.1580810546875, 1.26123046875, 1.3643798828125, 1.467529296875, 1.5706787109375, 1.673828125, 1.7769775390625, 1.880126953125, 1.9832763671875, 2.08642578125, 2.1895751953125, 2.292724609375, 2.3958740234375, 2.4990234375, 2.6021728515625, 2.705322265625, 2.8084716796875, 2.91162109375, 3.0147705078125, 3.117919921875, 3.2210693359375, 3.32421875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 1.0, 4.0, 4.0, 5.0, 8.0, 8.0, 11.0, 16.0, 18.0, 26.0, 44.0, 73.0, 96.0, 173.0, 194.0, 120.0, 67.0, 45.0, 28.0, 13.0, 13.0, 8.0, 7.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0009832382202148438, -0.0009593069553375244, -0.0009353756904602051, -0.0009114444255828857, -0.0008875131607055664, -0.0008635818958282471, -0.0008396506309509277, -0.0008157193660736084, -0.0007917881011962891, -0.0007678568363189697, -0.0007439255714416504, -0.0007199943065643311, -0.0006960630416870117, -0.0006721317768096924, -0.000648200511932373, -0.0006242692470550537, -0.0006003379821777344, -0.000576406717300415, -0.0005524754524230957, -0.0005285441875457764, -0.000504612922668457, -0.0004806816577911377, -0.00045675039291381836, -0.000432819128036499, -0.0004088878631591797, -0.00038495659828186035, -0.000361025333404541, -0.0003370940685272217, -0.00031316280364990234, -0.000289231538772583, -0.00026530027389526367, -0.00024136900901794434, -0.000217437744140625, -0.00019350647926330566, -0.00016957521438598633, -0.000145643949508667, -0.00012171268463134766, -9.778141975402832e-05, -7.385015487670898e-05, -4.991888999938965e-05, -2.5987625122070312e-05, -2.0563602447509766e-06, 2.187490463256836e-05, 4.5806169509887695e-05, 6.973743438720703e-05, 9.366869926452637e-05, 0.0001175999641418457, 0.00014153122901916504, 0.00016546249389648438, 0.0001893937587738037, 0.00021332502365112305, 0.00023725628852844238, 0.0002611875534057617, 0.00028511881828308105, 0.0003090500831604004, 0.0003329813480377197, 0.00035691261291503906, 0.0003808438777923584, 0.00040477514266967773, 0.00042870640754699707, 0.0004526376724243164, 0.00047656893730163574, 0.0005005002021789551, 0.0005244314670562744, 0.0005483627319335938]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 1.0, 5.0, 9.0, 24.0, 52.0, 58.0, 93.0, 181.0, 387.0, 982.0, 3653.0, 24109.0, 789944.0, 211657.0, 13540.0, 2465.0, 745.0, 303.0, 171.0, 84.0, 36.0, 29.0, 8.0, 7.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.70269775390625, -5.5343017578125, -5.36590576171875, -5.197509765625, -5.02911376953125, -4.8607177734375, -4.69232177734375, -4.52392578125, -4.35552978515625, -4.1871337890625, -4.01873779296875, -3.850341796875, -3.68194580078125, -3.5135498046875, -3.34515380859375, -3.1767578125, -3.00836181640625, -2.8399658203125, -2.67156982421875, -2.503173828125, -2.33477783203125, -2.1663818359375, -1.99798583984375, -1.82958984375, -1.66119384765625, -1.4927978515625, -1.32440185546875, -1.156005859375, -0.98760986328125, -0.8192138671875, -0.65081787109375, -0.482421875, -0.31402587890625, -0.1456298828125, 0.02276611328125, 0.191162109375, 0.35955810546875, 0.5279541015625, 0.69635009765625, 0.86474609375, 1.03314208984375, 1.2015380859375, 1.36993408203125, 1.538330078125, 1.70672607421875, 1.8751220703125, 2.04351806640625, 2.2119140625, 2.38031005859375, 2.5487060546875, 2.71710205078125, 2.885498046875, 3.05389404296875, 3.2222900390625, 3.39068603515625, 3.55908203125, 3.72747802734375, 3.8958740234375, 4.06427001953125, 4.232666015625, 4.40106201171875, 4.5694580078125, 4.73785400390625, 4.90625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 11.0, 7.0, 10.0, 17.0, 18.0, 31.0, 50.0, 84.0, 145.0, 215.0, 152.0, 90.0, 53.0, 30.0, 18.0, 18.0, 12.0, 12.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.26953125, -4.142425537109375, -4.01531982421875, -3.888214111328125, -3.7611083984375, -3.634002685546875, -3.50689697265625, -3.379791259765625, -3.252685546875, -3.125579833984375, -2.99847412109375, -2.871368408203125, -2.7442626953125, -2.617156982421875, -2.49005126953125, -2.362945556640625, -2.23583984375, -2.108734130859375, -1.98162841796875, -1.854522705078125, -1.7274169921875, -1.600311279296875, -1.47320556640625, -1.346099853515625, -1.218994140625, -1.091888427734375, -0.96478271484375, -0.837677001953125, -0.7105712890625, -0.583465576171875, -0.45635986328125, -0.329254150390625, -0.2021484375, -0.075042724609375, 0.05206298828125, 0.179168701171875, 0.3062744140625, 0.433380126953125, 0.56048583984375, 0.687591552734375, 0.814697265625, 0.941802978515625, 1.06890869140625, 1.196014404296875, 1.3231201171875, 1.450225830078125, 1.57733154296875, 1.704437255859375, 1.83154296875, 1.958648681640625, 2.08575439453125, 2.212860107421875, 2.3399658203125, 2.467071533203125, 2.59417724609375, 2.721282958984375, 2.848388671875, 2.975494384765625, 3.10260009765625, 3.229705810546875, 3.3568115234375, 3.483917236328125, 3.61102294921875, 3.738128662109375, 3.865234375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 18.0, 67.0, 200.0, 489.0, 159.0, 30.0, 14.0, 10.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.41334533691406, -133.06146240234375, -128.7095947265625, -124.35771179199219, -120.0058364868164, -115.65396118164062, -111.30208587646484, -106.95021057128906, -102.59832763671875, -98.24645233154297, -93.89457702636719, -89.54269409179688, -85.1908187866211, -80.83894348144531, -76.48706817626953, -72.13519287109375, -67.78331756591797, -63.43144226074219, -59.07956314086914, -54.72768783569336, -50.37580871582031, -46.02393341064453, -41.67205810546875, -37.32018280029297, -32.96830368041992, -28.616426467895508, -24.264549255371094, -19.912673950195312, -15.560796737670898, -11.208919525146484, -6.857044219970703, -2.505167007446289, 1.846710205078125, 6.198586940765381, 10.550463676452637, 14.902339935302734, 19.25421714782715, 23.606094360351562, 27.957969665527344, 32.309844970703125, 36.66172409057617, 41.01359939575195, 45.365478515625, 49.71735382080078, 54.06922912597656, 58.42110824584961, 62.77298355102539, 67.12486267089844, 71.47673797607422, 75.82861328125, 80.18048858642578, 84.53236389160156, 88.88424682617188, 93.23612213134766, 97.58799743652344, 101.93987274169922, 106.291748046875, 110.64362335205078, 114.99549865722656, 119.34738159179688, 123.69925689697266, 128.05113220214844, 132.40301513671875, 136.7548828125, 141.1067657470703]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 3.0, 8.0, 8.0, 14.0, 12.0, 12.0, 25.0, 26.0, 25.0, 23.0, 36.0, 25.0, 28.0, 29.0, 36.0, 71.0, 91.0, 112.0, 69.0, 63.0, 39.0, 36.0, 22.0, 29.0, 24.0, 20.0, 16.0, 21.0, 14.0, 18.0, 8.0, 7.0, 6.0, 2.0, 7.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.932708740234375, -41.35111618041992, -39.7695198059082, -38.18792724609375, -36.60633087158203, -35.02473831176758, -33.443145751953125, -31.861549377441406, -30.279956817626953, -28.698362350463867, -27.11676788330078, -25.535175323486328, -23.953580856323242, -22.371986389160156, -20.79039192199707, -19.208797454833984, -17.6272029876709, -16.045608520507812, -14.464015007019043, -12.882420539855957, -11.300827026367188, -9.719232559204102, -8.137638092041016, -6.556044578552246, -4.97445011138916, -3.3928561210632324, -1.8112618923187256, -0.22966766357421875, 1.351926326751709, 2.9335203170776367, 4.515114784240723, 6.096708297729492, 7.678302764892578, 9.259897232055664, 10.841490745544434, 12.42308521270752, 14.004678726196289, 15.586273193359375, 17.16786766052246, 18.749462127685547, 20.3310546875, 21.912649154663086, 23.494243621826172, 25.075836181640625, 26.65743064880371, 28.239025115966797, 29.820619583129883, 31.40221405029297, 32.98381042480469, 34.56540298461914, 36.14699935913086, 37.72859191894531, 39.31018829345703, 40.891780853271484, 42.47337341308594, 44.054969787597656, 45.63656234741211, 47.21815490722656, 48.79975128173828, 50.381343841552734, 51.96294021606445, 53.544532775878906, 55.126129150390625, 56.70772171020508, 58.28931427001953]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 8.0, 7.0, 18.0, 32.0, 44.0, 59.0, 104.0, 162.0, 252.0, 515.0, 877.0, 2242.0, 7167.0, 36529.0, 319556.0, 2545792.0, 1150631.0, 103546.0, 17450.0, 5139.0, 2032.0, 926.0, 482.0, 272.0, 155.0, 75.0, 56.0, 47.0, 26.0, 20.0, 13.0, 10.0, 9.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.5625, -5.39776611328125, -5.2330322265625, -5.06829833984375, -4.903564453125, -4.73883056640625, -4.5740966796875, -4.40936279296875, -4.24462890625, -4.07989501953125, -3.9151611328125, -3.75042724609375, -3.585693359375, -3.42095947265625, -3.2562255859375, -3.09149169921875, -2.9267578125, -2.76202392578125, -2.5972900390625, -2.43255615234375, -2.267822265625, -2.10308837890625, -1.9383544921875, -1.77362060546875, -1.60888671875, -1.44415283203125, -1.2794189453125, -1.11468505859375, -0.949951171875, -0.78521728515625, -0.6204833984375, -0.45574951171875, -0.291015625, -0.12628173828125, 0.0384521484375, 0.20318603515625, 0.367919921875, 0.53265380859375, 0.6973876953125, 0.86212158203125, 1.02685546875, 1.19158935546875, 1.3563232421875, 1.52105712890625, 1.685791015625, 1.85052490234375, 2.0152587890625, 2.17999267578125, 2.3447265625, 2.50946044921875, 2.6741943359375, 2.83892822265625, 3.003662109375, 3.16839599609375, 3.3331298828125, 3.49786376953125, 3.66259765625, 3.82733154296875, 3.9920654296875, 4.15679931640625, 4.321533203125, 4.48626708984375, 4.6510009765625, 4.81573486328125, 4.98046875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 3.0, 9.0, 7.0, 8.0, 16.0, 18.0, 24.0, 44.0, 40.0, 55.0, 57.0, 59.0, 67.0, 66.0, 51.0, 58.0, 74.0, 59.0, 62.0, 40.0, 31.0, 33.0, 25.0, 23.0, 19.0, 12.0, 6.0, 10.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-6.13671875, -5.98052978515625, -5.8243408203125, -5.66815185546875, -5.511962890625, -5.35577392578125, -5.1995849609375, -5.04339599609375, -4.88720703125, -4.73101806640625, -4.5748291015625, -4.41864013671875, -4.262451171875, -4.10626220703125, -3.9500732421875, -3.79388427734375, -3.6376953125, -3.48150634765625, -3.3253173828125, -3.16912841796875, -3.012939453125, -2.85675048828125, -2.7005615234375, -2.54437255859375, -2.38818359375, -2.23199462890625, -2.0758056640625, -1.91961669921875, -1.763427734375, -1.60723876953125, -1.4510498046875, -1.29486083984375, -1.138671875, -0.98248291015625, -0.8262939453125, -0.67010498046875, -0.513916015625, -0.35772705078125, -0.2015380859375, -0.04534912109375, 0.11083984375, 0.26702880859375, 0.4232177734375, 0.57940673828125, 0.735595703125, 0.89178466796875, 1.0479736328125, 1.20416259765625, 1.3603515625, 1.51654052734375, 1.6727294921875, 1.82891845703125, 1.985107421875, 2.14129638671875, 2.2974853515625, 2.45367431640625, 2.60986328125, 2.76605224609375, 2.9222412109375, 3.07843017578125, 3.234619140625, 3.39080810546875, 3.5469970703125, 3.70318603515625, 3.859375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 13.0, 24.0, 27.0, 50.0, 95.0, 121.0, 268.0, 630.0, 2183.0, 19814.0, 3615868.0, 544635.0, 8311.0, 1290.0, 474.0, 219.0, 111.0, 72.0, 29.0, 21.0, 10.0, 7.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.84375, -12.365234375, -11.88671875, -11.408203125, -10.9296875, -10.451171875, -9.97265625, -9.494140625, -9.015625, -8.537109375, -8.05859375, -7.580078125, -7.1015625, -6.623046875, -6.14453125, -5.666015625, -5.1875, -4.708984375, -4.23046875, -3.751953125, -3.2734375, -2.794921875, -2.31640625, -1.837890625, -1.359375, -0.880859375, -0.40234375, 0.076171875, 0.5546875, 1.033203125, 1.51171875, 1.990234375, 2.46875, 2.947265625, 3.42578125, 3.904296875, 4.3828125, 4.861328125, 5.33984375, 5.818359375, 6.296875, 6.775390625, 7.25390625, 7.732421875, 8.2109375, 8.689453125, 9.16796875, 9.646484375, 10.125, 10.603515625, 11.08203125, 11.560546875, 12.0390625, 12.517578125, 12.99609375, 13.474609375, 13.953125, 14.431640625, 14.91015625, 15.388671875, 15.8671875, 16.345703125, 16.82421875, 17.302734375, 17.78125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 9.0, 9.0, 18.0, 41.0, 44.0, 106.0, 254.0, 406.0, 722.0, 927.0, 692.0, 380.0, 198.0, 104.0, 65.0, 30.0, 17.0, 14.0, 14.0, 6.0, 9.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.7421875, -11.45208740234375, -11.1619873046875, -10.87188720703125, -10.581787109375, -10.29168701171875, -10.0015869140625, -9.71148681640625, -9.42138671875, -9.13128662109375, -8.8411865234375, -8.55108642578125, -8.260986328125, -7.97088623046875, -7.6807861328125, -7.39068603515625, -7.1005859375, -6.81048583984375, -6.5203857421875, -6.23028564453125, -5.940185546875, -5.65008544921875, -5.3599853515625, -5.06988525390625, -4.77978515625, -4.48968505859375, -4.1995849609375, -3.90948486328125, -3.619384765625, -3.32928466796875, -3.0391845703125, -2.74908447265625, -2.458984375, -2.16888427734375, -1.8787841796875, -1.58868408203125, -1.298583984375, -1.00848388671875, -0.7183837890625, -0.42828369140625, -0.13818359375, 0.15191650390625, 0.4420166015625, 0.73211669921875, 1.022216796875, 1.31231689453125, 1.6024169921875, 1.89251708984375, 2.1826171875, 2.47271728515625, 2.7628173828125, 3.05291748046875, 3.343017578125, 3.63311767578125, 3.9232177734375, 4.21331787109375, 4.50341796875, 4.79351806640625, 5.0836181640625, 5.37371826171875, 5.663818359375, 5.95391845703125, 6.2440185546875, 6.53411865234375, 6.82421875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 12.0, 12.0, 21.0, 39.0, 62.0, 83.0, 125.0, 156.0, 168.0, 95.0, 68.0, 56.0, 43.0, 22.0, 13.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-44.372467041015625, -42.71300506591797, -41.05354309082031, -39.394081115722656, -37.734622955322266, -36.07516098022461, -34.41569900512695, -32.7562370300293, -31.096776962280273, -29.437314987182617, -27.777854919433594, -26.118392944335938, -24.45893096923828, -22.799470901489258, -21.1400089263916, -19.480548858642578, -17.821086883544922, -16.161624908447266, -14.502164840698242, -12.842702865600586, -11.183241844177246, -9.523780822753906, -7.86431884765625, -6.20485782623291, -4.54539680480957, -2.8859355449676514, -1.2264742851257324, 0.4329872131347656, 2.0924482345581055, 3.7519092559814453, 5.411371231079102, 7.070832252502441, 8.730289459228516, 10.389750480651855, 12.049211502075195, 13.708673477172852, 15.368134498596191, 17.02759552001953, 18.687057495117188, 20.346519470214844, 22.005979537963867, 23.665441513061523, 25.324901580810547, 26.984363555908203, 28.64382553100586, 30.303285598754883, 31.96274757385254, 33.62220764160156, 35.28166961669922, 36.941131591796875, 38.60059356689453, 40.26005554199219, 41.91951370239258, 43.578975677490234, 45.23843765258789, 46.89789962768555, 48.55735778808594, 50.216819763183594, 51.87628173828125, 53.535743713378906, 55.1952018737793, 56.85466384887695, 58.51412582397461, 60.173587799072266, 61.83304977416992]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 6.0, 3.0, 4.0, 6.0, 5.0, 6.0, 12.0, 8.0, 7.0, 12.0, 13.0, 19.0, 15.0, 14.0, 18.0, 29.0, 30.0, 29.0, 29.0, 24.0, 43.0, 45.0, 33.0, 49.0, 46.0, 48.0, 41.0, 39.0, 34.0, 36.0, 27.0, 28.0, 25.0, 24.0, 23.0, 26.0, 17.0, 25.0, 12.0, 21.0, 13.0, 9.0, 13.0, 5.0, 9.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-22.030427932739258, -21.3128604888916, -20.595293045043945, -19.87772560119629, -19.160158157348633, -18.442590713500977, -17.725025177001953, -17.007457733154297, -16.28989028930664, -15.572322845458984, -14.854755401611328, -14.137187957763672, -13.419620513916016, -12.70205307006836, -11.98448657989502, -11.266919136047363, -10.54935073852539, -9.831783294677734, -9.114215850830078, -8.396648406982422, -7.679081439971924, -6.961513996124268, -6.2439470291137695, -5.526379585266113, -4.808812141418457, -4.091244697570801, -3.3736774921417236, -2.6561102867126465, -1.9385428428649902, -1.220975399017334, -0.5034084320068359, 0.2141590118408203, 0.9317245483398438, 1.6492918729782104, 2.366859197616577, 3.0844264030456543, 3.8019938468933105, 4.519561290740967, 5.237128257751465, 5.954695701599121, 6.672263145446777, 7.389830589294434, 8.10739803314209, 8.82496452331543, 9.542531967163086, 10.260099411010742, 10.977666854858398, 11.695234298706055, 12.412801742553711, 13.130369186401367, 13.847936630249023, 14.56550407409668, 15.283071517944336, 16.000638961791992, 16.718204498291016, 17.435771942138672, 18.153339385986328, 18.870906829833984, 19.58847427368164, 20.306041717529297, 21.023609161376953, 21.74117660522461, 22.458744049072266, 23.176311492919922, 23.893878936767578]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 15.0, 35.0, 65.0, 148.0, 274.0, 708.0, 1980.0, 7307.0, 38744.0, 337800.0, 577728.0, 67984.0, 11477.0, 2713.0, 895.0, 355.0, 153.0, 67.0, 39.0, 19.0, 6.0, 7.0, 4.0, 6.0, 8.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.7265625, -12.3839111328125, -12.041259765625, -11.6986083984375, -11.35595703125, -11.0133056640625, -10.670654296875, -10.3280029296875, -9.9853515625, -9.6427001953125, -9.300048828125, -8.9573974609375, -8.61474609375, -8.2720947265625, -7.929443359375, -7.5867919921875, -7.244140625, -6.9014892578125, -6.558837890625, -6.2161865234375, -5.87353515625, -5.5308837890625, -5.188232421875, -4.8455810546875, -4.5029296875, -4.1602783203125, -3.817626953125, -3.4749755859375, -3.13232421875, -2.7896728515625, -2.447021484375, -2.1043701171875, -1.76171875, -1.4190673828125, -1.076416015625, -0.7337646484375, -0.39111328125, -0.0484619140625, 0.294189453125, 0.6368408203125, 0.9794921875, 1.3221435546875, 1.664794921875, 2.0074462890625, 2.35009765625, 2.6927490234375, 3.035400390625, 3.3780517578125, 3.720703125, 4.0633544921875, 4.406005859375, 4.7486572265625, 5.09130859375, 5.4339599609375, 5.776611328125, 6.1192626953125, 6.4619140625, 6.8045654296875, 7.147216796875, 7.4898681640625, 7.83251953125, 8.1751708984375, 8.517822265625, 8.8604736328125, 9.203125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 7.0, 9.0, 11.0, 13.0, 20.0, 20.0, 38.0, 30.0, 43.0, 43.0, 45.0, 79.0, 60.0, 59.0, 80.0, 58.0, 49.0, 57.0, 53.0, 49.0, 34.0, 22.0, 24.0, 16.0, 19.0, 12.0, 8.0, 9.0, 8.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0], "bins": [-6.203125, -6.04840087890625, -5.8936767578125, -5.73895263671875, -5.584228515625, -5.42950439453125, -5.2747802734375, -5.12005615234375, -4.96533203125, -4.81060791015625, -4.6558837890625, -4.50115966796875, -4.346435546875, -4.19171142578125, -4.0369873046875, -3.88226318359375, -3.7275390625, -3.57281494140625, -3.4180908203125, -3.26336669921875, -3.108642578125, -2.95391845703125, -2.7991943359375, -2.64447021484375, -2.48974609375, -2.33502197265625, -2.1802978515625, -2.02557373046875, -1.870849609375, -1.71612548828125, -1.5614013671875, -1.40667724609375, -1.251953125, -1.09722900390625, -0.9425048828125, -0.78778076171875, -0.633056640625, -0.47833251953125, -0.3236083984375, -0.16888427734375, -0.01416015625, 0.14056396484375, 0.2952880859375, 0.45001220703125, 0.604736328125, 0.75946044921875, 0.9141845703125, 1.06890869140625, 1.2236328125, 1.37835693359375, 1.5330810546875, 1.68780517578125, 1.842529296875, 1.99725341796875, 2.1519775390625, 2.30670166015625, 2.46142578125, 2.61614990234375, 2.7708740234375, 2.92559814453125, 3.080322265625, 3.23504638671875, 3.3897705078125, 3.54449462890625, 3.69921875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 1.0, 5.0, 8.0, 4.0, 11.0, 21.0, 29.0, 26.0, 53.0, 65.0, 88.0, 117.0, 194.0, 296.0, 460.0, 809.0, 1474.0, 3885.0, 15590.0, 173056.0, 799862.0, 40824.0, 6696.0, 2267.0, 1032.0, 549.0, 359.0, 220.0, 165.0, 98.0, 72.0, 51.0, 45.0, 25.0, 24.0, 18.0, 10.0, 8.0, 11.0, 2.0, 6.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-12.890625, -12.4779052734375, -12.065185546875, -11.6524658203125, -11.23974609375, -10.8270263671875, -10.414306640625, -10.0015869140625, -9.5888671875, -9.1761474609375, -8.763427734375, -8.3507080078125, -7.93798828125, -7.5252685546875, -7.112548828125, -6.6998291015625, -6.287109375, -5.8743896484375, -5.461669921875, -5.0489501953125, -4.63623046875, -4.2235107421875, -3.810791015625, -3.3980712890625, -2.9853515625, -2.5726318359375, -2.159912109375, -1.7471923828125, -1.33447265625, -0.9217529296875, -0.509033203125, -0.0963134765625, 0.31640625, 0.7291259765625, 1.141845703125, 1.5545654296875, 1.96728515625, 2.3800048828125, 2.792724609375, 3.2054443359375, 3.6181640625, 4.0308837890625, 4.443603515625, 4.8563232421875, 5.26904296875, 5.6817626953125, 6.094482421875, 6.5072021484375, 6.919921875, 7.3326416015625, 7.745361328125, 8.1580810546875, 8.57080078125, 8.9835205078125, 9.396240234375, 9.8089599609375, 10.2216796875, 10.6343994140625, 11.047119140625, 11.4598388671875, 11.87255859375, 12.2852783203125, 12.697998046875, 13.1107177734375, 13.5234375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 4.0, 6.0, 7.0, 5.0, 11.0, 10.0, 14.0, 12.0, 21.0, 34.0, 29.0, 47.0, 49.0, 53.0, 69.0, 65.0, 55.0, 50.0, 51.0, 62.0, 53.0, 57.0, 45.0, 40.0, 21.0, 28.0, 21.0, 20.0, 15.0, 9.0, 9.0, 4.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.7890625, -13.2635498046875, -12.738037109375, -12.2125244140625, -11.68701171875, -11.1614990234375, -10.635986328125, -10.1104736328125, -9.5849609375, -9.0594482421875, -8.533935546875, -8.0084228515625, -7.48291015625, -6.9573974609375, -6.431884765625, -5.9063720703125, -5.380859375, -4.8553466796875, -4.329833984375, -3.8043212890625, -3.27880859375, -2.7532958984375, -2.227783203125, -1.7022705078125, -1.1767578125, -0.6512451171875, -0.125732421875, 0.3997802734375, 0.92529296875, 1.4508056640625, 1.976318359375, 2.5018310546875, 3.02734375, 3.5528564453125, 4.078369140625, 4.6038818359375, 5.12939453125, 5.6549072265625, 6.180419921875, 6.7059326171875, 7.2314453125, 7.7569580078125, 8.282470703125, 8.8079833984375, 9.33349609375, 9.8590087890625, 10.384521484375, 10.9100341796875, 11.435546875, 11.9610595703125, 12.486572265625, 13.0120849609375, 13.53759765625, 14.0631103515625, 14.588623046875, 15.1141357421875, 15.6396484375, 16.1651611328125, 16.690673828125, 17.2161865234375, 17.74169921875, 18.2672119140625, 18.792724609375, 19.3182373046875, 19.84375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 6.0, 7.0, 10.0, 5.0, 6.0, 15.0, 12.0, 27.0, 39.0, 45.0, 82.0, 187.0, 359.0, 1123.0, 4976.0, 54284.0, 957767.0, 24615.0, 3401.0, 883.0, 320.0, 134.0, 72.0, 56.0, 37.0, 17.0, 16.0, 16.0, 9.0, 9.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.60455322265625, -5.4200439453125, -5.23553466796875, -5.051025390625, -4.86651611328125, -4.6820068359375, -4.49749755859375, -4.31298828125, -4.12847900390625, -3.9439697265625, -3.75946044921875, -3.574951171875, -3.39044189453125, -3.2059326171875, -3.02142333984375, -2.8369140625, -2.65240478515625, -2.4678955078125, -2.28338623046875, -2.098876953125, -1.91436767578125, -1.7298583984375, -1.54534912109375, -1.36083984375, -1.17633056640625, -0.9918212890625, -0.80731201171875, -0.622802734375, -0.43829345703125, -0.2537841796875, -0.06927490234375, 0.115234375, 0.29974365234375, 0.4842529296875, 0.66876220703125, 0.853271484375, 1.03778076171875, 1.2222900390625, 1.40679931640625, 1.59130859375, 1.77581787109375, 1.9603271484375, 2.14483642578125, 2.329345703125, 2.51385498046875, 2.6983642578125, 2.88287353515625, 3.0673828125, 3.25189208984375, 3.4364013671875, 3.62091064453125, 3.805419921875, 3.98992919921875, 4.1744384765625, 4.35894775390625, 4.54345703125, 4.72796630859375, 4.9124755859375, 5.09698486328125, 5.281494140625, 5.46600341796875, 5.6505126953125, 5.83502197265625, 6.01953125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 0.0, 3.0, 2.0, 12.0, 13.0, 12.0, 18.0, 29.0, 67.0, 92.0, 182.0, 221.0, 146.0, 71.0, 40.0, 16.0, 13.0, 9.0, 10.0, 8.0, 6.0, 2.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005631446838378906, -0.0005399361252784729, -0.0005167275667190552, -0.0004935190081596375, -0.0004703104496002197, -0.000447101891040802, -0.0004238933324813843, -0.00040068477392196655, -0.00037747621536254883, -0.0003542676568031311, -0.0003310590982437134, -0.00030785053968429565, -0.00028464198112487793, -0.0002614334225654602, -0.00023822486400604248, -0.00021501630544662476, -0.00019180774688720703, -0.0001685991883277893, -0.00014539062976837158, -0.00012218207120895386, -9.897351264953613e-05, -7.576495409011841e-05, -5.2556395530700684e-05, -2.934783697128296e-05, -6.139278411865234e-06, 1.706928014755249e-05, 4.0277838706970215e-05, 6.348639726638794e-05, 8.669495582580566e-05, 0.00010990351438522339, 0.0001331120729446411, 0.00015632063150405884, 0.00017952919006347656, 0.0002027377486228943, 0.000225946307182312, 0.00024915486574172974, 0.00027236342430114746, 0.0002955719828605652, 0.0003187805414199829, 0.00034198909997940063, 0.00036519765853881836, 0.0003884062170982361, 0.0004116147756576538, 0.00043482333421707153, 0.00045803189277648926, 0.000481240451335907, 0.0005044490098953247, 0.0005276575684547424, 0.0005508661270141602, 0.0005740746855735779, 0.0005972832441329956, 0.0006204918026924133, 0.0006437003612518311, 0.0006669089198112488, 0.0006901174783706665, 0.0007133260369300842, 0.000736534595489502, 0.0007597431540489197, 0.0007829517126083374, 0.0008061602711677551, 0.0008293688297271729, 0.0008525773882865906, 0.0008757859468460083, 0.000898994505405426, 0.0009222030639648438]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 1.0, 7.0, 8.0, 11.0, 21.0, 22.0, 41.0, 41.0, 48.0, 85.0, 131.0, 210.0, 350.0, 685.0, 1444.0, 3229.0, 8987.0, 33808.0, 288535.0, 652581.0, 40892.0, 10425.0, 3688.0, 1445.0, 743.0, 421.0, 252.0, 152.0, 90.0, 58.0, 48.0, 28.0, 24.0, 12.0, 11.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.861328125, -2.7747802734375, -2.688232421875, -2.6016845703125, -2.51513671875, -2.4285888671875, -2.342041015625, -2.2554931640625, -2.1689453125, -2.0823974609375, -1.995849609375, -1.9093017578125, -1.82275390625, -1.7362060546875, -1.649658203125, -1.5631103515625, -1.4765625, -1.3900146484375, -1.303466796875, -1.2169189453125, -1.13037109375, -1.0438232421875, -0.957275390625, -0.8707275390625, -0.7841796875, -0.6976318359375, -0.611083984375, -0.5245361328125, -0.43798828125, -0.3514404296875, -0.264892578125, -0.1783447265625, -0.091796875, -0.0052490234375, 0.081298828125, 0.1678466796875, 0.25439453125, 0.3409423828125, 0.427490234375, 0.5140380859375, 0.6005859375, 0.6871337890625, 0.773681640625, 0.8602294921875, 0.94677734375, 1.0333251953125, 1.119873046875, 1.2064208984375, 1.29296875, 1.3795166015625, 1.466064453125, 1.5526123046875, 1.63916015625, 1.7257080078125, 1.812255859375, 1.8988037109375, 1.9853515625, 2.0718994140625, 2.158447265625, 2.2449951171875, 2.33154296875, 2.4180908203125, 2.504638671875, 2.5911865234375, 2.677734375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 4.0, 9.0, 5.0, 6.0, 11.0, 9.0, 17.0, 17.0, 24.0, 30.0, 40.0, 49.0, 74.0, 85.0, 114.0, 90.0, 88.0, 69.0, 61.0, 46.0, 31.0, 26.0, 16.0, 9.0, 16.0, 11.0, 7.0, 6.0, 5.0, 4.0, 4.0, 4.0, 4.0, 4.0, 4.0, 0.0, 4.0, 1.0], "bins": [-2.859375, -2.7896881103515625, -2.720001220703125, -2.6503143310546875, -2.58062744140625, -2.5109405517578125, -2.441253662109375, -2.3715667724609375, -2.3018798828125, -2.2321929931640625, -2.162506103515625, -2.0928192138671875, -2.02313232421875, -1.9534454345703125, -1.883758544921875, -1.8140716552734375, -1.744384765625, -1.6746978759765625, -1.605010986328125, -1.5353240966796875, -1.46563720703125, -1.3959503173828125, -1.326263427734375, -1.2565765380859375, -1.1868896484375, -1.1172027587890625, -1.047515869140625, -0.9778289794921875, -0.90814208984375, -0.8384552001953125, -0.768768310546875, -0.6990814208984375, -0.62939453125, -0.5597076416015625, -0.490020751953125, -0.4203338623046875, -0.35064697265625, -0.2809600830078125, -0.211273193359375, -0.1415863037109375, -0.0718994140625, -0.0022125244140625, 0.067474365234375, 0.1371612548828125, 0.20684814453125, 0.2765350341796875, 0.346221923828125, 0.4159088134765625, 0.485595703125, 0.5552825927734375, 0.624969482421875, 0.6946563720703125, 0.76434326171875, 0.8340301513671875, 0.903717041015625, 0.9734039306640625, 1.0430908203125, 1.1127777099609375, 1.182464599609375, 1.2521514892578125, 1.32183837890625, 1.3915252685546875, 1.461212158203125, 1.5308990478515625, 1.6005859375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 15.0, 91.0, 745.0, 136.0, 13.0, 7.0, 0.0, 2.0], "bins": [-590.990478515625, -580.9139404296875, -570.8373413085938, -560.7608032226562, -550.6842651367188, -540.6077270507812, -530.5311279296875, -520.45458984375, -510.3780517578125, -500.3014831542969, -490.2249450683594, -480.14837646484375, -470.07183837890625, -459.9952697753906, -449.9187316894531, -439.8421630859375, -429.7655944824219, -419.68902587890625, -409.61248779296875, -399.5359191894531, -389.4593811035156, -379.3828125, -369.3062744140625, -359.2297058105469, -349.15313720703125, -339.0765686035156, -329.0000305175781, -318.9234619140625, -308.846923828125, -298.7703552246094, -288.6938171386719, -278.61724853515625, -268.54071044921875, -258.4641418457031, -248.38760375976562, -238.31105041503906, -228.2344970703125, -218.15792846679688, -208.0813751220703, -198.00482177734375, -187.9282684326172, -177.85171508789062, -167.77516174316406, -157.6986083984375, -147.62203979492188, -137.54550170898438, -127.46893310546875, -117.39237976074219, -107.31582641601562, -97.23927307128906, -87.1627197265625, -77.0861587524414, -67.00960540771484, -56.93305206298828, -46.85649490356445, -36.779937744140625, -26.703388214111328, -16.626832962036133, -6.5502777099609375, 3.526277542114258, 13.602832794189453, 23.679386138916016, 33.755943298339844, 43.83250045776367, 53.909053802490234]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 9.0, 14.0, 13.0, 18.0, 24.0, 32.0, 40.0, 43.0, 66.0, 85.0, 245.0, 139.0, 63.0, 50.0, 50.0, 22.0, 25.0, 25.0, 10.0, 9.0, 7.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.17686462402344, -129.00241088867188, -125.82795715332031, -122.65351104736328, -119.47905731201172, -116.30460357666016, -113.1301498413086, -109.95570373535156, -106.78125, -103.60679626464844, -100.43234252929688, -97.25789642333984, -94.08344268798828, -90.90898895263672, -87.73453521728516, -84.56008911132812, -81.38563537597656, -78.211181640625, -75.03672790527344, -71.8622817993164, -68.68782806396484, -65.51337432861328, -62.33892059326172, -59.16447067260742, -55.990013122558594, -52.81555938720703, -49.641109466552734, -46.46665573120117, -43.292205810546875, -40.11775207519531, -36.94329833984375, -33.76884841918945, -30.594398498535156, -27.419946670532227, -24.245494842529297, -21.071041107177734, -17.896591186523438, -14.722138404846191, -11.547685623168945, -8.373233795166016, -5.198781967163086, -2.024329900741577, 1.1501221656799316, 4.3245744705200195, 7.499026298522949, 10.673478126525879, 13.847930908203125, 17.022382736206055, 20.196834564208984, 23.371286392211914, 26.545738220214844, 29.720191955566406, 32.8946418762207, 36.069095611572266, 39.24354553222656, 42.417999267578125, 45.59245300292969, 48.76690673828125, 51.94135665893555, 55.11581039428711, 58.290260314941406, 61.46471405029297, 64.63916778564453, 67.81361389160156, 70.98806762695312]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 8.0, 6.0, 9.0, 21.0, 50.0, 76.0, 210.0, 608.0, 2603.0, 26452.0, 2780137.0, 1362306.0, 16662.0, 3440.0, 1240.0, 315.0, 83.0, 34.0, 13.0, 9.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.375, -23.8553466796875, -23.335693359375, -22.8160400390625, -22.29638671875, -21.7767333984375, -21.257080078125, -20.7374267578125, -20.2177734375, -19.6981201171875, -19.178466796875, -18.6588134765625, -18.13916015625, -17.6195068359375, -17.099853515625, -16.5802001953125, -16.060546875, -15.5408935546875, -15.021240234375, -14.5015869140625, -13.98193359375, -13.4622802734375, -12.942626953125, -12.4229736328125, -11.9033203125, -11.3836669921875, -10.864013671875, -10.3443603515625, -9.82470703125, -9.3050537109375, -8.785400390625, -8.2657470703125, -7.74609375, -7.2264404296875, -6.706787109375, -6.1871337890625, -5.66748046875, -5.1478271484375, -4.628173828125, -4.1085205078125, -3.5888671875, -3.0692138671875, -2.549560546875, -2.0299072265625, -1.51025390625, -0.9906005859375, -0.470947265625, 0.0487060546875, 0.568359375, 1.0880126953125, 1.607666015625, 2.1273193359375, 2.64697265625, 3.1666259765625, 3.686279296875, 4.2059326171875, 4.7255859375, 5.2452392578125, 5.764892578125, 6.2845458984375, 6.80419921875, 7.3238525390625, 7.843505859375, 8.3631591796875, 8.8828125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 5.0, 18.0, 20.0, 45.0, 60.0, 92.0, 91.0, 124.0, 105.0, 98.0, 100.0, 68.0, 50.0, 51.0, 32.0, 19.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 2.0], "bins": [-13.1171875, -12.852142333984375, -12.58709716796875, -12.322052001953125, -12.0570068359375, -11.791961669921875, -11.52691650390625, -11.261871337890625, -10.996826171875, -10.731781005859375, -10.46673583984375, -10.201690673828125, -9.9366455078125, -9.671600341796875, -9.40655517578125, -9.141510009765625, -8.87646484375, -8.611419677734375, -8.34637451171875, -8.081329345703125, -7.8162841796875, -7.551239013671875, -7.28619384765625, -7.021148681640625, -6.756103515625, -6.491058349609375, -6.22601318359375, -5.960968017578125, -5.6959228515625, -5.430877685546875, -5.16583251953125, -4.900787353515625, -4.6357421875, -4.370697021484375, -4.10565185546875, -3.840606689453125, -3.5755615234375, -3.310516357421875, -3.04547119140625, -2.780426025390625, -2.515380859375, -2.250335693359375, -1.98529052734375, -1.720245361328125, -1.4552001953125, -1.190155029296875, -0.92510986328125, -0.660064697265625, -0.39501953125, -0.129974365234375, 0.13507080078125, 0.400115966796875, 0.6651611328125, 0.930206298828125, 1.19525146484375, 1.460296630859375, 1.725341796875, 1.990386962890625, 2.25543212890625, 2.520477294921875, 2.7855224609375, 3.050567626953125, 3.31561279296875, 3.580657958984375, 3.845703125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 10.0, 6.0, 9.0, 25.0, 28.0, 35.0, 73.0, 86.0, 192.0, 356.0, 691.0, 1643.0, 9326.0, 3788890.0, 384719.0, 5508.0, 1375.0, 574.0, 293.0, 172.0, 92.0, 73.0, 28.0, 33.0, 9.0, 14.0, 6.0, 8.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.0, -31.996337890625, -30.99267578125, -29.989013671875, -28.9853515625, -27.981689453125, -26.97802734375, -25.974365234375, -24.970703125, -23.967041015625, -22.96337890625, -21.959716796875, -20.9560546875, -19.952392578125, -18.94873046875, -17.945068359375, -16.94140625, -15.937744140625, -14.93408203125, -13.930419921875, -12.9267578125, -11.923095703125, -10.91943359375, -9.915771484375, -8.912109375, -7.908447265625, -6.90478515625, -5.901123046875, -4.8974609375, -3.893798828125, -2.89013671875, -1.886474609375, -0.8828125, 0.120849609375, 1.12451171875, 2.128173828125, 3.1318359375, 4.135498046875, 5.13916015625, 6.142822265625, 7.146484375, 8.150146484375, 9.15380859375, 10.157470703125, 11.1611328125, 12.164794921875, 13.16845703125, 14.172119140625, 15.17578125, 16.179443359375, 17.18310546875, 18.186767578125, 19.1904296875, 20.194091796875, 21.19775390625, 22.201416015625, 23.205078125, 24.208740234375, 25.21240234375, 26.216064453125, 27.2197265625, 28.223388671875, 29.22705078125, 30.230712890625, 31.234375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 11.0, 5.0, 7.0, 14.0, 24.0, 37.0, 66.0, 133.0, 258.0, 628.0, 1078.0, 908.0, 417.0, 204.0, 111.0, 56.0, 41.0, 26.0, 19.0, 10.0, 9.0, 4.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0, -12.428466796875, -11.85693359375, -11.285400390625, -10.7138671875, -10.142333984375, -9.57080078125, -8.999267578125, -8.427734375, -7.856201171875, -7.28466796875, -6.713134765625, -6.1416015625, -5.570068359375, -4.99853515625, -4.427001953125, -3.85546875, -3.283935546875, -2.71240234375, -2.140869140625, -1.5693359375, -0.997802734375, -0.42626953125, 0.145263671875, 0.716796875, 1.288330078125, 1.85986328125, 2.431396484375, 3.0029296875, 3.574462890625, 4.14599609375, 4.717529296875, 5.2890625, 5.860595703125, 6.43212890625, 7.003662109375, 7.5751953125, 8.146728515625, 8.71826171875, 9.289794921875, 9.861328125, 10.432861328125, 11.00439453125, 11.575927734375, 12.1474609375, 12.718994140625, 13.29052734375, 13.862060546875, 14.43359375, 15.005126953125, 15.57666015625, 16.148193359375, 16.7197265625, 17.291259765625, 17.86279296875, 18.434326171875, 19.005859375, 19.577392578125, 20.14892578125, 20.720458984375, 21.2919921875, 21.863525390625, 22.43505859375, 23.006591796875, 23.578125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 7.0, 5.0, 9.0, 14.0, 30.0, 48.0, 109.0, 245.0, 235.0, 121.0, 84.0, 43.0, 18.0, 9.0, 8.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-210.55014038085938, -205.1578826904297, -199.765625, -194.37335205078125, -188.98109436035156, -183.58883666992188, -178.1965789794922, -172.8043212890625, -167.41204833984375, -162.01979064941406, -156.62753295898438, -151.23526000976562, -145.84300231933594, -140.45074462890625, -135.05848693847656, -129.66622924804688, -124.27397155761719, -118.8817138671875, -113.48944854736328, -108.0971908569336, -102.70492553710938, -97.31266784667969, -91.92041015625, -86.52815246582031, -81.1358871459961, -75.7436294555664, -70.35136413574219, -64.9591064453125, -59.56684494018555, -54.174583435058594, -48.782325744628906, -43.39006423950195, -37.99778747558594, -32.605525970458984, -27.213266372680664, -21.821006774902344, -16.42874526977539, -11.036483764648438, -5.64422607421875, -0.2519645690917969, 5.140296936035156, 10.532557487487793, 15.92481803894043, 21.31707763671875, 26.709339141845703, 32.101600646972656, 37.493858337402344, 42.8861198425293, 48.27838134765625, 53.6706428527832, 59.062904357910156, 64.45516204833984, 69.84742736816406, 75.23968505859375, 80.63194274902344, 86.02420043945312, 91.41646575927734, 96.80872344970703, 102.20098876953125, 107.59324645996094, 112.98550415039062, 118.37776947021484, 123.77002716064453, 129.16229248046875, 134.55455017089844]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 4.0, 0.0, 3.0, 0.0, 5.0, 3.0, 6.0, 12.0, 16.0, 18.0, 27.0, 32.0, 37.0, 40.0, 52.0, 67.0, 60.0, 81.0, 99.0, 82.0, 61.0, 61.0, 54.0, 47.0, 36.0, 33.0, 18.0, 15.0, 15.0, 6.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.45579528808594, -87.58548736572266, -84.7151870727539, -81.84487915039062, -78.97457122802734, -76.10426330566406, -73.23396301269531, -70.36365509033203, -67.49334716796875, -64.62303924560547, -61.75273513793945, -58.88243103027344, -56.012123107910156, -53.14181900024414, -50.271514892578125, -47.401206970214844, -44.53090286254883, -41.66059875488281, -38.79029083251953, -35.919986724853516, -33.049678802490234, -30.17937469482422, -27.30906867980957, -24.438762664794922, -21.568456649780273, -18.698150634765625, -15.827844619750977, -12.957539558410645, -10.087233543395996, -7.216927528381348, -4.346622467041016, -1.4763164520263672, 1.3939895629882812, 4.26429557800293, 7.13460111618042, 10.00490665435791, 12.875212669372559, 15.745518684387207, 18.61582374572754, 21.486129760742188, 24.356435775756836, 27.226741790771484, 30.097047805786133, 32.96735382080078, 35.8376579284668, 38.70796585083008, 41.578269958496094, 44.448577880859375, 47.31888198852539, 50.189186096191406, 53.05949401855469, 55.9297981262207, 58.800106048583984, 61.67041015625, 64.54071807861328, 67.41102600097656, 70.28132629394531, 73.1516342163086, 76.02193450927734, 78.89224243164062, 81.7625503540039, 84.63285827636719, 87.50315856933594, 90.37346649169922, 93.2437744140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 13.0, 24.0, 18.0, 41.0, 100.0, 181.0, 433.0, 1420.0, 5915.0, 51776.0, 822397.0, 151200.0, 11477.0, 2349.0, 646.0, 263.0, 142.0, 59.0, 29.0, 21.0, 14.0, 12.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4375, -12.9847412109375, -12.531982421875, -12.0792236328125, -11.62646484375, -11.1737060546875, -10.720947265625, -10.2681884765625, -9.8154296875, -9.3626708984375, -8.909912109375, -8.4571533203125, -8.00439453125, -7.5516357421875, -7.098876953125, -6.6461181640625, -6.193359375, -5.7406005859375, -5.287841796875, -4.8350830078125, -4.38232421875, -3.9295654296875, -3.476806640625, -3.0240478515625, -2.5712890625, -2.1185302734375, -1.665771484375, -1.2130126953125, -0.76025390625, -0.3074951171875, 0.145263671875, 0.5980224609375, 1.05078125, 1.5035400390625, 1.956298828125, 2.4090576171875, 2.86181640625, 3.3145751953125, 3.767333984375, 4.2200927734375, 4.6728515625, 5.1256103515625, 5.578369140625, 6.0311279296875, 6.48388671875, 6.9366455078125, 7.389404296875, 7.8421630859375, 8.294921875, 8.7476806640625, 9.200439453125, 9.6531982421875, 10.10595703125, 10.5587158203125, 11.011474609375, 11.4642333984375, 11.9169921875, 12.3697509765625, 12.822509765625, 13.2752685546875, 13.72802734375, 14.1807861328125, 14.633544921875, 15.0863037109375, 15.5390625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 8.0, 24.0, 22.0, 39.0, 52.0, 69.0, 89.0, 103.0, 97.0, 89.0, 89.0, 84.0, 61.0, 57.0, 44.0, 32.0, 15.0, 10.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0], "bins": [-13.6328125, -13.35430908203125, -13.0758056640625, -12.79730224609375, -12.518798828125, -12.24029541015625, -11.9617919921875, -11.68328857421875, -11.40478515625, -11.12628173828125, -10.8477783203125, -10.56927490234375, -10.290771484375, -10.01226806640625, -9.7337646484375, -9.45526123046875, -9.1767578125, -8.89825439453125, -8.6197509765625, -8.34124755859375, -8.062744140625, -7.78424072265625, -7.5057373046875, -7.22723388671875, -6.94873046875, -6.67022705078125, -6.3917236328125, -6.11322021484375, -5.834716796875, -5.55621337890625, -5.2777099609375, -4.99920654296875, -4.720703125, -4.44219970703125, -4.1636962890625, -3.88519287109375, -3.606689453125, -3.32818603515625, -3.0496826171875, -2.77117919921875, -2.49267578125, -2.21417236328125, -1.9356689453125, -1.65716552734375, -1.378662109375, -1.10015869140625, -0.8216552734375, -0.54315185546875, -0.2646484375, 0.01385498046875, 0.2923583984375, 0.57086181640625, 0.849365234375, 1.12786865234375, 1.4063720703125, 1.68487548828125, 1.96337890625, 2.24188232421875, 2.5203857421875, 2.79888916015625, 3.077392578125, 3.35589599609375, 3.6343994140625, 3.91290283203125, 4.19140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 11.0, 7.0, 15.0, 19.0, 27.0, 28.0, 49.0, 64.0, 76.0, 118.0, 182.0, 270.0, 552.0, 1169.0, 3485.0, 18481.0, 463567.0, 534557.0, 19509.0, 3705.0, 1169.0, 556.0, 288.0, 187.0, 127.0, 85.0, 61.0, 40.0, 43.0, 38.0, 14.0, 14.0, 11.0, 6.0, 7.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.2109375, -8.8934326171875, -8.575927734375, -8.2584228515625, -7.94091796875, -7.6234130859375, -7.305908203125, -6.9884033203125, -6.6708984375, -6.3533935546875, -6.035888671875, -5.7183837890625, -5.40087890625, -5.0833740234375, -4.765869140625, -4.4483642578125, -4.130859375, -3.8133544921875, -3.495849609375, -3.1783447265625, -2.86083984375, -2.5433349609375, -2.225830078125, -1.9083251953125, -1.5908203125, -1.2733154296875, -0.955810546875, -0.6383056640625, -0.32080078125, -0.0032958984375, 0.314208984375, 0.6317138671875, 0.94921875, 1.2667236328125, 1.584228515625, 1.9017333984375, 2.21923828125, 2.5367431640625, 2.854248046875, 3.1717529296875, 3.4892578125, 3.8067626953125, 4.124267578125, 4.4417724609375, 4.75927734375, 5.0767822265625, 5.394287109375, 5.7117919921875, 6.029296875, 6.3468017578125, 6.664306640625, 6.9818115234375, 7.29931640625, 7.6168212890625, 7.934326171875, 8.2518310546875, 8.5693359375, 8.8868408203125, 9.204345703125, 9.5218505859375, 9.83935546875, 10.1568603515625, 10.474365234375, 10.7918701171875, 11.109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 8.0, 10.0, 9.0, 16.0, 14.0, 20.0, 28.0, 28.0, 33.0, 68.0, 65.0, 105.0, 100.0, 105.0, 64.0, 79.0, 51.0, 46.0, 26.0, 35.0, 24.0, 19.0, 15.0, 14.0, 6.0, 4.0, 6.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.59375, -23.746337890625, -22.89892578125, -22.051513671875, -21.2041015625, -20.356689453125, -19.50927734375, -18.661865234375, -17.814453125, -16.967041015625, -16.11962890625, -15.272216796875, -14.4248046875, -13.577392578125, -12.72998046875, -11.882568359375, -11.03515625, -10.187744140625, -9.34033203125, -8.492919921875, -7.6455078125, -6.798095703125, -5.95068359375, -5.103271484375, -4.255859375, -3.408447265625, -2.56103515625, -1.713623046875, -0.8662109375, -0.018798828125, 0.82861328125, 1.676025390625, 2.5234375, 3.370849609375, 4.21826171875, 5.065673828125, 5.9130859375, 6.760498046875, 7.60791015625, 8.455322265625, 9.302734375, 10.150146484375, 10.99755859375, 11.844970703125, 12.6923828125, 13.539794921875, 14.38720703125, 15.234619140625, 16.08203125, 16.929443359375, 17.77685546875, 18.624267578125, 19.4716796875, 20.319091796875, 21.16650390625, 22.013916015625, 22.861328125, 23.708740234375, 24.55615234375, 25.403564453125, 26.2509765625, 27.098388671875, 27.94580078125, 28.793212890625, 29.640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 5.0, 6.0, 6.0, 15.0, 32.0, 34.0, 74.0, 109.0, 230.0, 565.0, 2175.0, 16923.0, 970712.0, 51926.0, 4187.0, 907.0, 286.0, 142.0, 75.0, 43.0, 31.0, 14.0, 9.0, 7.0, 4.0, 2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.478515625, -2.397735595703125, -2.31695556640625, -2.236175537109375, -2.1553955078125, -2.074615478515625, -1.99383544921875, -1.913055419921875, -1.832275390625, -1.751495361328125, -1.67071533203125, -1.589935302734375, -1.5091552734375, -1.428375244140625, -1.34759521484375, -1.266815185546875, -1.18603515625, -1.105255126953125, -1.02447509765625, -0.943695068359375, -0.8629150390625, -0.782135009765625, -0.70135498046875, -0.620574951171875, -0.539794921875, -0.459014892578125, -0.37823486328125, -0.297454833984375, -0.2166748046875, -0.135894775390625, -0.05511474609375, 0.025665283203125, 0.1064453125, 0.187225341796875, 0.26800537109375, 0.348785400390625, 0.4295654296875, 0.510345458984375, 0.59112548828125, 0.671905517578125, 0.752685546875, 0.833465576171875, 0.91424560546875, 0.995025634765625, 1.0758056640625, 1.156585693359375, 1.23736572265625, 1.318145751953125, 1.39892578125, 1.479705810546875, 1.56048583984375, 1.641265869140625, 1.7220458984375, 1.802825927734375, 1.88360595703125, 1.964385986328125, 2.045166015625, 2.125946044921875, 2.20672607421875, 2.287506103515625, 2.3682861328125, 2.449066162109375, 2.52984619140625, 2.610626220703125, 2.69140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 7.0, 5.0, 8.0, 10.0, 13.0, 23.0, 24.0, 47.0, 57.0, 113.0, 173.0, 169.0, 110.0, 68.0, 37.0, 32.0, 14.0, 18.0, 10.0, 12.0, 10.0, 7.0, 3.0, 1.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0005292892456054688, -0.0005163699388504028, -0.0005034506320953369, -0.000490531325340271, -0.0004776120185852051, -0.00046469271183013916, -0.00045177340507507324, -0.0004388540983200073, -0.0004259347915649414, -0.0004130154848098755, -0.00040009617805480957, -0.00038717687129974365, -0.00037425756454467773, -0.0003613382577896118, -0.0003484189510345459, -0.00033549964427948, -0.00032258033752441406, -0.00030966103076934814, -0.0002967417240142822, -0.0002838224172592163, -0.0002709031105041504, -0.00025798380374908447, -0.00024506449699401855, -0.00023214519023895264, -0.00021922588348388672, -0.0002063065767288208, -0.00019338726997375488, -0.00018046796321868896, -0.00016754865646362305, -0.00015462934970855713, -0.0001417100429534912, -0.0001287907361984253, -0.00011587142944335938, -0.00010295212268829346, -9.003281593322754e-05, -7.711350917816162e-05, -6.41942024230957e-05, -5.1274895668029785e-05, -3.835558891296387e-05, -2.543628215789795e-05, -1.2516975402832031e-05, 4.023313522338867e-07, 1.3321638107299805e-05, 2.6240944862365723e-05, 3.916025161743164e-05, 5.207955837249756e-05, 6.499886512756348e-05, 7.79181718826294e-05, 9.083747863769531e-05, 0.00010375678539276123, 0.00011667609214782715, 0.00012959539890289307, 0.00014251470565795898, 0.0001554340124130249, 0.00016835331916809082, 0.00018127262592315674, 0.00019419193267822266, 0.00020711123943328857, 0.0002200305461883545, 0.0002329498529434204, 0.00024586915969848633, 0.00025878846645355225, 0.00027170777320861816, 0.0002846270799636841, 0.00029754638671875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 9.0, 6.0, 11.0, 22.0, 30.0, 33.0, 43.0, 87.0, 110.0, 187.0, 263.0, 435.0, 676.0, 1170.0, 1972.0, 3984.0, 8255.0, 19751.0, 62704.0, 727457.0, 162889.0, 33478.0, 12682.0, 5623.0, 2827.0, 1498.0, 896.0, 521.0, 278.0, 197.0, 144.0, 96.0, 61.0, 50.0, 31.0, 20.0, 14.0, 4.0, 8.0, 4.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.94091796875, -0.9130401611328125, -0.885162353515625, -0.8572845458984375, -0.82940673828125, -0.8015289306640625, -0.773651123046875, -0.7457733154296875, -0.7178955078125, -0.6900177001953125, -0.662139892578125, -0.6342620849609375, -0.60638427734375, -0.5785064697265625, -0.550628662109375, -0.5227508544921875, -0.494873046875, -0.4669952392578125, -0.439117431640625, -0.4112396240234375, -0.38336181640625, -0.3554840087890625, -0.327606201171875, -0.2997283935546875, -0.2718505859375, -0.2439727783203125, -0.216094970703125, -0.1882171630859375, -0.16033935546875, -0.1324615478515625, -0.104583740234375, -0.0767059326171875, -0.048828125, -0.0209503173828125, 0.006927490234375, 0.0348052978515625, 0.06268310546875, 0.0905609130859375, 0.118438720703125, 0.1463165283203125, 0.1741943359375, 0.2020721435546875, 0.229949951171875, 0.2578277587890625, 0.28570556640625, 0.3135833740234375, 0.341461181640625, 0.3693389892578125, 0.397216796875, 0.4250946044921875, 0.452972412109375, 0.4808502197265625, 0.50872802734375, 0.5366058349609375, 0.564483642578125, 0.5923614501953125, 0.6202392578125, 0.6481170654296875, 0.675994873046875, 0.7038726806640625, 0.73175048828125, 0.7596282958984375, 0.787506103515625, 0.8153839111328125, 0.84326171875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 2.0, 6.0, 2.0, 6.0, 8.0, 5.0, 10.0, 8.0, 7.0, 13.0, 25.0, 23.0, 29.0, 57.0, 91.0, 155.0, 181.0, 147.0, 74.0, 40.0, 27.0, 11.0, 10.0, 13.0, 12.0, 5.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.69921875, -1.6465301513671875, -1.593841552734375, -1.5411529541015625, -1.48846435546875, -1.4357757568359375, -1.383087158203125, -1.3303985595703125, -1.2777099609375, -1.2250213623046875, -1.172332763671875, -1.1196441650390625, -1.06695556640625, -1.0142669677734375, -0.961578369140625, -0.9088897705078125, -0.856201171875, -0.8035125732421875, -0.750823974609375, -0.6981353759765625, -0.64544677734375, -0.5927581787109375, -0.540069580078125, -0.4873809814453125, -0.4346923828125, -0.3820037841796875, -0.329315185546875, -0.2766265869140625, -0.22393798828125, -0.1712493896484375, -0.118560791015625, -0.0658721923828125, -0.01318359375, 0.0395050048828125, 0.092193603515625, 0.1448822021484375, 0.19757080078125, 0.2502593994140625, 0.302947998046875, 0.3556365966796875, 0.4083251953125, 0.4610137939453125, 0.513702392578125, 0.5663909912109375, 0.61907958984375, 0.6717681884765625, 0.724456787109375, 0.7771453857421875, 0.829833984375, 0.8825225830078125, 0.935211181640625, 0.9878997802734375, 1.04058837890625, 1.0932769775390625, 1.145965576171875, 1.1986541748046875, 1.2513427734375, 1.3040313720703125, 1.356719970703125, 1.4094085693359375, 1.46209716796875, 1.5147857666015625, 1.567474365234375, 1.6201629638671875, 1.6728515625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 12.0, 30.0, 123.0, 695.0, 90.0, 37.0, 18.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.58871459960938, -92.2748794555664, -86.9610366821289, -81.64720153808594, -76.33335876464844, -71.01952362060547, -65.7056884765625, -60.391845703125, -55.078006744384766, -49.76416778564453, -44.4503288269043, -39.13648986816406, -33.822654724121094, -28.508813858032227, -23.194976806640625, -17.88113784790039, -12.567298889160156, -7.25346040725708, -1.939621925354004, 3.374216079711914, 8.688055038452148, 14.001893997192383, 19.315731048583984, 24.62957000732422, 29.943408966064453, 35.25724792480469, 40.57108688354492, 45.884925842285156, 51.198760986328125, 56.512603759765625, 61.826438903808594, 67.14027404785156, 72.45411682128906, 77.76795196533203, 83.08179473876953, 88.3956298828125, 93.70947265625, 99.02330780029297, 104.33714294433594, 109.65098571777344, 114.96482849121094, 120.2786636352539, 125.5925064086914, 130.90634155273438, 136.22018432617188, 141.53402709960938, 146.8478546142578, 152.1616973876953, 157.47552490234375, 162.78936767578125, 168.1031951904297, 173.4170379638672, 178.7308807373047, 184.0447235107422, 189.35855102539062, 194.67239379882812, 199.98623657226562, 205.30007934570312, 210.61390686035156, 215.92774963378906, 221.24159240722656, 226.55543518066406, 231.8692626953125, 237.18310546875, 242.4969482421875]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 17.0, 28.0, 37.0, 45.0, 68.0, 314.0, 269.0, 59.0, 54.0, 48.0, 29.0, 22.0, 15.0, 3.0, 1.0, 0.0, 1.0], "bins": [-264.7650146484375, -259.7561950683594, -254.74737548828125, -249.7385711669922, -244.72975158691406, -239.72093200683594, -234.7121124267578, -229.7032928466797, -224.69448852539062, -219.6856689453125, -214.67684936523438, -209.6680450439453, -204.6592254638672, -199.65040588378906, -194.64158630371094, -189.6327667236328, -184.6239471435547, -179.61512756347656, -174.60630798339844, -169.59750366210938, -164.58868408203125, -159.57986450195312, -154.571044921875, -149.56222534179688, -144.55340576171875, -139.54458618164062, -134.5357666015625, -129.52696228027344, -124.51814270019531, -119.50932312011719, -114.50050354003906, -109.49168395996094, -104.48286437988281, -99.47404479980469, -94.4652328491211, -89.45641326904297, -84.44760131835938, -79.43878173828125, -74.42996215820312, -69.421142578125, -64.41233825683594, -59.40352249145508, -54.39470672607422, -49.385887145996094, -44.377071380615234, -39.368255615234375, -34.35943603515625, -29.35062026977539, -24.341800689697266, -19.332984924316406, -14.324167251586914, -9.315350532531738, -4.3065338134765625, 0.7022819519042969, 5.711099624633789, 10.719917297363281, 15.72873306274414, 20.737548828125, 25.746366500854492, 30.755184173583984, 35.763999938964844, 40.7728157043457, 45.78163146972656, 50.79045104980469, 55.79926681518555]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 6.0, 13.0, 32.0, 38.0, 62.0, 107.0, 410.0, 90.0, 61.0, 61.0, 38.0, 33.0, 21.0, 11.0, 7.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.375, -14.03607177734375, -13.6971435546875, -13.35821533203125, -13.019287109375, -12.68035888671875, -12.3414306640625, -12.00250244140625, -11.66357421875, -11.32464599609375, -10.9857177734375, -10.64678955078125, -10.307861328125, -9.96893310546875, -9.6300048828125, -9.29107666015625, -8.9521484375, -8.61322021484375, -8.2742919921875, -7.93536376953125, -7.596435546875, -7.25750732421875, -6.9185791015625, -6.57965087890625, -6.24072265625, -5.90179443359375, -5.5628662109375, -5.22393798828125, -4.885009765625, -4.54608154296875, -4.2071533203125, -3.86822509765625, -3.529296875, -3.19036865234375, -2.8514404296875, -2.51251220703125, -2.173583984375, -1.83465576171875, -1.4957275390625, -1.15679931640625, -0.81787109375, -0.47894287109375, -0.1400146484375, 0.19891357421875, 0.537841796875, 0.87677001953125, 1.2156982421875, 1.55462646484375, 1.8935546875, 2.23248291015625, 2.5714111328125, 2.91033935546875, 3.249267578125, 3.58819580078125, 3.9271240234375, 4.26605224609375, 4.60498046875, 4.94390869140625, 5.2828369140625, 5.62176513671875, 5.960693359375, 6.29962158203125, 6.6385498046875, 6.97747802734375, 7.31640625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 6.0, 10.0, 23.0, 42.0, 127.0, 541.0, 7873719.0, 513313.0, 577.0, 101.0, 52.0, 29.0, 7.0, 2.0, 0.0, 5.0, 1.0, 8.0, 10.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-210.20782470703125, -202.95790100097656, -195.70797729492188, -188.45803833007812, -181.20811462402344, -173.95819091796875, -166.70826721191406, -159.45834350585938, -152.20840454101562, -144.95848083496094, -137.70855712890625, -130.4586181640625, -123.20869445800781, -115.95877075195312, -108.70884704589844, -101.45892333984375, -94.20899963378906, -86.95907592773438, -79.70914459228516, -72.45922088623047, -65.20928955078125, -57.95936584472656, -50.709442138671875, -43.45951461791992, -36.20958709716797, -28.959659576416016, -21.709733963012695, -14.459808349609375, -7.209880828857422, 0.04004669189453125, 7.289970397949219, 14.539897918701172, 21.789840698242188, 29.03976821899414, 36.289695739746094, 43.53961944580078, 50.789546966552734, 58.03947448730469, 65.28939819335938, 72.53932189941406, 79.78925323486328, 87.03917694091797, 94.28910827636719, 101.53903198242188, 108.78895568847656, 116.03888702392578, 123.28881072998047, 130.5387420654297, 137.78866577148438, 145.03858947753906, 152.28851318359375, 159.5384521484375, 166.7883758544922, 174.03829956054688, 181.28822326660156, 188.53814697265625, 195.7880859375, 203.0380096435547, 210.28793334960938, 217.53787231445312, 224.7877960205078, 232.0377197265625, 239.2876434326172, 246.53756713867188, 253.78749084472656]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 0.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.9244270324707, -47.16679382324219, -44.40916442871094, -41.65153503417969, -38.89390182495117, -36.136268615722656, -33.378639221191406, -30.621007919311523, -27.86337661743164, -25.105745315551758, -22.348114013671875, -19.590482711791992, -16.83285140991211, -14.075220108032227, -11.317588806152344, -8.559957504272461, -5.802326202392578, -3.0446949005126953, -0.2870635986328125, 2.4705677032470703, 5.228199005126953, 7.985830307006836, 10.743461608886719, 13.501092910766602, 16.258724212646484, 19.016355514526367, 21.77398681640625, 24.531618118286133, 27.289249420166016, 30.0468807220459, 32.80451202392578, 35.56214141845703, 38.31977081298828, 41.07740020751953, 43.83503341674805, 46.59266662597656, 49.35029602050781, 52.10792541503906, 54.86555862426758, 57.623191833496094, 60.380821228027344, 63.138450622558594, 65.89608764648438, 68.65371704101562, 71.41134643554688, 74.16897583007812, 76.92660522460938, 79.68424224853516, 82.4418716430664, 85.19950103759766, 87.95713806152344, 90.71476745605469, 93.47239685058594, 96.23002624511719, 98.98765563964844, 101.74529266357422, 104.50292205810547, 107.26055145263672, 110.0181884765625, 112.77581787109375, 115.533447265625, 118.29107666015625, 121.0487060546875, 123.80634307861328, 126.56397247314453]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 4.0, 10.0, 13.0, 10.0, 15.0, 24.0, 35.0, 50.0, 70.0, 86.0, 116.0, 180.0, 270.0, 448.0, 735.0, 1360.0, 2493.0, 5591.0, 13805.0, 38096.0, 113793.0, 200153.0, 94522.0, 31687.0, 11498.0, 4576.0, 2013.0, 1009.0, 642.0, 337.0, 210.0, 151.0, 87.0, 48.0, 31.0, 24.0, 19.0, 17.0, 10.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.59375, -29.58837890625, -28.5830078125, -27.57763671875, -26.572265625, -25.56689453125, -24.5615234375, -23.55615234375, -22.55078125, -21.54541015625, -20.5400390625, -19.53466796875, -18.529296875, -17.52392578125, -16.5185546875, -15.51318359375, -14.5078125, -13.50244140625, -12.4970703125, -11.49169921875, -10.486328125, -9.48095703125, -8.4755859375, -7.47021484375, -6.46484375, -5.45947265625, -4.4541015625, -3.44873046875, -2.443359375, -1.43798828125, -0.4326171875, 0.57275390625, 1.578125, 2.58349609375, 3.5888671875, 4.59423828125, 5.599609375, 6.60498046875, 7.6103515625, 8.61572265625, 9.62109375, 10.62646484375, 11.6318359375, 12.63720703125, 13.642578125, 14.64794921875, 15.6533203125, 16.65869140625, 17.6640625, 18.66943359375, 19.6748046875, 20.68017578125, 21.685546875, 22.69091796875, 23.6962890625, 24.70166015625, 25.70703125, 26.71240234375, 27.7177734375, 28.72314453125, 29.728515625, 30.73388671875, 31.7392578125, 32.74462890625, 33.75]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 2.0, 7.0, 6.0, 17.0, 26.0, 29.0, 39.0, 74.0, 95.0, 106.0, 118.0, 122.0, 111.0, 81.0, 58.0, 46.0, 31.0, 23.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.9453125, -15.62030029296875, -15.2952880859375, -14.97027587890625, -14.645263671875, -14.32025146484375, -13.9952392578125, -13.67022705078125, -13.34521484375, -13.02020263671875, -12.6951904296875, -12.37017822265625, -12.045166015625, -11.72015380859375, -11.3951416015625, -11.07012939453125, -10.7451171875, -10.42010498046875, -10.0950927734375, -9.77008056640625, -9.445068359375, -9.12005615234375, -8.7950439453125, -8.47003173828125, -8.14501953125, -7.82000732421875, -7.4949951171875, -7.16998291015625, -6.844970703125, -6.51995849609375, -6.1949462890625, -5.86993408203125, -5.544921875, -5.21990966796875, -4.8948974609375, -4.56988525390625, -4.244873046875, -3.91986083984375, -3.5948486328125, -3.26983642578125, -2.94482421875, -2.61981201171875, -2.2947998046875, -1.96978759765625, -1.644775390625, -1.31976318359375, -0.9947509765625, -0.66973876953125, -0.3447265625, -0.01971435546875, 0.3052978515625, 0.63031005859375, 0.955322265625, 1.28033447265625, 1.6053466796875, 1.93035888671875, 2.25537109375, 2.58038330078125, 2.9053955078125, 3.23040771484375, 3.555419921875, 3.88043212890625, 4.2054443359375, 4.53045654296875, 4.85546875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 7.0, 10.0, 10.0, 15.0, 30.0, 57.0, 67.0, 60.0, 65.0, 54.0, 29.0, 21.0, 10.0, 16.0, 14.0, 4.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.34465408325195, -30.872949600219727, -29.4012451171875, -27.929540634155273, -26.457836151123047, -24.98613166809082, -23.514427185058594, -22.042722702026367, -20.57101821899414, -19.099313735961914, -17.627609252929688, -16.15590476989746, -14.684200286865234, -13.212495803833008, -11.740791320800781, -10.269086837768555, -8.797382354736328, -7.325677871704102, -5.853973388671875, -4.382268905639648, -2.910564422607422, -1.4388599395751953, 0.03284454345703125, 1.5045490264892578, 2.9762535095214844, 4.447957992553711, 5.9196624755859375, 7.391366958618164, 8.86307144165039, 10.334775924682617, 11.806480407714844, 13.27818489074707, 14.749885559082031, 16.221590042114258, 17.693294525146484, 19.16499900817871, 20.636703491210938, 22.108407974243164, 23.58011245727539, 25.051816940307617, 26.523521423339844, 27.99522590637207, 29.466930389404297, 30.938634872436523, 32.41033935546875, 33.882041931152344, 35.3537483215332, 36.82545471191406, 38.297157287597656, 39.76885986328125, 41.24056625366211, 42.71227264404297, 44.18397521972656, 45.655677795410156, 47.127384185791016, 48.599090576171875, 50.07079315185547, 51.54249572753906, 53.01420211791992, 54.48590850830078, 55.957611083984375, 57.42931365966797, 58.90102005004883, 60.37272644042969, 61.84442901611328]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 7.0, 7.0, 13.0, 17.0, 24.0, 23.0, 47.0, 58.0, 51.0, 46.0, 44.0, 42.0, 29.0, 20.0, 9.0, 8.0, 9.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.21632957458496, -27.327625274658203, -26.438922882080078, -25.550220489501953, -24.661516189575195, -23.772811889648438, -22.884109497070312, -21.995407104492188, -21.10670280456543, -20.217998504638672, -19.329296112060547, -18.440593719482422, -17.551889419555664, -16.663185119628906, -15.774482727050781, -14.88577938079834, -13.997076034545898, -13.108372688293457, -12.219669342041016, -11.330965995788574, -10.442262649536133, -9.553559303283691, -8.66485595703125, -7.776152610778809, -6.887449264526367, -5.998745918273926, -5.110042572021484, -4.221339225769043, -3.3326358795166016, -2.44393253326416, -1.5552291870117188, -0.6665258407592773, 0.22217750549316406, 1.1108808517456055, 1.9995841979980469, 2.8882875442504883, 3.7769908905029297, 4.665694236755371, 5.5543975830078125, 6.443100929260254, 7.331804275512695, 8.220507621765137, 9.109210968017578, 9.99791431427002, 10.886617660522461, 11.775321006774902, 12.664024353027344, 13.552727699279785, 14.441431045532227, 15.330134391784668, 16.21883773803711, 17.107540130615234, 17.996244430541992, 18.88494873046875, 19.773651123046875, 20.662353515625, 21.551057815551758, 22.439762115478516, 23.32846450805664, 24.217166900634766, 25.105871200561523, 25.99457550048828, 26.883277893066406, 27.77198028564453, 28.66068458557129]}, "eval/loss": 2.062474012374878, "eval/wer": 0.3362752875842919, "eval/runtime": 841.7974, "eval/samples_per_second": 3.139, "eval/steps_per_second": 0.393} \ No newline at end of file +{"train/loss": 0.407, "train/learning_rate": 5.068289786223278e-06, "train/epoch": 16.82, "train/global_step": 15000, "_runtime": 91322, "_timestamp": 1647465864, "_step": 15009, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 6.0, 8.0, 8.0, 6.0, 10.0, 12.0, 12.0, 15.0, 13.0, 20.0, 16.0, 17.0, 20.0, 26.0, 33.0, 38.0, 35.0, 47.0, 34.0, 38.0, 30.0, 56.0, 54.0, 39.0, 44.0, 38.0, 32.0, 33.0, 29.0, 33.0, 26.0, 23.0, 20.0, 16.0, 33.0, 19.0, 16.0, 8.0, 9.0, 4.0, 11.0, 7.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0], "bins": [-28.95673179626465, -28.36270523071289, -27.768680572509766, -27.174654006958008, -26.58062744140625, -25.986602783203125, -25.392576217651367, -24.79854965209961, -24.204524993896484, -23.610498428344727, -23.0164737701416, -22.422447204589844, -21.82842254638672, -21.23439598083496, -20.640369415283203, -20.046344757080078, -19.45231819152832, -18.858291625976562, -18.264266967773438, -17.67024040222168, -17.076213836669922, -16.482189178466797, -15.888162612915039, -15.294137001037598, -14.700111389160156, -14.106085777282715, -13.512060165405273, -12.918033599853516, -12.324007987976074, -11.729982376098633, -11.135955810546875, -10.541930198669434, -9.94790267944336, -9.353877067565918, -8.759851455688477, -8.165824890136719, -7.571799278259277, -6.977773666381836, -6.383747577667236, -5.789721488952637, -5.195695877075195, -4.601670265197754, -4.007644176483154, -3.413618326187134, -2.8195924758911133, -2.2255666255950928, -1.6315407752990723, -1.0375146865844727, -0.44348907470703125, 0.15053677558898926, 0.7445626258850098, 1.3385884761810303, 1.9326143264770508, 2.5266401767730713, 3.120666027069092, 3.7146921157836914, 4.308717727661133, 4.902743339538574, 5.496769428253174, 6.090795516967773, 6.684821128845215, 7.278846740722656, 7.872872829437256, 8.466898918151855, 9.060924530029297]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 1.0, 3.0, 10.0, 9.0, 17.0, 18.0, 19.0, 24.0, 31.0, 38.0, 29.0, 31.0, 30.0, 46.0, 37.0, 34.0, 49.0, 47.0, 43.0, 51.0, 48.0, 48.0, 35.0, 48.0, 34.0, 29.0, 44.0, 21.0, 17.0, 28.0, 17.0, 12.0, 17.0, 10.0, 4.0, 5.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.945802688598633, -20.255102157592773, -19.56439971923828, -18.873699188232422, -18.182998657226562, -17.492298126220703, -16.80159568786621, -16.11089515686035, -15.420193672180176, -14.7294921875, -14.03879165649414, -13.348090171813965, -12.657388687133789, -11.96668815612793, -11.275986671447754, -10.585285186767578, -9.894584655761719, -9.203883171081543, -8.513182640075684, -7.822481155395508, -7.13178014755249, -6.441079139709473, -5.750377655029297, -5.059676647186279, -4.368975639343262, -3.678274631500244, -2.9875733852386475, -2.296872138977051, -1.6061711311340332, -0.9154701232910156, -0.22476863861083984, 0.46593236923217773, 1.1566352844238281, 1.8473364114761353, 2.5380375385284424, 3.228738784790039, 3.9194397926330566, 4.610140800476074, 5.30084228515625, 5.991543292999268, 6.682244300842285, 7.372945308685303, 8.06364631652832, 8.754347801208496, 9.445049285888672, 10.135749816894531, 10.826451301574707, 11.517152786254883, 12.207853317260742, 12.898554801940918, 13.589255332946777, 14.279956817626953, 14.970657348632812, 15.661358833312988, 16.352060317993164, 17.042760848999023, 17.733463287353516, 18.424163818359375, 19.114866256713867, 19.805566787719727, 20.496267318725586, 21.186969757080078, 21.877670288085938, 22.568370819091797, 23.259071350097656]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 9.0, 25.0, 27.0, 27.0, 47.0, 69.0, 119.0, 210.0, 354.0, 554.0, 817.0, 1277.0, 2081.0, 3226.0, 5063.0, 7985.0, 12982.0, 20665.0, 32723.0, 50968.0, 79661.0, 122164.0, 184971.0, 269876.0, 374009.0, 481122.0, 542440.0, 528671.0, 444904.0, 336738.0, 237256.0, 161762.0, 105898.0, 68870.0, 43319.0, 27443.0, 17293.0, 10880.0, 6669.0, 4241.0, 2566.0, 1655.0, 1030.0, 593.0, 446.0, 233.0, 160.0, 78.0, 41.0, 31.0, 15.0, 12.0, 5.0, 2.0, 4.0, 3.0, 2.0], "bins": [-35.09375, -34.05615234375, -33.0185546875, -31.98095703125, -30.943359375, -29.90576171875, -28.8681640625, -27.83056640625, -26.79296875, -25.75537109375, -24.7177734375, -23.68017578125, -22.642578125, -21.60498046875, -20.5673828125, -19.52978515625, -18.4921875, -17.45458984375, -16.4169921875, -15.37939453125, -14.341796875, -13.30419921875, -12.2666015625, -11.22900390625, -10.19140625, -9.15380859375, -8.1162109375, -7.07861328125, -6.041015625, -5.00341796875, -3.9658203125, -2.92822265625, -1.890625, -0.85302734375, 0.1845703125, 1.22216796875, 2.259765625, 3.29736328125, 4.3349609375, 5.37255859375, 6.41015625, 7.44775390625, 8.4853515625, 9.52294921875, 10.560546875, 11.59814453125, 12.6357421875, 13.67333984375, 14.7109375, 15.74853515625, 16.7861328125, 17.82373046875, 18.861328125, 19.89892578125, 20.9365234375, 21.97412109375, 23.01171875, 24.04931640625, 25.0869140625, 26.12451171875, 27.162109375, 28.19970703125, 29.2373046875, 30.27490234375, 31.3125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 8.0, 11.0, 16.0, 16.0, 16.0, 24.0, 33.0, 28.0, 23.0, 40.0, 25.0, 34.0, 41.0, 43.0, 42.0, 41.0, 47.0, 35.0, 50.0, 45.0, 44.0, 44.0, 44.0, 22.0, 38.0, 34.0, 29.0, 21.0, 24.0, 11.0, 19.0, 6.0, 11.0, 9.0, 6.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-24.078125, -23.328857421875, -22.57958984375, -21.830322265625, -21.0810546875, -20.331787109375, -19.58251953125, -18.833251953125, -18.083984375, -17.334716796875, -16.58544921875, -15.836181640625, -15.0869140625, -14.337646484375, -13.58837890625, -12.839111328125, -12.08984375, -11.340576171875, -10.59130859375, -9.842041015625, -9.0927734375, -8.343505859375, -7.59423828125, -6.844970703125, -6.095703125, -5.346435546875, -4.59716796875, -3.847900390625, -3.0986328125, -2.349365234375, -1.60009765625, -0.850830078125, -0.1015625, 0.647705078125, 1.39697265625, 2.146240234375, 2.8955078125, 3.644775390625, 4.39404296875, 5.143310546875, 5.892578125, 6.641845703125, 7.39111328125, 8.140380859375, 8.8896484375, 9.638916015625, 10.38818359375, 11.137451171875, 11.88671875, 12.635986328125, 13.38525390625, 14.134521484375, 14.8837890625, 15.633056640625, 16.38232421875, 17.131591796875, 17.880859375, 18.630126953125, 19.37939453125, 20.128662109375, 20.8779296875, 21.627197265625, 22.37646484375, 23.125732421875, 23.875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 7.0, 7.0, 9.0, 25.0, 31.0, 61.0, 106.0, 165.0, 316.0, 478.0, 760.0, 1139.0, 1980.0, 3118.0, 5040.0, 7906.0, 12632.0, 19650.0, 30312.0, 46414.0, 69647.0, 101415.0, 146392.0, 202362.0, 268835.0, 337960.0, 397390.0, 433418.0, 434615.0, 399124.0, 340668.0, 271133.0, 204819.0, 148003.0, 104393.0, 71290.0, 47536.0, 30513.0, 20039.0, 12926.0, 8146.0, 5080.0, 3190.0, 2060.0, 1251.0, 745.0, 463.0, 300.0, 164.0, 105.0, 63.0, 32.0, 32.0, 10.0, 7.0, 8.0, 4.0, 0.0, 0.0, 2.0], "bins": [-22.546875, -21.8427734375, -21.138671875, -20.4345703125, -19.73046875, -19.0263671875, -18.322265625, -17.6181640625, -16.9140625, -16.2099609375, -15.505859375, -14.8017578125, -14.09765625, -13.3935546875, -12.689453125, -11.9853515625, -11.28125, -10.5771484375, -9.873046875, -9.1689453125, -8.46484375, -7.7607421875, -7.056640625, -6.3525390625, -5.6484375, -4.9443359375, -4.240234375, -3.5361328125, -2.83203125, -2.1279296875, -1.423828125, -0.7197265625, -0.015625, 0.6884765625, 1.392578125, 2.0966796875, 2.80078125, 3.5048828125, 4.208984375, 4.9130859375, 5.6171875, 6.3212890625, 7.025390625, 7.7294921875, 8.43359375, 9.1376953125, 9.841796875, 10.5458984375, 11.25, 11.9541015625, 12.658203125, 13.3623046875, 14.06640625, 14.7705078125, 15.474609375, 16.1787109375, 16.8828125, 17.5869140625, 18.291015625, 18.9951171875, 19.69921875, 20.4033203125, 21.107421875, 21.8115234375, 22.515625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 17.0, 17.0, 21.0, 20.0, 22.0, 57.0, 43.0, 36.0, 59.0, 77.0, 90.0, 103.0, 109.0, 136.0, 125.0, 162.0, 161.0, 163.0, 202.0, 193.0, 207.0, 208.0, 176.0, 189.0, 192.0, 186.0, 155.0, 127.0, 134.0, 121.0, 87.0, 85.0, 55.0, 67.0, 46.0, 44.0, 34.0, 31.0, 22.0, 15.0, 20.0, 18.0, 10.0, 7.0, 3.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0], "bins": [-12.2421875, -11.8797607421875, -11.517333984375, -11.1549072265625, -10.79248046875, -10.4300537109375, -10.067626953125, -9.7052001953125, -9.3427734375, -8.9803466796875, -8.617919921875, -8.2554931640625, -7.89306640625, -7.5306396484375, -7.168212890625, -6.8057861328125, -6.443359375, -6.0809326171875, -5.718505859375, -5.3560791015625, -4.99365234375, -4.6312255859375, -4.268798828125, -3.9063720703125, -3.5439453125, -3.1815185546875, -2.819091796875, -2.4566650390625, -2.09423828125, -1.7318115234375, -1.369384765625, -1.0069580078125, -0.64453125, -0.2821044921875, 0.080322265625, 0.4427490234375, 0.80517578125, 1.1676025390625, 1.530029296875, 1.8924560546875, 2.2548828125, 2.6173095703125, 2.979736328125, 3.3421630859375, 3.70458984375, 4.0670166015625, 4.429443359375, 4.7918701171875, 5.154296875, 5.5167236328125, 5.879150390625, 6.2415771484375, 6.60400390625, 6.9664306640625, 7.328857421875, 7.6912841796875, 8.0537109375, 8.4161376953125, 8.778564453125, 9.1409912109375, 9.50341796875, 9.8658447265625, 10.228271484375, 10.5906982421875, 10.953125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 4.0, 5.0, 4.0, 3.0, 10.0, 7.0, 10.0, 15.0, 11.0, 14.0, 26.0, 27.0, 34.0, 29.0, 19.0, 26.0, 42.0, 36.0, 33.0, 40.0, 53.0, 34.0, 44.0, 38.0, 43.0, 32.0, 39.0, 38.0, 30.0, 30.0, 30.0, 31.0, 19.0, 22.0, 18.0, 15.0, 18.0, 17.0, 9.0, 11.0, 10.0, 2.0, 11.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.393644332885742, -23.595495223999023, -22.797346115112305, -21.999197006225586, -21.201047897338867, -20.40289878845215, -19.604747772216797, -18.806598663330078, -18.00844955444336, -17.21030044555664, -16.412151336669922, -15.614002227783203, -14.815853118896484, -14.017704010009766, -13.21955394744873, -12.421404838562012, -11.62325668334961, -10.82510757446289, -10.026958465576172, -9.228809356689453, -8.430660247802734, -7.632510662078857, -6.8343610763549805, -6.036211967468262, -5.238062858581543, -4.439913749694824, -3.6417644023895264, -2.8436150550842285, -2.0454659461975098, -1.247316837310791, -0.44916725158691406, 0.3489818572998047, 1.1471309661865234, 1.9452801942825317, 2.74342942237854, 3.541578769683838, 4.339727878570557, 5.137876987457275, 5.936026573181152, 6.734175682067871, 7.53232479095459, 8.330473899841309, 9.128623008728027, 9.926773071289062, 10.724922180175781, 11.5230712890625, 12.321220397949219, 13.119369506835938, 13.917518615722656, 14.715667724609375, 15.513816833496094, 16.311965942382812, 17.11011505126953, 17.90826416015625, 18.70641326904297, 19.504562377929688, 20.302711486816406, 21.100860595703125, 21.899009704589844, 22.697158813476562, 23.49530792236328, 24.29345703125, 25.09160614013672, 25.889755249023438, 26.68790626525879]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 3.0, 6.0, 7.0, 15.0, 13.0, 14.0, 17.0, 31.0, 23.0, 26.0, 28.0, 27.0, 43.0, 23.0, 39.0, 51.0, 34.0, 46.0, 56.0, 48.0, 47.0, 51.0, 38.0, 42.0, 41.0, 27.0, 32.0, 37.0, 25.0, 23.0, 14.0, 13.0, 13.0, 15.0, 7.0, 4.0, 5.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.80069923400879, -27.835338592529297, -26.869979858398438, -25.904619216918945, -24.939258575439453, -23.973899841308594, -23.0085391998291, -22.04317855834961, -21.07781982421875, -20.112459182739258, -19.1471004486084, -18.181739807128906, -17.216379165649414, -16.251018524169922, -15.285659790039062, -14.32029914855957, -13.354938507080078, -12.389578819274902, -11.42421817779541, -10.458858489990234, -9.493497848510742, -8.528138160705566, -7.562778472900391, -6.597418308258057, -5.632058143615723, -4.666697978973389, -3.701338052749634, -2.735978126525879, -1.770617961883545, -0.8052577972412109, 0.16010189056396484, 1.1254620552062988, 2.0908241271972656, 3.0561842918395996, 4.021544456481934, 4.986904144287109, 5.952264308929443, 6.917624473571777, 7.882984161376953, 8.848344802856445, 9.813704490661621, 10.779064178466797, 11.744424819946289, 12.709784507751465, 13.67514419555664, 14.640504837036133, 15.605864524841309, 16.571224212646484, 17.536584854125977, 18.50194549560547, 19.467304229736328, 20.43266487121582, 21.398025512695312, 22.363384246826172, 23.328744888305664, 24.294105529785156, 25.259464263916016, 26.224824905395508, 27.190183639526367, 28.15554428100586, 29.12090492248535, 30.086265563964844, 31.051624298095703, 32.01698303222656, 32.98234558105469]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 5.0, 18.0, 23.0, 27.0, 47.0, 65.0, 105.0, 160.0, 254.0, 419.0, 654.0, 1072.0, 1639.0, 2761.0, 4585.0, 7591.0, 12383.0, 20590.0, 34119.0, 54869.0, 84448.0, 119540.0, 147340.0, 151990.0, 132365.0, 98700.0, 66229.0, 41995.0, 25246.0, 15586.0, 9248.0, 5606.0, 3347.0, 2013.0, 1311.0, 801.0, 496.0, 315.0, 215.0, 125.0, 94.0, 52.0, 30.0, 22.0, 10.0, 15.0, 10.0, 11.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-11.984375, -11.634033203125, -11.28369140625, -10.933349609375, -10.5830078125, -10.232666015625, -9.88232421875, -9.531982421875, -9.181640625, -8.831298828125, -8.48095703125, -8.130615234375, -7.7802734375, -7.429931640625, -7.07958984375, -6.729248046875, -6.37890625, -6.028564453125, -5.67822265625, -5.327880859375, -4.9775390625, -4.627197265625, -4.27685546875, -3.926513671875, -3.576171875, -3.225830078125, -2.87548828125, -2.525146484375, -2.1748046875, -1.824462890625, -1.47412109375, -1.123779296875, -0.7734375, -0.423095703125, -0.07275390625, 0.277587890625, 0.6279296875, 0.978271484375, 1.32861328125, 1.678955078125, 2.029296875, 2.379638671875, 2.72998046875, 3.080322265625, 3.4306640625, 3.781005859375, 4.13134765625, 4.481689453125, 4.83203125, 5.182373046875, 5.53271484375, 5.883056640625, 6.2333984375, 6.583740234375, 6.93408203125, 7.284423828125, 7.634765625, 7.985107421875, 8.33544921875, 8.685791015625, 9.0361328125, 9.386474609375, 9.73681640625, 10.087158203125, 10.4375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 3.0, 4.0, 7.0, 6.0, 14.0, 12.0, 17.0, 19.0, 31.0, 19.0, 26.0, 32.0, 26.0, 40.0, 30.0, 40.0, 50.0, 35.0, 36.0, 63.0, 45.0, 56.0, 43.0, 41.0, 37.0, 41.0, 28.0, 34.0, 33.0, 24.0, 21.0, 20.0, 15.0, 12.0, 10.0, 7.0, 6.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.34375, -28.359375, -27.375, -26.390625, -25.40625, -24.421875, -23.4375, -22.453125, -21.46875, -20.484375, -19.5, -18.515625, -17.53125, -16.546875, -15.5625, -14.578125, -13.59375, -12.609375, -11.625, -10.640625, -9.65625, -8.671875, -7.6875, -6.703125, -5.71875, -4.734375, -3.75, -2.765625, -1.78125, -0.796875, 0.1875, 1.171875, 2.15625, 3.140625, 4.125, 5.109375, 6.09375, 7.078125, 8.0625, 9.046875, 10.03125, 11.015625, 12.0, 12.984375, 13.96875, 14.953125, 15.9375, 16.921875, 17.90625, 18.890625, 19.875, 20.859375, 21.84375, 22.828125, 23.8125, 24.796875, 25.78125, 26.765625, 27.75, 28.734375, 29.71875, 30.703125, 31.6875, 32.671875, 33.65625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 7.0, 15.0, 13.0, 31.0, 58.0, 84.0, 161.0, 270.0, 511.0, 873.0, 1688.0, 3458.0, 7187.0, 15107.0, 36929.0, 864868.0, 74524.0, 22471.0, 10326.0, 4833.0, 2374.0, 1205.0, 690.0, 347.0, 194.0, 132.0, 67.0, 46.0, 37.0, 13.0, 12.0, 8.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.625, -32.53125, -31.4375, -30.34375, -29.25, -28.15625, -27.0625, -25.96875, -24.875, -23.78125, -22.6875, -21.59375, -20.5, -19.40625, -18.3125, -17.21875, -16.125, -15.03125, -13.9375, -12.84375, -11.75, -10.65625, -9.5625, -8.46875, -7.375, -6.28125, -5.1875, -4.09375, -3.0, -1.90625, -0.8125, 0.28125, 1.375, 2.46875, 3.5625, 4.65625, 5.75, 6.84375, 7.9375, 9.03125, 10.125, 11.21875, 12.3125, 13.40625, 14.5, 15.59375, 16.6875, 17.78125, 18.875, 19.96875, 21.0625, 22.15625, 23.25, 24.34375, 25.4375, 26.53125, 27.625, 28.71875, 29.8125, 30.90625, 32.0, 33.09375, 34.1875, 35.28125, 36.375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 0.0, 0.0, 8.0, 2.0, 5.0, 8.0, 10.0, 12.0, 7.0, 13.0, 17.0, 17.0, 22.0, 32.0, 29.0, 17.0, 39.0, 30.0, 44.0, 34.0, 36.0, 40.0, 55.0, 42.0, 48.0, 49.0, 43.0, 40.0, 42.0, 34.0, 34.0, 26.0, 25.0, 22.0, 18.0, 12.0, 13.0, 17.0, 14.0, 15.0, 11.0, 5.0, 4.0, 6.0, 1.0, 6.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.40625, -18.760498046875, -18.11474609375, -17.468994140625, -16.8232421875, -16.177490234375, -15.53173828125, -14.885986328125, -14.240234375, -13.594482421875, -12.94873046875, -12.302978515625, -11.6572265625, -11.011474609375, -10.36572265625, -9.719970703125, -9.07421875, -8.428466796875, -7.78271484375, -7.136962890625, -6.4912109375, -5.845458984375, -5.19970703125, -4.553955078125, -3.908203125, -3.262451171875, -2.61669921875, -1.970947265625, -1.3251953125, -0.679443359375, -0.03369140625, 0.612060546875, 1.2578125, 1.903564453125, 2.54931640625, 3.195068359375, 3.8408203125, 4.486572265625, 5.13232421875, 5.778076171875, 6.423828125, 7.069580078125, 7.71533203125, 8.361083984375, 9.0068359375, 9.652587890625, 10.29833984375, 10.944091796875, 11.58984375, 12.235595703125, 12.88134765625, 13.527099609375, 14.1728515625, 14.818603515625, 15.46435546875, 16.110107421875, 16.755859375, 17.401611328125, 18.04736328125, 18.693115234375, 19.3388671875, 19.984619140625, 20.63037109375, 21.276123046875, 21.921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 13.0, 8.0, 11.0, 8.0, 20.0, 33.0, 44.0, 67.0, 147.0, 224.0, 385.0, 731.0, 1412.0, 2903.0, 6059.0, 14453.0, 37534.0, 868771.0, 77039.0, 21681.0, 8808.0, 3922.0, 1997.0, 991.0, 525.0, 275.0, 180.0, 109.0, 60.0, 43.0, 29.0, 21.0, 11.0, 11.0, 8.0, 7.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.876953125, -2.786285400390625, -2.69561767578125, -2.604949951171875, -2.5142822265625, -2.423614501953125, -2.33294677734375, -2.242279052734375, -2.151611328125, -2.060943603515625, -1.97027587890625, -1.879608154296875, -1.7889404296875, -1.698272705078125, -1.60760498046875, -1.516937255859375, -1.42626953125, -1.335601806640625, -1.24493408203125, -1.154266357421875, -1.0635986328125, -0.972930908203125, -0.88226318359375, -0.791595458984375, -0.700927734375, -0.610260009765625, -0.51959228515625, -0.428924560546875, -0.3382568359375, -0.247589111328125, -0.15692138671875, -0.066253662109375, 0.0244140625, 0.115081787109375, 0.20574951171875, 0.296417236328125, 0.3870849609375, 0.477752685546875, 0.56842041015625, 0.659088134765625, 0.749755859375, 0.840423583984375, 0.93109130859375, 1.021759033203125, 1.1124267578125, 1.203094482421875, 1.29376220703125, 1.384429931640625, 1.47509765625, 1.565765380859375, 1.65643310546875, 1.747100830078125, 1.8377685546875, 1.928436279296875, 2.01910400390625, 2.109771728515625, 2.200439453125, 2.291107177734375, 2.38177490234375, 2.472442626953125, 2.5631103515625, 2.653778076171875, 2.74444580078125, 2.835113525390625, 2.92578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 7.0, 7.0, 11.0, 15.0, 18.0, 19.0, 35.0, 44.0, 65.0, 70.0, 105.0, 110.0, 104.0, 98.0, 84.0, 52.0, 53.0, 28.0, 25.0, 17.0, 12.0, 10.0, 4.0, 4.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020039081573486328, -0.0001936890184879303, -0.00018698722124099731, -0.00018028542399406433, -0.00017358362674713135, -0.00016688182950019836, -0.00016018003225326538, -0.0001534782350063324, -0.00014677643775939941, -0.00014007464051246643, -0.00013337284326553345, -0.00012667104601860046, -0.00011996924877166748, -0.0001132674515247345, -0.00010656565427780151, -9.986385703086853e-05, -9.316205978393555e-05, -8.646026253700256e-05, -7.975846529006958e-05, -7.30566680431366e-05, -6.635487079620361e-05, -5.965307354927063e-05, -5.2951276302337646e-05, -4.624947905540466e-05, -3.954768180847168e-05, -3.2845884561538696e-05, -2.6144087314605713e-05, -1.944229006767273e-05, -1.2740492820739746e-05, -6.038695573806763e-06, 6.631016731262207e-07, 7.364898920059204e-06, 1.4066696166992188e-05, 2.076849341392517e-05, 2.7470290660858154e-05, 3.417208790779114e-05, 4.087388515472412e-05, 4.7575682401657104e-05, 5.427747964859009e-05, 6.097927689552307e-05, 6.768107414245605e-05, 7.438287138938904e-05, 8.108466863632202e-05, 8.7786465883255e-05, 9.448826313018799e-05, 0.00010119006037712097, 0.00010789185762405396, 0.00011459365487098694, 0.00012129545211791992, 0.0001279972493648529, 0.0001346990466117859, 0.00014140084385871887, 0.00014810264110565186, 0.00015480443835258484, 0.00016150623559951782, 0.0001682080328464508, 0.0001749098300933838, 0.00018161162734031677, 0.00018831342458724976, 0.00019501522183418274, 0.00020171701908111572, 0.0002084188163280487, 0.0002151206135749817, 0.00022182241082191467, 0.00022852420806884766]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 4.0, 16.0, 11.0, 10.0, 12.0, 21.0, 29.0, 38.0, 60.0, 72.0, 116.0, 160.0, 228.0, 440.0, 779.0, 1410.0, 2660.0, 5482.0, 11064.0, 22973.0, 46387.0, 87527.0, 148946.0, 206704.0, 202582.0, 141717.0, 83115.0, 43266.0, 21508.0, 10531.0, 4967.0, 2528.0, 1263.0, 698.0, 437.0, 256.0, 142.0, 96.0, 71.0, 55.0, 29.0, 33.0, 21.0, 19.0, 16.0, 12.0, 8.0, 8.0, 5.0, 3.0, 7.0, 4.0, 2.0, 0.0, 1.0, 3.0], "bins": [-2.564453125, -2.48419189453125, -2.4039306640625, -2.32366943359375, -2.243408203125, -2.16314697265625, -2.0828857421875, -2.00262451171875, -1.92236328125, -1.84210205078125, -1.7618408203125, -1.68157958984375, -1.601318359375, -1.52105712890625, -1.4407958984375, -1.36053466796875, -1.2802734375, -1.20001220703125, -1.1197509765625, -1.03948974609375, -0.959228515625, -0.87896728515625, -0.7987060546875, -0.71844482421875, -0.63818359375, -0.55792236328125, -0.4776611328125, -0.39739990234375, -0.317138671875, -0.23687744140625, -0.1566162109375, -0.07635498046875, 0.00390625, 0.08416748046875, 0.1644287109375, 0.24468994140625, 0.324951171875, 0.40521240234375, 0.4854736328125, 0.56573486328125, 0.64599609375, 0.72625732421875, 0.8065185546875, 0.88677978515625, 0.967041015625, 1.04730224609375, 1.1275634765625, 1.20782470703125, 1.2880859375, 1.36834716796875, 1.4486083984375, 1.52886962890625, 1.609130859375, 1.68939208984375, 1.7696533203125, 1.84991455078125, 1.93017578125, 2.01043701171875, 2.0906982421875, 2.17095947265625, 2.251220703125, 2.33148193359375, 2.4117431640625, 2.49200439453125, 2.572265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 10.0, 13.0, 10.0, 13.0, 19.0, 26.0, 35.0, 47.0, 57.0, 58.0, 86.0, 74.0, 96.0, 82.0, 69.0, 55.0, 56.0, 45.0, 40.0, 32.0, 17.0, 19.0, 12.0, 9.0, 4.0, 6.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.115234375, -1.079681396484375, -1.04412841796875, -1.008575439453125, -0.9730224609375, -0.937469482421875, -0.90191650390625, -0.866363525390625, -0.830810546875, -0.795257568359375, -0.75970458984375, -0.724151611328125, -0.6885986328125, -0.653045654296875, -0.61749267578125, -0.581939697265625, -0.54638671875, -0.510833740234375, -0.47528076171875, -0.439727783203125, -0.4041748046875, -0.368621826171875, -0.33306884765625, -0.297515869140625, -0.261962890625, -0.226409912109375, -0.19085693359375, -0.155303955078125, -0.1197509765625, -0.084197998046875, -0.04864501953125, -0.013092041015625, 0.0224609375, 0.058013916015625, 0.09356689453125, 0.129119873046875, 0.1646728515625, 0.200225830078125, 0.23577880859375, 0.271331787109375, 0.306884765625, 0.342437744140625, 0.37799072265625, 0.413543701171875, 0.4490966796875, 0.484649658203125, 0.52020263671875, 0.555755615234375, 0.59130859375, 0.626861572265625, 0.66241455078125, 0.697967529296875, 0.7335205078125, 0.769073486328125, 0.80462646484375, 0.840179443359375, 0.875732421875, 0.911285400390625, 0.94683837890625, 0.982391357421875, 1.0179443359375, 1.053497314453125, 1.08905029296875, 1.124603271484375, 1.16015625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 7.0, 3.0, 6.0, 6.0, 12.0, 7.0, 12.0, 15.0, 16.0, 25.0, 30.0, 29.0, 26.0, 28.0, 31.0, 24.0, 37.0, 49.0, 37.0, 31.0, 38.0, 42.0, 41.0, 36.0, 46.0, 37.0, 36.0, 36.0, 32.0, 26.0, 18.0, 26.0, 19.0, 25.0, 20.0, 17.0, 16.0, 8.0, 14.0, 6.0, 4.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.033145904541016, -23.22198486328125, -22.410825729370117, -21.59966468811035, -20.788503646850586, -19.977344512939453, -19.166183471679688, -18.355022430419922, -17.54386329650879, -16.732702255249023, -15.921542167663574, -15.110382080078125, -14.299221992492676, -13.488061904907227, -12.676900863647461, -11.865740776062012, -11.054579734802246, -10.243419647216797, -9.432258605957031, -8.621098518371582, -7.809938430786133, -6.998777866363525, -6.187617301940918, -5.376457214355469, -4.565296649932861, -3.754136323928833, -2.9429759979248047, -2.1318154335021973, -1.320655107498169, -0.5094947814941406, 0.3016657829284668, 1.112825870513916, 1.9239864349365234, 2.7351467609405518, 3.54630708694458, 4.3574676513671875, 5.168627738952637, 5.979788303375244, 6.790948867797852, 7.602108955383301, 8.41326904296875, 9.2244291305542, 10.035590171813965, 10.846750259399414, 11.657910346984863, 12.469070434570312, 13.280231475830078, 14.091391563415527, 14.902552604675293, 15.713712692260742, 16.524873733520508, 17.33603286743164, 18.147193908691406, 18.958354949951172, 19.769515991210938, 20.58067512512207, 21.391836166381836, 22.2029972076416, 23.014156341552734, 23.8253173828125, 24.636478424072266, 25.4476375579834, 26.258798599243164, 27.069957733154297, 27.881118774414062]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 4.0, 7.0, 14.0, 11.0, 18.0, 13.0, 28.0, 21.0, 28.0, 32.0, 20.0, 40.0, 36.0, 35.0, 48.0, 34.0, 40.0, 54.0, 57.0, 48.0, 45.0, 49.0, 30.0, 46.0, 28.0, 36.0, 32.0, 27.0, 19.0, 25.0, 14.0, 12.0, 10.0, 11.0, 4.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.725088119506836, -28.738977432250977, -27.752866744995117, -26.766756057739258, -25.7806453704834, -24.79453468322754, -23.808422088623047, -22.822311401367188, -21.836200714111328, -20.85009002685547, -19.86397933959961, -18.87786865234375, -17.89175796508789, -16.90564727783203, -15.919535636901855, -14.933424949645996, -13.947315216064453, -12.961204528808594, -11.975093841552734, -10.988983154296875, -10.002872467041016, -9.016761779785156, -8.03065013885498, -7.044539451599121, -6.058428764343262, -5.072318077087402, -4.086207389831543, -3.1000962257385254, -2.113985538482666, -1.1278748512268066, -0.14176368713378906, 0.8443470001220703, 1.8304595947265625, 2.816570281982422, 3.8026812076568604, 4.788792133331299, 5.774902820587158, 6.761013507843018, 7.747124671936035, 8.733235359191895, 9.719346046447754, 10.705456733703613, 11.691567420959473, 12.677679061889648, 13.663789749145508, 14.649900436401367, 15.636011123657227, 16.622121810913086, 17.608232498168945, 18.594343185424805, 19.580453872680664, 20.566564559936523, 21.552675247192383, 22.538785934448242, 23.524898529052734, 24.511009216308594, 25.497119903564453, 26.483230590820312, 27.469341278076172, 28.45545196533203, 29.44156265258789, 30.42767333984375, 31.41378402709961, 32.39989471435547, 33.38600540161133]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 10.0, 15.0, 35.0, 29.0, 56.0, 79.0, 133.0, 198.0, 306.0, 482.0, 778.0, 1216.0, 1890.0, 2983.0, 4700.0, 6992.0, 10813.0, 15434.0, 22852.0, 31581.0, 42774.0, 56053.0, 70127.0, 83473.0, 92837.0, 98470.0, 95830.0, 89366.0, 78191.0, 64383.0, 50612.0, 38540.0, 27998.0, 19730.0, 13468.0, 8980.0, 6082.0, 3936.0, 2608.0, 1635.0, 1053.0, 648.0, 407.0, 265.0, 178.0, 111.0, 68.0, 56.0, 39.0, 21.0, 16.0, 5.0, 5.0, 5.0, 3.0, 3.0], "bins": [-21.0625, -20.439453125, -19.81640625, -19.193359375, -18.5703125, -17.947265625, -17.32421875, -16.701171875, -16.078125, -15.455078125, -14.83203125, -14.208984375, -13.5859375, -12.962890625, -12.33984375, -11.716796875, -11.09375, -10.470703125, -9.84765625, -9.224609375, -8.6015625, -7.978515625, -7.35546875, -6.732421875, -6.109375, -5.486328125, -4.86328125, -4.240234375, -3.6171875, -2.994140625, -2.37109375, -1.748046875, -1.125, -0.501953125, 0.12109375, 0.744140625, 1.3671875, 1.990234375, 2.61328125, 3.236328125, 3.859375, 4.482421875, 5.10546875, 5.728515625, 6.3515625, 6.974609375, 7.59765625, 8.220703125, 8.84375, 9.466796875, 10.08984375, 10.712890625, 11.3359375, 11.958984375, 12.58203125, 13.205078125, 13.828125, 14.451171875, 15.07421875, 15.697265625, 16.3203125, 16.943359375, 17.56640625, 18.189453125, 18.8125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 5.0, 16.0, 12.0, 16.0, 14.0, 23.0, 30.0, 24.0, 29.0, 23.0, 42.0, 29.0, 40.0, 42.0, 39.0, 43.0, 43.0, 59.0, 45.0, 49.0, 47.0, 40.0, 35.0, 35.0, 31.0, 35.0, 29.0, 18.0, 24.0, 15.0, 13.0, 10.0, 8.0, 7.0, 6.0, 1.0, 8.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.546875, -28.567626953125, -27.58837890625, -26.609130859375, -25.6298828125, -24.650634765625, -23.67138671875, -22.692138671875, -21.712890625, -20.733642578125, -19.75439453125, -18.775146484375, -17.7958984375, -16.816650390625, -15.83740234375, -14.858154296875, -13.87890625, -12.899658203125, -11.92041015625, -10.941162109375, -9.9619140625, -8.982666015625, -8.00341796875, -7.024169921875, -6.044921875, -5.065673828125, -4.08642578125, -3.107177734375, -2.1279296875, -1.148681640625, -0.16943359375, 0.809814453125, 1.7890625, 2.768310546875, 3.74755859375, 4.726806640625, 5.7060546875, 6.685302734375, 7.66455078125, 8.643798828125, 9.623046875, 10.602294921875, 11.58154296875, 12.560791015625, 13.5400390625, 14.519287109375, 15.49853515625, 16.477783203125, 17.45703125, 18.436279296875, 19.41552734375, 20.394775390625, 21.3740234375, 22.353271484375, 23.33251953125, 24.311767578125, 25.291015625, 26.270263671875, 27.24951171875, 28.228759765625, 29.2080078125, 30.187255859375, 31.16650390625, 32.145751953125, 33.125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 7.0, 8.0, 12.0, 21.0, 35.0, 47.0, 73.0, 90.0, 136.0, 186.0, 310.0, 446.0, 650.0, 1053.0, 1600.0, 2299.0, 3562.0, 5496.0, 8508.0, 12833.0, 19346.0, 28522.0, 40919.0, 55647.0, 73776.0, 90783.0, 103894.0, 110428.0, 107053.0, 96284.0, 80001.0, 62000.0, 45588.0, 32265.0, 21956.0, 14725.0, 9582.0, 6335.0, 4225.0, 2651.0, 1731.0, 1132.0, 750.0, 561.0, 343.0, 233.0, 152.0, 104.0, 68.0, 55.0, 29.0, 20.0, 12.0, 10.0, 7.0, 5.0, 4.0, 0.0, 2.0], "bins": [-25.609375, -24.825439453125, -24.04150390625, -23.257568359375, -22.4736328125, -21.689697265625, -20.90576171875, -20.121826171875, -19.337890625, -18.553955078125, -17.77001953125, -16.986083984375, -16.2021484375, -15.418212890625, -14.63427734375, -13.850341796875, -13.06640625, -12.282470703125, -11.49853515625, -10.714599609375, -9.9306640625, -9.146728515625, -8.36279296875, -7.578857421875, -6.794921875, -6.010986328125, -5.22705078125, -4.443115234375, -3.6591796875, -2.875244140625, -2.09130859375, -1.307373046875, -0.5234375, 0.260498046875, 1.04443359375, 1.828369140625, 2.6123046875, 3.396240234375, 4.18017578125, 4.964111328125, 5.748046875, 6.531982421875, 7.31591796875, 8.099853515625, 8.8837890625, 9.667724609375, 10.45166015625, 11.235595703125, 12.01953125, 12.803466796875, 13.58740234375, 14.371337890625, 15.1552734375, 15.939208984375, 16.72314453125, 17.507080078125, 18.291015625, 19.074951171875, 19.85888671875, 20.642822265625, 21.4267578125, 22.210693359375, 22.99462890625, 23.778564453125, 24.5625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 8.0, 5.0, 9.0, 4.0, 9.0, 10.0, 20.0, 18.0, 17.0, 18.0, 22.0, 23.0, 28.0, 26.0, 24.0, 31.0, 46.0, 23.0, 41.0, 25.0, 28.0, 37.0, 28.0, 40.0, 42.0, 48.0, 23.0, 30.0, 34.0, 32.0, 16.0, 25.0, 35.0, 29.0, 21.0, 19.0, 13.0, 15.0, 17.0, 11.0, 3.0, 13.0, 4.0, 4.0, 6.0, 3.0, 4.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-17.421875, -16.87841796875, -16.3349609375, -15.79150390625, -15.248046875, -14.70458984375, -14.1611328125, -13.61767578125, -13.07421875, -12.53076171875, -11.9873046875, -11.44384765625, -10.900390625, -10.35693359375, -9.8134765625, -9.27001953125, -8.7265625, -8.18310546875, -7.6396484375, -7.09619140625, -6.552734375, -6.00927734375, -5.4658203125, -4.92236328125, -4.37890625, -3.83544921875, -3.2919921875, -2.74853515625, -2.205078125, -1.66162109375, -1.1181640625, -0.57470703125, -0.03125, 0.51220703125, 1.0556640625, 1.59912109375, 2.142578125, 2.68603515625, 3.2294921875, 3.77294921875, 4.31640625, 4.85986328125, 5.4033203125, 5.94677734375, 6.490234375, 7.03369140625, 7.5771484375, 8.12060546875, 8.6640625, 9.20751953125, 9.7509765625, 10.29443359375, 10.837890625, 11.38134765625, 11.9248046875, 12.46826171875, 13.01171875, 13.55517578125, 14.0986328125, 14.64208984375, 15.185546875, 15.72900390625, 16.2724609375, 16.81591796875, 17.359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 12.0, 6.0, 9.0, 15.0, 35.0, 38.0, 74.0, 85.0, 145.0, 280.0, 427.0, 647.0, 1022.0, 1808.0, 3053.0, 5005.0, 8555.0, 14324.0, 24290.0, 39172.0, 61055.0, 88820.0, 118469.0, 139126.0, 141581.0, 124997.0, 96453.0, 67609.0, 43364.0, 27210.0, 16703.0, 9772.0, 5934.0, 3359.0, 1992.0, 1176.0, 728.0, 432.0, 286.0, 195.0, 120.0, 66.0, 34.0, 28.0, 22.0, 9.0, 9.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.8828125, -8.62249755859375, -8.3621826171875, -8.10186767578125, -7.841552734375, -7.58123779296875, -7.3209228515625, -7.06060791015625, -6.80029296875, -6.53997802734375, -6.2796630859375, -6.01934814453125, -5.759033203125, -5.49871826171875, -5.2384033203125, -4.97808837890625, -4.7177734375, -4.45745849609375, -4.1971435546875, -3.93682861328125, -3.676513671875, -3.41619873046875, -3.1558837890625, -2.89556884765625, -2.63525390625, -2.37493896484375, -2.1146240234375, -1.85430908203125, -1.593994140625, -1.33367919921875, -1.0733642578125, -0.81304931640625, -0.552734375, -0.29241943359375, -0.0321044921875, 0.22821044921875, 0.488525390625, 0.74884033203125, 1.0091552734375, 1.26947021484375, 1.52978515625, 1.79010009765625, 2.0504150390625, 2.31072998046875, 2.571044921875, 2.83135986328125, 3.0916748046875, 3.35198974609375, 3.6123046875, 3.87261962890625, 4.1329345703125, 4.39324951171875, 4.653564453125, 4.91387939453125, 5.1741943359375, 5.43450927734375, 5.69482421875, 5.95513916015625, 6.2154541015625, 6.47576904296875, 6.736083984375, 6.99639892578125, 7.2567138671875, 7.51702880859375, 7.77734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 5.0, 14.0, 14.0, 15.0, 20.0, 22.0, 26.0, 33.0, 48.0, 43.0, 55.0, 69.0, 64.0, 69.0, 51.0, 60.0, 51.0, 39.0, 44.0, 36.0, 45.0, 28.0, 21.0, 18.0, 29.0, 19.0, 15.0, 9.0, 6.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012407302856445312, -0.001207977533340454, -0.001175224781036377, -0.0011424720287322998, -0.0011097192764282227, -0.0010769665241241455, -0.0010442137718200684, -0.0010114610195159912, -0.000978708267211914, -0.0009459555149078369, -0.0009132027626037598, -0.0008804500102996826, -0.0008476972579956055, -0.0008149445056915283, -0.0007821917533874512, -0.000749439001083374, -0.0007166862487792969, -0.0006839334964752197, -0.0006511807441711426, -0.0006184279918670654, -0.0005856752395629883, -0.0005529224872589111, -0.000520169734954834, -0.00048741698265075684, -0.0004546642303466797, -0.00042191147804260254, -0.0003891587257385254, -0.00035640597343444824, -0.0003236532211303711, -0.00029090046882629395, -0.0002581477165222168, -0.00022539496421813965, -0.0001926422119140625, -0.00015988945960998535, -0.0001271367073059082, -9.438395500183105e-05, -6.16312026977539e-05, -2.8878450393676758e-05, 3.874301910400391e-06, 3.662705421447754e-05, 6.937980651855469e-05, 0.00010213255882263184, 0.00013488531112670898, 0.00016763806343078613, 0.00020039081573486328, 0.00023314356803894043, 0.0002658963203430176, 0.0002986490726470947, 0.0003314018249511719, 0.000364154577255249, 0.00039690732955932617, 0.0004296600818634033, 0.00046241283416748047, 0.0004951655864715576, 0.0005279183387756348, 0.0005606710910797119, 0.0005934238433837891, 0.0006261765956878662, 0.0006589293479919434, 0.0006916821002960205, 0.0007244348526000977, 0.0007571876049041748, 0.000789940357208252, 0.0008226931095123291, 0.0008554458618164062]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 6.0, 6.0, 11.0, 16.0, 21.0, 43.0, 67.0, 117.0, 127.0, 279.0, 354.0, 603.0, 853.0, 1323.0, 2038.0, 3075.0, 4847.0, 7316.0, 11497.0, 17062.0, 25524.0, 37508.0, 53119.0, 70952.0, 89490.0, 105351.0, 113172.0, 110526.0, 100477.0, 83511.0, 64384.0, 46852.0, 32910.0, 22472.0, 14755.0, 9708.0, 6445.0, 4146.0, 2709.0, 1704.0, 1050.0, 764.0, 483.0, 301.0, 197.0, 153.0, 84.0, 53.0, 33.0, 25.0, 17.0, 8.0, 3.0, 11.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.4921875, -6.28155517578125, -6.0709228515625, -5.86029052734375, -5.649658203125, -5.43902587890625, -5.2283935546875, -5.01776123046875, -4.80712890625, -4.59649658203125, -4.3858642578125, -4.17523193359375, -3.964599609375, -3.75396728515625, -3.5433349609375, -3.33270263671875, -3.1220703125, -2.91143798828125, -2.7008056640625, -2.49017333984375, -2.279541015625, -2.06890869140625, -1.8582763671875, -1.64764404296875, -1.43701171875, -1.22637939453125, -1.0157470703125, -0.80511474609375, -0.594482421875, -0.38385009765625, -0.1732177734375, 0.03741455078125, 0.248046875, 0.45867919921875, 0.6693115234375, 0.87994384765625, 1.090576171875, 1.30120849609375, 1.5118408203125, 1.72247314453125, 1.93310546875, 2.14373779296875, 2.3543701171875, 2.56500244140625, 2.775634765625, 2.98626708984375, 3.1968994140625, 3.40753173828125, 3.6181640625, 3.82879638671875, 4.0394287109375, 4.25006103515625, 4.460693359375, 4.67132568359375, 4.8819580078125, 5.09259033203125, 5.30322265625, 5.51385498046875, 5.7244873046875, 5.93511962890625, 6.145751953125, 6.35638427734375, 6.5670166015625, 6.77764892578125, 6.98828125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 2.0, 6.0, 7.0, 5.0, 15.0, 5.0, 10.0, 15.0, 17.0, 28.0, 27.0, 33.0, 34.0, 43.0, 41.0, 45.0, 43.0, 35.0, 52.0, 67.0, 49.0, 53.0, 51.0, 56.0, 41.0, 42.0, 35.0, 28.0, 27.0, 16.0, 10.0, 15.0, 9.0, 14.0, 8.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.162109375, -3.05987548828125, -2.9576416015625, -2.85540771484375, -2.753173828125, -2.65093994140625, -2.5487060546875, -2.44647216796875, -2.34423828125, -2.24200439453125, -2.1397705078125, -2.03753662109375, -1.935302734375, -1.83306884765625, -1.7308349609375, -1.62860107421875, -1.5263671875, -1.42413330078125, -1.3218994140625, -1.21966552734375, -1.117431640625, -1.01519775390625, -0.9129638671875, -0.81072998046875, -0.70849609375, -0.60626220703125, -0.5040283203125, -0.40179443359375, -0.299560546875, -0.19732666015625, -0.0950927734375, 0.00714111328125, 0.109375, 0.21160888671875, 0.3138427734375, 0.41607666015625, 0.518310546875, 0.62054443359375, 0.7227783203125, 0.82501220703125, 0.92724609375, 1.02947998046875, 1.1317138671875, 1.23394775390625, 1.336181640625, 1.43841552734375, 1.5406494140625, 1.64288330078125, 1.7451171875, 1.84735107421875, 1.9495849609375, 2.05181884765625, 2.154052734375, 2.25628662109375, 2.3585205078125, 2.46075439453125, 2.56298828125, 2.66522216796875, 2.7674560546875, 2.86968994140625, 2.971923828125, 3.07415771484375, 3.1763916015625, 3.27862548828125, 3.380859375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 7.0, 1.0, 3.0, 7.0, 8.0, 7.0, 14.0, 17.0, 13.0, 17.0, 26.0, 20.0, 17.0, 39.0, 53.0, 35.0, 29.0, 48.0, 39.0, 38.0, 34.0, 48.0, 41.0, 51.0, 52.0, 38.0, 31.0, 28.0, 32.0, 25.0, 28.0, 25.0, 27.0, 17.0, 17.0, 14.0, 11.0, 8.0, 7.0, 11.0, 10.0, 3.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.159210205078125, -29.23592185974121, -28.312631607055664, -27.38934326171875, -26.466054916381836, -25.542766571044922, -24.619476318359375, -23.69618797302246, -22.772899627685547, -21.849611282348633, -20.926321029663086, -20.003032684326172, -19.079744338989258, -18.156455993652344, -17.233165740966797, -16.309877395629883, -15.386587142944336, -14.463297843933105, -13.540009498596191, -12.616720199584961, -11.693431854248047, -10.770142555236816, -9.846853256225586, -8.923564910888672, -8.000275611877441, -7.076986789703369, -6.153697967529297, -5.230408668518066, -4.307119846343994, -3.383831024169922, -2.4605417251586914, -1.5372529029846191, -0.6139621734619141, 0.30932676792144775, 1.2326157093048096, 2.155904769897461, 3.079193592071533, 4.0024824142456055, 4.925771713256836, 5.849060535430908, 6.7723493576049805, 7.695638179779053, 8.618927001953125, 9.542216300964355, 10.465505599975586, 11.3887939453125, 12.31208324432373, 13.235372543334961, 14.158660888671875, 15.081950187683105, 16.005239486694336, 16.92852783203125, 17.851816177368164, 18.775104522705078, 19.698394775390625, 20.62168312072754, 21.544971466064453, 22.468259811401367, 23.391550064086914, 24.314838409423828, 25.238126754760742, 26.161415100097656, 27.084705352783203, 28.007993698120117, 28.931283950805664]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 15.0, 12.0, 19.0, 22.0, 22.0, 20.0, 29.0, 43.0, 29.0, 56.0, 36.0, 54.0, 41.0, 51.0, 60.0, 37.0, 52.0, 43.0, 40.0, 40.0, 39.0, 42.0, 37.0, 32.0, 17.0, 21.0, 12.0, 16.0, 8.0, 10.0, 11.0, 9.0, 3.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.4459342956543, -32.32765197753906, -31.209365844726562, -30.091083526611328, -28.97279930114746, -27.854515075683594, -26.736230850219727, -25.61794662475586, -24.499664306640625, -23.381380081176758, -22.26309585571289, -21.144813537597656, -20.02652931213379, -18.908245086669922, -17.789960861206055, -16.671676635742188, -15.55339241027832, -14.435108184814453, -13.316824913024902, -12.198540687561035, -11.080257415771484, -9.961973190307617, -8.84368896484375, -7.725405216217041, -6.607121467590332, -5.488837718963623, -4.370553970336914, -3.252269744873047, -2.133985996246338, -1.015702247619629, 0.10258197784423828, 1.2208657264709473, 2.3391494750976562, 3.4574332237243652, 4.575716972351074, 5.694001197814941, 6.81228494644165, 7.930568695068359, 9.048852920532227, 10.167137145996094, 11.285420417785645, 12.403704643249512, 13.521987915039062, 14.64027214050293, 15.758556365966797, 16.87683868408203, 17.99512481689453, 19.113407135009766, 20.231691360473633, 21.3499755859375, 22.468259811401367, 23.586544036865234, 24.70482635498047, 25.823110580444336, 26.941394805908203, 28.05967903137207, 29.177963256835938, 30.296247482299805, 31.414531707763672, 32.532814025878906, 33.651100158691406, 34.76938247680664, 35.887664794921875, 37.005950927734375, 38.12423324584961]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 13.0, 21.0, 40.0, 44.0, 70.0, 119.0, 185.0, 297.0, 454.0, 712.0, 1155.0, 1933.0, 2891.0, 4681.0, 7386.0, 12225.0, 18959.0, 29887.0, 46752.0, 73340.0, 112611.0, 170066.0, 247752.0, 345250.0, 440354.0, 508453.0, 517783.0, 462795.0, 371197.0, 271495.0, 188599.0, 127389.0, 82890.0, 53694.0, 33891.0, 21667.0, 13564.0, 8647.0, 5559.0, 3388.0, 2246.0, 1372.0, 861.0, 572.0, 351.0, 233.0, 147.0, 114.0, 76.0, 31.0, 30.0, 16.0, 13.0, 11.0, 2.0, 2.0, 3.0, 1.0], "bins": [-26.890625, -26.053955078125, -25.21728515625, -24.380615234375, -23.5439453125, -22.707275390625, -21.87060546875, -21.033935546875, -20.197265625, -19.360595703125, -18.52392578125, -17.687255859375, -16.8505859375, -16.013916015625, -15.17724609375, -14.340576171875, -13.50390625, -12.667236328125, -11.83056640625, -10.993896484375, -10.1572265625, -9.320556640625, -8.48388671875, -7.647216796875, -6.810546875, -5.973876953125, -5.13720703125, -4.300537109375, -3.4638671875, -2.627197265625, -1.79052734375, -0.953857421875, -0.1171875, 0.719482421875, 1.55615234375, 2.392822265625, 3.2294921875, 4.066162109375, 4.90283203125, 5.739501953125, 6.576171875, 7.412841796875, 8.24951171875, 9.086181640625, 9.9228515625, 10.759521484375, 11.59619140625, 12.432861328125, 13.26953125, 14.106201171875, 14.94287109375, 15.779541015625, 16.6162109375, 17.452880859375, 18.28955078125, 19.126220703125, 19.962890625, 20.799560546875, 21.63623046875, 22.472900390625, 23.3095703125, 24.146240234375, 24.98291015625, 25.819580078125, 26.65625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 6.0, 2.0, 10.0, 12.0, 14.0, 18.0, 17.0, 27.0, 22.0, 29.0, 35.0, 38.0, 48.0, 43.0, 47.0, 52.0, 53.0, 53.0, 49.0, 44.0, 47.0, 38.0, 39.0, 37.0, 42.0, 33.0, 34.0, 21.0, 17.0, 13.0, 16.0, 10.0, 11.0, 6.0, 10.0, 3.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.390625, -27.436767578125, -26.48291015625, -25.529052734375, -24.5751953125, -23.621337890625, -22.66748046875, -21.713623046875, -20.759765625, -19.805908203125, -18.85205078125, -17.898193359375, -16.9443359375, -15.990478515625, -15.03662109375, -14.082763671875, -13.12890625, -12.175048828125, -11.22119140625, -10.267333984375, -9.3134765625, -8.359619140625, -7.40576171875, -6.451904296875, -5.498046875, -4.544189453125, -3.59033203125, -2.636474609375, -1.6826171875, -0.728759765625, 0.22509765625, 1.178955078125, 2.1328125, 3.086669921875, 4.04052734375, 4.994384765625, 5.9482421875, 6.902099609375, 7.85595703125, 8.809814453125, 9.763671875, 10.717529296875, 11.67138671875, 12.625244140625, 13.5791015625, 14.532958984375, 15.48681640625, 16.440673828125, 17.39453125, 18.348388671875, 19.30224609375, 20.256103515625, 21.2099609375, 22.163818359375, 23.11767578125, 24.071533203125, 25.025390625, 25.979248046875, 26.93310546875, 27.886962890625, 28.8408203125, 29.794677734375, 30.74853515625, 31.702392578125, 32.65625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 12.0, 10.0, 20.0, 37.0, 58.0, 94.0, 155.0, 274.0, 437.0, 782.0, 1332.0, 2179.0, 3905.0, 6546.0, 11407.0, 19437.0, 32906.0, 54772.0, 89017.0, 140960.0, 214750.0, 308743.0, 411134.0, 497266.0, 533758.0, 506366.0, 422580.0, 321667.0, 225451.0, 149868.0, 94673.0, 58678.0, 35147.0, 20663.0, 12203.0, 7148.0, 4145.0, 2358.0, 1384.0, 827.0, 466.0, 274.0, 163.0, 96.0, 53.0, 25.0, 30.0, 13.0, 10.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-28.5, -27.65087890625, -26.8017578125, -25.95263671875, -25.103515625, -24.25439453125, -23.4052734375, -22.55615234375, -21.70703125, -20.85791015625, -20.0087890625, -19.15966796875, -18.310546875, -17.46142578125, -16.6123046875, -15.76318359375, -14.9140625, -14.06494140625, -13.2158203125, -12.36669921875, -11.517578125, -10.66845703125, -9.8193359375, -8.97021484375, -8.12109375, -7.27197265625, -6.4228515625, -5.57373046875, -4.724609375, -3.87548828125, -3.0263671875, -2.17724609375, -1.328125, -0.47900390625, 0.3701171875, 1.21923828125, 2.068359375, 2.91748046875, 3.7666015625, 4.61572265625, 5.46484375, 6.31396484375, 7.1630859375, 8.01220703125, 8.861328125, 9.71044921875, 10.5595703125, 11.40869140625, 12.2578125, 13.10693359375, 13.9560546875, 14.80517578125, 15.654296875, 16.50341796875, 17.3525390625, 18.20166015625, 19.05078125, 19.89990234375, 20.7490234375, 21.59814453125, 22.447265625, 23.29638671875, 24.1455078125, 24.99462890625, 25.84375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 11.0, 18.0, 17.0, 17.0, 26.0, 36.0, 51.0, 65.0, 65.0, 90.0, 117.0, 153.0, 152.0, 164.0, 171.0, 186.0, 213.0, 229.0, 242.0, 244.0, 234.0, 207.0, 204.0, 171.0, 143.0, 156.0, 127.0, 121.0, 98.0, 74.0, 50.0, 39.0, 44.0, 31.0, 26.0, 21.0, 20.0, 12.0, 8.0, 6.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.390625, -12.96875, -12.546875, -12.125, -11.703125, -11.28125, -10.859375, -10.4375, -10.015625, -9.59375, -9.171875, -8.75, -8.328125, -7.90625, -7.484375, -7.0625, -6.640625, -6.21875, -5.796875, -5.375, -4.953125, -4.53125, -4.109375, -3.6875, -3.265625, -2.84375, -2.421875, -2.0, -1.578125, -1.15625, -0.734375, -0.3125, 0.109375, 0.53125, 0.953125, 1.375, 1.796875, 2.21875, 2.640625, 3.0625, 3.484375, 3.90625, 4.328125, 4.75, 5.171875, 5.59375, 6.015625, 6.4375, 6.859375, 7.28125, 7.703125, 8.125, 8.546875, 8.96875, 9.390625, 9.8125, 10.234375, 10.65625, 11.078125, 11.5, 11.921875, 12.34375, 12.765625, 13.1875, 13.609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 7.0, 13.0, 6.0, 4.0, 9.0, 17.0, 17.0, 22.0, 18.0, 24.0, 33.0, 21.0, 41.0, 29.0, 37.0, 32.0, 54.0, 29.0, 35.0, 47.0, 51.0, 48.0, 36.0, 28.0, 26.0, 37.0, 36.0, 31.0, 32.0, 25.0, 18.0, 17.0, 20.0, 13.0, 13.0, 12.0, 17.0, 2.0, 6.0, 7.0, 8.0, 6.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-27.767608642578125, -26.920015335083008, -26.07242202758789, -25.224830627441406, -24.37723731994629, -23.529644012451172, -22.682050704956055, -21.834457397460938, -20.986865997314453, -20.139272689819336, -19.29167938232422, -18.444087982177734, -17.596494674682617, -16.7489013671875, -15.901308059692383, -15.053715705871582, -14.206122398376465, -13.358529090881348, -12.510936737060547, -11.66334342956543, -10.815751075744629, -9.968157768249512, -9.120565414428711, -8.272972106933594, -7.425379276275635, -6.577786445617676, -5.730193614959717, -4.882600784301758, -4.035007476806641, -3.1874146461486816, -2.3398218154907227, -1.4922289848327637, -0.6446361541748047, 0.20295673608779907, 1.0505496263504028, 1.8981425762176514, 2.7457354068756104, 3.5933284759521484, 4.440921306610107, 5.288514137268066, 6.136106967926025, 6.983699798583984, 7.831292629241943, 8.678885459899902, 9.52647876739502, 10.37407112121582, 11.221664428710938, 12.069257736206055, 12.916850090026855, 13.764443397521973, 14.612035751342773, 15.45962905883789, 16.307222366333008, 17.154815673828125, 18.00240707397461, 18.850000381469727, 19.697593688964844, 20.54518699645996, 21.392780303955078, 22.240371704101562, 23.08796501159668, 23.935558319091797, 24.783151626586914, 25.63074493408203, 26.478336334228516]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 1.0, 4.0, 6.0, 8.0, 9.0, 10.0, 10.0, 19.0, 14.0, 13.0, 30.0, 23.0, 27.0, 32.0, 40.0, 44.0, 33.0, 38.0, 47.0, 43.0, 50.0, 37.0, 42.0, 42.0, 36.0, 43.0, 43.0, 31.0, 26.0, 35.0, 29.0, 21.0, 22.0, 26.0, 10.0, 13.0, 8.0, 11.0, 3.0, 7.0, 6.0, 1.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.27320671081543, -28.30241584777832, -27.33162498474121, -26.3608341217041, -25.390043258666992, -24.419252395629883, -23.448461532592773, -22.477670669555664, -21.506879806518555, -20.536088943481445, -19.565298080444336, -18.594507217407227, -17.623716354370117, -16.652925491333008, -15.682134628295898, -14.711343765258789, -13.74055290222168, -12.76976203918457, -11.798971176147461, -10.828180313110352, -9.857389450073242, -8.886598587036133, -7.915807723999023, -6.945016860961914, -5.974225997924805, -5.003435134887695, -4.032644271850586, -3.0618534088134766, -2.091062545776367, -1.1202716827392578, -0.14948081970214844, 0.8213100433349609, 1.7921028137207031, 2.7628936767578125, 3.733684539794922, 4.704475402832031, 5.675266265869141, 6.64605712890625, 7.616847991943359, 8.587638854980469, 9.558429718017578, 10.529220581054688, 11.500011444091797, 12.470802307128906, 13.441593170166016, 14.412384033203125, 15.383174896240234, 16.353965759277344, 17.324756622314453, 18.295547485351562, 19.266338348388672, 20.23712921142578, 21.20792007446289, 22.1787109375, 23.14950180053711, 24.12029266357422, 25.091083526611328, 26.061874389648438, 27.032665252685547, 28.003456115722656, 28.974246978759766, 29.945037841796875, 30.915828704833984, 31.886619567871094, 32.8574104309082]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 5.0, 11.0, 10.0, 13.0, 19.0, 38.0, 49.0, 77.0, 135.0, 181.0, 272.0, 415.0, 632.0, 992.0, 1588.0, 2411.0, 3747.0, 5593.0, 8448.0, 12401.0, 18197.0, 26233.0, 36433.0, 48948.0, 62993.0, 76365.0, 89038.0, 97186.0, 99138.0, 94673.0, 85237.0, 71749.0, 57663.0, 44059.0, 32208.0, 23108.0, 16168.0, 10987.0, 7291.0, 4726.0, 3162.0, 2077.0, 1347.0, 913.0, 577.0, 359.0, 241.0, 173.0, 113.0, 71.0, 41.0, 16.0, 14.0, 8.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-11.7109375, -11.3370361328125, -10.963134765625, -10.5892333984375, -10.21533203125, -9.8414306640625, -9.467529296875, -9.0936279296875, -8.7197265625, -8.3458251953125, -7.971923828125, -7.5980224609375, -7.22412109375, -6.8502197265625, -6.476318359375, -6.1024169921875, -5.728515625, -5.3546142578125, -4.980712890625, -4.6068115234375, -4.23291015625, -3.8590087890625, -3.485107421875, -3.1112060546875, -2.7373046875, -2.3634033203125, -1.989501953125, -1.6156005859375, -1.24169921875, -0.8677978515625, -0.493896484375, -0.1199951171875, 0.25390625, 0.6278076171875, 1.001708984375, 1.3756103515625, 1.74951171875, 2.1234130859375, 2.497314453125, 2.8712158203125, 3.2451171875, 3.6190185546875, 3.992919921875, 4.3668212890625, 4.74072265625, 5.1146240234375, 5.488525390625, 5.8624267578125, 6.236328125, 6.6102294921875, 6.984130859375, 7.3580322265625, 7.73193359375, 8.1058349609375, 8.479736328125, 8.8536376953125, 9.2275390625, 9.6014404296875, 9.975341796875, 10.3492431640625, 10.72314453125, 11.0970458984375, 11.470947265625, 11.8448486328125, 12.21875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 2.0, 9.0, 9.0, 10.0, 12.0, 15.0, 14.0, 17.0, 19.0, 26.0, 32.0, 36.0, 37.0, 38.0, 37.0, 40.0, 45.0, 42.0, 59.0, 41.0, 40.0, 31.0, 42.0, 41.0, 42.0, 37.0, 24.0, 37.0, 22.0, 25.0, 22.0, 20.0, 13.0, 11.0, 10.0, 8.0, 8.0, 6.0, 4.0, 2.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.609375, -28.624267578125, -27.63916015625, -26.654052734375, -25.6689453125, -24.683837890625, -23.69873046875, -22.713623046875, -21.728515625, -20.743408203125, -19.75830078125, -18.773193359375, -17.7880859375, -16.802978515625, -15.81787109375, -14.832763671875, -13.84765625, -12.862548828125, -11.87744140625, -10.892333984375, -9.9072265625, -8.922119140625, -7.93701171875, -6.951904296875, -5.966796875, -4.981689453125, -3.99658203125, -3.011474609375, -2.0263671875, -1.041259765625, -0.05615234375, 0.928955078125, 1.9140625, 2.899169921875, 3.88427734375, 4.869384765625, 5.8544921875, 6.839599609375, 7.82470703125, 8.809814453125, 9.794921875, 10.780029296875, 11.76513671875, 12.750244140625, 13.7353515625, 14.720458984375, 15.70556640625, 16.690673828125, 17.67578125, 18.660888671875, 19.64599609375, 20.631103515625, 21.6162109375, 22.601318359375, 23.58642578125, 24.571533203125, 25.556640625, 26.541748046875, 27.52685546875, 28.511962890625, 29.4970703125, 30.482177734375, 31.46728515625, 32.452392578125, 33.4375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 11.0, 17.0, 36.0, 34.0, 41.0, 63.0, 96.0, 142.0, 202.0, 287.0, 484.0, 678.0, 1022.0, 1555.0, 2320.0, 3403.0, 5215.0, 7754.0, 11475.0, 17832.0, 28782.0, 222954.0, 647239.0, 36159.0, 20589.0, 13375.0, 8776.0, 5989.0, 3947.0, 2708.0, 1785.0, 1205.0, 778.0, 484.0, 341.0, 251.0, 174.0, 124.0, 74.0, 46.0, 41.0, 27.0, 20.0, 13.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.703125, -23.856201171875, -23.00927734375, -22.162353515625, -21.3154296875, -20.468505859375, -19.62158203125, -18.774658203125, -17.927734375, -17.080810546875, -16.23388671875, -15.386962890625, -14.5400390625, -13.693115234375, -12.84619140625, -11.999267578125, -11.15234375, -10.305419921875, -9.45849609375, -8.611572265625, -7.7646484375, -6.917724609375, -6.07080078125, -5.223876953125, -4.376953125, -3.530029296875, -2.68310546875, -1.836181640625, -0.9892578125, -0.142333984375, 0.70458984375, 1.551513671875, 2.3984375, 3.245361328125, 4.09228515625, 4.939208984375, 5.7861328125, 6.633056640625, 7.47998046875, 8.326904296875, 9.173828125, 10.020751953125, 10.86767578125, 11.714599609375, 12.5615234375, 13.408447265625, 14.25537109375, 15.102294921875, 15.94921875, 16.796142578125, 17.64306640625, 18.489990234375, 19.3369140625, 20.183837890625, 21.03076171875, 21.877685546875, 22.724609375, 23.571533203125, 24.41845703125, 25.265380859375, 26.1123046875, 26.959228515625, 27.80615234375, 28.653076171875, 29.5]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 10.0, 6.0, 12.0, 10.0, 16.0, 13.0, 19.0, 28.0, 21.0, 19.0, 29.0, 24.0, 46.0, 42.0, 41.0, 39.0, 30.0, 44.0, 33.0, 48.0, 39.0, 43.0, 40.0, 42.0, 40.0, 29.0, 26.0, 28.0, 25.0, 25.0, 26.0, 14.0, 14.0, 13.0, 10.0, 8.0, 10.0, 6.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.265625, -19.58837890625, -18.9111328125, -18.23388671875, -17.556640625, -16.87939453125, -16.2021484375, -15.52490234375, -14.84765625, -14.17041015625, -13.4931640625, -12.81591796875, -12.138671875, -11.46142578125, -10.7841796875, -10.10693359375, -9.4296875, -8.75244140625, -8.0751953125, -7.39794921875, -6.720703125, -6.04345703125, -5.3662109375, -4.68896484375, -4.01171875, -3.33447265625, -2.6572265625, -1.97998046875, -1.302734375, -0.62548828125, 0.0517578125, 0.72900390625, 1.40625, 2.08349609375, 2.7607421875, 3.43798828125, 4.115234375, 4.79248046875, 5.4697265625, 6.14697265625, 6.82421875, 7.50146484375, 8.1787109375, 8.85595703125, 9.533203125, 10.21044921875, 10.8876953125, 11.56494140625, 12.2421875, 12.91943359375, 13.5966796875, 14.27392578125, 14.951171875, 15.62841796875, 16.3056640625, 16.98291015625, 17.66015625, 18.33740234375, 19.0146484375, 19.69189453125, 20.369140625, 21.04638671875, 21.7236328125, 22.40087890625, 23.078125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 7.0, 11.0, 15.0, 23.0, 39.0, 57.0, 74.0, 98.0, 183.0, 246.0, 313.0, 468.0, 691.0, 990.0, 1502.0, 2331.0, 3406.0, 4989.0, 7671.0, 12044.0, 19632.0, 39954.0, 533336.0, 335929.0, 33845.0, 17852.0, 11138.0, 7319.0, 4715.0, 3057.0, 2152.0, 1420.0, 957.0, 647.0, 421.0, 325.0, 228.0, 127.0, 104.0, 78.0, 52.0, 39.0, 20.0, 15.0, 12.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.298828125, -2.231048583984375, -2.16326904296875, -2.095489501953125, -2.0277099609375, -1.959930419921875, -1.89215087890625, -1.824371337890625, -1.756591796875, -1.688812255859375, -1.62103271484375, -1.553253173828125, -1.4854736328125, -1.417694091796875, -1.34991455078125, -1.282135009765625, -1.21435546875, -1.146575927734375, -1.07879638671875, -1.011016845703125, -0.9432373046875, -0.875457763671875, -0.80767822265625, -0.739898681640625, -0.672119140625, -0.604339599609375, -0.53656005859375, -0.468780517578125, -0.4010009765625, -0.333221435546875, -0.26544189453125, -0.197662353515625, -0.1298828125, -0.062103271484375, 0.00567626953125, 0.073455810546875, 0.1412353515625, 0.209014892578125, 0.27679443359375, 0.344573974609375, 0.412353515625, 0.480133056640625, 0.54791259765625, 0.615692138671875, 0.6834716796875, 0.751251220703125, 0.81903076171875, 0.886810302734375, 0.95458984375, 1.022369384765625, 1.09014892578125, 1.157928466796875, 1.2257080078125, 1.293487548828125, 1.36126708984375, 1.429046630859375, 1.496826171875, 1.564605712890625, 1.63238525390625, 1.700164794921875, 1.7679443359375, 1.835723876953125, 1.90350341796875, 1.971282958984375, 2.0390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 8.0, 8.0, 7.0, 10.0, 14.0, 22.0, 18.0, 32.0, 46.0, 36.0, 52.0, 67.0, 53.0, 74.0, 68.0, 61.0, 65.0, 57.0, 56.0, 62.0, 34.0, 38.0, 25.0, 23.0, 21.0, 12.0, 7.0, 2.0, 3.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007786750793457031, -0.0007539913058280945, -0.0007293075323104858, -0.0007046237587928772, -0.0006799399852752686, -0.0006552562117576599, -0.0006305724382400513, -0.0006058886647224426, -0.000581204891204834, -0.0005565211176872253, -0.0005318373441696167, -0.0005071535706520081, -0.0004824697971343994, -0.00045778602361679077, -0.00043310225009918213, -0.0004084184765815735, -0.00038373470306396484, -0.0003590509295463562, -0.00033436715602874756, -0.0003096833825111389, -0.0002849996089935303, -0.00026031583547592163, -0.000235632061958313, -0.00021094828844070435, -0.0001862645149230957, -0.00016158074140548706, -0.00013689696788787842, -0.00011221319437026978, -8.752942085266113e-05, -6.284564733505249e-05, -3.816187381744385e-05, -1.3478100299835205e-05, 1.1205673217773438e-05, 3.588944673538208e-05, 6.057322025299072e-05, 8.525699377059937e-05, 0.00010994076728820801, 0.00013462454080581665, 0.0001593083143234253, 0.00018399208784103394, 0.00020867586135864258, 0.00023335963487625122, 0.00025804340839385986, 0.0002827271819114685, 0.00030741095542907715, 0.0003320947289466858, 0.00035677850246429443, 0.0003814622759819031, 0.0004061460494995117, 0.00043082982301712036, 0.000455513596534729, 0.00048019737005233765, 0.0005048811435699463, 0.0005295649170875549, 0.0005542486906051636, 0.0005789324641227722, 0.0006036162376403809, 0.0006283000111579895, 0.0006529837846755981, 0.0006776675581932068, 0.0007023513317108154, 0.0007270351052284241, 0.0007517188787460327, 0.0007764026522636414, 0.00080108642578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 12.0, 25.0, 40.0, 50.0, 63.0, 127.0, 176.0, 288.0, 454.0, 690.0, 1063.0, 1716.0, 2656.0, 4320.0, 6824.0, 10951.0, 18351.0, 30795.0, 51046.0, 82249.0, 119914.0, 152483.0, 159828.0, 138109.0, 100530.0, 65255.0, 39623.0, 23569.0, 14038.0, 8737.0, 5337.0, 3340.0, 2122.0, 1293.0, 894.0, 591.0, 333.0, 213.0, 137.0, 118.0, 54.0, 50.0, 22.0, 22.0, 11.0, 6.0, 2.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.09375, -1.058746337890625, -1.02374267578125, -0.988739013671875, -0.9537353515625, -0.918731689453125, -0.88372802734375, -0.848724365234375, -0.813720703125, -0.778717041015625, -0.74371337890625, -0.708709716796875, -0.6737060546875, -0.638702392578125, -0.60369873046875, -0.568695068359375, -0.53369140625, -0.498687744140625, -0.46368408203125, -0.428680419921875, -0.3936767578125, -0.358673095703125, -0.32366943359375, -0.288665771484375, -0.253662109375, -0.218658447265625, -0.18365478515625, -0.148651123046875, -0.1136474609375, -0.078643798828125, -0.04364013671875, -0.008636474609375, 0.0263671875, 0.061370849609375, 0.09637451171875, 0.131378173828125, 0.1663818359375, 0.201385498046875, 0.23638916015625, 0.271392822265625, 0.306396484375, 0.341400146484375, 0.37640380859375, 0.411407470703125, 0.4464111328125, 0.481414794921875, 0.51641845703125, 0.551422119140625, 0.58642578125, 0.621429443359375, 0.65643310546875, 0.691436767578125, 0.7264404296875, 0.761444091796875, 0.79644775390625, 0.831451416015625, 0.866455078125, 0.901458740234375, 0.93646240234375, 0.971466064453125, 1.0064697265625, 1.041473388671875, 1.07647705078125, 1.111480712890625, 1.146484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 4.0, 11.0, 12.0, 12.0, 11.0, 19.0, 20.0, 19.0, 37.0, 50.0, 42.0, 60.0, 57.0, 79.0, 82.0, 66.0, 76.0, 67.0, 41.0, 42.0, 36.0, 43.0, 28.0, 17.0, 13.0, 10.0, 11.0, 6.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.54736328125, -0.5319862365722656, -0.5166091918945312, -0.5012321472167969, -0.4858551025390625, -0.4704780578613281, -0.45510101318359375, -0.4397239685058594, -0.424346923828125, -0.4089698791503906, -0.39359283447265625, -0.3782157897949219, -0.3628387451171875, -0.3474617004394531, -0.33208465576171875, -0.3167076110839844, -0.30133056640625, -0.2859535217285156, -0.27057647705078125, -0.2551994323730469, -0.2398223876953125, -0.22444534301757812, -0.20906829833984375, -0.19369125366210938, -0.178314208984375, -0.16293716430664062, -0.14756011962890625, -0.13218307495117188, -0.1168060302734375, -0.10142898559570312, -0.08605194091796875, -0.07067489624023438, -0.0552978515625, -0.039920806884765625, -0.02454376220703125, -0.009166717529296875, 0.0062103271484375, 0.021587371826171875, 0.03696441650390625, 0.052341461181640625, 0.067718505859375, 0.08309555053710938, 0.09847259521484375, 0.11384963989257812, 0.1292266845703125, 0.14460372924804688, 0.15998077392578125, 0.17535781860351562, 0.19073486328125, 0.20611190795898438, 0.22148895263671875, 0.23686599731445312, 0.2522430419921875, 0.2676200866699219, 0.28299713134765625, 0.2983741760253906, 0.313751220703125, 0.3291282653808594, 0.34450531005859375, 0.3598823547363281, 0.3752593994140625, 0.3906364440917969, 0.40601348876953125, 0.4213905334472656, 0.436767578125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 8.0, 4.0, 2.0, 7.0, 9.0, 17.0, 12.0, 14.0, 22.0, 20.0, 30.0, 24.0, 26.0, 37.0, 37.0, 34.0, 32.0, 36.0, 38.0, 49.0, 41.0, 41.0, 43.0, 44.0, 39.0, 37.0, 35.0, 28.0, 39.0, 29.0, 27.0, 24.0, 22.0, 12.0, 14.0, 13.0, 9.0, 6.0, 9.0, 5.0, 5.0, 10.0, 4.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-28.42294692993164, -27.53778076171875, -26.65261459350586, -25.76744842529297, -24.882282257080078, -23.997116088867188, -23.111949920654297, -22.226783752441406, -21.341617584228516, -20.456451416015625, -19.571285247802734, -18.686119079589844, -17.800952911376953, -16.915786743164062, -16.030620574951172, -15.145454406738281, -14.26028823852539, -13.3751220703125, -12.48995590209961, -11.604789733886719, -10.719623565673828, -9.834457397460938, -8.949291229248047, -8.064125061035156, -7.178958892822266, -6.293792724609375, -5.408626556396484, -4.523460388183594, -3.638294219970703, -2.7531280517578125, -1.8679618835449219, -0.9827957153320312, -0.09762954711914062, 0.78753662109375, 1.6727027893066406, 2.5578689575195312, 3.443035125732422, 4.3282012939453125, 5.213367462158203, 6.098533630371094, 6.983699798583984, 7.868865966796875, 8.754032135009766, 9.639198303222656, 10.524364471435547, 11.409530639648438, 12.294696807861328, 13.179862976074219, 14.06502914428711, 14.9501953125, 15.83536148071289, 16.72052764892578, 17.605693817138672, 18.490859985351562, 19.376026153564453, 20.261192321777344, 21.146358489990234, 22.031524658203125, 22.916690826416016, 23.801856994628906, 24.687023162841797, 25.572189331054688, 26.457355499267578, 27.34252166748047, 28.22768783569336]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 3.0, 7.0, 6.0, 8.0, 15.0, 9.0, 18.0, 11.0, 18.0, 25.0, 26.0, 28.0, 45.0, 37.0, 38.0, 34.0, 39.0, 41.0, 54.0, 47.0, 38.0, 40.0, 32.0, 44.0, 36.0, 45.0, 33.0, 34.0, 21.0, 29.0, 24.0, 19.0, 21.0, 16.0, 10.0, 8.0, 7.0, 9.0, 4.0, 6.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.991809844970703, -28.021595001220703, -27.05137825012207, -26.08116340637207, -25.11094856262207, -24.140731811523438, -23.170516967773438, -22.200302124023438, -21.230087280273438, -20.259872436523438, -19.289655685424805, -18.319440841674805, -17.349225997924805, -16.379009246826172, -15.408794403076172, -14.438579559326172, -13.468363761901855, -12.498147964477539, -11.527933120727539, -10.557717323303223, -9.587502479553223, -8.617286682128906, -7.647071361541748, -6.67685604095459, -5.706640720367432, -4.736425399780273, -3.7662100791931152, -2.795994520187378, -1.8257791996002197, -0.8555636405944824, 0.11465167999267578, 1.084867000579834, 2.055082321166992, 3.0252976417541504, 3.9955129623413086, 4.965728759765625, 5.935943603515625, 6.906159400939941, 7.8763747215271, 8.846590042114258, 9.816804885864258, 10.787020683288574, 11.757235527038574, 12.72745132446289, 13.69766616821289, 14.667881965637207, 15.638097763061523, 16.608312606811523, 17.578529357910156, 18.548744201660156, 19.51896095275879, 20.48917579650879, 21.45939064025879, 22.429607391357422, 23.399822235107422, 24.370037078857422, 25.340251922607422, 26.310466766357422, 27.280683517456055, 28.250898361206055, 29.221113204956055, 30.191329956054688, 31.161544799804688, 32.13175964355469, 33.10197448730469]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 2.0, 13.0, 14.0, 27.0, 47.0, 70.0, 82.0, 134.0, 194.0, 318.0, 505.0, 824.0, 1304.0, 2279.0, 3598.0, 6395.0, 10563.0, 17569.0, 28438.0, 43827.0, 65573.0, 89347.0, 113194.0, 129325.0, 130132.0, 116772.0, 93695.0, 69043.0, 47045.0, 30310.0, 18891.0, 11273.0, 7062.0, 4111.0, 2570.0, 1477.0, 957.0, 545.0, 343.0, 260.0, 150.0, 85.0, 67.0, 40.0, 28.0, 16.0, 17.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0], "bins": [-28.0, -27.178466796875, -26.35693359375, -25.535400390625, -24.7138671875, -23.892333984375, -23.07080078125, -22.249267578125, -21.427734375, -20.606201171875, -19.78466796875, -18.963134765625, -18.1416015625, -17.320068359375, -16.49853515625, -15.677001953125, -14.85546875, -14.033935546875, -13.21240234375, -12.390869140625, -11.5693359375, -10.747802734375, -9.92626953125, -9.104736328125, -8.283203125, -7.461669921875, -6.64013671875, -5.818603515625, -4.9970703125, -4.175537109375, -3.35400390625, -2.532470703125, -1.7109375, -0.889404296875, -0.06787109375, 0.753662109375, 1.5751953125, 2.396728515625, 3.21826171875, 4.039794921875, 4.861328125, 5.682861328125, 6.50439453125, 7.325927734375, 8.1474609375, 8.968994140625, 9.79052734375, 10.612060546875, 11.43359375, 12.255126953125, 13.07666015625, 13.898193359375, 14.7197265625, 15.541259765625, 16.36279296875, 17.184326171875, 18.005859375, 18.827392578125, 19.64892578125, 20.470458984375, 21.2919921875, 22.113525390625, 22.93505859375, 23.756591796875, 24.578125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 7.0, 9.0, 9.0, 7.0, 19.0, 19.0, 13.0, 21.0, 25.0, 33.0, 33.0, 36.0, 37.0, 35.0, 34.0, 48.0, 38.0, 49.0, 42.0, 38.0, 40.0, 40.0, 38.0, 41.0, 37.0, 31.0, 29.0, 28.0, 28.0, 17.0, 26.0, 15.0, 15.0, 10.0, 10.0, 8.0, 3.0, 5.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.296875, -26.39892578125, -25.5009765625, -24.60302734375, -23.705078125, -22.80712890625, -21.9091796875, -21.01123046875, -20.11328125, -19.21533203125, -18.3173828125, -17.41943359375, -16.521484375, -15.62353515625, -14.7255859375, -13.82763671875, -12.9296875, -12.03173828125, -11.1337890625, -10.23583984375, -9.337890625, -8.43994140625, -7.5419921875, -6.64404296875, -5.74609375, -4.84814453125, -3.9501953125, -3.05224609375, -2.154296875, -1.25634765625, -0.3583984375, 0.53955078125, 1.4375, 2.33544921875, 3.2333984375, 4.13134765625, 5.029296875, 5.92724609375, 6.8251953125, 7.72314453125, 8.62109375, 9.51904296875, 10.4169921875, 11.31494140625, 12.212890625, 13.11083984375, 14.0087890625, 14.90673828125, 15.8046875, 16.70263671875, 17.6005859375, 18.49853515625, 19.396484375, 20.29443359375, 21.1923828125, 22.09033203125, 22.98828125, 23.88623046875, 24.7841796875, 25.68212890625, 26.580078125, 27.47802734375, 28.3759765625, 29.27392578125, 30.171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 14.0, 19.0, 25.0, 32.0, 54.0, 55.0, 125.0, 146.0, 261.0, 430.0, 604.0, 970.0, 1529.0, 2575.0, 4091.0, 6296.0, 10422.0, 16760.0, 26510.0, 40557.0, 60309.0, 83426.0, 106841.0, 124626.0, 128980.0, 118153.0, 97888.0, 73185.0, 51217.0, 34065.0, 21876.0, 13838.0, 8447.0, 5310.0, 3283.0, 2061.0, 1275.0, 794.0, 505.0, 335.0, 229.0, 148.0, 86.0, 69.0, 34.0, 32.0, 23.0, 16.0, 13.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-27.90625, -27.0419921875, -26.177734375, -25.3134765625, -24.44921875, -23.5849609375, -22.720703125, -21.8564453125, -20.9921875, -20.1279296875, -19.263671875, -18.3994140625, -17.53515625, -16.6708984375, -15.806640625, -14.9423828125, -14.078125, -13.2138671875, -12.349609375, -11.4853515625, -10.62109375, -9.7568359375, -8.892578125, -8.0283203125, -7.1640625, -6.2998046875, -5.435546875, -4.5712890625, -3.70703125, -2.8427734375, -1.978515625, -1.1142578125, -0.25, 0.6142578125, 1.478515625, 2.3427734375, 3.20703125, 4.0712890625, 4.935546875, 5.7998046875, 6.6640625, 7.5283203125, 8.392578125, 9.2568359375, 10.12109375, 10.9853515625, 11.849609375, 12.7138671875, 13.578125, 14.4423828125, 15.306640625, 16.1708984375, 17.03515625, 17.8994140625, 18.763671875, 19.6279296875, 20.4921875, 21.3564453125, 22.220703125, 23.0849609375, 23.94921875, 24.8134765625, 25.677734375, 26.5419921875, 27.40625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 8.0, 8.0, 3.0, 5.0, 9.0, 9.0, 10.0, 8.0, 8.0, 21.0, 19.0, 17.0, 29.0, 24.0, 31.0, 34.0, 34.0, 32.0, 37.0, 37.0, 36.0, 31.0, 35.0, 38.0, 37.0, 39.0, 40.0, 29.0, 39.0, 27.0, 38.0, 31.0, 25.0, 22.0, 16.0, 19.0, 15.0, 19.0, 14.0, 11.0, 13.0, 11.0, 10.0, 7.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0], "bins": [-16.75, -16.22802734375, -15.7060546875, -15.18408203125, -14.662109375, -14.14013671875, -13.6181640625, -13.09619140625, -12.57421875, -12.05224609375, -11.5302734375, -11.00830078125, -10.486328125, -9.96435546875, -9.4423828125, -8.92041015625, -8.3984375, -7.87646484375, -7.3544921875, -6.83251953125, -6.310546875, -5.78857421875, -5.2666015625, -4.74462890625, -4.22265625, -3.70068359375, -3.1787109375, -2.65673828125, -2.134765625, -1.61279296875, -1.0908203125, -0.56884765625, -0.046875, 0.47509765625, 0.9970703125, 1.51904296875, 2.041015625, 2.56298828125, 3.0849609375, 3.60693359375, 4.12890625, 4.65087890625, 5.1728515625, 5.69482421875, 6.216796875, 6.73876953125, 7.2607421875, 7.78271484375, 8.3046875, 8.82666015625, 9.3486328125, 9.87060546875, 10.392578125, 10.91455078125, 11.4365234375, 11.95849609375, 12.48046875, 13.00244140625, 13.5244140625, 14.04638671875, 14.568359375, 15.09033203125, 15.6123046875, 16.13427734375, 16.65625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 9.0, 6.0, 9.0, 35.0, 41.0, 58.0, 96.0, 179.0, 325.0, 520.0, 918.0, 1613.0, 3051.0, 5992.0, 11286.0, 21632.0, 41844.0, 77068.0, 128370.0, 177132.0, 190317.0, 157766.0, 104455.0, 59905.0, 31452.0, 16165.0, 8446.0, 4486.0, 2415.0, 1250.0, 693.0, 411.0, 244.0, 140.0, 80.0, 57.0, 33.0, 16.0, 11.0, 7.0, 5.0, 7.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6484375, -11.28759765625, -10.9267578125, -10.56591796875, -10.205078125, -9.84423828125, -9.4833984375, -9.12255859375, -8.76171875, -8.40087890625, -8.0400390625, -7.67919921875, -7.318359375, -6.95751953125, -6.5966796875, -6.23583984375, -5.875, -5.51416015625, -5.1533203125, -4.79248046875, -4.431640625, -4.07080078125, -3.7099609375, -3.34912109375, -2.98828125, -2.62744140625, -2.2666015625, -1.90576171875, -1.544921875, -1.18408203125, -0.8232421875, -0.46240234375, -0.1015625, 0.25927734375, 0.6201171875, 0.98095703125, 1.341796875, 1.70263671875, 2.0634765625, 2.42431640625, 2.78515625, 3.14599609375, 3.5068359375, 3.86767578125, 4.228515625, 4.58935546875, 4.9501953125, 5.31103515625, 5.671875, 6.03271484375, 6.3935546875, 6.75439453125, 7.115234375, 7.47607421875, 7.8369140625, 8.19775390625, 8.55859375, 8.91943359375, 9.2802734375, 9.64111328125, 10.001953125, 10.36279296875, 10.7236328125, 11.08447265625, 11.4453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 4.0, 7.0, 9.0, 12.0, 22.0, 23.0, 22.0, 30.0, 36.0, 46.0, 49.0, 61.0, 62.0, 60.0, 69.0, 70.0, 60.0, 65.0, 53.0, 48.0, 52.0, 24.0, 22.0, 26.0, 11.0, 16.0, 12.0, 11.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010309219360351562, -0.000993773341178894, -0.0009566247463226318, -0.0009194761514663696, -0.0008823275566101074, -0.0008451789617538452, -0.000808030366897583, -0.0007708817720413208, -0.0007337331771850586, -0.0006965845823287964, -0.0006594359874725342, -0.000622287392616272, -0.0005851387977600098, -0.0005479902029037476, -0.0005108416080474854, -0.00047369301319122314, -0.00043654441833496094, -0.00039939582347869873, -0.0003622472286224365, -0.0003250986337661743, -0.0002879500389099121, -0.0002508014440536499, -0.0002136528491973877, -0.0001765042543411255, -0.00013935565948486328, -0.00010220706462860107, -6.505846977233887e-05, -2.790987491607666e-05, 9.238719940185547e-06, 4.6387314796447754e-05, 8.353590965270996e-05, 0.00012068450450897217, 0.00015783309936523438, 0.00019498169422149658, 0.0002321302890777588, 0.000269278883934021, 0.0003064274787902832, 0.0003435760736465454, 0.0003807246685028076, 0.0004178732633590698, 0.00045502185821533203, 0.0004921704530715942, 0.0005293190479278564, 0.0005664676427841187, 0.0006036162376403809, 0.0006407648324966431, 0.0006779134273529053, 0.0007150620222091675, 0.0007522106170654297, 0.0007893592119216919, 0.0008265078067779541, 0.0008636564016342163, 0.0009008049964904785, 0.0009379535913467407, 0.0009751021862030029, 0.0010122507810592651, 0.0010493993759155273, 0.0010865479707717896, 0.0011236965656280518, 0.001160845160484314, 0.0011979937553405762, 0.0012351423501968384, 0.0012722909450531006, 0.0013094395399093628, 0.001346588134765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 15.0, 17.0, 17.0, 31.0, 35.0, 58.0, 95.0, 109.0, 181.0, 225.0, 375.0, 516.0, 803.0, 1302.0, 1987.0, 3101.0, 5144.0, 8441.0, 13692.0, 22152.0, 35510.0, 54679.0, 78506.0, 105706.0, 126267.0, 134888.0, 126456.0, 104996.0, 77970.0, 53764.0, 34498.0, 21726.0, 13470.0, 8065.0, 5013.0, 3120.0, 1910.0, 1236.0, 811.0, 538.0, 371.0, 250.0, 173.0, 113.0, 83.0, 48.0, 30.0, 24.0, 13.0, 15.0, 9.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.75, -7.4957275390625, -7.241455078125, -6.9871826171875, -6.73291015625, -6.4786376953125, -6.224365234375, -5.9700927734375, -5.7158203125, -5.4615478515625, -5.207275390625, -4.9530029296875, -4.69873046875, -4.4444580078125, -4.190185546875, -3.9359130859375, -3.681640625, -3.4273681640625, -3.173095703125, -2.9188232421875, -2.66455078125, -2.4102783203125, -2.156005859375, -1.9017333984375, -1.6474609375, -1.3931884765625, -1.138916015625, -0.8846435546875, -0.63037109375, -0.3760986328125, -0.121826171875, 0.1324462890625, 0.38671875, 0.6409912109375, 0.895263671875, 1.1495361328125, 1.40380859375, 1.6580810546875, 1.912353515625, 2.1666259765625, 2.4208984375, 2.6751708984375, 2.929443359375, 3.1837158203125, 3.43798828125, 3.6922607421875, 3.946533203125, 4.2008056640625, 4.455078125, 4.7093505859375, 4.963623046875, 5.2178955078125, 5.47216796875, 5.7264404296875, 5.980712890625, 6.2349853515625, 6.4892578125, 6.7435302734375, 6.997802734375, 7.2520751953125, 7.50634765625, 7.7606201171875, 8.014892578125, 8.2691650390625, 8.5234375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 0.0, 11.0, 17.0, 19.0, 34.0, 28.0, 28.0, 49.0, 38.0, 50.0, 58.0, 77.0, 80.0, 57.0, 59.0, 60.0, 48.0, 63.0, 42.0, 40.0, 15.0, 28.0, 20.0, 15.0, 17.0, 7.0, 8.0, 7.0, 6.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.322265625, -3.191192626953125, -3.06011962890625, -2.929046630859375, -2.7979736328125, -2.666900634765625, -2.53582763671875, -2.404754638671875, -2.273681640625, -2.142608642578125, -2.01153564453125, -1.880462646484375, -1.7493896484375, -1.618316650390625, -1.48724365234375, -1.356170654296875, -1.22509765625, -1.094024658203125, -0.96295166015625, -0.831878662109375, -0.7008056640625, -0.569732666015625, -0.43865966796875, -0.307586669921875, -0.176513671875, -0.045440673828125, 0.08563232421875, 0.216705322265625, 0.3477783203125, 0.478851318359375, 0.60992431640625, 0.740997314453125, 0.8720703125, 1.003143310546875, 1.13421630859375, 1.265289306640625, 1.3963623046875, 1.527435302734375, 1.65850830078125, 1.789581298828125, 1.920654296875, 2.051727294921875, 2.18280029296875, 2.313873291015625, 2.4449462890625, 2.576019287109375, 2.70709228515625, 2.838165283203125, 2.96923828125, 3.100311279296875, 3.23138427734375, 3.362457275390625, 3.4935302734375, 3.624603271484375, 3.75567626953125, 3.886749267578125, 4.017822265625, 4.148895263671875, 4.27996826171875, 4.411041259765625, 4.5421142578125, 4.673187255859375, 4.80426025390625, 4.935333251953125, 5.06640625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 12.0, 6.0, 9.0, 12.0, 10.0, 12.0, 19.0, 14.0, 19.0, 22.0, 30.0, 33.0, 31.0, 25.0, 28.0, 41.0, 30.0, 30.0, 39.0, 45.0, 35.0, 51.0, 39.0, 35.0, 29.0, 30.0, 32.0, 27.0, 32.0, 25.0, 30.0, 22.0, 23.0, 14.0, 14.0, 12.0, 12.0, 15.0, 10.0, 7.0, 5.0, 3.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-24.755844116210938, -23.971595764160156, -23.187349319458008, -22.403100967407227, -21.618854522705078, -20.834606170654297, -20.05035972595215, -19.266111373901367, -18.48186492919922, -17.697616577148438, -16.91337013244629, -16.129121780395508, -15.34487533569336, -14.560627937316895, -13.77638053894043, -12.992132186889648, -12.207884788513184, -11.423637390136719, -10.639389991760254, -9.855142593383789, -9.070895195007324, -8.28664779663086, -7.502399921417236, -6.7181525230407715, -5.933905124664307, -5.149657726287842, -4.365410327911377, -3.581162691116333, -2.796915292739868, -2.0126678943634033, -1.2284202575683594, -0.44417285919189453, 0.3400745391845703, 1.1243219375610352, 1.9085694551467896, 2.692816972732544, 3.477064371109009, 4.2613115310668945, 5.045559406280518, 5.829806804656982, 6.614054203033447, 7.398301601409912, 8.182549476623535, 8.966796875, 9.751044273376465, 10.53529167175293, 11.319539070129395, 12.10378646850586, 12.888033866882324, 13.672281265258789, 14.456528663635254, 15.240776062011719, 16.0250244140625, 16.80927085876465, 17.59351921081543, 18.377765655517578, 19.16201400756836, 19.94626235961914, 20.73050880432129, 21.51475715637207, 22.29900360107422, 23.083251953125, 23.86749839782715, 24.65174674987793, 25.435993194580078]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 6.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 7.0, 11.0, 7.0, 9.0, 6.0, 14.0, 26.0, 36.0, 31.0, 21.0, 29.0, 34.0, 33.0, 41.0, 45.0, 46.0, 53.0, 34.0, 37.0, 42.0, 44.0, 42.0, 23.0, 34.0, 35.0, 37.0, 25.0, 30.0, 24.0, 26.0, 11.0, 14.0, 6.0, 15.0, 13.0, 9.0, 9.0, 7.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.704984664916992, -25.78809356689453, -24.871200561523438, -23.954309463500977, -23.037416458129883, -22.120525360107422, -21.203632354736328, -20.286741256713867, -19.369850158691406, -18.452959060668945, -17.53606605529785, -16.61917495727539, -15.702281951904297, -14.785390853881836, -13.868498802185059, -12.951606750488281, -12.034713745117188, -11.11782169342041, -10.200929641723633, -9.284038543701172, -8.367145538330078, -7.450253963470459, -6.53336238861084, -5.6164703369140625, -4.699578285217285, -3.782686233520508, -2.8657944202423096, -1.9489026069641113, -1.032010555267334, -0.11511850357055664, 0.8017730712890625, 1.7186651229858398, 2.6355552673339844, 3.5524473190307617, 4.469339370727539, 5.386230945587158, 6.3031229972839355, 7.220015048980713, 8.136906623840332, 9.05379867553711, 9.970690727233887, 10.887582778930664, 11.804474830627441, 12.721366882324219, 13.63825798034668, 14.555150985717773, 15.472042083740234, 16.388935089111328, 17.30582618713379, 18.22271728515625, 19.139610290527344, 20.056501388549805, 20.9733943939209, 21.89028549194336, 22.807178497314453, 23.724069595336914, 24.640960693359375, 25.557851791381836, 26.47474479675293, 27.39163589477539, 28.308528900146484, 29.225419998168945, 30.142311096191406, 31.0592041015625, 31.976097106933594]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 7.0, 6.0, 18.0, 27.0, 43.0, 72.0, 166.0, 286.0, 457.0, 860.0, 1508.0, 2704.0, 4870.0, 8510.0, 14644.0, 25044.0, 42855.0, 71963.0, 117802.0, 188237.0, 286544.0, 403132.0, 514820.0, 570492.0, 546734.0, 455319.0, 336007.0, 228504.0, 146440.0, 91054.0, 55301.0, 33115.0, 19526.0, 11279.0, 6641.0, 3824.0, 2337.0, 1353.0, 771.0, 415.0, 263.0, 135.0, 85.0, 50.0, 34.0, 14.0, 10.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.453125, -21.61328125, -20.7734375, -19.93359375, -19.09375, -18.25390625, -17.4140625, -16.57421875, -15.734375, -14.89453125, -14.0546875, -13.21484375, -12.375, -11.53515625, -10.6953125, -9.85546875, -9.015625, -8.17578125, -7.3359375, -6.49609375, -5.65625, -4.81640625, -3.9765625, -3.13671875, -2.296875, -1.45703125, -0.6171875, 0.22265625, 1.0625, 1.90234375, 2.7421875, 3.58203125, 4.421875, 5.26171875, 6.1015625, 6.94140625, 7.78125, 8.62109375, 9.4609375, 10.30078125, 11.140625, 11.98046875, 12.8203125, 13.66015625, 14.5, 15.33984375, 16.1796875, 17.01953125, 17.859375, 18.69921875, 19.5390625, 20.37890625, 21.21875, 22.05859375, 22.8984375, 23.73828125, 24.578125, 25.41796875, 26.2578125, 27.09765625, 27.9375, 28.77734375, 29.6171875, 30.45703125, 31.296875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 3.0, 11.0, 10.0, 12.0, 7.0, 16.0, 19.0, 23.0, 28.0, 27.0, 31.0, 30.0, 31.0, 40.0, 37.0, 52.0, 43.0, 42.0, 42.0, 40.0, 35.0, 41.0, 34.0, 33.0, 34.0, 32.0, 32.0, 32.0, 21.0, 24.0, 19.0, 20.0, 6.0, 14.0, 12.0, 20.0, 6.0, 8.0, 3.0, 5.0, 2.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.546875, -21.762451171875, -20.97802734375, -20.193603515625, -19.4091796875, -18.624755859375, -17.84033203125, -17.055908203125, -16.271484375, -15.487060546875, -14.70263671875, -13.918212890625, -13.1337890625, -12.349365234375, -11.56494140625, -10.780517578125, -9.99609375, -9.211669921875, -8.42724609375, -7.642822265625, -6.8583984375, -6.073974609375, -5.28955078125, -4.505126953125, -3.720703125, -2.936279296875, -2.15185546875, -1.367431640625, -0.5830078125, 0.201416015625, 0.98583984375, 1.770263671875, 2.5546875, 3.339111328125, 4.12353515625, 4.907958984375, 5.6923828125, 6.476806640625, 7.26123046875, 8.045654296875, 8.830078125, 9.614501953125, 10.39892578125, 11.183349609375, 11.9677734375, 12.752197265625, 13.53662109375, 14.321044921875, 15.10546875, 15.889892578125, 16.67431640625, 17.458740234375, 18.2431640625, 19.027587890625, 19.81201171875, 20.596435546875, 21.380859375, 22.165283203125, 22.94970703125, 23.734130859375, 24.5185546875, 25.302978515625, 26.08740234375, 26.871826171875, 27.65625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 17.0, 22.0, 35.0, 69.0, 109.0, 168.0, 305.0, 513.0, 852.0, 1486.0, 2489.0, 4044.0, 6688.0, 10799.0, 17815.0, 28743.0, 45480.0, 70870.0, 108335.0, 159319.0, 226969.0, 303958.0, 382302.0, 446099.0, 471342.0, 453657.0, 396314.0, 320030.0, 240478.0, 170108.0, 116642.0, 77495.0, 49602.0, 31569.0, 19479.0, 11627.0, 7406.0, 4394.0, 2620.0, 1600.0, 979.0, 556.0, 362.0, 198.0, 123.0, 78.0, 56.0, 39.0, 23.0, 8.0, 7.0, 2.0, 1.0, 3.0, 3.0], "bins": [-25.1875, -24.437744140625, -23.68798828125, -22.938232421875, -22.1884765625, -21.438720703125, -20.68896484375, -19.939208984375, -19.189453125, -18.439697265625, -17.68994140625, -16.940185546875, -16.1904296875, -15.440673828125, -14.69091796875, -13.941162109375, -13.19140625, -12.441650390625, -11.69189453125, -10.942138671875, -10.1923828125, -9.442626953125, -8.69287109375, -7.943115234375, -7.193359375, -6.443603515625, -5.69384765625, -4.944091796875, -4.1943359375, -3.444580078125, -2.69482421875, -1.945068359375, -1.1953125, -0.445556640625, 0.30419921875, 1.053955078125, 1.8037109375, 2.553466796875, 3.30322265625, 4.052978515625, 4.802734375, 5.552490234375, 6.30224609375, 7.052001953125, 7.8017578125, 8.551513671875, 9.30126953125, 10.051025390625, 10.80078125, 11.550537109375, 12.30029296875, 13.050048828125, 13.7998046875, 14.549560546875, 15.29931640625, 16.049072265625, 16.798828125, 17.548583984375, 18.29833984375, 19.048095703125, 19.7978515625, 20.547607421875, 21.29736328125, 22.047119140625, 22.796875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 7.0, 12.0, 17.0, 28.0, 20.0, 39.0, 29.0, 39.0, 65.0, 74.0, 85.0, 107.0, 99.0, 120.0, 157.0, 172.0, 167.0, 191.0, 208.0, 228.0, 207.0, 211.0, 203.0, 191.0, 194.0, 174.0, 158.0, 139.0, 129.0, 115.0, 97.0, 79.0, 61.0, 44.0, 36.0, 35.0, 31.0, 26.0, 21.0, 17.0, 13.0, 7.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-12.5703125, -12.184326171875, -11.79833984375, -11.412353515625, -11.0263671875, -10.640380859375, -10.25439453125, -9.868408203125, -9.482421875, -9.096435546875, -8.71044921875, -8.324462890625, -7.9384765625, -7.552490234375, -7.16650390625, -6.780517578125, -6.39453125, -6.008544921875, -5.62255859375, -5.236572265625, -4.8505859375, -4.464599609375, -4.07861328125, -3.692626953125, -3.306640625, -2.920654296875, -2.53466796875, -2.148681640625, -1.7626953125, -1.376708984375, -0.99072265625, -0.604736328125, -0.21875, 0.167236328125, 0.55322265625, 0.939208984375, 1.3251953125, 1.711181640625, 2.09716796875, 2.483154296875, 2.869140625, 3.255126953125, 3.64111328125, 4.027099609375, 4.4130859375, 4.799072265625, 5.18505859375, 5.571044921875, 5.95703125, 6.343017578125, 6.72900390625, 7.114990234375, 7.5009765625, 7.886962890625, 8.27294921875, 8.658935546875, 9.044921875, 9.430908203125, 9.81689453125, 10.202880859375, 10.5888671875, 10.974853515625, 11.36083984375, 11.746826171875, 12.1328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 6.0, 8.0, 7.0, 10.0, 9.0, 17.0, 16.0, 18.0, 18.0, 19.0, 28.0, 24.0, 21.0, 35.0, 40.0, 30.0, 35.0, 27.0, 39.0, 38.0, 46.0, 43.0, 35.0, 37.0, 41.0, 43.0, 39.0, 32.0, 31.0, 28.0, 18.0, 25.0, 18.0, 26.0, 22.0, 12.0, 12.0, 15.0, 6.0, 1.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-25.224323272705078, -24.37598991394043, -23.527658462524414, -22.679325103759766, -21.83099365234375, -20.9826602935791, -20.134326934814453, -19.285995483398438, -18.43766212463379, -17.58932876586914, -16.740997314453125, -15.892663955688477, -15.044331550598145, -14.195999145507812, -13.34766674041748, -12.499334335327148, -11.651001930236816, -10.802669525146484, -9.954337120056152, -9.10600471496582, -8.257671356201172, -7.40933895111084, -6.561006546020508, -5.712673664093018, -4.8643412590026855, -4.0160088539123535, -3.1676759719848633, -2.3193435668945312, -1.4710109233856201, -0.622678279876709, 0.22565412521362305, 1.0739870071411133, 1.9223194122314453, 2.7706520557403564, 3.6189846992492676, 4.4673171043396, 5.31564998626709, 6.163982391357422, 7.012314796447754, 7.860647678375244, 8.708980560302734, 9.557312965393066, 10.405645370483398, 11.253978729248047, 12.102311134338379, 12.950643539428711, 13.798975944519043, 14.647308349609375, 15.495640754699707, 16.34397315979004, 17.192306518554688, 18.040637969970703, 18.88897132873535, 19.7373046875, 20.585636138916016, 21.433969497680664, 22.28230094909668, 23.130634307861328, 23.978965759277344, 24.827299118041992, 25.675630569458008, 26.523963928222656, 27.372295379638672, 28.22062873840332, 29.06896209716797]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 4.0, 6.0, 5.0, 8.0, 6.0, 15.0, 16.0, 16.0, 13.0, 20.0, 26.0, 23.0, 22.0, 32.0, 33.0, 31.0, 26.0, 45.0, 42.0, 42.0, 33.0, 42.0, 31.0, 44.0, 39.0, 34.0, 26.0, 31.0, 31.0, 25.0, 30.0, 32.0, 27.0, 24.0, 17.0, 17.0, 8.0, 14.0, 13.0, 9.0, 3.0, 6.0, 7.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-26.389484405517578, -25.511083602905273, -24.632680892944336, -23.75428009033203, -22.875879287719727, -21.997478485107422, -21.119075775146484, -20.24067497253418, -19.362274169921875, -18.48387336730957, -17.605470657348633, -16.727069854736328, -15.848669052124023, -14.970267295837402, -14.091865539550781, -13.213464736938477, -12.335062026977539, -11.456660270690918, -10.578259468078613, -9.699857711791992, -8.821456909179688, -7.943055152893066, -7.064653396606445, -6.186252117156982, -5.3078508377075195, -4.429449558258057, -3.5510480403900146, -2.6726465225219727, -1.7942452430725098, -0.9158439636230469, -0.03744220733642578, 0.8409590721130371, 1.7193622589111328, 2.5977635383605957, 3.4761650562286377, 4.35456657409668, 5.232967853546143, 6.1113691329956055, 6.989770889282227, 7.8681721687316895, 8.746573448181152, 9.624975204467773, 10.503376007080078, 11.3817777633667, 12.26017951965332, 13.138580322265625, 14.016982078552246, 14.895383834838867, 15.773784637451172, 16.652185440063477, 17.530588150024414, 18.40898895263672, 19.287389755249023, 20.165790557861328, 21.044193267822266, 21.92259407043457, 22.800994873046875, 23.67939567565918, 24.557798385620117, 25.436199188232422, 26.314599990844727, 27.19300079345703, 28.07140350341797, 28.949804306030273, 29.82820701599121]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 5.0, 2.0, 11.0, 12.0, 23.0, 25.0, 52.0, 73.0, 112.0, 179.0, 261.0, 450.0, 624.0, 1003.0, 1581.0, 2331.0, 3468.0, 5092.0, 7598.0, 11000.0, 15430.0, 21885.0, 29690.0, 39283.0, 50577.0, 62543.0, 74154.0, 83168.0, 89418.0, 90533.0, 87238.0, 78929.0, 68994.0, 56863.0, 45537.0, 34686.0, 25790.0, 18474.0, 13426.0, 9156.0, 6298.0, 4253.0, 2833.0, 1920.0, 1298.0, 804.0, 520.0, 354.0, 230.0, 138.0, 92.0, 56.0, 25.0, 26.0, 16.0, 10.0, 8.0, 5.0, 1.0, 2.0], "bins": [-12.21875, -11.8514404296875, -11.484130859375, -11.1168212890625, -10.74951171875, -10.3822021484375, -10.014892578125, -9.6475830078125, -9.2802734375, -8.9129638671875, -8.545654296875, -8.1783447265625, -7.81103515625, -7.4437255859375, -7.076416015625, -6.7091064453125, -6.341796875, -5.9744873046875, -5.607177734375, -5.2398681640625, -4.87255859375, -4.5052490234375, -4.137939453125, -3.7706298828125, -3.4033203125, -3.0360107421875, -2.668701171875, -2.3013916015625, -1.93408203125, -1.5667724609375, -1.199462890625, -0.8321533203125, -0.46484375, -0.0975341796875, 0.269775390625, 0.6370849609375, 1.00439453125, 1.3717041015625, 1.739013671875, 2.1063232421875, 2.4736328125, 2.8409423828125, 3.208251953125, 3.5755615234375, 3.94287109375, 4.3101806640625, 4.677490234375, 5.0447998046875, 5.412109375, 5.7794189453125, 6.146728515625, 6.5140380859375, 6.88134765625, 7.2486572265625, 7.615966796875, 7.9832763671875, 8.3505859375, 8.7178955078125, 9.085205078125, 9.4525146484375, 9.81982421875, 10.1871337890625, 10.554443359375, 10.9217529296875, 11.2890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 2.0, 10.0, 3.0, 5.0, 6.0, 6.0, 8.0, 17.0, 14.0, 16.0, 14.0, 22.0, 22.0, 25.0, 26.0, 33.0, 28.0, 33.0, 33.0, 41.0, 40.0, 39.0, 41.0, 38.0, 35.0, 46.0, 36.0, 29.0, 28.0, 36.0, 28.0, 23.0, 33.0, 27.0, 32.0, 20.0, 17.0, 16.0, 6.0, 14.0, 13.0, 7.0, 3.0, 8.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-26.234375, -25.345703125, -24.45703125, -23.568359375, -22.6796875, -21.791015625, -20.90234375, -20.013671875, -19.125, -18.236328125, -17.34765625, -16.458984375, -15.5703125, -14.681640625, -13.79296875, -12.904296875, -12.015625, -11.126953125, -10.23828125, -9.349609375, -8.4609375, -7.572265625, -6.68359375, -5.794921875, -4.90625, -4.017578125, -3.12890625, -2.240234375, -1.3515625, -0.462890625, 0.42578125, 1.314453125, 2.203125, 3.091796875, 3.98046875, 4.869140625, 5.7578125, 6.646484375, 7.53515625, 8.423828125, 9.3125, 10.201171875, 11.08984375, 11.978515625, 12.8671875, 13.755859375, 14.64453125, 15.533203125, 16.421875, 17.310546875, 18.19921875, 19.087890625, 19.9765625, 20.865234375, 21.75390625, 22.642578125, 23.53125, 24.419921875, 25.30859375, 26.197265625, 27.0859375, 27.974609375, 28.86328125, 29.751953125, 30.640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 7.0, 7.0, 9.0, 20.0, 24.0, 36.0, 51.0, 69.0, 91.0, 158.0, 208.0, 336.0, 485.0, 725.0, 998.0, 1580.0, 2377.0, 3426.0, 4775.0, 7047.0, 10258.0, 15028.0, 23004.0, 49735.0, 724288.0, 124549.0, 26271.0, 16816.0, 11383.0, 7787.0, 5226.0, 3699.0, 2592.0, 1755.0, 1181.0, 856.0, 558.0, 366.0, 249.0, 158.0, 113.0, 82.0, 65.0, 27.0, 33.0, 16.0, 15.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-29.53125, -28.67919921875, -27.8271484375, -26.97509765625, -26.123046875, -25.27099609375, -24.4189453125, -23.56689453125, -22.71484375, -21.86279296875, -21.0107421875, -20.15869140625, -19.306640625, -18.45458984375, -17.6025390625, -16.75048828125, -15.8984375, -15.04638671875, -14.1943359375, -13.34228515625, -12.490234375, -11.63818359375, -10.7861328125, -9.93408203125, -9.08203125, -8.22998046875, -7.3779296875, -6.52587890625, -5.673828125, -4.82177734375, -3.9697265625, -3.11767578125, -2.265625, -1.41357421875, -0.5615234375, 0.29052734375, 1.142578125, 1.99462890625, 2.8466796875, 3.69873046875, 4.55078125, 5.40283203125, 6.2548828125, 7.10693359375, 7.958984375, 8.81103515625, 9.6630859375, 10.51513671875, 11.3671875, 12.21923828125, 13.0712890625, 13.92333984375, 14.775390625, 15.62744140625, 16.4794921875, 17.33154296875, 18.18359375, 19.03564453125, 19.8876953125, 20.73974609375, 21.591796875, 22.44384765625, 23.2958984375, 24.14794921875, 25.0]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 5.0, 0.0, 0.0, 8.0, 9.0, 11.0, 15.0, 14.0, 25.0, 16.0, 25.0, 20.0, 28.0, 28.0, 29.0, 35.0, 35.0, 37.0, 26.0, 40.0, 46.0, 38.0, 46.0, 44.0, 35.0, 39.0, 43.0, 33.0, 32.0, 35.0, 35.0, 36.0, 22.0, 22.0, 12.0, 17.0, 11.0, 9.0, 5.0, 8.0, 4.0, 3.0, 5.0, 6.0, 5.0, 1.0, 5.0, 0.0, 2.0], "bins": [-27.828125, -27.073486328125, -26.31884765625, -25.564208984375, -24.8095703125, -24.054931640625, -23.30029296875, -22.545654296875, -21.791015625, -21.036376953125, -20.28173828125, -19.527099609375, -18.7724609375, -18.017822265625, -17.26318359375, -16.508544921875, -15.75390625, -14.999267578125, -14.24462890625, -13.489990234375, -12.7353515625, -11.980712890625, -11.22607421875, -10.471435546875, -9.716796875, -8.962158203125, -8.20751953125, -7.452880859375, -6.6982421875, -5.943603515625, -5.18896484375, -4.434326171875, -3.6796875, -2.925048828125, -2.17041015625, -1.415771484375, -0.6611328125, 0.093505859375, 0.84814453125, 1.602783203125, 2.357421875, 3.112060546875, 3.86669921875, 4.621337890625, 5.3759765625, 6.130615234375, 6.88525390625, 7.639892578125, 8.39453125, 9.149169921875, 9.90380859375, 10.658447265625, 11.4130859375, 12.167724609375, 12.92236328125, 13.677001953125, 14.431640625, 15.186279296875, 15.94091796875, 16.695556640625, 17.4501953125, 18.204833984375, 18.95947265625, 19.714111328125, 20.46875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 8.0, 6.0, 4.0, 6.0, 17.0, 31.0, 47.0, 58.0, 107.0, 195.0, 342.0, 683.0, 1516.0, 3250.0, 7381.0, 18714.0, 75678.0, 873453.0, 42864.0, 13726.0, 5560.0, 2514.0, 1123.0, 559.0, 267.0, 168.0, 82.0, 67.0, 33.0, 40.0, 11.0, 18.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.015625, -7.79510498046875, -7.5745849609375, -7.35406494140625, -7.133544921875, -6.91302490234375, -6.6925048828125, -6.47198486328125, -6.25146484375, -6.03094482421875, -5.8104248046875, -5.58990478515625, -5.369384765625, -5.14886474609375, -4.9283447265625, -4.70782470703125, -4.4873046875, -4.26678466796875, -4.0462646484375, -3.82574462890625, -3.605224609375, -3.38470458984375, -3.1641845703125, -2.94366455078125, -2.72314453125, -2.50262451171875, -2.2821044921875, -2.06158447265625, -1.841064453125, -1.62054443359375, -1.4000244140625, -1.17950439453125, -0.958984375, -0.73846435546875, -0.5179443359375, -0.29742431640625, -0.076904296875, 0.14361572265625, 0.3641357421875, 0.58465576171875, 0.80517578125, 1.02569580078125, 1.2462158203125, 1.46673583984375, 1.687255859375, 1.90777587890625, 2.1282958984375, 2.34881591796875, 2.5693359375, 2.78985595703125, 3.0103759765625, 3.23089599609375, 3.451416015625, 3.67193603515625, 3.8924560546875, 4.11297607421875, 4.33349609375, 4.55401611328125, 4.7745361328125, 4.99505615234375, 5.215576171875, 5.43609619140625, 5.6566162109375, 5.87713623046875, 6.09765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 9.0, 16.0, 26.0, 54.0, 103.0, 182.0, 192.0, 185.0, 115.0, 67.0, 27.0, 11.0, 10.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003265380859375, -0.0031554102897644043, -0.0030454397201538086, -0.002935469150543213, -0.002825498580932617, -0.0027155280113220215, -0.0026055574417114258, -0.00249558687210083, -0.0023856163024902344, -0.0022756457328796387, -0.002165675163269043, -0.0020557045936584473, -0.0019457340240478516, -0.0018357634544372559, -0.0017257928848266602, -0.0016158223152160645, -0.0015058517456054688, -0.001395881175994873, -0.0012859106063842773, -0.0011759400367736816, -0.001065969467163086, -0.0009559988975524902, -0.0008460283279418945, -0.0007360577583312988, -0.0006260871887207031, -0.0005161166191101074, -0.0004061460494995117, -0.000296175479888916, -0.0001862049102783203, -7.623434066772461e-05, 3.3736228942871094e-05, 0.0001437067985534668, 0.0002536773681640625, 0.0003636479377746582, 0.0004736185073852539, 0.0005835890769958496, 0.0006935596466064453, 0.000803530216217041, 0.0009135007858276367, 0.0010234713554382324, 0.0011334419250488281, 0.0012434124946594238, 0.0013533830642700195, 0.0014633536338806152, 0.001573324203491211, 0.0016832947731018066, 0.0017932653427124023, 0.001903235912322998, 0.0020132064819335938, 0.0021231770515441895, 0.002233147621154785, 0.002343118190765381, 0.0024530887603759766, 0.0025630593299865723, 0.002673029899597168, 0.0027830004692077637, 0.0028929710388183594, 0.003002941608428955, 0.0031129121780395508, 0.0032228827476501465, 0.003332853317260742, 0.003442823886871338, 0.0035527944564819336, 0.0036627650260925293, 0.003772735595703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 12.0, 19.0, 25.0, 31.0, 35.0, 49.0, 66.0, 107.0, 135.0, 201.0, 292.0, 453.0, 641.0, 998.0, 1517.0, 2306.0, 3825.0, 6159.0, 10429.0, 17507.0, 29016.0, 47899.0, 75097.0, 113992.0, 149515.0, 163497.0, 142487.0, 104980.0, 68319.0, 42849.0, 25924.0, 15658.0, 9327.0, 5509.0, 3429.0, 2152.0, 1313.0, 808.0, 616.0, 402.0, 286.0, 185.0, 151.0, 103.0, 62.0, 51.0, 35.0, 21.0, 19.0, 17.0, 9.0, 3.0, 13.0, 5.0, 3.0], "bins": [-1.455078125, -1.4127655029296875, -1.370452880859375, -1.3281402587890625, -1.28582763671875, -1.2435150146484375, -1.201202392578125, -1.1588897705078125, -1.1165771484375, -1.0742645263671875, -1.031951904296875, -0.9896392822265625, -0.94732666015625, -0.9050140380859375, -0.862701416015625, -0.8203887939453125, -0.778076171875, -0.7357635498046875, -0.693450927734375, -0.6511383056640625, -0.60882568359375, -0.5665130615234375, -0.524200439453125, -0.4818878173828125, -0.4395751953125, -0.3972625732421875, -0.354949951171875, -0.3126373291015625, -0.27032470703125, -0.2280120849609375, -0.185699462890625, -0.1433868408203125, -0.10107421875, -0.0587615966796875, -0.016448974609375, 0.0258636474609375, 0.06817626953125, 0.1104888916015625, 0.152801513671875, 0.1951141357421875, 0.2374267578125, 0.2797393798828125, 0.322052001953125, 0.3643646240234375, 0.40667724609375, 0.4489898681640625, 0.491302490234375, 0.5336151123046875, 0.575927734375, 0.6182403564453125, 0.660552978515625, 0.7028656005859375, 0.74517822265625, 0.7874908447265625, 0.829803466796875, 0.8721160888671875, 0.9144287109375, 0.9567413330078125, 0.999053955078125, 1.0413665771484375, 1.08367919921875, 1.1259918212890625, 1.168304443359375, 1.2106170654296875, 1.2529296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 7.0, 6.0, 2.0, 5.0, 9.0, 9.0, 20.0, 16.0, 23.0, 26.0, 24.0, 31.0, 31.0, 55.0, 75.0, 70.0, 84.0, 66.0, 60.0, 60.0, 42.0, 41.0, 41.0, 29.0, 18.0, 25.0, 22.0, 16.0, 8.0, 18.0, 6.0, 11.0, 12.0, 8.0, 5.0, 5.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.53271484375, -0.5171966552734375, -0.501678466796875, -0.4861602783203125, -0.47064208984375, -0.4551239013671875, -0.439605712890625, -0.4240875244140625, -0.4085693359375, -0.3930511474609375, -0.377532958984375, -0.3620147705078125, -0.34649658203125, -0.3309783935546875, -0.315460205078125, -0.2999420166015625, -0.284423828125, -0.2689056396484375, -0.253387451171875, -0.2378692626953125, -0.22235107421875, -0.2068328857421875, -0.191314697265625, -0.1757965087890625, -0.1602783203125, -0.1447601318359375, -0.129241943359375, -0.1137237548828125, -0.09820556640625, -0.0826873779296875, -0.067169189453125, -0.0516510009765625, -0.0361328125, -0.0206146240234375, -0.005096435546875, 0.0104217529296875, 0.02593994140625, 0.0414581298828125, 0.056976318359375, 0.0724945068359375, 0.0880126953125, 0.1035308837890625, 0.119049072265625, 0.1345672607421875, 0.15008544921875, 0.1656036376953125, 0.181121826171875, 0.1966400146484375, 0.212158203125, 0.2276763916015625, 0.243194580078125, 0.2587127685546875, 0.27423095703125, 0.2897491455078125, 0.305267333984375, 0.3207855224609375, 0.3363037109375, 0.3518218994140625, 0.367340087890625, 0.3828582763671875, 0.39837646484375, 0.4138946533203125, 0.429412841796875, 0.4449310302734375, 0.46044921875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 6.0, 3.0, 2.0, 2.0, 6.0, 6.0, 6.0, 9.0, 12.0, 7.0, 10.0, 17.0, 13.0, 20.0, 27.0, 21.0, 33.0, 21.0, 30.0, 37.0, 32.0, 37.0, 38.0, 37.0, 34.0, 42.0, 44.0, 40.0, 37.0, 42.0, 37.0, 47.0, 24.0, 32.0, 26.0, 30.0, 25.0, 27.0, 13.0, 14.0, 12.0, 16.0, 6.0, 13.0, 8.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.963294982910156, -24.102270126342773, -23.24124526977539, -22.380220413208008, -21.519195556640625, -20.658170700073242, -19.79714584350586, -18.93612289428711, -18.075096130371094, -17.21407127380371, -16.353046417236328, -15.492021560668945, -14.630996704101562, -13.76997184753418, -12.908947944641113, -12.04792308807373, -11.186899185180664, -10.325874328613281, -9.464849472045898, -8.603824615478516, -7.742800235748291, -6.881775379180908, -6.020750999450684, -5.159726142883301, -4.298701286315918, -3.437676429748535, -2.5766518115997314, -1.7156271934509277, -0.8546023368835449, 0.006422519683837891, 0.8674468994140625, 1.7284717559814453, 2.5894947052001953, 3.450519561767578, 4.311544418334961, 5.1725687980651855, 6.033593654632568, 6.894618511199951, 7.755642890930176, 8.616667747497559, 9.477692604064941, 10.338717460632324, 11.199742317199707, 12.060766220092773, 12.921791076660156, 13.782815933227539, 14.643840789794922, 15.504865646362305, 16.365890502929688, 17.22691535949707, 18.087940216064453, 18.948965072631836, 19.80998992919922, 20.6710147857666, 21.532039642333984, 22.393062591552734, 23.25408935546875, 24.115114212036133, 24.976139068603516, 25.8371639251709, 26.69818878173828, 27.559213638305664, 28.420238494873047, 29.281261444091797, 30.14228630065918]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 5.0, 7.0, 6.0, 6.0, 3.0, 10.0, 12.0, 14.0, 18.0, 13.0, 19.0, 24.0, 27.0, 19.0, 36.0, 28.0, 33.0, 27.0, 46.0, 42.0, 34.0, 43.0, 40.0, 37.0, 39.0, 39.0, 31.0, 32.0, 33.0, 31.0, 28.0, 25.0, 29.0, 32.0, 23.0, 15.0, 17.0, 8.0, 12.0, 15.0, 9.0, 3.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-26.57605743408203, -25.684240341186523, -24.792423248291016, -23.900606155395508, -23.0087890625, -22.116971969604492, -21.225154876708984, -20.333337783813477, -19.44152069091797, -18.54970359802246, -17.657886505126953, -16.766069412231445, -15.874252319335938, -14.98243522644043, -14.090618133544922, -13.198801040649414, -12.306983947753906, -11.415166854858398, -10.52334976196289, -9.631532669067383, -8.739715576171875, -7.847898483276367, -6.956081390380859, -6.064264297485352, -5.172447204589844, -4.280630111694336, -3.388813018798828, -2.4969959259033203, -1.6051788330078125, -0.7133617401123047, 0.17845535278320312, 1.070272445678711, 1.9620895385742188, 2.8539066314697266, 3.7457237243652344, 4.637540817260742, 5.52935791015625, 6.421175003051758, 7.312992095947266, 8.204809188842773, 9.096626281738281, 9.988443374633789, 10.880260467529297, 11.772077560424805, 12.663894653320312, 13.55571174621582, 14.447528839111328, 15.339345932006836, 16.231163024902344, 17.12298011779785, 18.01479721069336, 18.906614303588867, 19.798431396484375, 20.690248489379883, 21.58206558227539, 22.4738826751709, 23.365699768066406, 24.257516860961914, 25.149333953857422, 26.04115104675293, 26.932968139648438, 27.824785232543945, 28.716602325439453, 29.60841941833496, 30.50023651123047]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 6.0, 9.0, 16.0, 33.0, 33.0, 52.0, 71.0, 129.0, 227.0, 370.0, 627.0, 1079.0, 1779.0, 3070.0, 5161.0, 8674.0, 14130.0, 22316.0, 34371.0, 51025.0, 71536.0, 93356.0, 111857.0, 123451.0, 121004.0, 106865.0, 86716.0, 65296.0, 45232.0, 30193.0, 19361.0, 12114.0, 7407.0, 4511.0, 2633.0, 1525.0, 893.0, 551.0, 346.0, 205.0, 113.0, 78.0, 47.0, 35.0, 21.0, 15.0, 8.0, 4.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.640625, -19.871826171875, -19.10302734375, -18.334228515625, -17.5654296875, -16.796630859375, -16.02783203125, -15.259033203125, -14.490234375, -13.721435546875, -12.95263671875, -12.183837890625, -11.4150390625, -10.646240234375, -9.87744140625, -9.108642578125, -8.33984375, -7.571044921875, -6.80224609375, -6.033447265625, -5.2646484375, -4.495849609375, -3.72705078125, -2.958251953125, -2.189453125, -1.420654296875, -0.65185546875, 0.116943359375, 0.8857421875, 1.654541015625, 2.42333984375, 3.192138671875, 3.9609375, 4.729736328125, 5.49853515625, 6.267333984375, 7.0361328125, 7.804931640625, 8.57373046875, 9.342529296875, 10.111328125, 10.880126953125, 11.64892578125, 12.417724609375, 13.1865234375, 13.955322265625, 14.72412109375, 15.492919921875, 16.26171875, 17.030517578125, 17.79931640625, 18.568115234375, 19.3369140625, 20.105712890625, 20.87451171875, 21.643310546875, 22.412109375, 23.180908203125, 23.94970703125, 24.718505859375, 25.4873046875, 26.256103515625, 27.02490234375, 27.793701171875, 28.5625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 4.0, 9.0, 6.0, 3.0, 7.0, 6.0, 16.0, 15.0, 16.0, 17.0, 17.0, 25.0, 30.0, 20.0, 26.0, 32.0, 35.0, 26.0, 47.0, 41.0, 31.0, 44.0, 41.0, 44.0, 33.0, 45.0, 30.0, 25.0, 35.0, 24.0, 34.0, 31.0, 31.0, 25.0, 23.0, 18.0, 15.0, 5.0, 14.0, 13.0, 7.0, 8.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0], "bins": [-25.5625, -24.72900390625, -23.8955078125, -23.06201171875, -22.228515625, -21.39501953125, -20.5615234375, -19.72802734375, -18.89453125, -18.06103515625, -17.2275390625, -16.39404296875, -15.560546875, -14.72705078125, -13.8935546875, -13.06005859375, -12.2265625, -11.39306640625, -10.5595703125, -9.72607421875, -8.892578125, -8.05908203125, -7.2255859375, -6.39208984375, -5.55859375, -4.72509765625, -3.8916015625, -3.05810546875, -2.224609375, -1.39111328125, -0.5576171875, 0.27587890625, 1.109375, 1.94287109375, 2.7763671875, 3.60986328125, 4.443359375, 5.27685546875, 6.1103515625, 6.94384765625, 7.77734375, 8.61083984375, 9.4443359375, 10.27783203125, 11.111328125, 11.94482421875, 12.7783203125, 13.61181640625, 14.4453125, 15.27880859375, 16.1123046875, 16.94580078125, 17.779296875, 18.61279296875, 19.4462890625, 20.27978515625, 21.11328125, 21.94677734375, 22.7802734375, 23.61376953125, 24.447265625, 25.28076171875, 26.1142578125, 26.94775390625, 27.78125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 8.0, 7.0, 8.0, 21.0, 24.0, 40.0, 51.0, 98.0, 173.0, 303.0, 564.0, 1047.0, 1874.0, 3359.0, 6462.0, 11597.0, 21770.0, 38322.0, 64255.0, 98621.0, 134199.0, 156467.0, 153735.0, 127637.0, 91900.0, 58634.0, 34844.0, 19350.0, 10622.0, 5699.0, 3016.0, 1651.0, 943.0, 519.0, 298.0, 177.0, 107.0, 52.0, 34.0, 28.0, 19.0, 8.0, 4.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.8125, -31.7841796875, -30.755859375, -29.7275390625, -28.69921875, -27.6708984375, -26.642578125, -25.6142578125, -24.5859375, -23.5576171875, -22.529296875, -21.5009765625, -20.47265625, -19.4443359375, -18.416015625, -17.3876953125, -16.359375, -15.3310546875, -14.302734375, -13.2744140625, -12.24609375, -11.2177734375, -10.189453125, -9.1611328125, -8.1328125, -7.1044921875, -6.076171875, -5.0478515625, -4.01953125, -2.9912109375, -1.962890625, -0.9345703125, 0.09375, 1.1220703125, 2.150390625, 3.1787109375, 4.20703125, 5.2353515625, 6.263671875, 7.2919921875, 8.3203125, 9.3486328125, 10.376953125, 11.4052734375, 12.43359375, 13.4619140625, 14.490234375, 15.5185546875, 16.546875, 17.5751953125, 18.603515625, 19.6318359375, 20.66015625, 21.6884765625, 22.716796875, 23.7451171875, 24.7734375, 25.8017578125, 26.830078125, 27.8583984375, 28.88671875, 29.9150390625, 30.943359375, 31.9716796875, 33.0]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 8.0, 5.0, 11.0, 22.0, 17.0, 19.0, 22.0, 27.0, 20.0, 27.0, 25.0, 42.0, 38.0, 34.0, 45.0, 37.0, 49.0, 54.0, 42.0, 50.0, 46.0, 37.0, 40.0, 42.0, 38.0, 34.0, 16.0, 31.0, 20.0, 20.0, 13.0, 8.0, 15.0, 8.0, 9.0, 9.0, 3.0, 1.0, 5.0, 4.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.28125, -17.653564453125, -17.02587890625, -16.398193359375, -15.7705078125, -15.142822265625, -14.51513671875, -13.887451171875, -13.259765625, -12.632080078125, -12.00439453125, -11.376708984375, -10.7490234375, -10.121337890625, -9.49365234375, -8.865966796875, -8.23828125, -7.610595703125, -6.98291015625, -6.355224609375, -5.7275390625, -5.099853515625, -4.47216796875, -3.844482421875, -3.216796875, -2.589111328125, -1.96142578125, -1.333740234375, -0.7060546875, -0.078369140625, 0.54931640625, 1.177001953125, 1.8046875, 2.432373046875, 3.06005859375, 3.687744140625, 4.3154296875, 4.943115234375, 5.57080078125, 6.198486328125, 6.826171875, 7.453857421875, 8.08154296875, 8.709228515625, 9.3369140625, 9.964599609375, 10.59228515625, 11.219970703125, 11.84765625, 12.475341796875, 13.10302734375, 13.730712890625, 14.3583984375, 14.986083984375, 15.61376953125, 16.241455078125, 16.869140625, 17.496826171875, 18.12451171875, 18.752197265625, 19.3798828125, 20.007568359375, 20.63525390625, 21.262939453125, 21.890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 4.0, 3.0, 5.0, 8.0, 16.0, 20.0, 36.0, 40.0, 75.0, 112.0, 174.0, 298.0, 608.0, 1070.0, 2254.0, 4961.0, 11598.0, 29128.0, 75173.0, 179362.0, 287956.0, 247854.0, 124961.0, 49158.0, 19059.0, 7741.0, 3381.0, 1592.0, 778.0, 454.0, 253.0, 151.0, 105.0, 53.0, 32.0, 26.0, 17.0, 13.0, 9.0, 9.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.5, -22.782958984375, -22.06591796875, -21.348876953125, -20.6318359375, -19.914794921875, -19.19775390625, -18.480712890625, -17.763671875, -17.046630859375, -16.32958984375, -15.612548828125, -14.8955078125, -14.178466796875, -13.46142578125, -12.744384765625, -12.02734375, -11.310302734375, -10.59326171875, -9.876220703125, -9.1591796875, -8.442138671875, -7.72509765625, -7.008056640625, -6.291015625, -5.573974609375, -4.85693359375, -4.139892578125, -3.4228515625, -2.705810546875, -1.98876953125, -1.271728515625, -0.5546875, 0.162353515625, 0.87939453125, 1.596435546875, 2.3134765625, 3.030517578125, 3.74755859375, 4.464599609375, 5.181640625, 5.898681640625, 6.61572265625, 7.332763671875, 8.0498046875, 8.766845703125, 9.48388671875, 10.200927734375, 10.91796875, 11.635009765625, 12.35205078125, 13.069091796875, 13.7861328125, 14.503173828125, 15.22021484375, 15.937255859375, 16.654296875, 17.371337890625, 18.08837890625, 18.805419921875, 19.5224609375, 20.239501953125, 20.95654296875, 21.673583984375, 22.390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 5.0, 4.0, 5.0, 5.0, 6.0, 13.0, 9.0, 22.0, 19.0, 24.0, 28.0, 38.0, 34.0, 27.0, 40.0, 46.0, 39.0, 39.0, 58.0, 47.0, 46.0, 45.0, 45.0, 49.0, 36.0, 36.0, 30.0, 25.0, 23.0, 25.0, 29.0, 19.0, 14.0, 10.0, 10.0, 7.0, 6.0, 6.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.001071929931640625, -0.0010370910167694092, -0.0010022521018981934, -0.0009674131870269775, -0.0009325742721557617, -0.0008977353572845459, -0.0008628964424133301, -0.0008280575275421143, -0.0007932186126708984, -0.0007583796977996826, -0.0007235407829284668, -0.000688701868057251, -0.0006538629531860352, -0.0006190240383148193, -0.0005841851234436035, -0.0005493462085723877, -0.0005145072937011719, -0.00047966837882995605, -0.00044482946395874023, -0.0004099905490875244, -0.0003751516342163086, -0.0003403127193450928, -0.00030547380447387695, -0.00027063488960266113, -0.0002357959747314453, -0.0002009570598602295, -0.00016611814498901367, -0.00013127923011779785, -9.644031524658203e-05, -6.160140037536621e-05, -2.676248550415039e-05, 8.07642936706543e-06, 4.291534423828125e-05, 7.775425910949707e-05, 0.00011259317398071289, 0.0001474320888519287, 0.00018227100372314453, 0.00021710991859436035, 0.00025194883346557617, 0.000286787748336792, 0.0003216266632080078, 0.00035646557807922363, 0.00039130449295043945, 0.0004261434078216553, 0.0004609823226928711, 0.0004958212375640869, 0.0005306601524353027, 0.0005654990673065186, 0.0006003379821777344, 0.0006351768970489502, 0.000670015811920166, 0.0007048547267913818, 0.0007396936416625977, 0.0007745325565338135, 0.0008093714714050293, 0.0008442103862762451, 0.0008790493011474609, 0.0009138882160186768, 0.0009487271308898926, 0.0009835660457611084, 0.0010184049606323242, 0.00105324387550354, 0.0010880827903747559, 0.0011229217052459717, 0.0011577606201171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 12.0, 17.0, 22.0, 36.0, 48.0, 58.0, 107.0, 139.0, 207.0, 266.0, 441.0, 642.0, 859.0, 1271.0, 1948.0, 3043.0, 4371.0, 6954.0, 10436.0, 16362.0, 24804.0, 37423.0, 55015.0, 76248.0, 99323.0, 118410.0, 125708.0, 119251.0, 100804.0, 77365.0, 55533.0, 37996.0, 25242.0, 16731.0, 10713.0, 6936.0, 4640.0, 2958.0, 2013.0, 1389.0, 906.0, 613.0, 408.0, 301.0, 180.0, 133.0, 87.0, 68.0, 41.0, 27.0, 19.0, 15.0, 13.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.2734375, -8.9696044921875, -8.665771484375, -8.3619384765625, -8.05810546875, -7.7542724609375, -7.450439453125, -7.1466064453125, -6.8427734375, -6.5389404296875, -6.235107421875, -5.9312744140625, -5.62744140625, -5.3236083984375, -5.019775390625, -4.7159423828125, -4.412109375, -4.1082763671875, -3.804443359375, -3.5006103515625, -3.19677734375, -2.8929443359375, -2.589111328125, -2.2852783203125, -1.9814453125, -1.6776123046875, -1.373779296875, -1.0699462890625, -0.76611328125, -0.4622802734375, -0.158447265625, 0.1453857421875, 0.44921875, 0.7530517578125, 1.056884765625, 1.3607177734375, 1.66455078125, 1.9683837890625, 2.272216796875, 2.5760498046875, 2.8798828125, 3.1837158203125, 3.487548828125, 3.7913818359375, 4.09521484375, 4.3990478515625, 4.702880859375, 5.0067138671875, 5.310546875, 5.6143798828125, 5.918212890625, 6.2220458984375, 6.52587890625, 6.8297119140625, 7.133544921875, 7.4373779296875, 7.7412109375, 8.0450439453125, 8.348876953125, 8.6527099609375, 8.95654296875, 9.2603759765625, 9.564208984375, 9.8680419921875, 10.171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 1.0, 4.0, 10.0, 11.0, 11.0, 7.0, 22.0, 27.0, 20.0, 23.0, 22.0, 35.0, 35.0, 47.0, 47.0, 56.0, 65.0, 58.0, 44.0, 63.0, 50.0, 55.0, 48.0, 30.0, 47.0, 27.0, 17.0, 22.0, 18.0, 13.0, 15.0, 4.0, 9.0, 3.0, 10.0, 2.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.10546875, -4.94921875, -4.79296875, -4.63671875, -4.48046875, -4.32421875, -4.16796875, -4.01171875, -3.85546875, -3.69921875, -3.54296875, -3.38671875, -3.23046875, -3.07421875, -2.91796875, -2.76171875, -2.60546875, -2.44921875, -2.29296875, -2.13671875, -1.98046875, -1.82421875, -1.66796875, -1.51171875, -1.35546875, -1.19921875, -1.04296875, -0.88671875, -0.73046875, -0.57421875, -0.41796875, -0.26171875, -0.10546875, 0.05078125, 0.20703125, 0.36328125, 0.51953125, 0.67578125, 0.83203125, 0.98828125, 1.14453125, 1.30078125, 1.45703125, 1.61328125, 1.76953125, 1.92578125, 2.08203125, 2.23828125, 2.39453125, 2.55078125, 2.70703125, 2.86328125, 3.01953125, 3.17578125, 3.33203125, 3.48828125, 3.64453125, 3.80078125, 3.95703125, 4.11328125, 4.26953125, 4.42578125, 4.58203125, 4.73828125, 4.89453125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 10.0, 10.0, 6.0, 10.0, 15.0, 13.0, 22.0, 16.0, 23.0, 33.0, 37.0, 21.0, 29.0, 39.0, 34.0, 41.0, 30.0, 37.0, 39.0, 43.0, 44.0, 37.0, 32.0, 32.0, 40.0, 26.0, 30.0, 35.0, 38.0, 24.0, 17.0, 25.0, 16.0, 17.0, 15.0, 7.0, 8.0, 5.0, 2.0, 8.0, 6.0, 5.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.53798484802246, -23.73561668395996, -22.93324851989746, -22.130878448486328, -21.328510284423828, -20.526142120361328, -19.723773956298828, -18.921405792236328, -18.119037628173828, -17.316669464111328, -16.514301300048828, -15.711932182312012, -14.909563064575195, -14.107194900512695, -13.304826736450195, -12.502458572387695, -11.700088500976562, -10.897720336914062, -10.095351219177246, -9.292983055114746, -8.49061393737793, -7.68824577331543, -6.88587760925293, -6.0835089683532715, -5.281140327453613, -4.478771686553955, -3.676403284072876, -2.874034881591797, -2.0716662406921387, -1.2692975997924805, -0.46692943572998047, 0.33543920516967773, 1.1378097534179688, 1.9401782751083374, 2.742546796798706, 3.544915199279785, 4.347283840179443, 5.149652481079102, 5.952020645141602, 6.75438928604126, 7.556757926940918, 8.359126091003418, 9.161495208740234, 9.963863372802734, 10.766231536865234, 11.56860065460205, 12.37096881866455, 13.173337936401367, 13.975706100463867, 14.778074264526367, 15.580443382263184, 16.3828125, 17.1851806640625, 17.987548828125, 18.7899169921875, 19.59228515625, 20.3946533203125, 21.197021484375, 21.9993896484375, 22.8017578125, 23.604127883911133, 24.406496047973633, 25.208864212036133, 26.011232376098633, 26.813602447509766]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 2.0, 7.0, 6.0, 8.0, 8.0, 14.0, 18.0, 15.0, 14.0, 23.0, 26.0, 19.0, 24.0, 32.0, 27.0, 28.0, 46.0, 35.0, 49.0, 37.0, 36.0, 38.0, 39.0, 39.0, 44.0, 42.0, 38.0, 44.0, 32.0, 31.0, 24.0, 26.0, 22.0, 12.0, 17.0, 10.0, 19.0, 5.0, 5.0, 8.0, 6.0, 11.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-29.367952346801758, -28.423612594604492, -27.479272842407227, -26.534934997558594, -25.590595245361328, -24.646255493164062, -23.701915740966797, -22.75757598876953, -21.813236236572266, -20.868896484375, -19.924556732177734, -18.98021697998047, -18.035879135131836, -17.09153938293457, -16.147199630737305, -15.202859878540039, -14.258522033691406, -13.31418228149414, -12.369843482971191, -11.425503730773926, -10.481164932250977, -9.536825180053711, -8.592485427856445, -7.648146152496338, -6.7038068771362305, -5.759467601776123, -4.815128326416016, -3.87078857421875, -2.9264492988586426, -1.9821100234985352, -1.0377702713012695, -0.09343099594116211, 0.8509063720703125, 1.7952457666397095, 2.7395851612091064, 3.683924674987793, 4.6282639503479, 5.572603225708008, 6.516942977905273, 7.461282253265381, 8.405621528625488, 9.349961280822754, 10.294300079345703, 11.238639831542969, 12.182979583740234, 13.127318382263184, 14.07165813446045, 15.015996932983398, 15.960336685180664, 16.90467643737793, 17.849016189575195, 18.793354034423828, 19.737693786621094, 20.68203353881836, 21.626373291015625, 22.57071304321289, 23.515052795410156, 24.459392547607422, 25.403732299804688, 26.348072052001953, 27.292409896850586, 28.23674964904785, 29.181089401245117, 30.125429153442383, 31.069766998291016]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [3.0, 5.0, 6.0, 8.0, 14.0, 20.0, 32.0, 45.0, 94.0, 155.0, 243.0, 434.0, 622.0, 1079.0, 1727.0, 2867.0, 4564.0, 7634.0, 11909.0, 18935.0, 30597.0, 48404.0, 75706.0, 115644.0, 172381.0, 245769.0, 332018.0, 413289.0, 472904.0, 486253.0, 450528.0, 378725.0, 292919.0, 211883.0, 146957.0, 97261.0, 63464.0, 40596.0, 25500.0, 15995.0, 10175.0, 6375.0, 4065.0, 2422.0, 1529.0, 954.0, 620.0, 371.0, 246.0, 137.0, 78.0, 58.0, 24.0, 26.0, 13.0, 10.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.453125, -18.7890625, -18.125, -17.4609375, -16.796875, -16.1328125, -15.46875, -14.8046875, -14.140625, -13.4765625, -12.8125, -12.1484375, -11.484375, -10.8203125, -10.15625, -9.4921875, -8.828125, -8.1640625, -7.5, -6.8359375, -6.171875, -5.5078125, -4.84375, -4.1796875, -3.515625, -2.8515625, -2.1875, -1.5234375, -0.859375, -0.1953125, 0.46875, 1.1328125, 1.796875, 2.4609375, 3.125, 3.7890625, 4.453125, 5.1171875, 5.78125, 6.4453125, 7.109375, 7.7734375, 8.4375, 9.1015625, 9.765625, 10.4296875, 11.09375, 11.7578125, 12.421875, 13.0859375, 13.75, 14.4140625, 15.078125, 15.7421875, 16.40625, 17.0703125, 17.734375, 18.3984375, 19.0625, 19.7265625, 20.390625, 21.0546875, 21.71875, 22.3828125, 23.046875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 8.0, 4.0, 4.0, 7.0, 9.0, 5.0, 16.0, 15.0, 18.0, 16.0, 18.0, 23.0, 23.0, 23.0, 27.0, 31.0, 30.0, 44.0, 35.0, 39.0, 40.0, 42.0, 31.0, 35.0, 41.0, 48.0, 39.0, 39.0, 38.0, 33.0, 37.0, 21.0, 39.0, 14.0, 14.0, 13.0, 16.0, 18.0, 9.0, 5.0, 8.0, 10.0, 4.0, 6.0, 2.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-25.828125, -25.010009765625, -24.19189453125, -23.373779296875, -22.5556640625, -21.737548828125, -20.91943359375, -20.101318359375, -19.283203125, -18.465087890625, -17.64697265625, -16.828857421875, -16.0107421875, -15.192626953125, -14.37451171875, -13.556396484375, -12.73828125, -11.920166015625, -11.10205078125, -10.283935546875, -9.4658203125, -8.647705078125, -7.82958984375, -7.011474609375, -6.193359375, -5.375244140625, -4.55712890625, -3.739013671875, -2.9208984375, -2.102783203125, -1.28466796875, -0.466552734375, 0.3515625, 1.169677734375, 1.98779296875, 2.805908203125, 3.6240234375, 4.442138671875, 5.26025390625, 6.078369140625, 6.896484375, 7.714599609375, 8.53271484375, 9.350830078125, 10.1689453125, 10.987060546875, 11.80517578125, 12.623291015625, 13.44140625, 14.259521484375, 15.07763671875, 15.895751953125, 16.7138671875, 17.531982421875, 18.35009765625, 19.168212890625, 19.986328125, 20.804443359375, 21.62255859375, 22.440673828125, 23.2587890625, 24.076904296875, 24.89501953125, 25.713134765625, 26.53125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 13.0, 15.0, 29.0, 43.0, 54.0, 101.0, 202.0, 319.0, 455.0, 764.0, 1194.0, 1815.0, 2957.0, 4817.0, 7563.0, 11780.0, 17837.0, 27354.0, 41352.0, 61123.0, 89111.0, 126481.0, 173623.0, 229938.0, 290603.0, 348406.0, 393284.0, 412053.0, 400801.0, 363880.0, 308116.0, 247138.0, 189834.0, 139400.0, 99577.0, 68748.0, 46463.0, 30895.0, 19994.0, 12974.0, 8470.0, 5538.0, 3367.0, 2151.0, 1371.0, 871.0, 487.0, 368.0, 211.0, 121.0, 81.0, 56.0, 31.0, 28.0, 16.0, 8.0, 4.0, 6.0, 3.0], "bins": [-20.90625, -20.265869140625, -19.62548828125, -18.985107421875, -18.3447265625, -17.704345703125, -17.06396484375, -16.423583984375, -15.783203125, -15.142822265625, -14.50244140625, -13.862060546875, -13.2216796875, -12.581298828125, -11.94091796875, -11.300537109375, -10.66015625, -10.019775390625, -9.37939453125, -8.739013671875, -8.0986328125, -7.458251953125, -6.81787109375, -6.177490234375, -5.537109375, -4.896728515625, -4.25634765625, -3.615966796875, -2.9755859375, -2.335205078125, -1.69482421875, -1.054443359375, -0.4140625, 0.226318359375, 0.86669921875, 1.507080078125, 2.1474609375, 2.787841796875, 3.42822265625, 4.068603515625, 4.708984375, 5.349365234375, 5.98974609375, 6.630126953125, 7.2705078125, 7.910888671875, 8.55126953125, 9.191650390625, 9.83203125, 10.472412109375, 11.11279296875, 11.753173828125, 12.3935546875, 13.033935546875, 13.67431640625, 14.314697265625, 14.955078125, 15.595458984375, 16.23583984375, 16.876220703125, 17.5166015625, 18.156982421875, 18.79736328125, 19.437744140625, 20.078125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 4.0, 12.0, 17.0, 16.0, 15.0, 20.0, 26.0, 42.0, 42.0, 59.0, 50.0, 62.0, 85.0, 108.0, 115.0, 129.0, 147.0, 141.0, 168.0, 170.0, 168.0, 212.0, 192.0, 199.0, 177.0, 195.0, 173.0, 173.0, 154.0, 143.0, 124.0, 134.0, 108.0, 89.0, 68.0, 75.0, 54.0, 38.0, 41.0, 29.0, 23.0, 18.0, 15.0, 4.0, 10.0, 7.0, 6.0, 6.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.3515625, -10.0076904296875, -9.663818359375, -9.3199462890625, -8.97607421875, -8.6322021484375, -8.288330078125, -7.9444580078125, -7.6005859375, -7.2567138671875, -6.912841796875, -6.5689697265625, -6.22509765625, -5.8812255859375, -5.537353515625, -5.1934814453125, -4.849609375, -4.5057373046875, -4.161865234375, -3.8179931640625, -3.47412109375, -3.1302490234375, -2.786376953125, -2.4425048828125, -2.0986328125, -1.7547607421875, -1.410888671875, -1.0670166015625, -0.72314453125, -0.3792724609375, -0.035400390625, 0.3084716796875, 0.65234375, 0.9962158203125, 1.340087890625, 1.6839599609375, 2.02783203125, 2.3717041015625, 2.715576171875, 3.0594482421875, 3.4033203125, 3.7471923828125, 4.091064453125, 4.4349365234375, 4.77880859375, 5.1226806640625, 5.466552734375, 5.8104248046875, 6.154296875, 6.4981689453125, 6.842041015625, 7.1859130859375, 7.52978515625, 7.8736572265625, 8.217529296875, 8.5614013671875, 8.9052734375, 9.2491455078125, 9.593017578125, 9.9368896484375, 10.28076171875, 10.6246337890625, 10.968505859375, 11.3123779296875, 11.65625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 3.0, 10.0, 3.0, 7.0, 8.0, 10.0, 16.0, 12.0, 19.0, 27.0, 22.0, 35.0, 33.0, 26.0, 31.0, 31.0, 29.0, 49.0, 34.0, 32.0, 44.0, 34.0, 46.0, 36.0, 38.0, 43.0, 29.0, 29.0, 31.0, 22.0, 27.0, 17.0, 22.0, 21.0, 20.0, 20.0, 14.0, 13.0, 11.0, 9.0, 10.0, 5.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.437240600585938, -23.615877151489258, -22.794513702392578, -21.9731502532959, -21.15178680419922, -20.330421447753906, -19.50905990600586, -18.687694549560547, -17.866331100463867, -17.044967651367188, -16.223604202270508, -15.402240753173828, -14.580876350402832, -13.759512901306152, -12.938149452209473, -12.116785049438477, -11.295422554016113, -10.474059104919434, -9.652695655822754, -8.831331253051758, -8.009967803955078, -7.188604354858398, -6.367240905761719, -5.545876979827881, -4.724513530731201, -3.9031498432159424, -3.0817861557006836, -2.260422706604004, -1.4390590190887451, -0.6176953315734863, 0.20366811752319336, 1.0250320434570312, 1.846395492553711, 2.6677591800689697, 3.4891228675842285, 4.310486316680908, 5.131850242614746, 5.953213691711426, 6.7745771408081055, 7.595941066741943, 8.417304992675781, 9.238668441772461, 10.06003189086914, 10.88139533996582, 11.702759742736816, 12.524123191833496, 13.345486640930176, 14.166851043701172, 14.988213539123535, 15.809576988220215, 16.63094139099121, 17.45230484008789, 18.27366828918457, 19.09503173828125, 19.91639518737793, 20.73775863647461, 21.55912208557129, 22.38048553466797, 23.20184898376465, 24.023212432861328, 24.844575881958008, 25.665939331054688, 26.4873046875, 27.30866813659668, 28.13003158569336]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 8.0, 8.0, 17.0, 11.0, 15.0, 20.0, 26.0, 20.0, 26.0, 15.0, 31.0, 31.0, 28.0, 31.0, 38.0, 36.0, 39.0, 43.0, 42.0, 38.0, 42.0, 39.0, 42.0, 44.0, 35.0, 29.0, 24.0, 44.0, 21.0, 29.0, 14.0, 15.0, 17.0, 18.0, 7.0, 10.0, 7.0, 9.0, 9.0, 7.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0], "bins": [-32.672080993652344, -31.711727142333984, -30.751371383666992, -29.791015625, -28.83066177368164, -27.87030792236328, -26.90995216369629, -25.949596405029297, -24.989242553710938, -24.028888702392578, -23.068532943725586, -22.108177185058594, -21.147823333740234, -20.187469482421875, -19.227113723754883, -18.26675796508789, -17.30640411376953, -16.346050262451172, -15.38569450378418, -14.425339698791504, -13.464984893798828, -12.504630088806152, -11.544275283813477, -10.5839204788208, -9.623565673828125, -8.66321086883545, -7.702856063842773, -6.742501258850098, -5.782146453857422, -4.821791648864746, -3.8614368438720703, -2.9010820388793945, -1.940725326538086, -0.9803705215454102, -0.020015716552734375, 0.9403390884399414, 1.9006938934326172, 2.861048698425293, 3.8214035034179688, 4.7817583084106445, 5.74211311340332, 6.702467918395996, 7.662822723388672, 8.623177528381348, 9.583532333374023, 10.5438871383667, 11.504241943359375, 12.46459674835205, 13.424951553344727, 14.385306358337402, 15.345661163330078, 16.306015014648438, 17.26637077331543, 18.226726531982422, 19.18708038330078, 20.14743423461914, 21.107789993286133, 22.068145751953125, 23.028499603271484, 23.988853454589844, 24.949209213256836, 25.909564971923828, 26.869918823242188, 27.830272674560547, 28.79062843322754]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 12.0, 17.0, 31.0, 27.0, 42.0, 101.0, 155.0, 252.0, 398.0, 624.0, 959.0, 1490.0, 2442.0, 3955.0, 6150.0, 9253.0, 13943.0, 21093.0, 29706.0, 41433.0, 55192.0, 70207.0, 85181.0, 95777.0, 101429.0, 100276.0, 93204.0, 80332.0, 65464.0, 50881.0, 37789.0, 26646.0, 18753.0, 12426.0, 8275.0, 5328.0, 3465.0, 2213.0, 1357.0, 826.0, 548.0, 325.0, 218.0, 126.0, 83.0, 64.0, 36.0, 16.0, 13.0, 11.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.484375, -12.0924072265625, -11.700439453125, -11.3084716796875, -10.91650390625, -10.5245361328125, -10.132568359375, -9.7406005859375, -9.3486328125, -8.9566650390625, -8.564697265625, -8.1727294921875, -7.78076171875, -7.3887939453125, -6.996826171875, -6.6048583984375, -6.212890625, -5.8209228515625, -5.428955078125, -5.0369873046875, -4.64501953125, -4.2530517578125, -3.861083984375, -3.4691162109375, -3.0771484375, -2.6851806640625, -2.293212890625, -1.9012451171875, -1.50927734375, -1.1173095703125, -0.725341796875, -0.3333740234375, 0.05859375, 0.4505615234375, 0.842529296875, 1.2344970703125, 1.62646484375, 2.0184326171875, 2.410400390625, 2.8023681640625, 3.1943359375, 3.5863037109375, 3.978271484375, 4.3702392578125, 4.76220703125, 5.1541748046875, 5.546142578125, 5.9381103515625, 6.330078125, 6.7220458984375, 7.114013671875, 7.5059814453125, 7.89794921875, 8.2899169921875, 8.681884765625, 9.0738525390625, 9.4658203125, 9.8577880859375, 10.249755859375, 10.6417236328125, 11.03369140625, 11.4256591796875, 11.817626953125, 12.2095947265625, 12.6015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 7.0, 14.0, 11.0, 12.0, 19.0, 15.0, 27.0, 20.0, 26.0, 16.0, 30.0, 33.0, 30.0, 30.0, 39.0, 31.0, 44.0, 45.0, 40.0, 42.0, 37.0, 36.0, 49.0, 40.0, 30.0, 30.0, 24.0, 44.0, 22.0, 25.0, 18.0, 13.0, 19.0, 15.0, 10.0, 9.0, 7.0, 9.0, 7.0, 8.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0], "bins": [-33.1875, -32.213623046875, -31.23974609375, -30.265869140625, -29.2919921875, -28.318115234375, -27.34423828125, -26.370361328125, -25.396484375, -24.422607421875, -23.44873046875, -22.474853515625, -21.5009765625, -20.527099609375, -19.55322265625, -18.579345703125, -17.60546875, -16.631591796875, -15.65771484375, -14.683837890625, -13.7099609375, -12.736083984375, -11.76220703125, -10.788330078125, -9.814453125, -8.840576171875, -7.86669921875, -6.892822265625, -5.9189453125, -4.945068359375, -3.97119140625, -2.997314453125, -2.0234375, -1.049560546875, -0.07568359375, 0.898193359375, 1.8720703125, 2.845947265625, 3.81982421875, 4.793701171875, 5.767578125, 6.741455078125, 7.71533203125, 8.689208984375, 9.6630859375, 10.636962890625, 11.61083984375, 12.584716796875, 13.55859375, 14.532470703125, 15.50634765625, 16.480224609375, 17.4541015625, 18.427978515625, 19.40185546875, 20.375732421875, 21.349609375, 22.323486328125, 23.29736328125, 24.271240234375, 25.2451171875, 26.218994140625, 27.19287109375, 28.166748046875, 29.140625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 5.0, 4.0, 8.0, 15.0, 24.0, 35.0, 52.0, 57.0, 79.0, 138.0, 178.0, 225.0, 364.0, 512.0, 719.0, 1011.0, 1449.0, 2012.0, 2807.0, 3810.0, 5203.0, 7425.0, 10504.0, 15220.0, 22478.0, 50332.0, 697550.0, 141392.0, 26057.0, 17335.0, 11811.0, 8472.0, 6174.0, 4334.0, 3267.0, 2188.0, 1622.0, 1098.0, 819.0, 525.0, 358.0, 272.0, 174.0, 138.0, 87.0, 61.0, 37.0, 37.0, 25.0, 17.0, 17.0, 13.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-22.71875, -21.953125, -21.1875, -20.421875, -19.65625, -18.890625, -18.125, -17.359375, -16.59375, -15.828125, -15.0625, -14.296875, -13.53125, -12.765625, -12.0, -11.234375, -10.46875, -9.703125, -8.9375, -8.171875, -7.40625, -6.640625, -5.875, -5.109375, -4.34375, -3.578125, -2.8125, -2.046875, -1.28125, -0.515625, 0.25, 1.015625, 1.78125, 2.546875, 3.3125, 4.078125, 4.84375, 5.609375, 6.375, 7.140625, 7.90625, 8.671875, 9.4375, 10.203125, 10.96875, 11.734375, 12.5, 13.265625, 14.03125, 14.796875, 15.5625, 16.328125, 17.09375, 17.859375, 18.625, 19.390625, 20.15625, 20.921875, 21.6875, 22.453125, 23.21875, 23.984375, 24.75, 25.515625, 26.28125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 3.0, 9.0, 6.0, 7.0, 14.0, 16.0, 18.0, 20.0, 26.0, 24.0, 28.0, 21.0, 31.0, 32.0, 36.0, 37.0, 50.0, 38.0, 52.0, 42.0, 41.0, 39.0, 39.0, 38.0, 37.0, 28.0, 34.0, 32.0, 25.0, 27.0, 21.0, 27.0, 18.0, 17.0, 16.0, 9.0, 10.0, 7.0, 3.0, 5.0, 6.0, 1.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.015625, -25.239501953125, -24.46337890625, -23.687255859375, -22.9111328125, -22.135009765625, -21.35888671875, -20.582763671875, -19.806640625, -19.030517578125, -18.25439453125, -17.478271484375, -16.7021484375, -15.926025390625, -15.14990234375, -14.373779296875, -13.59765625, -12.821533203125, -12.04541015625, -11.269287109375, -10.4931640625, -9.717041015625, -8.94091796875, -8.164794921875, -7.388671875, -6.612548828125, -5.83642578125, -5.060302734375, -4.2841796875, -3.508056640625, -2.73193359375, -1.955810546875, -1.1796875, -0.403564453125, 0.37255859375, 1.148681640625, 1.9248046875, 2.700927734375, 3.47705078125, 4.253173828125, 5.029296875, 5.805419921875, 6.58154296875, 7.357666015625, 8.1337890625, 8.909912109375, 9.68603515625, 10.462158203125, 11.23828125, 12.014404296875, 12.79052734375, 13.566650390625, 14.3427734375, 15.118896484375, 15.89501953125, 16.671142578125, 17.447265625, 18.223388671875, 18.99951171875, 19.775634765625, 20.5517578125, 21.327880859375, 22.10400390625, 22.880126953125, 23.65625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 7.0, 7.0, 5.0, 15.0, 17.0, 29.0, 33.0, 61.0, 81.0, 119.0, 178.0, 264.0, 396.0, 626.0, 995.0, 1580.0, 2662.0, 4509.0, 7827.0, 14427.0, 27845.0, 185090.0, 718093.0, 40987.0, 18184.0, 9945.0, 5665.0, 3359.0, 2041.0, 1233.0, 736.0, 504.0, 332.0, 207.0, 156.0, 113.0, 65.0, 50.0, 36.0, 24.0, 15.0, 9.0, 13.0, 6.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.48046875, -3.37237548828125, -3.2642822265625, -3.15618896484375, -3.048095703125, -2.94000244140625, -2.8319091796875, -2.72381591796875, -2.61572265625, -2.50762939453125, -2.3995361328125, -2.29144287109375, -2.183349609375, -2.07525634765625, -1.9671630859375, -1.85906982421875, -1.7509765625, -1.64288330078125, -1.5347900390625, -1.42669677734375, -1.318603515625, -1.21051025390625, -1.1024169921875, -0.99432373046875, -0.88623046875, -0.77813720703125, -0.6700439453125, -0.56195068359375, -0.453857421875, -0.34576416015625, -0.2376708984375, -0.12957763671875, -0.021484375, 0.08660888671875, 0.1947021484375, 0.30279541015625, 0.410888671875, 0.51898193359375, 0.6270751953125, 0.73516845703125, 0.84326171875, 0.95135498046875, 1.0594482421875, 1.16754150390625, 1.275634765625, 1.38372802734375, 1.4918212890625, 1.59991455078125, 1.7080078125, 1.81610107421875, 1.9241943359375, 2.03228759765625, 2.140380859375, 2.24847412109375, 2.3565673828125, 2.46466064453125, 2.57275390625, 2.68084716796875, 2.7889404296875, 2.89703369140625, 3.005126953125, 3.11322021484375, 3.2213134765625, 3.32940673828125, 3.4375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 8.0, 11.0, 14.0, 10.0, 16.0, 18.0, 15.0, 29.0, 33.0, 42.0, 41.0, 47.0, 63.0, 63.0, 70.0, 62.0, 76.0, 50.0, 53.0, 44.0, 43.0, 40.0, 32.0, 22.0, 15.0, 14.0, 19.0, 10.0, 14.0, 6.0, 5.0, 0.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0009069442749023438, -0.0008811578154563904, -0.000855371356010437, -0.0008295848965644836, -0.0008037984371185303, -0.0007780119776725769, -0.0007522255182266235, -0.0007264390587806702, -0.0007006525993347168, -0.0006748661398887634, -0.0006490796804428101, -0.0006232932209968567, -0.0005975067615509033, -0.00057172030210495, -0.0005459338426589966, -0.0005201473832130432, -0.0004943609237670898, -0.0004685744643211365, -0.0004427880048751831, -0.00041700154542922974, -0.00039121508598327637, -0.000365428626537323, -0.00033964216709136963, -0.00031385570764541626, -0.0002880692481994629, -0.0002622827887535095, -0.00023649632930755615, -0.00021070986986160278, -0.00018492341041564941, -0.00015913695096969604, -0.00013335049152374268, -0.0001075640320777893, -8.177757263183594e-05, -5.599111318588257e-05, -3.02046537399292e-05, -4.41819429397583e-06, 2.136826515197754e-05, 4.715472459793091e-05, 7.294118404388428e-05, 9.872764348983765e-05, 0.00012451410293579102, 0.00015030056238174438, 0.00017608702182769775, 0.00020187348127365112, 0.0002276599407196045, 0.00025344640016555786, 0.00027923285961151123, 0.0003050193190574646, 0.00033080577850341797, 0.00035659223794937134, 0.0003823786973953247, 0.0004081651568412781, 0.00043395161628723145, 0.0004597380757331848, 0.0004855245351791382, 0.0005113109946250916, 0.0005370974540710449, 0.0005628839135169983, 0.0005886703729629517, 0.000614456832408905, 0.0006402432918548584, 0.0006660297513008118, 0.0006918162107467651, 0.0007176026701927185, 0.0007433891296386719]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 3.0, 10.0, 13.0, 17.0, 35.0, 34.0, 75.0, 95.0, 114.0, 174.0, 290.0, 386.0, 590.0, 791.0, 1178.0, 1726.0, 2630.0, 3992.0, 6271.0, 10221.0, 17631.0, 31343.0, 55264.0, 97434.0, 151737.0, 190671.0, 176140.0, 124327.0, 73818.0, 41640.0, 23513.0, 13335.0, 7971.0, 5115.0, 3193.0, 2118.0, 1483.0, 947.0, 690.0, 478.0, 322.0, 253.0, 164.0, 99.0, 75.0, 58.0, 33.0, 24.0, 17.0, 8.0, 7.0, 4.0, 4.0, 0.0, 2.0], "bins": [-1.6279296875, -1.581085205078125, -1.53424072265625, -1.487396240234375, -1.4405517578125, -1.393707275390625, -1.34686279296875, -1.300018310546875, -1.253173828125, -1.206329345703125, -1.15948486328125, -1.112640380859375, -1.0657958984375, -1.018951416015625, -0.97210693359375, -0.925262451171875, -0.87841796875, -0.831573486328125, -0.78472900390625, -0.737884521484375, -0.6910400390625, -0.644195556640625, -0.59735107421875, -0.550506591796875, -0.503662109375, -0.456817626953125, -0.40997314453125, -0.363128662109375, -0.3162841796875, -0.269439697265625, -0.22259521484375, -0.175750732421875, -0.12890625, -0.082061767578125, -0.03521728515625, 0.011627197265625, 0.0584716796875, 0.105316162109375, 0.15216064453125, 0.199005126953125, 0.245849609375, 0.292694091796875, 0.33953857421875, 0.386383056640625, 0.4332275390625, 0.480072021484375, 0.52691650390625, 0.573760986328125, 0.62060546875, 0.667449951171875, 0.71429443359375, 0.761138916015625, 0.8079833984375, 0.854827880859375, 0.90167236328125, 0.948516845703125, 0.995361328125, 1.042205810546875, 1.08905029296875, 1.135894775390625, 1.1827392578125, 1.229583740234375, 1.27642822265625, 1.323272705078125, 1.3701171875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 7.0, 8.0, 13.0, 13.0, 13.0, 10.0, 21.0, 28.0, 26.0, 22.0, 42.0, 45.0, 57.0, 66.0, 66.0, 50.0, 66.0, 68.0, 49.0, 48.0, 46.0, 45.0, 30.0, 28.0, 21.0, 14.0, 20.0, 15.0, 4.0, 10.0, 7.0, 6.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5263671875, -0.5099639892578125, -0.493560791015625, -0.4771575927734375, -0.46075439453125, -0.4443511962890625, -0.427947998046875, -0.4115447998046875, -0.3951416015625, -0.3787384033203125, -0.362335205078125, -0.3459320068359375, -0.32952880859375, -0.3131256103515625, -0.296722412109375, -0.2803192138671875, -0.263916015625, -0.2475128173828125, -0.231109619140625, -0.2147064208984375, -0.19830322265625, -0.1819000244140625, -0.165496826171875, -0.1490936279296875, -0.1326904296875, -0.1162872314453125, -0.099884033203125, -0.0834808349609375, -0.06707763671875, -0.0506744384765625, -0.034271240234375, -0.0178680419921875, -0.00146484375, 0.0149383544921875, 0.031341552734375, 0.0477447509765625, 0.06414794921875, 0.0805511474609375, 0.096954345703125, 0.1133575439453125, 0.1297607421875, 0.1461639404296875, 0.162567138671875, 0.1789703369140625, 0.19537353515625, 0.2117767333984375, 0.228179931640625, 0.2445831298828125, 0.260986328125, 0.2773895263671875, 0.293792724609375, 0.3101959228515625, 0.32659912109375, 0.3430023193359375, 0.359405517578125, 0.3758087158203125, 0.3922119140625, 0.4086151123046875, 0.425018310546875, 0.4414215087890625, 0.45782470703125, 0.4742279052734375, 0.490631103515625, 0.5070343017578125, 0.5234375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 5.0, 1.0, 4.0, 13.0, 18.0, 12.0, 11.0, 20.0, 19.0, 34.0, 22.0, 30.0, 30.0, 24.0, 33.0, 33.0, 41.0, 46.0, 45.0, 33.0, 42.0, 38.0, 46.0, 52.0, 28.0, 40.0, 30.0, 28.0, 31.0, 27.0, 14.0, 20.0, 15.0, 24.0, 19.0, 15.0, 8.0, 9.0, 12.0, 10.0, 6.0, 3.0, 3.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.495849609375, -23.61009979248047, -22.72435188293457, -21.83860206604004, -20.952852249145508, -20.06710433959961, -19.181354522705078, -18.295604705810547, -17.409854888916016, -16.524105072021484, -15.63835620880127, -14.752607345581055, -13.866857528686523, -12.981108665466309, -12.095359802246094, -11.209609985351562, -10.323861122131348, -9.438112258911133, -8.552362442016602, -7.666613578796387, -6.7808637619018555, -5.895114898681641, -5.009365558624268, -4.1236162185668945, -3.2378668785095215, -2.3521175384521484, -1.466368317604065, -0.5806190967559814, 0.3051302433013916, 1.1908793449401855, 2.0766286849975586, 2.9623780250549316, 3.8481273651123047, 4.733876705169678, 5.619626045227051, 6.505374908447266, 7.391124725341797, 8.276873588562012, 9.162622451782227, 10.048372268676758, 10.934122085571289, 11.819870948791504, 12.705620765686035, 13.59136962890625, 14.477119445800781, 15.362868309020996, 16.24861717224121, 17.134366989135742, 18.02011489868164, 18.905864715576172, 19.79161262512207, 20.6773624420166, 21.563112258911133, 22.44886016845703, 23.334609985351562, 24.220359802246094, 25.106109619140625, 25.991859436035156, 26.877607345581055, 27.763357162475586, 28.649106979370117, 29.534854888916016, 30.420604705810547, 31.306354522705078, 32.19210433959961]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 5.0, 7.0, 13.0, 12.0, 14.0, 17.0, 19.0, 25.0, 20.0, 24.0, 20.0, 27.0, 36.0, 26.0, 36.0, 36.0, 29.0, 45.0, 45.0, 41.0, 36.0, 42.0, 39.0, 42.0, 46.0, 30.0, 30.0, 22.0, 39.0, 25.0, 27.0, 17.0, 12.0, 18.0, 18.0, 9.0, 9.0, 5.0, 10.0, 7.0, 8.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 5.0, 0.0, 1.0], "bins": [-33.08607864379883, -32.11357498168945, -31.141069412231445, -30.16856575012207, -29.196060180664062, -28.223556518554688, -27.251052856445312, -26.278549194335938, -25.30604362487793, -24.333539962768555, -23.361034393310547, -22.388530731201172, -21.416027069091797, -20.44352149963379, -19.471017837524414, -18.498512268066406, -17.52600860595703, -16.553504943847656, -15.580999374389648, -14.608495712280273, -13.635991096496582, -12.66348648071289, -11.690982818603516, -10.718478202819824, -9.745973587036133, -8.773468971252441, -7.800964832305908, -6.828460693359375, -5.855956077575684, -4.883451461791992, -3.910947322845459, -2.938443183898926, -1.9659385681152344, -0.9934341907501221, -0.020929813385009766, 0.9515745639801025, 1.9240789413452148, 2.8965835571289062, 3.8690876960754395, 4.841591835021973, 5.814096450805664, 6.7866010665893555, 7.759105205535889, 8.731609344482422, 9.704113960266113, 10.676618576049805, 11.64912223815918, 12.621626853942871, 13.594131469726562, 14.566636085510254, 15.539140701293945, 16.51164436340332, 17.484149932861328, 18.456653594970703, 19.429157257080078, 20.401660919189453, 21.37416648864746, 22.346670150756836, 23.319175720214844, 24.29167938232422, 25.264183044433594, 26.2366886138916, 27.209192276000977, 28.181697845458984, 29.15420150756836]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 3.0, 5.0, 13.0, 15.0, 36.0, 60.0, 70.0, 117.0, 217.0, 328.0, 552.0, 1101.0, 1847.0, 3214.0, 5610.0, 9628.0, 16717.0, 27584.0, 44538.0, 66618.0, 93802.0, 119877.0, 135920.0, 135679.0, 118341.0, 92601.0, 65435.0, 43051.0, 27012.0, 16189.0, 9449.0, 5575.0, 3138.0, 1742.0, 1009.0, 560.0, 338.0, 208.0, 122.0, 77.0, 52.0, 42.0, 21.0, 10.0, 10.0, 9.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.28125, -28.365478515625, -27.44970703125, -26.533935546875, -25.6181640625, -24.702392578125, -23.78662109375, -22.870849609375, -21.955078125, -21.039306640625, -20.12353515625, -19.207763671875, -18.2919921875, -17.376220703125, -16.46044921875, -15.544677734375, -14.62890625, -13.713134765625, -12.79736328125, -11.881591796875, -10.9658203125, -10.050048828125, -9.13427734375, -8.218505859375, -7.302734375, -6.386962890625, -5.47119140625, -4.555419921875, -3.6396484375, -2.723876953125, -1.80810546875, -0.892333984375, 0.0234375, 0.939208984375, 1.85498046875, 2.770751953125, 3.6865234375, 4.602294921875, 5.51806640625, 6.433837890625, 7.349609375, 8.265380859375, 9.18115234375, 10.096923828125, 11.0126953125, 11.928466796875, 12.84423828125, 13.760009765625, 14.67578125, 15.591552734375, 16.50732421875, 17.423095703125, 18.3388671875, 19.254638671875, 20.17041015625, 21.086181640625, 22.001953125, 22.917724609375, 23.83349609375, 24.749267578125, 25.6650390625, 26.580810546875, 27.49658203125, 28.412353515625, 29.328125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 5.0, 5.0, 16.0, 12.0, 11.0, 21.0, 20.0, 20.0, 23.0, 25.0, 22.0, 27.0, 31.0, 30.0, 39.0, 31.0, 32.0, 46.0, 40.0, 44.0, 37.0, 37.0, 43.0, 50.0, 31.0, 36.0, 26.0, 30.0, 35.0, 26.0, 29.0, 10.0, 17.0, 18.0, 14.0, 9.0, 9.0, 6.0, 9.0, 10.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-31.0, -30.0859375, -29.171875, -28.2578125, -27.34375, -26.4296875, -25.515625, -24.6015625, -23.6875, -22.7734375, -21.859375, -20.9453125, -20.03125, -19.1171875, -18.203125, -17.2890625, -16.375, -15.4609375, -14.546875, -13.6328125, -12.71875, -11.8046875, -10.890625, -9.9765625, -9.0625, -8.1484375, -7.234375, -6.3203125, -5.40625, -4.4921875, -3.578125, -2.6640625, -1.75, -0.8359375, 0.078125, 0.9921875, 1.90625, 2.8203125, 3.734375, 4.6484375, 5.5625, 6.4765625, 7.390625, 8.3046875, 9.21875, 10.1328125, 11.046875, 11.9609375, 12.875, 13.7890625, 14.703125, 15.6171875, 16.53125, 17.4453125, 18.359375, 19.2734375, 20.1875, 21.1015625, 22.015625, 22.9296875, 23.84375, 24.7578125, 25.671875, 26.5859375, 27.5]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 7.0, 10.0, 19.0, 25.0, 28.0, 57.0, 71.0, 118.0, 176.0, 240.0, 390.0, 607.0, 946.0, 1409.0, 2170.0, 3246.0, 4885.0, 7582.0, 11302.0, 16631.0, 24413.0, 34329.0, 47216.0, 62497.0, 78910.0, 93914.0, 103638.0, 105581.0, 99967.0, 87410.0, 71824.0, 55959.0, 41121.0, 29203.0, 20741.0, 13961.0, 9566.0, 6294.0, 4147.0, 2763.0, 1785.0, 1160.0, 777.0, 489.0, 354.0, 239.0, 124.0, 78.0, 76.0, 41.0, 23.0, 17.0, 11.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.375, -21.65966796875, -20.9443359375, -20.22900390625, -19.513671875, -18.79833984375, -18.0830078125, -17.36767578125, -16.65234375, -15.93701171875, -15.2216796875, -14.50634765625, -13.791015625, -13.07568359375, -12.3603515625, -11.64501953125, -10.9296875, -10.21435546875, -9.4990234375, -8.78369140625, -8.068359375, -7.35302734375, -6.6376953125, -5.92236328125, -5.20703125, -4.49169921875, -3.7763671875, -3.06103515625, -2.345703125, -1.63037109375, -0.9150390625, -0.19970703125, 0.515625, 1.23095703125, 1.9462890625, 2.66162109375, 3.376953125, 4.09228515625, 4.8076171875, 5.52294921875, 6.23828125, 6.95361328125, 7.6689453125, 8.38427734375, 9.099609375, 9.81494140625, 10.5302734375, 11.24560546875, 11.9609375, 12.67626953125, 13.3916015625, 14.10693359375, 14.822265625, 15.53759765625, 16.2529296875, 16.96826171875, 17.68359375, 18.39892578125, 19.1142578125, 19.82958984375, 20.544921875, 21.26025390625, 21.9755859375, 22.69091796875, 23.40625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 2.0, 5.0, 7.0, 5.0, 10.0, 12.0, 13.0, 12.0, 21.0, 18.0, 23.0, 26.0, 32.0, 25.0, 32.0, 38.0, 38.0, 34.0, 46.0, 34.0, 36.0, 36.0, 40.0, 41.0, 36.0, 27.0, 36.0, 47.0, 32.0, 19.0, 27.0, 24.0, 18.0, 23.0, 22.0, 19.0, 12.0, 13.0, 12.0, 8.0, 9.0, 9.0, 5.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.875, -19.28564453125, -18.6962890625, -18.10693359375, -17.517578125, -16.92822265625, -16.3388671875, -15.74951171875, -15.16015625, -14.57080078125, -13.9814453125, -13.39208984375, -12.802734375, -12.21337890625, -11.6240234375, -11.03466796875, -10.4453125, -9.85595703125, -9.2666015625, -8.67724609375, -8.087890625, -7.49853515625, -6.9091796875, -6.31982421875, -5.73046875, -5.14111328125, -4.5517578125, -3.96240234375, -3.373046875, -2.78369140625, -2.1943359375, -1.60498046875, -1.015625, -0.42626953125, 0.1630859375, 0.75244140625, 1.341796875, 1.93115234375, 2.5205078125, 3.10986328125, 3.69921875, 4.28857421875, 4.8779296875, 5.46728515625, 6.056640625, 6.64599609375, 7.2353515625, 7.82470703125, 8.4140625, 9.00341796875, 9.5927734375, 10.18212890625, 10.771484375, 11.36083984375, 11.9501953125, 12.53955078125, 13.12890625, 13.71826171875, 14.3076171875, 14.89697265625, 15.486328125, 16.07568359375, 16.6650390625, 17.25439453125, 17.84375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 12.0, 13.0, 13.0, 25.0, 34.0, 51.0, 82.0, 112.0, 177.0, 272.0, 478.0, 744.0, 1377.0, 2535.0, 4704.0, 8721.0, 16041.0, 29430.0, 51882.0, 85827.0, 127815.0, 162759.0, 169157.0, 142548.0, 100425.0, 62787.0, 36462.0, 20119.0, 10902.0, 5793.0, 3028.0, 1728.0, 957.0, 580.0, 342.0, 210.0, 139.0, 85.0, 58.0, 44.0, 29.0, 17.0, 8.0, 12.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.8359375, -11.4681396484375, -11.100341796875, -10.7325439453125, -10.36474609375, -9.9969482421875, -9.629150390625, -9.2613525390625, -8.8935546875, -8.5257568359375, -8.157958984375, -7.7901611328125, -7.42236328125, -7.0545654296875, -6.686767578125, -6.3189697265625, -5.951171875, -5.5833740234375, -5.215576171875, -4.8477783203125, -4.47998046875, -4.1121826171875, -3.744384765625, -3.3765869140625, -3.0087890625, -2.6409912109375, -2.273193359375, -1.9053955078125, -1.53759765625, -1.1697998046875, -0.802001953125, -0.4342041015625, -0.06640625, 0.3013916015625, 0.669189453125, 1.0369873046875, 1.40478515625, 1.7725830078125, 2.140380859375, 2.5081787109375, 2.8759765625, 3.2437744140625, 3.611572265625, 3.9793701171875, 4.34716796875, 4.7149658203125, 5.082763671875, 5.4505615234375, 5.818359375, 6.1861572265625, 6.553955078125, 6.9217529296875, 7.28955078125, 7.6573486328125, 8.025146484375, 8.3929443359375, 8.7607421875, 9.1285400390625, 9.496337890625, 9.8641357421875, 10.23193359375, 10.5997314453125, 10.967529296875, 11.3353271484375, 11.703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 10.0, 11.0, 12.0, 14.0, 9.0, 17.0, 19.0, 24.0, 38.0, 47.0, 34.0, 55.0, 49.0, 72.0, 59.0, 55.0, 70.0, 55.0, 40.0, 65.0, 46.0, 45.0, 26.0, 25.0, 16.0, 21.0, 18.0, 7.0, 9.0, 7.0, 3.0, 4.0, 6.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012149810791015625, -0.0011740028858184814, -0.0011330246925354004, -0.0010920464992523193, -0.0010510683059692383, -0.0010100901126861572, -0.0009691119194030762, -0.0009281337261199951, -0.0008871555328369141, -0.000846177339553833, -0.000805199146270752, -0.0007642209529876709, -0.0007232427597045898, -0.0006822645664215088, -0.0006412863731384277, -0.0006003081798553467, -0.0005593299865722656, -0.0005183517932891846, -0.0004773736000061035, -0.00043639540672302246, -0.0003954172134399414, -0.00035443902015686035, -0.0003134608268737793, -0.00027248263359069824, -0.0002315044403076172, -0.00019052624702453613, -0.00014954805374145508, -0.00010856986045837402, -6.759166717529297e-05, -2.6613473892211914e-05, 1.436471939086914e-05, 5.5342912673950195e-05, 9.632110595703125e-05, 0.0001372992992401123, 0.00017827749252319336, 0.00021925568580627441, 0.00026023387908935547, 0.0003012120723724365, 0.0003421902656555176, 0.00038316845893859863, 0.0004241466522216797, 0.00046512484550476074, 0.0005061030387878418, 0.0005470812320709229, 0.0005880594253540039, 0.000629037618637085, 0.000670015811920166, 0.0007109940052032471, 0.0007519721984863281, 0.0007929503917694092, 0.0008339285850524902, 0.0008749067783355713, 0.0009158849716186523, 0.0009568631649017334, 0.0009978413581848145, 0.0010388195514678955, 0.0010797977447509766, 0.0011207759380340576, 0.0011617541313171387, 0.0012027323246002197, 0.0012437105178833008, 0.0012846887111663818, 0.0013256669044494629, 0.001366645097732544, 0.001407623291015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 12.0, 8.0, 11.0, 26.0, 29.0, 65.0, 77.0, 99.0, 155.0, 206.0, 338.0, 472.0, 710.0, 1113.0, 1888.0, 3052.0, 4895.0, 8224.0, 13859.0, 23284.0, 37976.0, 61103.0, 89485.0, 120689.0, 141677.0, 145579.0, 125825.0, 95790.0, 65330.0, 42039.0, 25839.0, 15357.0, 9120.0, 5336.0, 3340.0, 1997.0, 1194.0, 750.0, 537.0, 344.0, 232.0, 162.0, 93.0, 84.0, 59.0, 34.0, 25.0, 16.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-10.5859375, -10.256103515625, -9.92626953125, -9.596435546875, -9.2666015625, -8.936767578125, -8.60693359375, -8.277099609375, -7.947265625, -7.617431640625, -7.28759765625, -6.957763671875, -6.6279296875, -6.298095703125, -5.96826171875, -5.638427734375, -5.30859375, -4.978759765625, -4.64892578125, -4.319091796875, -3.9892578125, -3.659423828125, -3.32958984375, -2.999755859375, -2.669921875, -2.340087890625, -2.01025390625, -1.680419921875, -1.3505859375, -1.020751953125, -0.69091796875, -0.361083984375, -0.03125, 0.298583984375, 0.62841796875, 0.958251953125, 1.2880859375, 1.617919921875, 1.94775390625, 2.277587890625, 2.607421875, 2.937255859375, 3.26708984375, 3.596923828125, 3.9267578125, 4.256591796875, 4.58642578125, 4.916259765625, 5.24609375, 5.575927734375, 5.90576171875, 6.235595703125, 6.5654296875, 6.895263671875, 7.22509765625, 7.554931640625, 7.884765625, 8.214599609375, 8.54443359375, 8.874267578125, 9.2041015625, 9.533935546875, 9.86376953125, 10.193603515625, 10.5234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 10.0, 14.0, 25.0, 18.0, 24.0, 26.0, 38.0, 41.0, 50.0, 63.0, 74.0, 79.0, 72.0, 70.0, 79.0, 56.0, 55.0, 45.0, 38.0, 31.0, 25.0, 13.0, 11.0, 11.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.94140625, -6.73858642578125, -6.5357666015625, -6.33294677734375, -6.130126953125, -5.92730712890625, -5.7244873046875, -5.52166748046875, -5.31884765625, -5.11602783203125, -4.9132080078125, -4.71038818359375, -4.507568359375, -4.30474853515625, -4.1019287109375, -3.89910888671875, -3.6962890625, -3.49346923828125, -3.2906494140625, -3.08782958984375, -2.885009765625, -2.68218994140625, -2.4793701171875, -2.27655029296875, -2.07373046875, -1.87091064453125, -1.6680908203125, -1.46527099609375, -1.262451171875, -1.05963134765625, -0.8568115234375, -0.65399169921875, -0.451171875, -0.24835205078125, -0.0455322265625, 0.15728759765625, 0.360107421875, 0.56292724609375, 0.7657470703125, 0.96856689453125, 1.17138671875, 1.37420654296875, 1.5770263671875, 1.77984619140625, 1.982666015625, 2.18548583984375, 2.3883056640625, 2.59112548828125, 2.7939453125, 2.99676513671875, 3.1995849609375, 3.40240478515625, 3.605224609375, 3.80804443359375, 4.0108642578125, 4.21368408203125, 4.41650390625, 4.61932373046875, 4.8221435546875, 5.02496337890625, 5.227783203125, 5.43060302734375, 5.6334228515625, 5.83624267578125, 6.0390625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 9.0, 10.0, 12.0, 11.0, 11.0, 14.0, 16.0, 27.0, 22.0, 25.0, 29.0, 27.0, 31.0, 35.0, 40.0, 47.0, 40.0, 38.0, 31.0, 50.0, 47.0, 36.0, 36.0, 39.0, 41.0, 28.0, 34.0, 30.0, 23.0, 17.0, 22.0, 15.0, 25.0, 14.0, 13.0, 11.0, 8.0, 9.0, 6.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.10675048828125, -24.247634887695312, -23.388521194458008, -22.52940559387207, -21.670291900634766, -20.811176300048828, -19.95206069946289, -19.092947006225586, -18.23383140563965, -17.37471580505371, -16.515602111816406, -15.656486511230469, -14.797371864318848, -13.938257217407227, -13.079142570495605, -12.220027923583984, -11.360913276672363, -10.501798629760742, -9.642683982849121, -8.7835693359375, -7.9244537353515625, -7.065339088439941, -6.20622444152832, -5.347109317779541, -4.48799467086792, -3.6288797855377197, -2.7697649002075195, -1.9106502532958984, -1.0515353679656982, -0.19242048263549805, 0.666694164276123, 1.5258092880249023, 2.3849239349365234, 3.2440388202667236, 4.103153705596924, 4.962268352508545, 5.821383476257324, 6.680498123168945, 7.539612770080566, 8.398727416992188, 9.257843017578125, 10.116957664489746, 10.976072311401367, 11.835187911987305, 12.694302558898926, 13.553417205810547, 14.412531852722168, 15.271646499633789, 16.130760192871094, 16.98987579345703, 17.848989486694336, 18.708105087280273, 19.567218780517578, 20.426334381103516, 21.285449981689453, 22.144563674926758, 23.003679275512695, 23.862794876098633, 24.721908569335938, 25.581024169921875, 26.44013786315918, 27.299253463745117, 28.158367156982422, 29.01748275756836, 29.876598358154297]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 8.0, 9.0, 13.0, 8.0, 16.0, 20.0, 19.0, 28.0, 19.0, 26.0, 26.0, 27.0, 30.0, 32.0, 32.0, 41.0, 36.0, 37.0, 34.0, 36.0, 46.0, 43.0, 43.0, 29.0, 37.0, 35.0, 34.0, 31.0, 25.0, 30.0, 19.0, 18.0, 19.0, 13.0, 20.0, 13.0, 7.0, 8.0, 13.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.841938018798828, -25.89006805419922, -24.93819808959961, -23.986326217651367, -23.034456253051758, -22.08258628845215, -21.130714416503906, -20.178844451904297, -19.226974487304688, -18.275104522705078, -17.32323455810547, -16.371362686157227, -15.419492721557617, -14.467622756958008, -13.515751838684082, -12.563880920410156, -11.612010955810547, -10.660140991210938, -9.708270072937012, -8.756399154663086, -7.804529190063477, -6.852658748626709, -5.900788307189941, -4.948917865753174, -3.9970474243164062, -3.0451769828796387, -2.093306541442871, -1.1414361000061035, -0.18956565856933594, 0.7623047828674316, 1.7141752243041992, 2.666045665740967, 3.6179161071777344, 4.569786548614502, 5.5216569900512695, 6.473527431488037, 7.425397872924805, 8.377267837524414, 9.32913875579834, 10.281009674072266, 11.232879638671875, 12.184749603271484, 13.13662052154541, 14.088491439819336, 15.040361404418945, 15.992231369018555, 16.944103240966797, 17.895973205566406, 18.847843170166016, 19.799713134765625, 20.751583099365234, 21.703454971313477, 22.655324935913086, 23.607194900512695, 24.559066772460938, 25.510936737060547, 26.462806701660156, 27.414676666259766, 28.366546630859375, 29.318418502807617, 30.270288467407227, 31.222158432006836, 32.17403030395508, 33.12590026855469, 34.0777702331543]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 14.0, 41.0, 50.0, 99.0, 181.0, 258.0, 458.0, 708.0, 1263.0, 2124.0, 3454.0, 6047.0, 10052.0, 17102.0, 28946.0, 48003.0, 77611.0, 124342.0, 190400.0, 277349.0, 377387.0, 468581.0, 522389.0, 514131.0, 450282.0, 354589.0, 256136.0, 173516.0, 111813.0, 70187.0, 42586.0, 25914.0, 15561.0, 9095.0, 5625.0, 3249.0, 1934.0, 1111.0, 695.0, 391.0, 250.0, 151.0, 78.0, 54.0, 25.0, 21.0, 15.0, 7.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.125, -22.421875, -21.71875, -21.015625, -20.3125, -19.609375, -18.90625, -18.203125, -17.5, -16.796875, -16.09375, -15.390625, -14.6875, -13.984375, -13.28125, -12.578125, -11.875, -11.171875, -10.46875, -9.765625, -9.0625, -8.359375, -7.65625, -6.953125, -6.25, -5.546875, -4.84375, -4.140625, -3.4375, -2.734375, -2.03125, -1.328125, -0.625, 0.078125, 0.78125, 1.484375, 2.1875, 2.890625, 3.59375, 4.296875, 5.0, 5.703125, 6.40625, 7.109375, 7.8125, 8.515625, 9.21875, 9.921875, 10.625, 11.328125, 12.03125, 12.734375, 13.4375, 14.140625, 14.84375, 15.546875, 16.25, 16.953125, 17.65625, 18.359375, 19.0625, 19.765625, 20.46875, 21.171875, 21.875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [5.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 11.0, 8.0, 12.0, 5.0, 9.0, 19.0, 19.0, 19.0, 26.0, 13.0, 22.0, 31.0, 29.0, 25.0, 35.0, 28.0, 36.0, 36.0, 34.0, 38.0, 33.0, 40.0, 49.0, 39.0, 37.0, 30.0, 38.0, 27.0, 38.0, 22.0, 36.0, 19.0, 19.0, 21.0, 11.0, 21.0, 18.0, 8.0, 9.0, 8.0, 7.0, 5.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.3125, -21.51123046875, -20.7099609375, -19.90869140625, -19.107421875, -18.30615234375, -17.5048828125, -16.70361328125, -15.90234375, -15.10107421875, -14.2998046875, -13.49853515625, -12.697265625, -11.89599609375, -11.0947265625, -10.29345703125, -9.4921875, -8.69091796875, -7.8896484375, -7.08837890625, -6.287109375, -5.48583984375, -4.6845703125, -3.88330078125, -3.08203125, -2.28076171875, -1.4794921875, -0.67822265625, 0.123046875, 0.92431640625, 1.7255859375, 2.52685546875, 3.328125, 4.12939453125, 4.9306640625, 5.73193359375, 6.533203125, 7.33447265625, 8.1357421875, 8.93701171875, 9.73828125, 10.53955078125, 11.3408203125, 12.14208984375, 12.943359375, 13.74462890625, 14.5458984375, 15.34716796875, 16.1484375, 16.94970703125, 17.7509765625, 18.55224609375, 19.353515625, 20.15478515625, 20.9560546875, 21.75732421875, 22.55859375, 23.35986328125, 24.1611328125, 24.96240234375, 25.763671875, 26.56494140625, 27.3662109375, 28.16748046875, 28.96875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 4.0, 8.0, 16.0, 8.0, 26.0, 46.0, 82.0, 130.0, 238.0, 375.0, 643.0, 1025.0, 1838.0, 2946.0, 4932.0, 8180.0, 13271.0, 21419.0, 34253.0, 53480.0, 82495.0, 122386.0, 176020.0, 241281.0, 313753.0, 382555.0, 431427.0, 450527.0, 429431.0, 376445.0, 307043.0, 234932.0, 170246.0, 117269.0, 78809.0, 51558.0, 32753.0, 20308.0, 12716.0, 7623.0, 4660.0, 2899.0, 1640.0, 1048.0, 585.0, 381.0, 241.0, 151.0, 72.0, 48.0, 40.0, 8.0, 14.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-21.9375, -21.239990234375, -20.54248046875, -19.844970703125, -19.1474609375, -18.449951171875, -17.75244140625, -17.054931640625, -16.357421875, -15.659912109375, -14.96240234375, -14.264892578125, -13.5673828125, -12.869873046875, -12.17236328125, -11.474853515625, -10.77734375, -10.079833984375, -9.38232421875, -8.684814453125, -7.9873046875, -7.289794921875, -6.59228515625, -5.894775390625, -5.197265625, -4.499755859375, -3.80224609375, -3.104736328125, -2.4072265625, -1.709716796875, -1.01220703125, -0.314697265625, 0.3828125, 1.080322265625, 1.77783203125, 2.475341796875, 3.1728515625, 3.870361328125, 4.56787109375, 5.265380859375, 5.962890625, 6.660400390625, 7.35791015625, 8.055419921875, 8.7529296875, 9.450439453125, 10.14794921875, 10.845458984375, 11.54296875, 12.240478515625, 12.93798828125, 13.635498046875, 14.3330078125, 15.030517578125, 15.72802734375, 16.425537109375, 17.123046875, 17.820556640625, 18.51806640625, 19.215576171875, 19.9130859375, 20.610595703125, 21.30810546875, 22.005615234375, 22.703125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 3.0, 12.0, 24.0, 25.0, 30.0, 31.0, 49.0, 59.0, 80.0, 98.0, 118.0, 121.0, 141.0, 177.0, 178.0, 224.0, 218.0, 237.0, 232.0, 223.0, 240.0, 236.0, 230.0, 201.0, 170.0, 140.0, 124.0, 107.0, 72.0, 64.0, 53.0, 41.0, 33.0, 24.0, 17.0, 13.0, 7.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.75, -13.317138671875, -12.88427734375, -12.451416015625, -12.0185546875, -11.585693359375, -11.15283203125, -10.719970703125, -10.287109375, -9.854248046875, -9.42138671875, -8.988525390625, -8.5556640625, -8.122802734375, -7.68994140625, -7.257080078125, -6.82421875, -6.391357421875, -5.95849609375, -5.525634765625, -5.0927734375, -4.659912109375, -4.22705078125, -3.794189453125, -3.361328125, -2.928466796875, -2.49560546875, -2.062744140625, -1.6298828125, -1.197021484375, -0.76416015625, -0.331298828125, 0.1015625, 0.534423828125, 0.96728515625, 1.400146484375, 1.8330078125, 2.265869140625, 2.69873046875, 3.131591796875, 3.564453125, 3.997314453125, 4.43017578125, 4.863037109375, 5.2958984375, 5.728759765625, 6.16162109375, 6.594482421875, 7.02734375, 7.460205078125, 7.89306640625, 8.325927734375, 8.7587890625, 9.191650390625, 9.62451171875, 10.057373046875, 10.490234375, 10.923095703125, 11.35595703125, 11.788818359375, 12.2216796875, 12.654541015625, 13.08740234375, 13.520263671875, 13.953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 6.0, 0.0, 3.0, 7.0, 6.0, 15.0, 10.0, 15.0, 12.0, 17.0, 18.0, 19.0, 15.0, 26.0, 33.0, 27.0, 41.0, 36.0, 34.0, 41.0, 42.0, 38.0, 41.0, 44.0, 48.0, 38.0, 29.0, 40.0, 29.0, 33.0, 23.0, 29.0, 30.0, 28.0, 17.0, 16.0, 20.0, 19.0, 10.0, 9.0, 7.0, 11.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.271831512451172, -25.450593948364258, -24.629358291625977, -23.808120727539062, -22.98688316345215, -22.165645599365234, -21.344409942626953, -20.52317237854004, -19.701934814453125, -18.88069725036621, -18.05946159362793, -17.238224029541016, -16.4169864654541, -15.595749855041504, -14.774513244628906, -13.953275680541992, -13.132039070129395, -12.310802459716797, -11.489564895629883, -10.668328285217285, -9.847090721130371, -9.025854110717773, -8.20461654663086, -7.383379936218262, -6.562142848968506, -5.74090576171875, -4.919668674468994, -4.098431587219238, -3.2771947383880615, -2.4559578895568848, -1.634720802307129, -0.813483715057373, 0.0077533721923828125, 0.8289903998374939, 1.650227427482605, 2.4714643955230713, 3.292701482772827, 4.113938331604004, 4.93517541885376, 5.756412506103516, 6.5776495933532715, 7.398886680603027, 8.220123291015625, 9.041360855102539, 9.862597465515137, 10.683834075927734, 11.505071640014648, 12.326309204101562, 13.14754581451416, 13.968782424926758, 14.790019989013672, 15.61125659942627, 16.432493209838867, 17.25373077392578, 18.074968338012695, 18.89620590209961, 19.71744155883789, 20.538679122924805, 21.359914779663086, 22.18115234375, 23.002389907836914, 23.823627471923828, 24.64486312866211, 25.466100692749023, 26.287338256835938]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 9.0, 10.0, 8.0, 15.0, 18.0, 23.0, 26.0, 21.0, 21.0, 23.0, 27.0, 33.0, 41.0, 31.0, 35.0, 27.0, 35.0, 38.0, 43.0, 35.0, 43.0, 41.0, 36.0, 42.0, 41.0, 27.0, 37.0, 30.0, 24.0, 28.0, 21.0, 20.0, 20.0, 10.0, 13.0, 12.0, 9.0, 4.0, 11.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.024250030517578, -24.063556671142578, -23.102863311767578, -22.142169952392578, -21.181476593017578, -20.220783233642578, -19.260089874267578, -18.299396514892578, -17.338703155517578, -16.378009796142578, -15.417316436767578, -14.456623077392578, -13.495929718017578, -12.535236358642578, -11.574542045593262, -10.613848686218262, -9.653154373168945, -8.692461013793945, -7.731767654418945, -6.771073818206787, -5.810380458831787, -4.849687099456787, -3.888993263244629, -2.928299903869629, -1.967606544494629, -1.0069130659103394, -0.046219587326049805, 0.9144740104675293, 1.8751673698425293, 2.8358607292175293, 3.7965545654296875, 4.7572479248046875, 5.7179412841796875, 6.6786346435546875, 7.6393280029296875, 8.600021362304688, 9.560714721679688, 10.521408081054688, 11.482102394104004, 12.442795753479004, 13.403489112854004, 14.364182472229004, 15.324875831604004, 16.28557014465332, 17.24626350402832, 18.20695686340332, 19.16765022277832, 20.12834358215332, 21.08903694152832, 22.04973030090332, 23.01042366027832, 23.97111701965332, 24.93181037902832, 25.89250373840332, 26.853199005126953, 27.813892364501953, 28.774585723876953, 29.735279083251953, 30.695972442626953, 31.656665802001953, 32.61735916137695, 33.57805252075195, 34.53874588012695, 35.49943923950195, 36.46013259887695]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 2.0, 5.0, 11.0, 21.0, 29.0, 43.0, 53.0, 104.0, 178.0, 286.0, 386.0, 662.0, 928.0, 1513.0, 2376.0, 3531.0, 5274.0, 8198.0, 11993.0, 17554.0, 25352.0, 35644.0, 48321.0, 63151.0, 77870.0, 91875.0, 101140.0, 102985.0, 97348.0, 85665.0, 71177.0, 56525.0, 41933.0, 30549.0, 21433.0, 14760.0, 10150.0, 6706.0, 4499.0, 2951.0, 1913.0, 1243.0, 807.0, 497.0, 310.0, 239.0, 122.0, 81.0, 58.0, 45.0, 15.0, 12.0, 15.0, 8.0, 4.0, 3.0, 3.0, 2.0], "bins": [-9.921875, -9.6236572265625, -9.325439453125, -9.0272216796875, -8.72900390625, -8.4307861328125, -8.132568359375, -7.8343505859375, -7.5361328125, -7.2379150390625, -6.939697265625, -6.6414794921875, -6.34326171875, -6.0450439453125, -5.746826171875, -5.4486083984375, -5.150390625, -4.8521728515625, -4.553955078125, -4.2557373046875, -3.95751953125, -3.6593017578125, -3.361083984375, -3.0628662109375, -2.7646484375, -2.4664306640625, -2.168212890625, -1.8699951171875, -1.57177734375, -1.2735595703125, -0.975341796875, -0.6771240234375, -0.37890625, -0.0806884765625, 0.217529296875, 0.5157470703125, 0.81396484375, 1.1121826171875, 1.410400390625, 1.7086181640625, 2.0068359375, 2.3050537109375, 2.603271484375, 2.9014892578125, 3.19970703125, 3.4979248046875, 3.796142578125, 4.0943603515625, 4.392578125, 4.6907958984375, 4.989013671875, 5.2872314453125, 5.58544921875, 5.8836669921875, 6.181884765625, 6.4801025390625, 6.7783203125, 7.0765380859375, 7.374755859375, 7.6729736328125, 7.97119140625, 8.2694091796875, 8.567626953125, 8.8658447265625, 9.1640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 9.0, 9.0, 10.0, 13.0, 17.0, 23.0, 27.0, 22.0, 19.0, 25.0, 25.0, 37.0, 41.0, 28.0, 36.0, 24.0, 39.0, 37.0, 41.0, 36.0, 44.0, 38.0, 38.0, 40.0, 42.0, 26.0, 37.0, 30.0, 25.0, 30.0, 20.0, 19.0, 21.0, 10.0, 14.0, 10.0, 11.0, 4.0, 9.0, 7.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.359375, -24.387939453125, -23.41650390625, -22.445068359375, -21.4736328125, -20.502197265625, -19.53076171875, -18.559326171875, -17.587890625, -16.616455078125, -15.64501953125, -14.673583984375, -13.7021484375, -12.730712890625, -11.75927734375, -10.787841796875, -9.81640625, -8.844970703125, -7.87353515625, -6.902099609375, -5.9306640625, -4.959228515625, -3.98779296875, -3.016357421875, -2.044921875, -1.073486328125, -0.10205078125, 0.869384765625, 1.8408203125, 2.812255859375, 3.78369140625, 4.755126953125, 5.7265625, 6.697998046875, 7.66943359375, 8.640869140625, 9.6123046875, 10.583740234375, 11.55517578125, 12.526611328125, 13.498046875, 14.469482421875, 15.44091796875, 16.412353515625, 17.3837890625, 18.355224609375, 19.32666015625, 20.298095703125, 21.26953125, 22.240966796875, 23.21240234375, 24.183837890625, 25.1552734375, 26.126708984375, 27.09814453125, 28.069580078125, 29.041015625, 30.012451171875, 30.98388671875, 31.955322265625, 32.9267578125, 33.898193359375, 34.86962890625, 35.841064453125, 36.8125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 12.0, 21.0, 29.0, 44.0, 60.0, 90.0, 150.0, 195.0, 351.0, 552.0, 800.0, 1242.0, 2001.0, 3132.0, 4882.0, 7403.0, 11819.0, 19232.0, 33873.0, 618931.0, 267039.0, 29918.0, 17109.0, 10698.0, 6664.0, 4378.0, 2823.0, 1859.0, 1157.0, 728.0, 475.0, 322.0, 194.0, 121.0, 73.0, 66.0, 35.0, 18.0, 15.0, 14.0, 9.0, 7.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.234375, -26.352783203125, -25.47119140625, -24.589599609375, -23.7080078125, -22.826416015625, -21.94482421875, -21.063232421875, -20.181640625, -19.300048828125, -18.41845703125, -17.536865234375, -16.6552734375, -15.773681640625, -14.89208984375, -14.010498046875, -13.12890625, -12.247314453125, -11.36572265625, -10.484130859375, -9.6025390625, -8.720947265625, -7.83935546875, -6.957763671875, -6.076171875, -5.194580078125, -4.31298828125, -3.431396484375, -2.5498046875, -1.668212890625, -0.78662109375, 0.094970703125, 0.9765625, 1.858154296875, 2.73974609375, 3.621337890625, 4.5029296875, 5.384521484375, 6.26611328125, 7.147705078125, 8.029296875, 8.910888671875, 9.79248046875, 10.674072265625, 11.5556640625, 12.437255859375, 13.31884765625, 14.200439453125, 15.08203125, 15.963623046875, 16.84521484375, 17.726806640625, 18.6083984375, 19.489990234375, 20.37158203125, 21.253173828125, 22.134765625, 23.016357421875, 23.89794921875, 24.779541015625, 25.6611328125, 26.542724609375, 27.42431640625, 28.305908203125, 29.1875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 12.0, 10.0, 16.0, 12.0, 17.0, 11.0, 32.0, 25.0, 26.0, 34.0, 34.0, 38.0, 40.0, 37.0, 36.0, 38.0, 47.0, 40.0, 52.0, 37.0, 34.0, 26.0, 36.0, 41.0, 38.0, 29.0, 25.0, 30.0, 25.0, 19.0, 21.0, 14.0, 13.0, 7.0, 13.0, 14.0, 5.0, 5.0, 6.0, 0.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.015625, -22.314208984375, -21.61279296875, -20.911376953125, -20.2099609375, -19.508544921875, -18.80712890625, -18.105712890625, -17.404296875, -16.702880859375, -16.00146484375, -15.300048828125, -14.5986328125, -13.897216796875, -13.19580078125, -12.494384765625, -11.79296875, -11.091552734375, -10.39013671875, -9.688720703125, -8.9873046875, -8.285888671875, -7.58447265625, -6.883056640625, -6.181640625, -5.480224609375, -4.77880859375, -4.077392578125, -3.3759765625, -2.674560546875, -1.97314453125, -1.271728515625, -0.5703125, 0.131103515625, 0.83251953125, 1.533935546875, 2.2353515625, 2.936767578125, 3.63818359375, 4.339599609375, 5.041015625, 5.742431640625, 6.44384765625, 7.145263671875, 7.8466796875, 8.548095703125, 9.24951171875, 9.950927734375, 10.65234375, 11.353759765625, 12.05517578125, 12.756591796875, 13.4580078125, 14.159423828125, 14.86083984375, 15.562255859375, 16.263671875, 16.965087890625, 17.66650390625, 18.367919921875, 19.0693359375, 19.770751953125, 20.47216796875, 21.173583984375, 21.875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 5.0, 5.0, 11.0, 21.0, 19.0, 39.0, 37.0, 60.0, 70.0, 99.0, 137.0, 200.0, 273.0, 401.0, 560.0, 841.0, 1250.0, 1785.0, 2749.0, 4136.0, 6164.0, 9768.0, 15615.0, 27392.0, 143622.0, 727701.0, 48177.0, 21069.0, 12500.0, 8014.0, 5289.0, 3523.0, 2231.0, 1517.0, 924.0, 701.0, 482.0, 349.0, 216.0, 154.0, 125.0, 83.0, 58.0, 48.0, 36.0, 33.0, 17.0, 16.0, 10.0, 5.0, 1.0, 9.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-2.044921875, -1.981597900390625, -1.91827392578125, -1.854949951171875, -1.7916259765625, -1.728302001953125, -1.66497802734375, -1.601654052734375, -1.538330078125, -1.475006103515625, -1.41168212890625, -1.348358154296875, -1.2850341796875, -1.221710205078125, -1.15838623046875, -1.095062255859375, -1.03173828125, -0.968414306640625, -0.90509033203125, -0.841766357421875, -0.7784423828125, -0.715118408203125, -0.65179443359375, -0.588470458984375, -0.525146484375, -0.461822509765625, -0.39849853515625, -0.335174560546875, -0.2718505859375, -0.208526611328125, -0.14520263671875, -0.081878662109375, -0.0185546875, 0.044769287109375, 0.10809326171875, 0.171417236328125, 0.2347412109375, 0.298065185546875, 0.36138916015625, 0.424713134765625, 0.488037109375, 0.551361083984375, 0.61468505859375, 0.678009033203125, 0.7413330078125, 0.804656982421875, 0.86798095703125, 0.931304931640625, 0.99462890625, 1.057952880859375, 1.12127685546875, 1.184600830078125, 1.2479248046875, 1.311248779296875, 1.37457275390625, 1.437896728515625, 1.501220703125, 1.564544677734375, 1.62786865234375, 1.691192626953125, 1.7545166015625, 1.817840576171875, 1.88116455078125, 1.944488525390625, 2.0078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 8.0, 5.0, 8.0, 12.0, 14.0, 20.0, 32.0, 40.0, 37.0, 46.0, 50.0, 65.0, 99.0, 76.0, 84.0, 84.0, 60.0, 58.0, 46.0, 28.0, 24.0, 20.0, 12.0, 10.0, 12.0, 10.0, 4.0, 6.0, 7.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004992485046386719, -0.00048423558473587036, -0.00046922266483306885, -0.00045420974493026733, -0.0004391968250274658, -0.0004241839051246643, -0.0004091709852218628, -0.0003941580653190613, -0.00037914514541625977, -0.00036413222551345825, -0.00034911930561065674, -0.0003341063857078552, -0.0003190934658050537, -0.0003040805459022522, -0.0002890676259994507, -0.00027405470609664917, -0.00025904178619384766, -0.00024402886629104614, -0.00022901594638824463, -0.00021400302648544312, -0.0001989901065826416, -0.0001839771866798401, -0.00016896426677703857, -0.00015395134687423706, -0.00013893842697143555, -0.00012392550706863403, -0.00010891258716583252, -9.3899667263031e-05, -7.888674736022949e-05, -6.387382745742798e-05, -4.8860907554626465e-05, -3.384798765182495e-05, -1.8835067749023438e-05, -3.822147846221924e-06, 1.119077205657959e-05, 2.6203691959381104e-05, 4.121661186218262e-05, 5.622953176498413e-05, 7.124245166778564e-05, 8.625537157058716e-05, 0.00010126829147338867, 0.00011628121137619019, 0.0001312941312789917, 0.0001463070511817932, 0.00016131997108459473, 0.00017633289098739624, 0.00019134581089019775, 0.00020635873079299927, 0.00022137165069580078, 0.0002363845705986023, 0.0002513974905014038, 0.0002664104104042053, 0.00028142333030700684, 0.00029643625020980835, 0.00031144917011260986, 0.0003264620900154114, 0.0003414750099182129, 0.0003564879298210144, 0.0003715008497238159, 0.00038651376962661743, 0.00040152668952941895, 0.00041653960943222046, 0.00043155252933502197, 0.0004465654492378235, 0.000461578369140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 9.0, 4.0, 12.0, 15.0, 26.0, 39.0, 45.0, 79.0, 101.0, 146.0, 250.0, 394.0, 668.0, 1076.0, 1859.0, 3205.0, 5735.0, 10454.0, 18946.0, 34130.0, 58885.0, 94553.0, 136058.0, 162919.0, 161939.0, 132529.0, 92603.0, 57568.0, 32875.0, 18218.0, 9983.0, 5541.0, 3161.0, 1763.0, 1030.0, 625.0, 345.0, 267.0, 161.0, 112.0, 64.0, 53.0, 37.0, 23.0, 17.0, 12.0, 8.0, 8.0, 7.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.345703125, -1.307220458984375, -1.26873779296875, -1.230255126953125, -1.1917724609375, -1.153289794921875, -1.11480712890625, -1.076324462890625, -1.037841796875, -0.999359130859375, -0.96087646484375, -0.922393798828125, -0.8839111328125, -0.845428466796875, -0.80694580078125, -0.768463134765625, -0.72998046875, -0.691497802734375, -0.65301513671875, -0.614532470703125, -0.5760498046875, -0.537567138671875, -0.49908447265625, -0.460601806640625, -0.422119140625, -0.383636474609375, -0.34515380859375, -0.306671142578125, -0.2681884765625, -0.229705810546875, -0.19122314453125, -0.152740478515625, -0.1142578125, -0.075775146484375, -0.03729248046875, 0.001190185546875, 0.0396728515625, 0.078155517578125, 0.11663818359375, 0.155120849609375, 0.193603515625, 0.232086181640625, 0.27056884765625, 0.309051513671875, 0.3475341796875, 0.386016845703125, 0.42449951171875, 0.462982177734375, 0.50146484375, 0.539947509765625, 0.57843017578125, 0.616912841796875, 0.6553955078125, 0.693878173828125, 0.73236083984375, 0.770843505859375, 0.809326171875, 0.847808837890625, 0.88629150390625, 0.924774169921875, 0.9632568359375, 1.001739501953125, 1.04022216796875, 1.078704833984375, 1.1171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 3.0, 2.0, 3.0, 5.0, 8.0, 6.0, 19.0, 22.0, 9.0, 16.0, 22.0, 25.0, 27.0, 24.0, 34.0, 43.0, 39.0, 43.0, 47.0, 49.0, 55.0, 46.0, 49.0, 42.0, 53.0, 39.0, 48.0, 31.0, 32.0, 29.0, 22.0, 9.0, 14.0, 15.0, 13.0, 9.0, 11.0, 10.0, 5.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.476806640625, -0.46414947509765625, -0.4514923095703125, -0.43883514404296875, -0.426177978515625, -0.41352081298828125, -0.4008636474609375, -0.38820648193359375, -0.37554931640625, -0.36289215087890625, -0.3502349853515625, -0.33757781982421875, -0.324920654296875, -0.31226348876953125, -0.2996063232421875, -0.28694915771484375, -0.2742919921875, -0.26163482666015625, -0.2489776611328125, -0.23632049560546875, -0.223663330078125, -0.21100616455078125, -0.1983489990234375, -0.18569183349609375, -0.17303466796875, -0.16037750244140625, -0.1477203369140625, -0.13506317138671875, -0.122406005859375, -0.10974884033203125, -0.0970916748046875, -0.08443450927734375, -0.07177734375, -0.05912017822265625, -0.0464630126953125, -0.03380584716796875, -0.021148681640625, -0.00849151611328125, 0.0041656494140625, 0.01682281494140625, 0.02947998046875, 0.04213714599609375, 0.0547943115234375, 0.06745147705078125, 0.080108642578125, 0.09276580810546875, 0.1054229736328125, 0.11808013916015625, 0.1307373046875, 0.14339447021484375, 0.1560516357421875, 0.16870880126953125, 0.181365966796875, 0.19402313232421875, 0.2066802978515625, 0.21933746337890625, 0.23199462890625, 0.24465179443359375, 0.2573089599609375, 0.26996612548828125, 0.282623291015625, 0.29528045654296875, 0.3079376220703125, 0.32059478759765625, 0.333251953125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 16.0, 12.0, 11.0, 19.0, 15.0, 13.0, 16.0, 23.0, 30.0, 32.0, 38.0, 35.0, 28.0, 48.0, 45.0, 41.0, 38.0, 43.0, 42.0, 46.0, 38.0, 36.0, 40.0, 29.0, 36.0, 24.0, 26.0, 29.0, 15.0, 12.0, 18.0, 13.0, 19.0, 17.0, 6.0, 7.0, 8.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.57131576538086, -26.71919059753418, -25.8670654296875, -25.01494026184082, -24.16281509399414, -23.31068992614746, -22.45856475830078, -21.60643768310547, -20.754314422607422, -19.902189254760742, -19.050064086914062, -18.197938919067383, -17.345813751220703, -16.493688583374023, -15.641562461853027, -14.789437294006348, -13.937311172485352, -13.085186004638672, -12.233060836791992, -11.380935668945312, -10.528810501098633, -9.676685333251953, -8.824559211730957, -7.972434043884277, -7.120308876037598, -6.268183708190918, -5.416058540344238, -4.5639328956604, -3.7118077278137207, -2.859682559967041, -2.007556915283203, -1.1554317474365234, -0.30330467224121094, 0.5488206148147583, 1.4009459018707275, 2.2530713081359863, 3.105196475982666, 3.9573216438293457, 4.809447288513184, 5.661572456359863, 6.513697624206543, 7.365822792053223, 8.217947959899902, 9.070074081420898, 9.922199249267578, 10.774324417114258, 11.626449584960938, 12.478574752807617, 13.330699920654297, 14.182825088500977, 15.034950256347656, 15.887075424194336, 16.739200592041016, 17.591325759887695, 18.443450927734375, 19.295578002929688, 20.147701263427734, 20.999826431274414, 21.851951599121094, 22.704076766967773, 23.556201934814453, 24.408327102661133, 25.260452270507812, 26.112579345703125, 26.964704513549805]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 9.0, 11.0, 8.0, 15.0, 18.0, 23.0, 24.0, 21.0, 22.0, 26.0, 25.0, 38.0, 38.0, 26.0, 30.0, 42.0, 32.0, 34.0, 33.0, 45.0, 42.0, 33.0, 43.0, 31.0, 50.0, 27.0, 34.0, 29.0, 27.0, 22.0, 24.0, 18.0, 23.0, 14.0, 10.0, 8.0, 11.0, 9.0, 7.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.958290100097656, -24.000320434570312, -23.04235076904297, -22.084381103515625, -21.12641143798828, -20.168441772460938, -19.210472106933594, -18.25250244140625, -17.294532775878906, -16.336563110351562, -15.378593444824219, -14.420623779296875, -13.462654113769531, -12.504684448242188, -11.546713829040527, -10.588744163513184, -9.630773544311523, -8.67280387878418, -7.714834213256836, -6.756864070892334, -5.79889440536499, -4.8409247398376465, -3.8829545974731445, -2.924984931945801, -1.967015266418457, -1.0090454816818237, -0.05107569694519043, 0.9068942070007324, 1.8648638725280762, 2.82283353805542, 3.780803680419922, 4.738773345947266, 5.696743011474609, 6.654712677001953, 7.612682342529297, 8.57065200805664, 9.528621673583984, 10.486591339111328, 11.444561958312988, 12.402531623840332, 13.360501289367676, 14.31847095489502, 15.276440620422363, 16.234411239624023, 17.192380905151367, 18.15035057067871, 19.108320236206055, 20.0662899017334, 21.024259567260742, 21.982229232788086, 22.94019889831543, 23.898168563842773, 24.856138229370117, 25.81410789489746, 26.772079467773438, 27.73004913330078, 28.688018798828125, 29.64598846435547, 30.603958129882812, 31.561927795410156, 32.5198974609375, 33.477867126464844, 34.43583679199219, 35.39380645751953, 36.351776123046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 7.0, 9.0, 22.0, 21.0, 26.0, 32.0, 58.0, 80.0, 125.0, 165.0, 284.0, 453.0, 687.0, 1149.0, 1846.0, 2969.0, 4958.0, 7939.0, 13113.0, 21287.0, 32904.0, 49464.0, 70019.0, 92088.0, 112129.0, 123278.0, 122300.0, 109002.0, 88531.0, 66079.0, 46133.0, 30500.0, 19577.0, 12094.0, 7421.0, 4548.0, 2667.0, 1664.0, 1095.0, 626.0, 387.0, 267.0, 178.0, 113.0, 86.0, 54.0, 42.0, 28.0, 22.0, 7.0, 13.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-25.71875, -24.912841796875, -24.10693359375, -23.301025390625, -22.4951171875, -21.689208984375, -20.88330078125, -20.077392578125, -19.271484375, -18.465576171875, -17.65966796875, -16.853759765625, -16.0478515625, -15.241943359375, -14.43603515625, -13.630126953125, -12.82421875, -12.018310546875, -11.21240234375, -10.406494140625, -9.6005859375, -8.794677734375, -7.98876953125, -7.182861328125, -6.376953125, -5.571044921875, -4.76513671875, -3.959228515625, -3.1533203125, -2.347412109375, -1.54150390625, -0.735595703125, 0.0703125, 0.876220703125, 1.68212890625, 2.488037109375, 3.2939453125, 4.099853515625, 4.90576171875, 5.711669921875, 6.517578125, 7.323486328125, 8.12939453125, 8.935302734375, 9.7412109375, 10.547119140625, 11.35302734375, 12.158935546875, 12.96484375, 13.770751953125, 14.57666015625, 15.382568359375, 16.1884765625, 16.994384765625, 17.80029296875, 18.606201171875, 19.412109375, 20.218017578125, 21.02392578125, 21.829833984375, 22.6357421875, 23.441650390625, 24.24755859375, 25.053466796875, 25.859375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 6.0, 3.0, 5.0, 8.0, 10.0, 7.0, 12.0, 23.0, 19.0, 22.0, 23.0, 26.0, 21.0, 27.0, 35.0, 38.0, 29.0, 27.0, 43.0, 36.0, 26.0, 40.0, 45.0, 36.0, 38.0, 41.0, 32.0, 44.0, 36.0, 27.0, 35.0, 23.0, 25.0, 21.0, 17.0, 28.0, 10.0, 15.0, 8.0, 13.0, 7.0, 5.0, 10.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.78125, -22.875, -21.96875, -21.0625, -20.15625, -19.25, -18.34375, -17.4375, -16.53125, -15.625, -14.71875, -13.8125, -12.90625, -12.0, -11.09375, -10.1875, -9.28125, -8.375, -7.46875, -6.5625, -5.65625, -4.75, -3.84375, -2.9375, -2.03125, -1.125, -0.21875, 0.6875, 1.59375, 2.5, 3.40625, 4.3125, 5.21875, 6.125, 7.03125, 7.9375, 8.84375, 9.75, 10.65625, 11.5625, 12.46875, 13.375, 14.28125, 15.1875, 16.09375, 17.0, 17.90625, 18.8125, 19.71875, 20.625, 21.53125, 22.4375, 23.34375, 24.25, 25.15625, 26.0625, 26.96875, 27.875, 28.78125, 29.6875, 30.59375, 31.5, 32.40625, 33.3125, 34.21875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 6.0, 7.0, 20.0, 22.0, 30.0, 53.0, 87.0, 136.0, 220.0, 361.0, 565.0, 1016.0, 1510.0, 2546.0, 4249.0, 6859.0, 11014.0, 17661.0, 26856.0, 39783.0, 57608.0, 77126.0, 96313.0, 110797.0, 116512.0, 112037.0, 99161.0, 80786.0, 61021.0, 43530.0, 29701.0, 19203.0, 12181.0, 7557.0, 4721.0, 2829.0, 1714.0, 1068.0, 662.0, 400.0, 240.0, 147.0, 106.0, 53.0, 34.0, 25.0, 13.0, 7.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.546875, -22.8017578125, -22.056640625, -21.3115234375, -20.56640625, -19.8212890625, -19.076171875, -18.3310546875, -17.5859375, -16.8408203125, -16.095703125, -15.3505859375, -14.60546875, -13.8603515625, -13.115234375, -12.3701171875, -11.625, -10.8798828125, -10.134765625, -9.3896484375, -8.64453125, -7.8994140625, -7.154296875, -6.4091796875, -5.6640625, -4.9189453125, -4.173828125, -3.4287109375, -2.68359375, -1.9384765625, -1.193359375, -0.4482421875, 0.296875, 1.0419921875, 1.787109375, 2.5322265625, 3.27734375, 4.0224609375, 4.767578125, 5.5126953125, 6.2578125, 7.0029296875, 7.748046875, 8.4931640625, 9.23828125, 9.9833984375, 10.728515625, 11.4736328125, 12.21875, 12.9638671875, 13.708984375, 14.4541015625, 15.19921875, 15.9443359375, 16.689453125, 17.4345703125, 18.1796875, 18.9248046875, 19.669921875, 20.4150390625, 21.16015625, 21.9052734375, 22.650390625, 23.3955078125, 24.140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 11.0, 6.0, 7.0, 17.0, 10.0, 15.0, 24.0, 29.0, 36.0, 35.0, 36.0, 30.0, 47.0, 56.0, 43.0, 52.0, 45.0, 42.0, 41.0, 38.0, 46.0, 42.0, 36.0, 50.0, 24.0, 24.0, 27.0, 36.0, 21.0, 15.0, 11.0, 7.0, 6.0, 4.0, 7.0, 3.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.125, -18.447265625, -17.76953125, -17.091796875, -16.4140625, -15.736328125, -15.05859375, -14.380859375, -13.703125, -13.025390625, -12.34765625, -11.669921875, -10.9921875, -10.314453125, -9.63671875, -8.958984375, -8.28125, -7.603515625, -6.92578125, -6.248046875, -5.5703125, -4.892578125, -4.21484375, -3.537109375, -2.859375, -2.181640625, -1.50390625, -0.826171875, -0.1484375, 0.529296875, 1.20703125, 1.884765625, 2.5625, 3.240234375, 3.91796875, 4.595703125, 5.2734375, 5.951171875, 6.62890625, 7.306640625, 7.984375, 8.662109375, 9.33984375, 10.017578125, 10.6953125, 11.373046875, 12.05078125, 12.728515625, 13.40625, 14.083984375, 14.76171875, 15.439453125, 16.1171875, 16.794921875, 17.47265625, 18.150390625, 18.828125, 19.505859375, 20.18359375, 20.861328125, 21.5390625, 22.216796875, 22.89453125, 23.572265625, 24.25]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 8.0, 23.0, 40.0, 34.0, 54.0, 107.0, 128.0, 213.0, 349.0, 550.0, 1010.0, 2117.0, 4768.0, 13761.0, 45120.0, 143263.0, 308149.0, 311170.0, 147198.0, 46752.0, 14093.0, 4880.0, 2076.0, 982.0, 625.0, 357.0, 209.0, 132.0, 119.0, 81.0, 54.0, 35.0, 27.0, 17.0, 8.0, 13.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-30.984375, -30.1240234375, -29.263671875, -28.4033203125, -27.54296875, -26.6826171875, -25.822265625, -24.9619140625, -24.1015625, -23.2412109375, -22.380859375, -21.5205078125, -20.66015625, -19.7998046875, -18.939453125, -18.0791015625, -17.21875, -16.3583984375, -15.498046875, -14.6376953125, -13.77734375, -12.9169921875, -12.056640625, -11.1962890625, -10.3359375, -9.4755859375, -8.615234375, -7.7548828125, -6.89453125, -6.0341796875, -5.173828125, -4.3134765625, -3.453125, -2.5927734375, -1.732421875, -0.8720703125, -0.01171875, 0.8486328125, 1.708984375, 2.5693359375, 3.4296875, 4.2900390625, 5.150390625, 6.0107421875, 6.87109375, 7.7314453125, 8.591796875, 9.4521484375, 10.3125, 11.1728515625, 12.033203125, 12.8935546875, 13.75390625, 14.6142578125, 15.474609375, 16.3349609375, 17.1953125, 18.0556640625, 18.916015625, 19.7763671875, 20.63671875, 21.4970703125, 22.357421875, 23.2177734375, 24.078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 7.0, 9.0, 10.0, 9.0, 14.0, 11.0, 15.0, 21.0, 28.0, 40.0, 35.0, 50.0, 51.0, 48.0, 58.0, 45.0, 54.0, 65.0, 64.0, 64.0, 50.0, 41.0, 28.0, 32.0, 27.0, 25.0, 21.0, 12.0, 19.0, 9.0, 9.0, 5.0, 6.0, 2.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0016613006591796875, -0.0016154050827026367, -0.001569509506225586, -0.0015236139297485352, -0.0014777183532714844, -0.0014318227767944336, -0.0013859272003173828, -0.001340031623840332, -0.0012941360473632812, -0.0012482404708862305, -0.0012023448944091797, -0.001156449317932129, -0.0011105537414550781, -0.0010646581649780273, -0.0010187625885009766, -0.0009728670120239258, -0.000926971435546875, -0.0008810758590698242, -0.0008351802825927734, -0.0007892847061157227, -0.0007433891296386719, -0.0006974935531616211, -0.0006515979766845703, -0.0006057024002075195, -0.0005598068237304688, -0.000513911247253418, -0.0004680156707763672, -0.0004221200942993164, -0.0003762245178222656, -0.00033032894134521484, -0.00028443336486816406, -0.00023853778839111328, -0.0001926422119140625, -0.00014674663543701172, -0.00010085105895996094, -5.4955482482910156e-05, -9.059906005859375e-06, 3.6835670471191406e-05, 8.273124694824219e-05, 0.00012862682342529297, 0.00017452239990234375, 0.00022041797637939453, 0.0002663135528564453, 0.0003122091293334961, 0.0003581047058105469, 0.00040400028228759766, 0.00044989585876464844, 0.0004957914352416992, 0.00054168701171875, 0.0005875825881958008, 0.0006334781646728516, 0.0006793737411499023, 0.0007252693176269531, 0.0007711648941040039, 0.0008170604705810547, 0.0008629560470581055, 0.0009088516235351562, 0.000954747200012207, 0.0010006427764892578, 0.0010465383529663086, 0.0010924339294433594, 0.0011383295059204102, 0.001184225082397461, 0.0012301206588745117, 0.0012760162353515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 11.0, 16.0, 18.0, 32.0, 37.0, 62.0, 78.0, 85.0, 178.0, 214.0, 370.0, 532.0, 1060.0, 2221.0, 5253.0, 15065.0, 45207.0, 126667.0, 257472.0, 296093.0, 183979.0, 74232.0, 24596.0, 8262.0, 3289.0, 1475.0, 737.0, 426.0, 253.0, 179.0, 132.0, 85.0, 63.0, 50.0, 23.0, 27.0, 18.0, 18.0, 6.0, 4.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.59375, -23.83056640625, -23.0673828125, -22.30419921875, -21.541015625, -20.77783203125, -20.0146484375, -19.25146484375, -18.48828125, -17.72509765625, -16.9619140625, -16.19873046875, -15.435546875, -14.67236328125, -13.9091796875, -13.14599609375, -12.3828125, -11.61962890625, -10.8564453125, -10.09326171875, -9.330078125, -8.56689453125, -7.8037109375, -7.04052734375, -6.27734375, -5.51416015625, -4.7509765625, -3.98779296875, -3.224609375, -2.46142578125, -1.6982421875, -0.93505859375, -0.171875, 0.59130859375, 1.3544921875, 2.11767578125, 2.880859375, 3.64404296875, 4.4072265625, 5.17041015625, 5.93359375, 6.69677734375, 7.4599609375, 8.22314453125, 8.986328125, 9.74951171875, 10.5126953125, 11.27587890625, 12.0390625, 12.80224609375, 13.5654296875, 14.32861328125, 15.091796875, 15.85498046875, 16.6181640625, 17.38134765625, 18.14453125, 18.90771484375, 19.6708984375, 20.43408203125, 21.197265625, 21.96044921875, 22.7236328125, 23.48681640625, 24.25]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 8.0, 18.0, 29.0, 35.0, 54.0, 59.0, 85.0, 85.0, 103.0, 78.0, 95.0, 73.0, 71.0, 65.0, 38.0, 30.0, 21.0, 17.0, 11.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.0625, -5.778564453125, -5.49462890625, -5.210693359375, -4.9267578125, -4.642822265625, -4.35888671875, -4.074951171875, -3.791015625, -3.507080078125, -3.22314453125, -2.939208984375, -2.6552734375, -2.371337890625, -2.08740234375, -1.803466796875, -1.51953125, -1.235595703125, -0.95166015625, -0.667724609375, -0.3837890625, -0.099853515625, 0.18408203125, 0.468017578125, 0.751953125, 1.035888671875, 1.31982421875, 1.603759765625, 1.8876953125, 2.171630859375, 2.45556640625, 2.739501953125, 3.0234375, 3.307373046875, 3.59130859375, 3.875244140625, 4.1591796875, 4.443115234375, 4.72705078125, 5.010986328125, 5.294921875, 5.578857421875, 5.86279296875, 6.146728515625, 6.4306640625, 6.714599609375, 6.99853515625, 7.282470703125, 7.56640625, 7.850341796875, 8.13427734375, 8.418212890625, 8.7021484375, 8.986083984375, 9.27001953125, 9.553955078125, 9.837890625, 10.121826171875, 10.40576171875, 10.689697265625, 10.9736328125, 11.257568359375, 11.54150390625, 11.825439453125, 12.109375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 5.0, 2.0, 4.0, 9.0, 12.0, 9.0, 27.0, 19.0, 15.0, 25.0, 29.0, 40.0, 28.0, 35.0, 44.0, 44.0, 48.0, 42.0, 48.0, 55.0, 67.0, 27.0, 54.0, 41.0, 39.0, 38.0, 33.0, 22.0, 22.0, 13.0, 22.0, 14.0, 13.0, 13.0, 13.0, 10.0, 7.0, 7.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.35939598083496, -23.42682456970215, -22.494253158569336, -21.561681747436523, -20.629112243652344, -19.69654083251953, -18.76396942138672, -17.831398010253906, -16.898826599121094, -15.966255187988281, -15.033683776855469, -14.101113319396973, -13.16854190826416, -12.235970497131348, -11.303400039672852, -10.370828628540039, -9.438257217407227, -8.505685806274414, -7.57311487197876, -6.6405439376831055, -5.707972526550293, -4.7754011154174805, -3.842830181121826, -2.910259246826172, -1.9776878356933594, -1.045116662979126, -0.11254549026489258, 0.8200256824493408, 1.7525968551635742, 2.6851682662963867, 3.617739200592041, 4.550310134887695, 5.482883453369141, 6.415454864501953, 7.348025798797607, 8.280596733093262, 9.213168144226074, 10.145739555358887, 11.078310012817383, 12.010881423950195, 12.943452835083008, 13.87602424621582, 14.808595657348633, 15.741166114807129, 16.673736572265625, 17.606307983398438, 18.53887939453125, 19.471450805664062, 20.404022216796875, 21.336593627929688, 22.2691650390625, 23.201736450195312, 24.134307861328125, 25.066879272460938, 25.999448776245117, 26.93202018737793, 27.864591598510742, 28.797163009643555, 29.729734420776367, 30.66230583190918, 31.59487533569336, 32.52744674682617, 33.460018157958984, 34.3925895690918, 35.32516098022461]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 6.0, 12.0, 14.0, 12.0, 10.0, 20.0, 20.0, 26.0, 28.0, 35.0, 32.0, 27.0, 32.0, 38.0, 37.0, 32.0, 43.0, 47.0, 42.0, 48.0, 35.0, 40.0, 34.0, 46.0, 32.0, 32.0, 33.0, 33.0, 16.0, 23.0, 24.0, 19.0, 17.0, 10.0, 10.0, 3.0, 7.0, 5.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.959009170532227, -25.94156265258789, -24.924118041992188, -23.90667152404785, -22.889225006103516, -21.87177848815918, -20.854331970214844, -19.83688735961914, -18.819440841674805, -17.80199432373047, -16.784549713134766, -15.76710319519043, -14.749656677246094, -13.732210159301758, -12.714764595031738, -11.697319030761719, -10.679872512817383, -9.662425994873047, -8.644980430603027, -7.62753438949585, -6.610088348388672, -5.592642307281494, -4.575196266174316, -3.5577502250671387, -2.540304183959961, -1.5228581428527832, -0.5054121017456055, 0.5120339393615723, 1.52947998046875, 2.5469260215759277, 3.5643720626831055, 4.581818103790283, 5.599262237548828, 6.616708278656006, 7.634154319763184, 8.651599884033203, 9.669046401977539, 10.686492919921875, 11.703938484191895, 12.721384048461914, 13.73883056640625, 14.756277084350586, 15.773722648620605, 16.791168212890625, 17.80861473083496, 18.826061248779297, 19.843505859375, 20.860952377319336, 21.878398895263672, 22.895845413208008, 23.913291931152344, 24.930736541748047, 25.948183059692383, 26.96562957763672, 27.983074188232422, 29.000520706176758, 30.017967224121094, 31.03541374206543, 32.052860260009766, 33.07030487060547, 34.08775329589844, 35.10519790649414, 36.122642517089844, 37.14009094238281, 38.157535552978516]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 14.0, 30.0, 28.0, 105.0, 160.0, 369.0, 619.0, 1328.0, 2467.0, 4666.0, 8951.0, 17189.0, 32310.0, 60135.0, 107740.0, 184072.0, 294970.0, 432022.0, 555511.0, 614662.0, 579756.0, 470220.0, 331251.0, 212252.0, 126489.0, 71944.0, 39580.0, 21530.0, 11372.0, 5869.0, 3079.0, 1688.0, 883.0, 484.0, 229.0, 123.0, 82.0, 44.0, 29.0, 20.0, 7.0, 5.0, 0.0, 4.0, 2.0], "bins": [-32.46875, -31.628662109375, -30.78857421875, -29.948486328125, -29.1083984375, -28.268310546875, -27.42822265625, -26.588134765625, -25.748046875, -24.907958984375, -24.06787109375, -23.227783203125, -22.3876953125, -21.547607421875, -20.70751953125, -19.867431640625, -19.02734375, -18.187255859375, -17.34716796875, -16.507080078125, -15.6669921875, -14.826904296875, -13.98681640625, -13.146728515625, -12.306640625, -11.466552734375, -10.62646484375, -9.786376953125, -8.9462890625, -8.106201171875, -7.26611328125, -6.426025390625, -5.5859375, -4.745849609375, -3.90576171875, -3.065673828125, -2.2255859375, -1.385498046875, -0.54541015625, 0.294677734375, 1.134765625, 1.974853515625, 2.81494140625, 3.655029296875, 4.4951171875, 5.335205078125, 6.17529296875, 7.015380859375, 7.85546875, 8.695556640625, 9.53564453125, 10.375732421875, 11.2158203125, 12.055908203125, 12.89599609375, 13.736083984375, 14.576171875, 15.416259765625, 16.25634765625, 17.096435546875, 17.9365234375, 18.776611328125, 19.61669921875, 20.456787109375, 21.296875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 6.0, 5.0, 16.0, 7.0, 14.0, 18.0, 19.0, 17.0, 33.0, 35.0, 24.0, 34.0, 26.0, 39.0, 32.0, 38.0, 38.0, 37.0, 52.0, 39.0, 37.0, 41.0, 42.0, 38.0, 35.0, 40.0, 32.0, 31.0, 25.0, 22.0, 21.0, 23.0, 18.0, 17.0, 8.0, 10.0, 2.0, 6.0, 9.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.0625, -22.17919921875, -21.2958984375, -20.41259765625, -19.529296875, -18.64599609375, -17.7626953125, -16.87939453125, -15.99609375, -15.11279296875, -14.2294921875, -13.34619140625, -12.462890625, -11.57958984375, -10.6962890625, -9.81298828125, -8.9296875, -8.04638671875, -7.1630859375, -6.27978515625, -5.396484375, -4.51318359375, -3.6298828125, -2.74658203125, -1.86328125, -0.97998046875, -0.0966796875, 0.78662109375, 1.669921875, 2.55322265625, 3.4365234375, 4.31982421875, 5.203125, 6.08642578125, 6.9697265625, 7.85302734375, 8.736328125, 9.61962890625, 10.5029296875, 11.38623046875, 12.26953125, 13.15283203125, 14.0361328125, 14.91943359375, 15.802734375, 16.68603515625, 17.5693359375, 18.45263671875, 19.3359375, 20.21923828125, 21.1025390625, 21.98583984375, 22.869140625, 23.75244140625, 24.6357421875, 25.51904296875, 26.40234375, 27.28564453125, 28.1689453125, 29.05224609375, 29.935546875, 30.81884765625, 31.7021484375, 32.58544921875, 33.46875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 10.0, 14.0, 31.0, 49.0, 122.0, 179.0, 303.0, 506.0, 859.0, 1540.0, 2595.0, 4234.0, 7011.0, 11582.0, 18833.0, 30727.0, 48609.0, 75441.0, 112061.0, 163805.0, 226164.0, 297436.0, 367285.0, 422619.0, 446963.0, 433793.0, 389725.0, 324624.0, 251985.0, 185977.0, 129857.0, 87626.0, 57256.0, 36717.0, 22802.0, 13851.0, 8447.0, 5175.0, 3044.0, 1886.0, 1057.0, 608.0, 364.0, 213.0, 122.0, 75.0, 53.0, 24.0, 19.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.0625, -21.3662109375, -20.669921875, -19.9736328125, -19.27734375, -18.5810546875, -17.884765625, -17.1884765625, -16.4921875, -15.7958984375, -15.099609375, -14.4033203125, -13.70703125, -13.0107421875, -12.314453125, -11.6181640625, -10.921875, -10.2255859375, -9.529296875, -8.8330078125, -8.13671875, -7.4404296875, -6.744140625, -6.0478515625, -5.3515625, -4.6552734375, -3.958984375, -3.2626953125, -2.56640625, -1.8701171875, -1.173828125, -0.4775390625, 0.21875, 0.9150390625, 1.611328125, 2.3076171875, 3.00390625, 3.7001953125, 4.396484375, 5.0927734375, 5.7890625, 6.4853515625, 7.181640625, 7.8779296875, 8.57421875, 9.2705078125, 9.966796875, 10.6630859375, 11.359375, 12.0556640625, 12.751953125, 13.4482421875, 14.14453125, 14.8408203125, 15.537109375, 16.2333984375, 16.9296875, 17.6259765625, 18.322265625, 19.0185546875, 19.71484375, 20.4111328125, 21.107421875, 21.8037109375, 22.5]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 1.0, 2.0, 4.0, 9.0, 7.0, 6.0, 27.0, 20.0, 32.0, 31.0, 42.0, 36.0, 80.0, 68.0, 84.0, 105.0, 119.0, 148.0, 151.0, 176.0, 194.0, 195.0, 207.0, 223.0, 200.0, 213.0, 204.0, 202.0, 170.0, 161.0, 140.0, 131.0, 112.0, 101.0, 110.0, 84.0, 51.0, 56.0, 29.0, 34.0, 25.0, 22.0, 12.0, 20.0, 13.0, 8.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6171875, -12.2391357421875, -11.861083984375, -11.4830322265625, -11.10498046875, -10.7269287109375, -10.348876953125, -9.9708251953125, -9.5927734375, -9.2147216796875, -8.836669921875, -8.4586181640625, -8.08056640625, -7.7025146484375, -7.324462890625, -6.9464111328125, -6.568359375, -6.1903076171875, -5.812255859375, -5.4342041015625, -5.05615234375, -4.6781005859375, -4.300048828125, -3.9219970703125, -3.5439453125, -3.1658935546875, -2.787841796875, -2.4097900390625, -2.03173828125, -1.6536865234375, -1.275634765625, -0.8975830078125, -0.51953125, -0.1414794921875, 0.236572265625, 0.6146240234375, 0.99267578125, 1.3707275390625, 1.748779296875, 2.1268310546875, 2.5048828125, 2.8829345703125, 3.260986328125, 3.6390380859375, 4.01708984375, 4.3951416015625, 4.773193359375, 5.1512451171875, 5.529296875, 5.9073486328125, 6.285400390625, 6.6634521484375, 7.04150390625, 7.4195556640625, 7.797607421875, 8.1756591796875, 8.5537109375, 8.9317626953125, 9.309814453125, 9.6878662109375, 10.06591796875, 10.4439697265625, 10.822021484375, 11.2000732421875, 11.578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 8.0, 6.0, 6.0, 12.0, 9.0, 22.0, 21.0, 20.0, 21.0, 26.0, 34.0, 34.0, 37.0, 36.0, 32.0, 38.0, 44.0, 48.0, 43.0, 42.0, 33.0, 46.0, 46.0, 28.0, 30.0, 29.0, 30.0, 12.0, 22.0, 22.0, 27.0, 12.0, 19.0, 11.0, 14.0, 8.0, 10.0, 14.0, 5.0, 7.0, 4.0, 4.0, 9.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.50648307800293, -23.714515686035156, -22.92254638671875, -22.130578994750977, -21.338611602783203, -20.54664421081543, -19.754674911499023, -18.96270751953125, -18.170740127563477, -17.378772735595703, -16.586803436279297, -15.794836044311523, -15.00286865234375, -14.21090030670166, -13.41893196105957, -12.626964569091797, -11.834996223449707, -11.043027877807617, -10.251060485839844, -9.459092140197754, -8.66712474822998, -7.875156402587891, -7.083188533782959, -6.291220664978027, -5.499252796173096, -4.707284927368164, -3.9153170585632324, -3.1233489513397217, -2.33138108253479, -1.5394132137298584, -0.7474451065063477, 0.044522762298583984, 0.8364906311035156, 1.6284584999084473, 2.420426368713379, 3.2123944759368896, 4.004362106323242, 4.796330451965332, 5.588298320770264, 6.380266189575195, 7.172234058380127, 7.964201927185059, 8.756170272827148, 9.548137664794922, 10.340106010437012, 11.132073402404785, 11.924041748046875, 12.716009140014648, 13.507977485656738, 14.299945831298828, 15.091913223266602, 15.883881568908691, 16.67584991455078, 17.467817306518555, 18.259784698486328, 19.051753997802734, 19.843721389770508, 20.63568878173828, 21.427658081054688, 22.21962547302246, 23.011592864990234, 23.803560256958008, 24.595529556274414, 25.387496948242188, 26.17946434020996]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 7.0, 7.0, 7.0, 14.0, 16.0, 22.0, 10.0, 16.0, 20.0, 14.0, 27.0, 17.0, 34.0, 39.0, 34.0, 30.0, 39.0, 31.0, 28.0, 43.0, 50.0, 36.0, 38.0, 33.0, 38.0, 49.0, 29.0, 45.0, 29.0, 24.0, 24.0, 32.0, 15.0, 13.0, 15.0, 13.0, 16.0, 10.0, 7.0, 8.0, 4.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-31.261606216430664, -30.33831024169922, -29.415016174316406, -28.49172019958496, -27.56842613220215, -26.645130157470703, -25.72183609008789, -24.798540115356445, -23.875246047973633, -22.951950073242188, -22.028656005859375, -21.10536003112793, -20.182065963745117, -19.258769989013672, -18.33547592163086, -17.412179946899414, -16.48888397216797, -15.56558895111084, -14.642293930053711, -13.718998908996582, -12.795703887939453, -11.872407913208008, -10.949113845825195, -10.02581787109375, -9.102523803710938, -8.179228782653809, -7.25593376159668, -6.332638740539551, -5.409343719482422, -4.486048221588135, -3.562753200531006, -2.639458179473877, -1.7161636352539062, -0.7928685545921326, 0.1304265260696411, 1.0537216663360596, 1.9770166873931885, 2.9003119468688965, 3.8236069679260254, 4.746901988983154, 5.670197010040283, 6.593492031097412, 7.516787052154541, 8.440082550048828, 9.363377571105957, 10.286672592163086, 11.209967613220215, 12.133262634277344, 13.056557655334473, 13.979852676391602, 14.90314769744873, 15.82644271850586, 16.749738693237305, 17.673032760620117, 18.596328735351562, 19.519622802734375, 20.44291877746582, 21.366214752197266, 22.289508819580078, 23.212804794311523, 24.136098861694336, 25.05939483642578, 25.982688903808594, 26.90598487854004, 27.82927894592285]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 0.0, 5.0, 1.0, 6.0, 9.0, 21.0, 27.0, 47.0, 80.0, 129.0, 185.0, 350.0, 545.0, 916.0, 1428.0, 2236.0, 3707.0, 5798.0, 9111.0, 13752.0, 20406.0, 29354.0, 41098.0, 54730.0, 70183.0, 85122.0, 95155.0, 102479.0, 101093.0, 93717.0, 81521.0, 66587.0, 51478.0, 38009.0, 26742.0, 18498.0, 12173.0, 7993.0, 5204.0, 3289.0, 2046.0, 1325.0, 794.0, 454.0, 293.0, 166.0, 116.0, 77.0, 47.0, 29.0, 14.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.85302734375, -7.5810546875, -7.30908203125, -7.037109375, -6.76513671875, -6.4931640625, -6.22119140625, -5.94921875, -5.67724609375, -5.4052734375, -5.13330078125, -4.861328125, -4.58935546875, -4.3173828125, -4.04541015625, -3.7734375, -3.50146484375, -3.2294921875, -2.95751953125, -2.685546875, -2.41357421875, -2.1416015625, -1.86962890625, -1.59765625, -1.32568359375, -1.0537109375, -0.78173828125, -0.509765625, -0.23779296875, 0.0341796875, 0.30615234375, 0.578125, 0.85009765625, 1.1220703125, 1.39404296875, 1.666015625, 1.93798828125, 2.2099609375, 2.48193359375, 2.75390625, 3.02587890625, 3.2978515625, 3.56982421875, 3.841796875, 4.11376953125, 4.3857421875, 4.65771484375, 4.9296875, 5.20166015625, 5.4736328125, 5.74560546875, 6.017578125, 6.28955078125, 6.5615234375, 6.83349609375, 7.10546875, 7.37744140625, 7.6494140625, 7.92138671875, 8.193359375, 8.46533203125, 8.7373046875, 9.00927734375, 9.28125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 7.0, 7.0, 7.0, 14.0, 18.0, 20.0, 12.0, 13.0, 21.0, 14.0, 29.0, 16.0, 35.0, 36.0, 34.0, 31.0, 36.0, 34.0, 27.0, 41.0, 53.0, 40.0, 33.0, 35.0, 39.0, 48.0, 27.0, 45.0, 32.0, 23.0, 28.0, 28.0, 16.0, 13.0, 14.0, 12.0, 16.0, 11.0, 7.0, 8.0, 3.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-31.21875, -30.29150390625, -29.3642578125, -28.43701171875, -27.509765625, -26.58251953125, -25.6552734375, -24.72802734375, -23.80078125, -22.87353515625, -21.9462890625, -21.01904296875, -20.091796875, -19.16455078125, -18.2373046875, -17.31005859375, -16.3828125, -15.45556640625, -14.5283203125, -13.60107421875, -12.673828125, -11.74658203125, -10.8193359375, -9.89208984375, -8.96484375, -8.03759765625, -7.1103515625, -6.18310546875, -5.255859375, -4.32861328125, -3.4013671875, -2.47412109375, -1.546875, -0.61962890625, 0.3076171875, 1.23486328125, 2.162109375, 3.08935546875, 4.0166015625, 4.94384765625, 5.87109375, 6.79833984375, 7.7255859375, 8.65283203125, 9.580078125, 10.50732421875, 11.4345703125, 12.36181640625, 13.2890625, 14.21630859375, 15.1435546875, 16.07080078125, 16.998046875, 17.92529296875, 18.8525390625, 19.77978515625, 20.70703125, 21.63427734375, 22.5615234375, 23.48876953125, 24.416015625, 25.34326171875, 26.2705078125, 27.19775390625, 28.125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 10.0, 15.0, 21.0, 33.0, 62.0, 89.0, 142.0, 189.0, 311.0, 523.0, 873.0, 1320.0, 2159.0, 3508.0, 5757.0, 8922.0, 14705.0, 25572.0, 75338.0, 814052.0, 40477.0, 21018.0, 12672.0, 7763.0, 4864.0, 3079.0, 1958.0, 1213.0, 747.0, 471.0, 261.0, 162.0, 105.0, 63.0, 29.0, 27.0, 15.0, 18.0, 4.0, 5.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.703125, -29.7822265625, -28.861328125, -27.9404296875, -27.01953125, -26.0986328125, -25.177734375, -24.2568359375, -23.3359375, -22.4150390625, -21.494140625, -20.5732421875, -19.65234375, -18.7314453125, -17.810546875, -16.8896484375, -15.96875, -15.0478515625, -14.126953125, -13.2060546875, -12.28515625, -11.3642578125, -10.443359375, -9.5224609375, -8.6015625, -7.6806640625, -6.759765625, -5.8388671875, -4.91796875, -3.9970703125, -3.076171875, -2.1552734375, -1.234375, -0.3134765625, 0.607421875, 1.5283203125, 2.44921875, 3.3701171875, 4.291015625, 5.2119140625, 6.1328125, 7.0537109375, 7.974609375, 8.8955078125, 9.81640625, 10.7373046875, 11.658203125, 12.5791015625, 13.5, 14.4208984375, 15.341796875, 16.2626953125, 17.18359375, 18.1044921875, 19.025390625, 19.9462890625, 20.8671875, 21.7880859375, 22.708984375, 23.6298828125, 24.55078125, 25.4716796875, 26.392578125, 27.3134765625, 28.234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 5.0, 9.0, 10.0, 14.0, 15.0, 18.0, 18.0, 21.0, 27.0, 23.0, 27.0, 35.0, 41.0, 41.0, 37.0, 42.0, 40.0, 46.0, 45.0, 50.0, 43.0, 45.0, 38.0, 39.0, 38.0, 38.0, 27.0, 28.0, 28.0, 16.0, 24.0, 13.0, 14.0, 13.0, 5.0, 6.0, 3.0, 5.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.765625, -24.0263671875, -23.287109375, -22.5478515625, -21.80859375, -21.0693359375, -20.330078125, -19.5908203125, -18.8515625, -18.1123046875, -17.373046875, -16.6337890625, -15.89453125, -15.1552734375, -14.416015625, -13.6767578125, -12.9375, -12.1982421875, -11.458984375, -10.7197265625, -9.98046875, -9.2412109375, -8.501953125, -7.7626953125, -7.0234375, -6.2841796875, -5.544921875, -4.8056640625, -4.06640625, -3.3271484375, -2.587890625, -1.8486328125, -1.109375, -0.3701171875, 0.369140625, 1.1083984375, 1.84765625, 2.5869140625, 3.326171875, 4.0654296875, 4.8046875, 5.5439453125, 6.283203125, 7.0224609375, 7.76171875, 8.5009765625, 9.240234375, 9.9794921875, 10.71875, 11.4580078125, 12.197265625, 12.9365234375, 13.67578125, 14.4150390625, 15.154296875, 15.8935546875, 16.6328125, 17.3720703125, 18.111328125, 18.8505859375, 19.58984375, 20.3291015625, 21.068359375, 21.8076171875, 22.546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 8.0, 15.0, 28.0, 32.0, 74.0, 59.0, 110.0, 156.0, 259.0, 391.0, 678.0, 1100.0, 1723.0, 2762.0, 4738.0, 7915.0, 13512.0, 24379.0, 75956.0, 804961.0, 56194.0, 22403.0, 12406.0, 7333.0, 4377.0, 2617.0, 1618.0, 996.0, 616.0, 403.0, 239.0, 159.0, 95.0, 85.0, 47.0, 25.0, 23.0, 14.0, 14.0, 11.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.232421875, -2.1656494140625, -2.098876953125, -2.0321044921875, -1.96533203125, -1.8985595703125, -1.831787109375, -1.7650146484375, -1.6982421875, -1.6314697265625, -1.564697265625, -1.4979248046875, -1.43115234375, -1.3643798828125, -1.297607421875, -1.2308349609375, -1.1640625, -1.0972900390625, -1.030517578125, -0.9637451171875, -0.89697265625, -0.8302001953125, -0.763427734375, -0.6966552734375, -0.6298828125, -0.5631103515625, -0.496337890625, -0.4295654296875, -0.36279296875, -0.2960205078125, -0.229248046875, -0.1624755859375, -0.095703125, -0.0289306640625, 0.037841796875, 0.1046142578125, 0.17138671875, 0.2381591796875, 0.304931640625, 0.3717041015625, 0.4384765625, 0.5052490234375, 0.572021484375, 0.6387939453125, 0.70556640625, 0.7723388671875, 0.839111328125, 0.9058837890625, 0.97265625, 1.0394287109375, 1.106201171875, 1.1729736328125, 1.23974609375, 1.3065185546875, 1.373291015625, 1.4400634765625, 1.5068359375, 1.5736083984375, 1.640380859375, 1.7071533203125, 1.77392578125, 1.8406982421875, 1.907470703125, 1.9742431640625, 2.041015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 6.0, 5.0, 7.0, 7.0, 14.0, 16.0, 21.0, 16.0, 22.0, 27.0, 27.0, 53.0, 49.0, 63.0, 59.0, 54.0, 53.0, 67.0, 43.0, 52.0, 56.0, 44.0, 35.0, 43.0, 29.0, 19.0, 26.0, 19.0, 16.0, 13.0, 8.0, 6.0, 2.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00029659271240234375, -0.00028759241104125977, -0.0002785921096801758, -0.0002695918083190918, -0.0002605915069580078, -0.00025159120559692383, -0.00024259090423583984, -0.00023359060287475586, -0.00022459030151367188, -0.0002155900001525879, -0.0002065896987915039, -0.00019758939743041992, -0.00018858909606933594, -0.00017958879470825195, -0.00017058849334716797, -0.00016158819198608398, -0.000152587890625, -0.00014358758926391602, -0.00013458728790283203, -0.00012558698654174805, -0.00011658668518066406, -0.00010758638381958008, -9.85860824584961e-05, -8.958578109741211e-05, -8.058547973632812e-05, -7.158517837524414e-05, -6.258487701416016e-05, -5.358457565307617e-05, -4.458427429199219e-05, -3.55839729309082e-05, -2.658367156982422e-05, -1.7583370208740234e-05, -8.58306884765625e-06, 4.172325134277344e-07, 9.417533874511719e-06, 1.8417835235595703e-05, 2.7418136596679688e-05, 3.641843795776367e-05, 4.5418739318847656e-05, 5.441904067993164e-05, 6.341934204101562e-05, 7.241964340209961e-05, 8.14199447631836e-05, 9.042024612426758e-05, 9.942054748535156e-05, 0.00010842084884643555, 0.00011742115020751953, 0.00012642145156860352, 0.0001354217529296875, 0.00014442205429077148, 0.00015342235565185547, 0.00016242265701293945, 0.00017142295837402344, 0.00018042325973510742, 0.0001894235610961914, 0.0001984238624572754, 0.00020742416381835938, 0.00021642446517944336, 0.00022542476654052734, 0.00023442506790161133, 0.0002434253692626953, 0.0002524256706237793, 0.0002614259719848633, 0.00027042627334594727, 0.00027942657470703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 2.0, 15.0, 12.0, 19.0, 37.0, 68.0, 81.0, 127.0, 239.0, 326.0, 541.0, 842.0, 1297.0, 2161.0, 3351.0, 5727.0, 9316.0, 15786.0, 25619.0, 41143.0, 62719.0, 89589.0, 116459.0, 135683.0, 137695.0, 121176.0, 94915.0, 67181.0, 44691.0, 27947.0, 16998.0, 10488.0, 6352.0, 3790.0, 2258.0, 1412.0, 885.0, 589.0, 387.0, 228.0, 143.0, 86.0, 63.0, 47.0, 31.0, 12.0, 13.0, 9.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.1240234375, -1.090057373046875, -1.05609130859375, -1.022125244140625, -0.9881591796875, -0.954193115234375, -0.92022705078125, -0.886260986328125, -0.852294921875, -0.818328857421875, -0.78436279296875, -0.750396728515625, -0.7164306640625, -0.682464599609375, -0.64849853515625, -0.614532470703125, -0.58056640625, -0.546600341796875, -0.51263427734375, -0.478668212890625, -0.4447021484375, -0.410736083984375, -0.37677001953125, -0.342803955078125, -0.308837890625, -0.274871826171875, -0.24090576171875, -0.206939697265625, -0.1729736328125, -0.139007568359375, -0.10504150390625, -0.071075439453125, -0.037109375, -0.003143310546875, 0.03082275390625, 0.064788818359375, 0.0987548828125, 0.132720947265625, 0.16668701171875, 0.200653076171875, 0.234619140625, 0.268585205078125, 0.30255126953125, 0.336517333984375, 0.3704833984375, 0.404449462890625, 0.43841552734375, 0.472381591796875, 0.50634765625, 0.540313720703125, 0.57427978515625, 0.608245849609375, 0.6422119140625, 0.676177978515625, 0.71014404296875, 0.744110107421875, 0.778076171875, 0.812042236328125, 0.84600830078125, 0.879974365234375, 0.9139404296875, 0.947906494140625, 0.98187255859375, 1.015838623046875, 1.0498046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 7.0, 7.0, 13.0, 11.0, 8.0, 22.0, 16.0, 18.0, 30.0, 32.0, 28.0, 45.0, 30.0, 51.0, 40.0, 47.0, 41.0, 34.0, 48.0, 58.0, 49.0, 38.0, 45.0, 32.0, 33.0, 26.0, 26.0, 29.0, 20.0, 19.0, 12.0, 14.0, 10.0, 16.0, 9.0, 4.0, 12.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.40478515625, -0.3917884826660156, -0.37879180908203125, -0.3657951354980469, -0.3527984619140625, -0.3398017883300781, -0.32680511474609375, -0.3138084411621094, -0.300811767578125, -0.2878150939941406, -0.27481842041015625, -0.2618217468261719, -0.2488250732421875, -0.23582839965820312, -0.22283172607421875, -0.20983505249023438, -0.19683837890625, -0.18384170532226562, -0.17084503173828125, -0.15784835815429688, -0.1448516845703125, -0.13185501098632812, -0.11885833740234375, -0.10586166381835938, -0.092864990234375, -0.07986831665039062, -0.06687164306640625, -0.053874969482421875, -0.0408782958984375, -0.027881622314453125, -0.01488494873046875, -0.001888275146484375, 0.0111083984375, 0.024105072021484375, 0.03710174560546875, 0.050098419189453125, 0.0630950927734375, 0.07609176635742188, 0.08908843994140625, 0.10208511352539062, 0.115081787109375, 0.12807846069335938, 0.14107513427734375, 0.15407180786132812, 0.1670684814453125, 0.18006515502929688, 0.19306182861328125, 0.20605850219726562, 0.21905517578125, 0.23205184936523438, 0.24504852294921875, 0.2580451965332031, 0.2710418701171875, 0.2840385437011719, 0.29703521728515625, 0.3100318908691406, 0.323028564453125, 0.3360252380371094, 0.34902191162109375, 0.3620185852050781, 0.3750152587890625, 0.3880119323730469, 0.40100860595703125, 0.4140052795410156, 0.427001953125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 6.0, 7.0, 5.0, 15.0, 14.0, 15.0, 14.0, 27.0, 18.0, 25.0, 34.0, 33.0, 36.0, 37.0, 38.0, 30.0, 40.0, 53.0, 44.0, 41.0, 34.0, 42.0, 41.0, 36.0, 26.0, 28.0, 28.0, 26.0, 21.0, 18.0, 20.0, 20.0, 18.0, 16.0, 10.0, 12.0, 12.0, 10.0, 7.0, 8.0, 5.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.580408096313477, -23.788970947265625, -22.997535705566406, -22.206098556518555, -21.414661407470703, -20.623226165771484, -19.831789016723633, -19.04035186767578, -18.248916625976562, -17.45747947692871, -16.666044235229492, -15.87460708618164, -15.083169937133789, -14.291733741760254, -13.500297546386719, -12.708860397338867, -11.917423248291016, -11.12598705291748, -10.334549903869629, -9.543113708496094, -8.751676559448242, -7.960240364074707, -7.168804168701172, -6.3773674964904785, -5.585930824279785, -4.794494152069092, -4.003057479858398, -3.2116212844848633, -2.42018461227417, -1.6287479400634766, -0.8373117446899414, -0.04587507247924805, 0.7455615997314453, 1.5369981527328491, 2.328434705734253, 3.119871139526367, 3.9113078117370605, 4.702744483947754, 5.494180679321289, 6.285617351531982, 7.077054023742676, 7.868490695953369, 8.659927368164062, 9.451363563537598, 10.242799758911133, 11.034236907958984, 11.82567310333252, 12.617109298706055, 13.408546447753906, 14.199982643127441, 14.991419792175293, 15.782855987548828, 16.57429313659668, 17.36573028564453, 18.15716552734375, 18.9486026763916, 19.740039825439453, 20.531476974487305, 21.322912216186523, 22.114349365234375, 22.905786514282227, 23.697223663330078, 24.488658905029297, 25.28009605407715, 26.071531295776367]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 6.0, 6.0, 7.0, 6.0, 11.0, 18.0, 14.0, 19.0, 10.0, 16.0, 22.0, 21.0, 24.0, 20.0, 41.0, 33.0, 38.0, 32.0, 34.0, 28.0, 31.0, 50.0, 45.0, 42.0, 35.0, 34.0, 52.0, 31.0, 39.0, 35.0, 26.0, 25.0, 26.0, 25.0, 11.0, 18.0, 12.0, 18.0, 5.0, 10.0, 8.0, 6.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-30.796035766601562, -29.865793228149414, -28.935548782348633, -28.005306243896484, -27.075063705444336, -26.144821166992188, -25.214576721191406, -24.284334182739258, -23.35409164428711, -22.42384910583496, -21.49360466003418, -20.56336212158203, -19.633119583129883, -18.702877044677734, -17.772632598876953, -16.842390060424805, -15.91214656829834, -14.981903076171875, -14.051660537719727, -13.121417045593262, -12.191174507141113, -11.260931015014648, -10.3306884765625, -9.400444984436035, -8.47020149230957, -7.539958477020264, -6.609715461730957, -5.679471969604492, -4.749229431152344, -3.818985939025879, -2.8887429237365723, -1.9584999084472656, -1.0282573699951172, -0.09801429510116577, 0.8322287797927856, 1.7624719142913818, 2.6927149295806885, 3.622958183288574, 4.553201198577881, 5.4834442138671875, 6.413687229156494, 7.343930244445801, 8.274173736572266, 9.204416275024414, 10.134659767150879, 11.064903259277344, 11.995145797729492, 12.92538833618164, 13.855631828308105, 14.78587532043457, 15.716117858886719, 16.646360397338867, 17.57660484313965, 18.506847381591797, 19.437089920043945, 20.367332458496094, 21.297576904296875, 22.227819442749023, 23.158063888549805, 24.088306427001953, 25.0185489654541, 25.94879150390625, 26.87903594970703, 27.80927848815918, 28.739521026611328]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 8.0, 7.0, 13.0, 20.0, 22.0, 40.0, 63.0, 88.0, 144.0, 234.0, 443.0, 634.0, 1064.0, 1893.0, 3125.0, 5314.0, 8912.0, 14609.0, 23395.0, 35884.0, 52248.0, 71800.0, 92497.0, 108848.0, 118444.0, 116577.0, 105181.0, 87227.0, 66631.0, 48110.0, 32153.0, 20746.0, 12908.0, 7816.0, 4735.0, 2798.0, 1572.0, 871.0, 553.0, 311.0, 201.0, 159.0, 86.0, 55.0, 40.0, 33.0, 22.0, 12.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.734375, -22.965576171875, -22.19677734375, -21.427978515625, -20.6591796875, -19.890380859375, -19.12158203125, -18.352783203125, -17.583984375, -16.815185546875, -16.04638671875, -15.277587890625, -14.5087890625, -13.739990234375, -12.97119140625, -12.202392578125, -11.43359375, -10.664794921875, -9.89599609375, -9.127197265625, -8.3583984375, -7.589599609375, -6.82080078125, -6.052001953125, -5.283203125, -4.514404296875, -3.74560546875, -2.976806640625, -2.2080078125, -1.439208984375, -0.67041015625, 0.098388671875, 0.8671875, 1.635986328125, 2.40478515625, 3.173583984375, 3.9423828125, 4.711181640625, 5.47998046875, 6.248779296875, 7.017578125, 7.786376953125, 8.55517578125, 9.323974609375, 10.0927734375, 10.861572265625, 11.63037109375, 12.399169921875, 13.16796875, 13.936767578125, 14.70556640625, 15.474365234375, 16.2431640625, 17.011962890625, 17.78076171875, 18.549560546875, 19.318359375, 20.087158203125, 20.85595703125, 21.624755859375, 22.3935546875, 23.162353515625, 23.93115234375, 24.699951171875, 25.46875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 7.0, 4.0, 11.0, 3.0, 17.0, 11.0, 17.0, 21.0, 9.0, 19.0, 18.0, 26.0, 23.0, 22.0, 42.0, 30.0, 43.0, 29.0, 33.0, 26.0, 38.0, 51.0, 43.0, 37.0, 37.0, 34.0, 52.0, 30.0, 40.0, 32.0, 22.0, 27.0, 26.0, 22.0, 14.0, 15.0, 15.0, 15.0, 7.0, 8.0, 8.0, 4.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-29.25, -28.359130859375, -27.46826171875, -26.577392578125, -25.6865234375, -24.795654296875, -23.90478515625, -23.013916015625, -22.123046875, -21.232177734375, -20.34130859375, -19.450439453125, -18.5595703125, -17.668701171875, -16.77783203125, -15.886962890625, -14.99609375, -14.105224609375, -13.21435546875, -12.323486328125, -11.4326171875, -10.541748046875, -9.65087890625, -8.760009765625, -7.869140625, -6.978271484375, -6.08740234375, -5.196533203125, -4.3056640625, -3.414794921875, -2.52392578125, -1.633056640625, -0.7421875, 0.148681640625, 1.03955078125, 1.930419921875, 2.8212890625, 3.712158203125, 4.60302734375, 5.493896484375, 6.384765625, 7.275634765625, 8.16650390625, 9.057373046875, 9.9482421875, 10.839111328125, 11.72998046875, 12.620849609375, 13.51171875, 14.402587890625, 15.29345703125, 16.184326171875, 17.0751953125, 17.966064453125, 18.85693359375, 19.747802734375, 20.638671875, 21.529541015625, 22.42041015625, 23.311279296875, 24.2021484375, 25.093017578125, 25.98388671875, 26.874755859375, 27.765625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 4.0, 6.0, 13.0, 17.0, 24.0, 37.0, 65.0, 118.0, 163.0, 235.0, 401.0, 643.0, 1021.0, 1649.0, 2351.0, 3621.0, 5174.0, 7801.0, 11203.0, 16176.0, 22714.0, 31339.0, 40942.0, 53423.0, 65640.0, 77534.0, 87013.0, 92383.0, 91937.0, 87146.0, 77870.0, 66616.0, 53888.0, 42030.0, 31734.0, 23291.0, 16577.0, 11878.0, 8043.0, 5466.0, 3577.0, 2395.0, 1556.0, 999.0, 665.0, 430.0, 274.0, 202.0, 101.0, 65.0, 44.0, 25.0, 18.0, 13.0, 11.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.0625, -18.4482421875, -17.833984375, -17.2197265625, -16.60546875, -15.9912109375, -15.376953125, -14.7626953125, -14.1484375, -13.5341796875, -12.919921875, -12.3056640625, -11.69140625, -11.0771484375, -10.462890625, -9.8486328125, -9.234375, -8.6201171875, -8.005859375, -7.3916015625, -6.77734375, -6.1630859375, -5.548828125, -4.9345703125, -4.3203125, -3.7060546875, -3.091796875, -2.4775390625, -1.86328125, -1.2490234375, -0.634765625, -0.0205078125, 0.59375, 1.2080078125, 1.822265625, 2.4365234375, 3.05078125, 3.6650390625, 4.279296875, 4.8935546875, 5.5078125, 6.1220703125, 6.736328125, 7.3505859375, 7.96484375, 8.5791015625, 9.193359375, 9.8076171875, 10.421875, 11.0361328125, 11.650390625, 12.2646484375, 12.87890625, 13.4931640625, 14.107421875, 14.7216796875, 15.3359375, 15.9501953125, 16.564453125, 17.1787109375, 17.79296875, 18.4072265625, 19.021484375, 19.6357421875, 20.25]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 3.0, 5.0, 8.0, 8.0, 13.0, 11.0, 15.0, 22.0, 22.0, 14.0, 27.0, 27.0, 27.0, 37.0, 32.0, 41.0, 40.0, 37.0, 49.0, 54.0, 41.0, 51.0, 40.0, 43.0, 33.0, 36.0, 30.0, 25.0, 26.0, 29.0, 30.0, 16.0, 25.0, 24.0, 11.0, 11.0, 10.0, 7.0, 5.0, 4.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-21.4375, -20.835205078125, -20.23291015625, -19.630615234375, -19.0283203125, -18.426025390625, -17.82373046875, -17.221435546875, -16.619140625, -16.016845703125, -15.41455078125, -14.812255859375, -14.2099609375, -13.607666015625, -13.00537109375, -12.403076171875, -11.80078125, -11.198486328125, -10.59619140625, -9.993896484375, -9.3916015625, -8.789306640625, -8.18701171875, -7.584716796875, -6.982421875, -6.380126953125, -5.77783203125, -5.175537109375, -4.5732421875, -3.970947265625, -3.36865234375, -2.766357421875, -2.1640625, -1.561767578125, -0.95947265625, -0.357177734375, 0.2451171875, 0.847412109375, 1.44970703125, 2.052001953125, 2.654296875, 3.256591796875, 3.85888671875, 4.461181640625, 5.0634765625, 5.665771484375, 6.26806640625, 6.870361328125, 7.47265625, 8.074951171875, 8.67724609375, 9.279541015625, 9.8818359375, 10.484130859375, 11.08642578125, 11.688720703125, 12.291015625, 12.893310546875, 13.49560546875, 14.097900390625, 14.7001953125, 15.302490234375, 15.90478515625, 16.507080078125, 17.109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 6.0, 10.0, 13.0, 12.0, 26.0, 27.0, 62.0, 64.0, 105.0, 164.0, 238.0, 340.0, 524.0, 836.0, 1196.0, 1815.0, 2724.0, 4223.0, 6355.0, 9736.0, 14742.0, 22239.0, 32447.0, 46475.0, 63540.0, 82739.0, 99778.0, 110978.0, 112938.0, 104862.0, 90385.0, 71569.0, 52575.0, 37600.0, 25996.0, 17302.0, 11508.0, 7660.0, 5028.0, 3276.0, 2202.0, 1429.0, 937.0, 629.0, 401.0, 255.0, 187.0, 130.0, 77.0, 73.0, 45.0, 29.0, 13.0, 13.0, 10.0, 9.0, 7.0, 4.0, 4.0], "bins": [-8.84375, -8.577392578125, -8.31103515625, -8.044677734375, -7.7783203125, -7.511962890625, -7.24560546875, -6.979248046875, -6.712890625, -6.446533203125, -6.18017578125, -5.913818359375, -5.6474609375, -5.381103515625, -5.11474609375, -4.848388671875, -4.58203125, -4.315673828125, -4.04931640625, -3.782958984375, -3.5166015625, -3.250244140625, -2.98388671875, -2.717529296875, -2.451171875, -2.184814453125, -1.91845703125, -1.652099609375, -1.3857421875, -1.119384765625, -0.85302734375, -0.586669921875, -0.3203125, -0.053955078125, 0.21240234375, 0.478759765625, 0.7451171875, 1.011474609375, 1.27783203125, 1.544189453125, 1.810546875, 2.076904296875, 2.34326171875, 2.609619140625, 2.8759765625, 3.142333984375, 3.40869140625, 3.675048828125, 3.94140625, 4.207763671875, 4.47412109375, 4.740478515625, 5.0068359375, 5.273193359375, 5.53955078125, 5.805908203125, 6.072265625, 6.338623046875, 6.60498046875, 6.871337890625, 7.1376953125, 7.404052734375, 7.67041015625, 7.936767578125, 8.203125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 9.0, 7.0, 3.0, 8.0, 17.0, 10.0, 22.0, 25.0, 18.0, 29.0, 36.0, 40.0, 43.0, 43.0, 49.0, 54.0, 51.0, 40.0, 52.0, 38.0, 47.0, 41.0, 47.0, 38.0, 35.0, 29.0, 21.0, 30.0, 19.0, 11.0, 25.0, 11.0, 6.0, 11.0, 4.0, 4.0, 3.0, 8.0, 1.0, 6.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00122833251953125, -0.0011920034885406494, -0.0011556744575500488, -0.0011193454265594482, -0.0010830163955688477, -0.001046687364578247, -0.0010103583335876465, -0.0009740293025970459, -0.0009377002716064453, -0.0009013712406158447, -0.0008650422096252441, -0.0008287131786346436, -0.000792384147644043, -0.0007560551166534424, -0.0007197260856628418, -0.0006833970546722412, -0.0006470680236816406, -0.00061073899269104, -0.0005744099617004395, -0.0005380809307098389, -0.0005017518997192383, -0.0004654228687286377, -0.0004290938377380371, -0.0003927648067474365, -0.00035643577575683594, -0.00032010674476623535, -0.00028377771377563477, -0.0002474486827850342, -0.0002111196517944336, -0.000174790620803833, -0.00013846158981323242, -0.00010213255882263184, -6.580352783203125e-05, -2.9474496841430664e-05, 6.854534149169922e-06, 4.318356513977051e-05, 7.95125961303711e-05, 0.00011584162712097168, 0.00015217065811157227, 0.00018849968910217285, 0.00022482872009277344, 0.000261157751083374, 0.0002974867820739746, 0.0003338158130645752, 0.0003701448440551758, 0.00040647387504577637, 0.00044280290603637695, 0.00047913193702697754, 0.0005154609680175781, 0.0005517899990081787, 0.0005881190299987793, 0.0006244480609893799, 0.0006607770919799805, 0.0006971061229705811, 0.0007334351539611816, 0.0007697641849517822, 0.0008060932159423828, 0.0008424222469329834, 0.000878751277923584, 0.0009150803089141846, 0.0009514093399047852, 0.0009877383708953857, 0.0010240674018859863, 0.001060396432876587, 0.0010967254638671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 6.0, 10.0, 20.0, 35.0, 57.0, 97.0, 134.0, 245.0, 399.0, 623.0, 1070.0, 1654.0, 2775.0, 4563.0, 7291.0, 11522.0, 18153.0, 27809.0, 40453.0, 56843.0, 76262.0, 94356.0, 109052.0, 115398.0, 111028.0, 98355.0, 80353.0, 61291.0, 43898.0, 30367.0, 20155.0, 12867.0, 8276.0, 5130.0, 3157.0, 1897.0, 1168.0, 700.0, 428.0, 253.0, 169.0, 93.0, 53.0, 35.0, 24.0, 16.0, 8.0, 2.0, 7.0, 0.0, 1.0, 2.0], "bins": [-9.7890625, -9.51422119140625, -9.2393798828125, -8.96453857421875, -8.689697265625, -8.41485595703125, -8.1400146484375, -7.86517333984375, -7.59033203125, -7.31549072265625, -7.0406494140625, -6.76580810546875, -6.490966796875, -6.21612548828125, -5.9412841796875, -5.66644287109375, -5.3916015625, -5.11676025390625, -4.8419189453125, -4.56707763671875, -4.292236328125, -4.01739501953125, -3.7425537109375, -3.46771240234375, -3.19287109375, -2.91802978515625, -2.6431884765625, -2.36834716796875, -2.093505859375, -1.81866455078125, -1.5438232421875, -1.26898193359375, -0.994140625, -0.71929931640625, -0.4444580078125, -0.16961669921875, 0.105224609375, 0.38006591796875, 0.6549072265625, 0.92974853515625, 1.20458984375, 1.47943115234375, 1.7542724609375, 2.02911376953125, 2.303955078125, 2.57879638671875, 2.8536376953125, 3.12847900390625, 3.4033203125, 3.67816162109375, 3.9530029296875, 4.22784423828125, 4.502685546875, 4.77752685546875, 5.0523681640625, 5.32720947265625, 5.60205078125, 5.87689208984375, 6.1517333984375, 6.42657470703125, 6.701416015625, 6.97625732421875, 7.2510986328125, 7.52593994140625, 7.80078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 7.0, 2.0, 7.0, 6.0, 8.0, 9.0, 14.0, 21.0, 15.0, 21.0, 19.0, 32.0, 32.0, 36.0, 38.0, 42.0, 43.0, 48.0, 43.0, 54.0, 52.0, 55.0, 45.0, 53.0, 55.0, 29.0, 45.0, 23.0, 26.0, 15.0, 17.0, 22.0, 12.0, 12.0, 9.0, 6.0, 3.0, 3.0, 2.0, 5.0, 2.0, 9.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.19140625, -4.05523681640625, -3.9190673828125, -3.78289794921875, -3.646728515625, -3.51055908203125, -3.3743896484375, -3.23822021484375, -3.10205078125, -2.96588134765625, -2.8297119140625, -2.69354248046875, -2.557373046875, -2.42120361328125, -2.2850341796875, -2.14886474609375, -2.0126953125, -1.87652587890625, -1.7403564453125, -1.60418701171875, -1.468017578125, -1.33184814453125, -1.1956787109375, -1.05950927734375, -0.92333984375, -0.78717041015625, -0.6510009765625, -0.51483154296875, -0.378662109375, -0.24249267578125, -0.1063232421875, 0.02984619140625, 0.166015625, 0.30218505859375, 0.4383544921875, 0.57452392578125, 0.710693359375, 0.84686279296875, 0.9830322265625, 1.11920166015625, 1.25537109375, 1.39154052734375, 1.5277099609375, 1.66387939453125, 1.800048828125, 1.93621826171875, 2.0723876953125, 2.20855712890625, 2.3447265625, 2.48089599609375, 2.6170654296875, 2.75323486328125, 2.889404296875, 3.02557373046875, 3.1617431640625, 3.29791259765625, 3.43408203125, 3.57025146484375, 3.7064208984375, 3.84259033203125, 3.978759765625, 4.11492919921875, 4.2510986328125, 4.38726806640625, 4.5234375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 4.0, 5.0, 11.0, 7.0, 3.0, 20.0, 16.0, 17.0, 19.0, 17.0, 26.0, 31.0, 30.0, 35.0, 35.0, 37.0, 38.0, 31.0, 42.0, 43.0, 45.0, 51.0, 50.0, 41.0, 45.0, 27.0, 40.0, 24.0, 23.0, 36.0, 28.0, 10.0, 16.0, 15.0, 12.0, 11.0, 14.0, 11.0, 11.0, 6.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.628761291503906, -26.781553268432617, -25.934343338012695, -25.087135314941406, -24.239925384521484, -23.392717361450195, -22.545509338378906, -21.698299407958984, -20.851089477539062, -20.003881454467773, -19.15667152404785, -18.309463500976562, -17.46225357055664, -16.61504554748535, -15.767836570739746, -14.92062759399414, -14.073419570922852, -13.226210594177246, -12.37900161743164, -11.531793594360352, -10.68458366394043, -9.83737564086914, -8.990166664123535, -8.14295768737793, -7.295748710632324, -6.448539733886719, -5.601330757141113, -4.754122257232666, -3.9069132804870605, -3.059704303741455, -2.212495803833008, -1.3652868270874023, -0.5180759429931641, 0.32913291454315186, 1.1763417720794678, 2.023550510406494, 2.8707594871520996, 3.717968463897705, 4.565176963806152, 5.412385940551758, 6.259594917297363, 7.106803894042969, 7.954012870788574, 8.80122184753418, 9.648429870605469, 10.49563980102539, 11.34284782409668, 12.190056800842285, 13.03726577758789, 13.884474754333496, 14.731683731079102, 15.57889175415039, 16.426101684570312, 17.2733097076416, 18.12051773071289, 18.967727661132812, 19.814937591552734, 20.662145614624023, 21.509355545043945, 22.356563568115234, 23.203773498535156, 24.050981521606445, 24.898189544677734, 25.745399475097656, 26.592607498168945]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 7.0, 8.0, 5.0, 10.0, 11.0, 13.0, 18.0, 19.0, 22.0, 21.0, 16.0, 29.0, 30.0, 33.0, 23.0, 37.0, 39.0, 43.0, 43.0, 33.0, 40.0, 31.0, 41.0, 41.0, 40.0, 31.0, 36.0, 38.0, 30.0, 26.0, 28.0, 34.0, 14.0, 14.0, 16.0, 11.0, 14.0, 12.0, 11.0, 7.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.764745712280273, -28.830656051635742, -27.89656639099121, -26.96247673034668, -26.02838897705078, -25.09429931640625, -24.16020965576172, -23.226119995117188, -22.292030334472656, -21.357940673828125, -20.423851013183594, -19.489761352539062, -18.55567169189453, -17.62158203125, -16.6874942779541, -15.75340461730957, -14.819314956665039, -13.885225296020508, -12.951135635375977, -12.017046928405762, -11.08295726776123, -10.1488676071167, -9.214778900146484, -8.280689239501953, -7.346599578857422, -6.412509918212891, -5.478420734405518, -4.5443315505981445, -3.6102418899536133, -2.676152229309082, -1.742063045501709, -0.8079738616943359, 0.12611770629882812, 1.0602071285247803, 1.9942965507507324, 2.9283859729766846, 3.8624753952026367, 4.796565055847168, 5.730654239654541, 6.664743423461914, 7.598833084106445, 8.532922744750977, 9.467012405395508, 10.401101112365723, 11.335190773010254, 12.269280433654785, 13.203369140625, 14.137458801269531, 15.071548461914062, 16.005638122558594, 16.939727783203125, 17.873817443847656, 18.807907104492188, 19.74199676513672, 20.676084518432617, 21.61017417907715, 22.54426383972168, 23.47835350036621, 24.412443161010742, 25.346532821655273, 26.280620574951172, 27.214710235595703, 28.148799896240234, 29.082889556884766, 30.016979217529297]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 8.0, 13.0, 30.0, 44.0, 84.0, 130.0, 210.0, 397.0, 632.0, 1080.0, 1737.0, 2916.0, 4900.0, 8017.0, 13355.0, 21775.0, 34928.0, 56198.0, 87434.0, 133166.0, 193867.0, 271529.0, 353335.0, 427493.0, 472617.0, 472669.0, 430510.0, 357569.0, 274745.0, 197425.0, 135854.0, 89588.0, 57210.0, 36232.0, 22308.0, 13651.0, 8264.0, 4988.0, 3003.0, 1808.0, 1030.0, 650.0, 383.0, 207.0, 114.0, 67.0, 44.0, 24.0, 15.0, 16.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.0625, -20.40478515625, -19.7470703125, -19.08935546875, -18.431640625, -17.77392578125, -17.1162109375, -16.45849609375, -15.80078125, -15.14306640625, -14.4853515625, -13.82763671875, -13.169921875, -12.51220703125, -11.8544921875, -11.19677734375, -10.5390625, -9.88134765625, -9.2236328125, -8.56591796875, -7.908203125, -7.25048828125, -6.5927734375, -5.93505859375, -5.27734375, -4.61962890625, -3.9619140625, -3.30419921875, -2.646484375, -1.98876953125, -1.3310546875, -0.67333984375, -0.015625, 0.64208984375, 1.2998046875, 1.95751953125, 2.615234375, 3.27294921875, 3.9306640625, 4.58837890625, 5.24609375, 5.90380859375, 6.5615234375, 7.21923828125, 7.876953125, 8.53466796875, 9.1923828125, 9.85009765625, 10.5078125, 11.16552734375, 11.8232421875, 12.48095703125, 13.138671875, 13.79638671875, 14.4541015625, 15.11181640625, 15.76953125, 16.42724609375, 17.0849609375, 17.74267578125, 18.400390625, 19.05810546875, 19.7158203125, 20.37353515625, 21.03125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 7.0, 10.0, 5.0, 11.0, 10.0, 12.0, 19.0, 19.0, 21.0, 19.0, 19.0, 22.0, 34.0, 31.0, 23.0, 34.0, 44.0, 36.0, 44.0, 35.0, 45.0, 35.0, 31.0, 35.0, 51.0, 28.0, 29.0, 44.0, 31.0, 30.0, 31.0, 23.0, 23.0, 11.0, 14.0, 14.0, 10.0, 19.0, 7.0, 11.0, 3.0, 6.0, 2.0, 6.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-26.015625, -25.201416015625, -24.38720703125, -23.572998046875, -22.7587890625, -21.944580078125, -21.13037109375, -20.316162109375, -19.501953125, -18.687744140625, -17.87353515625, -17.059326171875, -16.2451171875, -15.430908203125, -14.61669921875, -13.802490234375, -12.98828125, -12.174072265625, -11.35986328125, -10.545654296875, -9.7314453125, -8.917236328125, -8.10302734375, -7.288818359375, -6.474609375, -5.660400390625, -4.84619140625, -4.031982421875, -3.2177734375, -2.403564453125, -1.58935546875, -0.775146484375, 0.0390625, 0.853271484375, 1.66748046875, 2.481689453125, 3.2958984375, 4.110107421875, 4.92431640625, 5.738525390625, 6.552734375, 7.366943359375, 8.18115234375, 8.995361328125, 9.8095703125, 10.623779296875, 11.43798828125, 12.252197265625, 13.06640625, 13.880615234375, 14.69482421875, 15.509033203125, 16.3232421875, 17.137451171875, 17.95166015625, 18.765869140625, 19.580078125, 20.394287109375, 21.20849609375, 22.022705078125, 22.8369140625, 23.651123046875, 24.46533203125, 25.279541015625, 26.09375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 20.0, 25.0, 54.0, 76.0, 143.0, 231.0, 402.0, 655.0, 1154.0, 1975.0, 3346.0, 5519.0, 9072.0, 15003.0, 23880.0, 37452.0, 58011.0, 87649.0, 128097.0, 179854.0, 242047.0, 310599.0, 371804.0, 415509.0, 431050.0, 412445.0, 369045.0, 306511.0, 238996.0, 177742.0, 125792.0, 85945.0, 56954.0, 36751.0, 23614.0, 14559.0, 8925.0, 5368.0, 3342.0, 1908.0, 1114.0, 667.0, 435.0, 216.0, 130.0, 91.0, 45.0, 29.0, 12.0, 11.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-21.8125, -21.140869140625, -20.46923828125, -19.797607421875, -19.1259765625, -18.454345703125, -17.78271484375, -17.111083984375, -16.439453125, -15.767822265625, -15.09619140625, -14.424560546875, -13.7529296875, -13.081298828125, -12.40966796875, -11.738037109375, -11.06640625, -10.394775390625, -9.72314453125, -9.051513671875, -8.3798828125, -7.708251953125, -7.03662109375, -6.364990234375, -5.693359375, -5.021728515625, -4.35009765625, -3.678466796875, -3.0068359375, -2.335205078125, -1.66357421875, -0.991943359375, -0.3203125, 0.351318359375, 1.02294921875, 1.694580078125, 2.3662109375, 3.037841796875, 3.70947265625, 4.381103515625, 5.052734375, 5.724365234375, 6.39599609375, 7.067626953125, 7.7392578125, 8.410888671875, 9.08251953125, 9.754150390625, 10.42578125, 11.097412109375, 11.76904296875, 12.440673828125, 13.1123046875, 13.783935546875, 14.45556640625, 15.127197265625, 15.798828125, 16.470458984375, 17.14208984375, 17.813720703125, 18.4853515625, 19.156982421875, 19.82861328125, 20.500244140625, 21.171875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 10.0, 4.0, 7.0, 10.0, 20.0, 21.0, 30.0, 30.0, 43.0, 54.0, 77.0, 69.0, 89.0, 103.0, 126.0, 117.0, 131.0, 159.0, 170.0, 170.0, 183.0, 183.0, 194.0, 188.0, 201.0, 210.0, 165.0, 204.0, 164.0, 143.0, 110.0, 126.0, 85.0, 80.0, 74.0, 80.0, 53.0, 43.0, 38.0, 21.0, 22.0, 18.0, 12.0, 13.0, 12.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.8203125, -11.4708251953125, -11.121337890625, -10.7718505859375, -10.42236328125, -10.0728759765625, -9.723388671875, -9.3739013671875, -9.0244140625, -8.6749267578125, -8.325439453125, -7.9759521484375, -7.62646484375, -7.2769775390625, -6.927490234375, -6.5780029296875, -6.228515625, -5.8790283203125, -5.529541015625, -5.1800537109375, -4.83056640625, -4.4810791015625, -4.131591796875, -3.7821044921875, -3.4326171875, -3.0831298828125, -2.733642578125, -2.3841552734375, -2.03466796875, -1.6851806640625, -1.335693359375, -0.9862060546875, -0.63671875, -0.2872314453125, 0.062255859375, 0.4117431640625, 0.76123046875, 1.1107177734375, 1.460205078125, 1.8096923828125, 2.1591796875, 2.5086669921875, 2.858154296875, 3.2076416015625, 3.55712890625, 3.9066162109375, 4.256103515625, 4.6055908203125, 4.955078125, 5.3045654296875, 5.654052734375, 6.0035400390625, 6.35302734375, 6.7025146484375, 7.052001953125, 7.4014892578125, 7.7509765625, 8.1004638671875, 8.449951171875, 8.7994384765625, 9.14892578125, 9.4984130859375, 9.847900390625, 10.1973876953125, 10.546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 3.0, 4.0, 5.0, 7.0, 8.0, 13.0, 14.0, 12.0, 17.0, 23.0, 23.0, 37.0, 25.0, 34.0, 28.0, 41.0, 39.0, 33.0, 45.0, 41.0, 46.0, 42.0, 40.0, 56.0, 31.0, 31.0, 36.0, 35.0, 28.0, 19.0, 35.0, 24.0, 26.0, 18.0, 12.0, 13.0, 18.0, 8.0, 4.0, 8.0, 12.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.142011642456055, -27.26846694946289, -26.394922256469727, -25.521377563476562, -24.6478328704834, -23.774288177490234, -22.900741577148438, -22.027196884155273, -21.15365219116211, -20.280107498168945, -19.40656280517578, -18.533018112182617, -17.659473419189453, -16.785926818847656, -15.912383079528809, -15.038837432861328, -14.16529369354248, -13.291749000549316, -12.418204307556152, -11.544658660888672, -10.671113967895508, -9.797569274902344, -8.92402458190918, -8.050479888916016, -7.176934719085693, -6.303390026092529, -5.429844856262207, -4.556300163269043, -3.6827552318573, -2.8092103004455566, -1.9356656074523926, -1.0621204376220703, -0.18857574462890625, 0.6849691271781921, 1.5585139989852905, 2.432058811187744, 3.3056037425994873, 4.1791486740112305, 5.0526933670043945, 5.926238536834717, 6.799783229827881, 7.673327922821045, 8.546873092651367, 9.420417785644531, 10.293962478637695, 11.16750717163086, 12.041051864624023, 12.914597511291504, 13.788142204284668, 14.661686897277832, 15.535231590270996, 16.408777236938477, 17.28232192993164, 18.155866622924805, 19.02941131591797, 19.902956008911133, 20.776500701904297, 21.65004539489746, 22.523590087890625, 23.39713478088379, 24.270679473876953, 25.14422607421875, 26.01776885986328, 26.891315460205078, 27.764860153198242]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 8.0, 7.0, 13.0, 12.0, 10.0, 12.0, 13.0, 18.0, 15.0, 24.0, 20.0, 22.0, 18.0, 24.0, 43.0, 30.0, 34.0, 34.0, 29.0, 32.0, 34.0, 31.0, 27.0, 45.0, 38.0, 39.0, 25.0, 27.0, 29.0, 35.0, 22.0, 25.0, 30.0, 27.0, 15.0, 25.0, 16.0, 13.0, 11.0, 14.0, 9.0, 9.0, 7.0, 4.0, 3.0, 3.0, 6.0, 1.0, 2.0, 6.0, 1.0, 2.0], "bins": [-27.159069061279297, -26.358509063720703, -25.557947158813477, -24.75738525390625, -23.956825256347656, -23.156265258789062, -22.355703353881836, -21.55514144897461, -20.754581451416016, -19.954021453857422, -19.153459548950195, -18.35289764404297, -17.552337646484375, -16.75177764892578, -15.951215744018555, -15.150654792785645, -14.350093841552734, -13.549532890319824, -12.748971939086914, -11.948410987854004, -11.147850036621094, -10.347289085388184, -9.546728134155273, -8.746167182922363, -7.945606231689453, -7.145045280456543, -6.344484329223633, -5.543923377990723, -4.7433624267578125, -3.9428014755249023, -3.142240524291992, -2.341679573059082, -1.5411205291748047, -0.7405595779418945, 0.060001373291015625, 0.8605623245239258, 1.661123275756836, 2.461684226989746, 3.2622451782226562, 4.062806129455566, 4.863367080688477, 5.663928031921387, 6.464488983154297, 7.265049934387207, 8.065610885620117, 8.866171836853027, 9.666732788085938, 10.467293739318848, 11.267854690551758, 12.068415641784668, 12.868976593017578, 13.669537544250488, 14.470098495483398, 15.270659446716309, 16.07122039794922, 16.871780395507812, 17.67234230041504, 18.472904205322266, 19.27346420288086, 20.074024200439453, 20.87458610534668, 21.675148010253906, 22.4757080078125, 23.276268005371094, 24.07682991027832]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 12.0, 7.0, 30.0, 28.0, 62.0, 77.0, 138.0, 249.0, 348.0, 595.0, 950.0, 1542.0, 2341.0, 3793.0, 6017.0, 8948.0, 13370.0, 19573.0, 28378.0, 38789.0, 51911.0, 66210.0, 80646.0, 91755.0, 98769.0, 99144.0, 93527.0, 82463.0, 68998.0, 54692.0, 41303.0, 30405.0, 21327.0, 14701.0, 9834.0, 6373.0, 4199.0, 2634.0, 1650.0, 1053.0, 645.0, 408.0, 251.0, 152.0, 91.0, 61.0, 48.0, 26.0, 9.0, 12.0, 10.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.90234375, -6.680419921875, -6.45849609375, -6.236572265625, -6.0146484375, -5.792724609375, -5.57080078125, -5.348876953125, -5.126953125, -4.905029296875, -4.68310546875, -4.461181640625, -4.2392578125, -4.017333984375, -3.79541015625, -3.573486328125, -3.3515625, -3.129638671875, -2.90771484375, -2.685791015625, -2.4638671875, -2.241943359375, -2.02001953125, -1.798095703125, -1.576171875, -1.354248046875, -1.13232421875, -0.910400390625, -0.6884765625, -0.466552734375, -0.24462890625, -0.022705078125, 0.19921875, 0.421142578125, 0.64306640625, 0.864990234375, 1.0869140625, 1.308837890625, 1.53076171875, 1.752685546875, 1.974609375, 2.196533203125, 2.41845703125, 2.640380859375, 2.8623046875, 3.084228515625, 3.30615234375, 3.528076171875, 3.75, 3.971923828125, 4.19384765625, 4.415771484375, 4.6376953125, 4.859619140625, 5.08154296875, 5.303466796875, 5.525390625, 5.747314453125, 5.96923828125, 6.191162109375, 6.4130859375, 6.635009765625, 6.85693359375, 7.078857421875, 7.30078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 10.0, 8.0, 6.0, 12.0, 16.0, 10.0, 10.0, 13.0, 18.0, 16.0, 23.0, 22.0, 22.0, 17.0, 24.0, 42.0, 34.0, 31.0, 33.0, 34.0, 29.0, 35.0, 30.0, 29.0, 45.0, 38.0, 35.0, 28.0, 26.0, 29.0, 35.0, 22.0, 27.0, 27.0, 25.0, 22.0, 20.0, 16.0, 13.0, 13.0, 10.0, 10.0, 8.0, 7.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 6.0, 1.0, 2.0], "bins": [-27.15625, -26.353759765625, -25.55126953125, -24.748779296875, -23.9462890625, -23.143798828125, -22.34130859375, -21.538818359375, -20.736328125, -19.933837890625, -19.13134765625, -18.328857421875, -17.5263671875, -16.723876953125, -15.92138671875, -15.118896484375, -14.31640625, -13.513916015625, -12.71142578125, -11.908935546875, -11.1064453125, -10.303955078125, -9.50146484375, -8.698974609375, -7.896484375, -7.093994140625, -6.29150390625, -5.489013671875, -4.6865234375, -3.884033203125, -3.08154296875, -2.279052734375, -1.4765625, -0.674072265625, 0.12841796875, 0.930908203125, 1.7333984375, 2.535888671875, 3.33837890625, 4.140869140625, 4.943359375, 5.745849609375, 6.54833984375, 7.350830078125, 8.1533203125, 8.955810546875, 9.75830078125, 10.560791015625, 11.36328125, 12.165771484375, 12.96826171875, 13.770751953125, 14.5732421875, 15.375732421875, 16.17822265625, 16.980712890625, 17.783203125, 18.585693359375, 19.38818359375, 20.190673828125, 20.9931640625, 21.795654296875, 22.59814453125, 23.400634765625, 24.203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 11.0, 28.0, 32.0, 46.0, 69.0, 136.0, 169.0, 292.0, 427.0, 732.0, 1111.0, 1718.0, 2583.0, 4042.0, 6141.0, 9645.0, 15375.0, 26537.0, 118180.0, 770764.0, 36438.0, 20252.0, 12329.0, 7640.0, 4859.0, 3191.0, 2038.0, 1353.0, 845.0, 574.0, 355.0, 252.0, 143.0, 82.0, 51.0, 36.0, 27.0, 19.0, 22.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.3125, -24.551025390625, -23.78955078125, -23.028076171875, -22.2666015625, -21.505126953125, -20.74365234375, -19.982177734375, -19.220703125, -18.459228515625, -17.69775390625, -16.936279296875, -16.1748046875, -15.413330078125, -14.65185546875, -13.890380859375, -13.12890625, -12.367431640625, -11.60595703125, -10.844482421875, -10.0830078125, -9.321533203125, -8.56005859375, -7.798583984375, -7.037109375, -6.275634765625, -5.51416015625, -4.752685546875, -3.9912109375, -3.229736328125, -2.46826171875, -1.706787109375, -0.9453125, -0.183837890625, 0.57763671875, 1.339111328125, 2.1005859375, 2.862060546875, 3.62353515625, 4.385009765625, 5.146484375, 5.907958984375, 6.66943359375, 7.430908203125, 8.1923828125, 8.953857421875, 9.71533203125, 10.476806640625, 11.23828125, 11.999755859375, 12.76123046875, 13.522705078125, 14.2841796875, 15.045654296875, 15.80712890625, 16.568603515625, 17.330078125, 18.091552734375, 18.85302734375, 19.614501953125, 20.3759765625, 21.137451171875, 21.89892578125, 22.660400390625, 23.421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 10.0, 4.0, 4.0, 5.0, 8.0, 9.0, 13.0, 15.0, 20.0, 19.0, 16.0, 27.0, 36.0, 37.0, 33.0, 36.0, 28.0, 39.0, 31.0, 37.0, 37.0, 37.0, 43.0, 38.0, 40.0, 32.0, 43.0, 35.0, 50.0, 27.0, 31.0, 21.0, 24.0, 16.0, 25.0, 12.0, 10.0, 11.0, 8.0, 5.0, 11.0, 5.0, 2.0, 8.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.15625, -16.550048828125, -15.94384765625, -15.337646484375, -14.7314453125, -14.125244140625, -13.51904296875, -12.912841796875, -12.306640625, -11.700439453125, -11.09423828125, -10.488037109375, -9.8818359375, -9.275634765625, -8.66943359375, -8.063232421875, -7.45703125, -6.850830078125, -6.24462890625, -5.638427734375, -5.0322265625, -4.426025390625, -3.81982421875, -3.213623046875, -2.607421875, -2.001220703125, -1.39501953125, -0.788818359375, -0.1826171875, 0.423583984375, 1.02978515625, 1.635986328125, 2.2421875, 2.848388671875, 3.45458984375, 4.060791015625, 4.6669921875, 5.273193359375, 5.87939453125, 6.485595703125, 7.091796875, 7.697998046875, 8.30419921875, 8.910400390625, 9.5166015625, 10.122802734375, 10.72900390625, 11.335205078125, 11.94140625, 12.547607421875, 13.15380859375, 13.760009765625, 14.3662109375, 14.972412109375, 15.57861328125, 16.184814453125, 16.791015625, 17.397216796875, 18.00341796875, 18.609619140625, 19.2158203125, 19.822021484375, 20.42822265625, 21.034423828125, 21.640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 11.0, 12.0, 19.0, 16.0, 34.0, 40.0, 65.0, 97.0, 150.0, 231.0, 370.0, 631.0, 1036.0, 1631.0, 2620.0, 4606.0, 7728.0, 13949.0, 26168.0, 113989.0, 789849.0, 40477.0, 19088.0, 10433.0, 5995.0, 3615.0, 2204.0, 1283.0, 806.0, 530.0, 315.0, 175.0, 119.0, 84.0, 58.0, 38.0, 20.0, 19.0, 12.0, 9.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9345703125, -1.8726959228515625, -1.810821533203125, -1.7489471435546875, -1.68707275390625, -1.6251983642578125, -1.563323974609375, -1.5014495849609375, -1.4395751953125, -1.3777008056640625, -1.315826416015625, -1.2539520263671875, -1.19207763671875, -1.1302032470703125, -1.068328857421875, -1.0064544677734375, -0.944580078125, -0.8827056884765625, -0.820831298828125, -0.7589569091796875, -0.69708251953125, -0.6352081298828125, -0.573333740234375, -0.5114593505859375, -0.4495849609375, -0.3877105712890625, -0.325836181640625, -0.2639617919921875, -0.20208740234375, -0.1402130126953125, -0.078338623046875, -0.0164642333984375, 0.04541015625, 0.1072845458984375, 0.169158935546875, 0.2310333251953125, 0.29290771484375, 0.3547821044921875, 0.416656494140625, 0.4785308837890625, 0.5404052734375, 0.6022796630859375, 0.664154052734375, 0.7260284423828125, 0.78790283203125, 0.8497772216796875, 0.911651611328125, 0.9735260009765625, 1.035400390625, 1.0972747802734375, 1.159149169921875, 1.2210235595703125, 1.28289794921875, 1.3447723388671875, 1.406646728515625, 1.4685211181640625, 1.5303955078125, 1.5922698974609375, 1.654144287109375, 1.7160186767578125, 1.77789306640625, 1.8397674560546875, 1.901641845703125, 1.9635162353515625, 2.025390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 6.0, 1.0, 5.0, 2.0, 5.0, 10.0, 8.0, 14.0, 13.0, 26.0, 20.0, 33.0, 41.0, 38.0, 40.0, 34.0, 44.0, 51.0, 63.0, 53.0, 60.0, 56.0, 43.0, 53.0, 42.0, 47.0, 25.0, 32.0, 30.0, 23.0, 16.0, 11.0, 14.0, 8.0, 6.0, 2.0, 5.0, 6.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.00015807151794433594, -0.00015353411436080933, -0.00014899671077728271, -0.0001444593071937561, -0.0001399219036102295, -0.00013538450002670288, -0.00013084709644317627, -0.00012630969285964966, -0.00012177228927612305, -0.00011723488569259644, -0.00011269748210906982, -0.00010816007852554321, -0.0001036226749420166, -9.908527135848999e-05, -9.454786777496338e-05, -9.001046419143677e-05, -8.547306060791016e-05, -8.093565702438354e-05, -7.639825344085693e-05, -7.186084985733032e-05, -6.732344627380371e-05, -6.27860426902771e-05, -5.824863910675049e-05, -5.371123552322388e-05, -4.9173831939697266e-05, -4.4636428356170654e-05, -4.009902477264404e-05, -3.556162118911743e-05, -3.102421760559082e-05, -2.648681402206421e-05, -2.1949410438537598e-05, -1.7412006855010986e-05, -1.2874603271484375e-05, -8.337199687957764e-06, -3.7997961044311523e-06, 7.37607479095459e-07, 5.27501106262207e-06, 9.812414646148682e-06, 1.4349818229675293e-05, 1.8887221813201904e-05, 2.3424625396728516e-05, 2.7962028980255127e-05, 3.249943256378174e-05, 3.703683614730835e-05, 4.157423973083496e-05, 4.611164331436157e-05, 5.0649046897888184e-05, 5.5186450481414795e-05, 5.9723854064941406e-05, 6.426125764846802e-05, 6.879866123199463e-05, 7.333606481552124e-05, 7.787346839904785e-05, 8.241087198257446e-05, 8.694827556610107e-05, 9.148567914962769e-05, 9.60230827331543e-05, 0.00010056048631668091, 0.00010509788990020752, 0.00010963529348373413, 0.00011417269706726074, 0.00011871010065078735, 0.00012324750423431396, 0.00012778490781784058, 0.0001323223114013672]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 17.0, 37.0, 36.0, 73.0, 92.0, 170.0, 240.0, 424.0, 702.0, 1221.0, 1987.0, 3232.0, 5323.0, 8185.0, 13349.0, 20669.0, 30856.0, 44845.0, 62202.0, 81472.0, 99056.0, 110863.0, 114385.0, 108292.0, 93645.0, 75338.0, 56321.0, 40173.0, 27181.0, 17731.0, 11574.0, 7353.0, 4459.0, 2806.0, 1641.0, 1016.0, 620.0, 373.0, 222.0, 134.0, 75.0, 56.0, 36.0, 25.0, 12.0, 9.0, 11.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.95068359375, -0.92034912109375, -0.8900146484375, -0.85968017578125, -0.829345703125, -0.79901123046875, -0.7686767578125, -0.73834228515625, -0.7080078125, -0.67767333984375, -0.6473388671875, -0.61700439453125, -0.586669921875, -0.55633544921875, -0.5260009765625, -0.49566650390625, -0.46533203125, -0.43499755859375, -0.4046630859375, -0.37432861328125, -0.343994140625, -0.31365966796875, -0.2833251953125, -0.25299072265625, -0.22265625, -0.19232177734375, -0.1619873046875, -0.13165283203125, -0.101318359375, -0.07098388671875, -0.0406494140625, -0.01031494140625, 0.02001953125, 0.05035400390625, 0.0806884765625, 0.11102294921875, 0.141357421875, 0.17169189453125, 0.2020263671875, 0.23236083984375, 0.2626953125, 0.29302978515625, 0.3233642578125, 0.35369873046875, 0.384033203125, 0.41436767578125, 0.4447021484375, 0.47503662109375, 0.50537109375, 0.53570556640625, 0.5660400390625, 0.59637451171875, 0.626708984375, 0.65704345703125, 0.6873779296875, 0.71771240234375, 0.748046875, 0.77838134765625, 0.8087158203125, 0.83905029296875, 0.869384765625, 0.89971923828125, 0.9300537109375, 0.96038818359375, 0.99072265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 6.0, 3.0, 3.0, 5.0, 4.0, 8.0, 4.0, 4.0, 10.0, 16.0, 10.0, 11.0, 14.0, 18.0, 16.0, 22.0, 19.0, 20.0, 28.0, 28.0, 26.0, 29.0, 22.0, 42.0, 30.0, 29.0, 42.0, 32.0, 34.0, 24.0, 30.0, 31.0, 34.0, 34.0, 28.0, 24.0, 27.0, 27.0, 17.0, 25.0, 20.0, 18.0, 19.0, 18.0, 18.0, 18.0, 10.0, 16.0, 9.0, 12.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.385009765625, -0.3726806640625, -0.3603515625, -0.3480224609375, -0.335693359375, -0.3233642578125, -0.31103515625, -0.2987060546875, -0.286376953125, -0.2740478515625, -0.26171875, -0.2493896484375, -0.237060546875, -0.2247314453125, -0.21240234375, -0.2000732421875, -0.187744140625, -0.1754150390625, -0.1630859375, -0.1507568359375, -0.138427734375, -0.1260986328125, -0.11376953125, -0.1014404296875, -0.089111328125, -0.0767822265625, -0.064453125, -0.0521240234375, -0.039794921875, -0.0274658203125, -0.01513671875, -0.0028076171875, 0.009521484375, 0.0218505859375, 0.0341796875, 0.0465087890625, 0.058837890625, 0.0711669921875, 0.08349609375, 0.0958251953125, 0.108154296875, 0.1204833984375, 0.1328125, 0.1451416015625, 0.157470703125, 0.1697998046875, 0.18212890625, 0.1944580078125, 0.206787109375, 0.2191162109375, 0.2314453125, 0.2437744140625, 0.256103515625, 0.2684326171875, 0.28076171875, 0.2930908203125, 0.305419921875, 0.3177490234375, 0.330078125, 0.3424072265625, 0.354736328125, 0.3670654296875, 0.37939453125, 0.3917236328125, 0.404052734375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 8.0, 9.0, 3.0, 6.0, 20.0, 11.0, 20.0, 16.0, 17.0, 38.0, 27.0, 26.0, 37.0, 41.0, 32.0, 36.0, 43.0, 34.0, 44.0, 47.0, 38.0, 54.0, 33.0, 45.0, 39.0, 26.0, 34.0, 23.0, 32.0, 24.0, 24.0, 21.0, 21.0, 14.0, 15.0, 9.0, 8.0, 7.0, 7.0, 8.0, 6.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.845993041992188, -27.963638305664062, -27.081281661987305, -26.19892692565918, -25.316570281982422, -24.434215545654297, -23.551860809326172, -22.669506072998047, -21.78714942932129, -20.904794692993164, -20.022438049316406, -19.14008331298828, -18.257728576660156, -17.3753719329834, -16.493017196655273, -15.610661506652832, -14.72830581665039, -13.84595012664795, -12.963594436645508, -12.081239700317383, -11.198884010314941, -10.3165283203125, -9.434173583984375, -8.551817893981934, -7.669462203979492, -6.787106513977051, -5.904751300811768, -5.022396087646484, -4.140040397644043, -3.2576847076416016, -2.3753294944763184, -1.4929742813110352, -0.6106185913085938, 0.27173686027526855, 1.1540923118591309, 2.036447763442993, 2.9188032150268555, 3.801158905029297, 4.68351411819458, 5.565869331359863, 6.448225021362305, 7.330580711364746, 8.212936401367188, 9.095291137695312, 9.977646827697754, 10.860002517700195, 11.74235725402832, 12.624712944030762, 13.507068634033203, 14.389424324035645, 15.271780014038086, 16.15413475036621, 17.03649139404297, 17.918846130371094, 18.80120086669922, 19.683555603027344, 20.5659122467041, 21.448266983032227, 22.330623626708984, 23.21297836303711, 24.095333099365234, 24.977689743041992, 25.860044479370117, 26.742401123046875, 27.624755859375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 9.0, 7.0, 10.0, 8.0, 11.0, 15.0, 14.0, 8.0, 19.0, 18.0, 19.0, 25.0, 19.0, 17.0, 16.0, 42.0, 31.0, 43.0, 26.0, 34.0, 23.0, 37.0, 35.0, 30.0, 34.0, 38.0, 40.0, 30.0, 33.0, 24.0, 26.0, 28.0, 24.0, 32.0, 27.0, 20.0, 26.0, 17.0, 11.0, 11.0, 16.0, 10.0, 6.0, 11.0, 4.0, 5.0, 2.0, 2.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0], "bins": [-26.567829132080078, -25.769271850585938, -24.97071647644043, -24.172161102294922, -23.37360382080078, -22.57504653930664, -21.776491165161133, -20.977935791015625, -20.179378509521484, -19.380821228027344, -18.582265853881836, -17.783710479736328, -16.985153198242188, -16.186595916748047, -15.388040542602539, -14.589484214782715, -13.79092788696289, -12.992371559143066, -12.193815231323242, -11.395258903503418, -10.596702575683594, -9.79814624786377, -8.999589920043945, -8.201033592224121, -7.402477264404297, -6.603920936584473, -5.805364608764648, -5.006808280944824, -4.208251953125, -3.409695625305176, -2.6111392974853516, -1.8125829696655273, -1.014028549194336, -0.21547222137451172, 0.5830841064453125, 1.3816404342651367, 2.180196762084961, 2.978753089904785, 3.7773094177246094, 4.575865745544434, 5.374422073364258, 6.172978401184082, 6.971534729003906, 7.7700910568237305, 8.568647384643555, 9.367203712463379, 10.165760040283203, 10.964316368103027, 11.762872695922852, 12.561429023742676, 13.3599853515625, 14.158541679382324, 14.957098007202148, 15.755654335021973, 16.554210662841797, 17.352767944335938, 18.151323318481445, 18.949878692626953, 19.748435974121094, 20.546993255615234, 21.345548629760742, 22.14410400390625, 22.94266128540039, 23.74121856689453, 24.53977394104004]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 10.0, 14.0, 19.0, 40.0, 41.0, 67.0, 114.0, 176.0, 269.0, 437.0, 678.0, 1152.0, 1838.0, 2782.0, 4254.0, 6588.0, 10001.0, 15081.0, 22082.0, 31114.0, 42849.0, 56675.0, 71160.0, 84292.0, 94513.0, 99378.0, 98697.0, 90607.0, 78943.0, 64494.0, 50533.0, 37827.0, 26950.0, 18455.0, 12776.0, 8445.0, 5569.0, 3447.0, 2228.0, 1459.0, 960.0, 541.0, 368.0, 233.0, 145.0, 97.0, 55.0, 45.0, 16.0, 19.0, 3.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.53125, -19.88525390625, -19.2392578125, -18.59326171875, -17.947265625, -17.30126953125, -16.6552734375, -16.00927734375, -15.36328125, -14.71728515625, -14.0712890625, -13.42529296875, -12.779296875, -12.13330078125, -11.4873046875, -10.84130859375, -10.1953125, -9.54931640625, -8.9033203125, -8.25732421875, -7.611328125, -6.96533203125, -6.3193359375, -5.67333984375, -5.02734375, -4.38134765625, -3.7353515625, -3.08935546875, -2.443359375, -1.79736328125, -1.1513671875, -0.50537109375, 0.140625, 0.78662109375, 1.4326171875, 2.07861328125, 2.724609375, 3.37060546875, 4.0166015625, 4.66259765625, 5.30859375, 5.95458984375, 6.6005859375, 7.24658203125, 7.892578125, 8.53857421875, 9.1845703125, 9.83056640625, 10.4765625, 11.12255859375, 11.7685546875, 12.41455078125, 13.060546875, 13.70654296875, 14.3525390625, 14.99853515625, 15.64453125, 16.29052734375, 16.9365234375, 17.58251953125, 18.228515625, 18.87451171875, 19.5205078125, 20.16650390625, 20.8125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 10.0, 9.0, 8.0, 6.0, 15.0, 16.0, 8.0, 11.0, 18.0, 24.0, 19.0, 25.0, 17.0, 15.0, 29.0, 35.0, 41.0, 28.0, 28.0, 36.0, 26.0, 35.0, 33.0, 30.0, 38.0, 37.0, 34.0, 34.0, 31.0, 26.0, 27.0, 24.0, 27.0, 28.0, 25.0, 23.0, 25.0, 15.0, 11.0, 10.0, 13.0, 12.0, 7.0, 9.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0], "bins": [-25.21875, -24.453125, -23.6875, -22.921875, -22.15625, -21.390625, -20.625, -19.859375, -19.09375, -18.328125, -17.5625, -16.796875, -16.03125, -15.265625, -14.5, -13.734375, -12.96875, -12.203125, -11.4375, -10.671875, -9.90625, -9.140625, -8.375, -7.609375, -6.84375, -6.078125, -5.3125, -4.546875, -3.78125, -3.015625, -2.25, -1.484375, -0.71875, 0.046875, 0.8125, 1.578125, 2.34375, 3.109375, 3.875, 4.640625, 5.40625, 6.171875, 6.9375, 7.703125, 8.46875, 9.234375, 10.0, 10.765625, 11.53125, 12.296875, 13.0625, 13.828125, 14.59375, 15.359375, 16.125, 16.890625, 17.65625, 18.421875, 19.1875, 19.953125, 20.71875, 21.484375, 22.25, 23.015625, 23.78125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 10.0, 12.0, 25.0, 40.0, 69.0, 110.0, 167.0, 263.0, 437.0, 759.0, 1176.0, 1845.0, 2963.0, 4608.0, 7236.0, 11014.0, 16475.0, 23701.0, 33259.0, 45043.0, 58390.0, 71929.0, 84857.0, 93847.0, 97504.0, 95731.0, 88349.0, 76717.0, 63801.0, 49198.0, 36962.0, 26798.0, 18879.0, 12930.0, 8515.0, 5480.0, 3497.0, 2295.0, 1428.0, 881.0, 504.0, 309.0, 229.0, 117.0, 83.0, 50.0, 20.0, 18.0, 11.0, 9.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.078125, -18.456298828125, -17.83447265625, -17.212646484375, -16.5908203125, -15.968994140625, -15.34716796875, -14.725341796875, -14.103515625, -13.481689453125, -12.85986328125, -12.238037109375, -11.6162109375, -10.994384765625, -10.37255859375, -9.750732421875, -9.12890625, -8.507080078125, -7.88525390625, -7.263427734375, -6.6416015625, -6.019775390625, -5.39794921875, -4.776123046875, -4.154296875, -3.532470703125, -2.91064453125, -2.288818359375, -1.6669921875, -1.045166015625, -0.42333984375, 0.198486328125, 0.8203125, 1.442138671875, 2.06396484375, 2.685791015625, 3.3076171875, 3.929443359375, 4.55126953125, 5.173095703125, 5.794921875, 6.416748046875, 7.03857421875, 7.660400390625, 8.2822265625, 8.904052734375, 9.52587890625, 10.147705078125, 10.76953125, 11.391357421875, 12.01318359375, 12.635009765625, 13.2568359375, 13.878662109375, 14.50048828125, 15.122314453125, 15.744140625, 16.365966796875, 16.98779296875, 17.609619140625, 18.2314453125, 18.853271484375, 19.47509765625, 20.096923828125, 20.71875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 8.0, 4.0, 5.0, 12.0, 11.0, 10.0, 23.0, 23.0, 19.0, 26.0, 19.0, 21.0, 25.0, 27.0, 29.0, 45.0, 34.0, 30.0, 28.0, 39.0, 31.0, 36.0, 40.0, 38.0, 45.0, 23.0, 34.0, 29.0, 29.0, 32.0, 26.0, 30.0, 18.0, 22.0, 19.0, 16.0, 11.0, 15.0, 9.0, 11.0, 6.0, 14.0, 10.0, 6.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-17.78125, -17.25927734375, -16.7373046875, -16.21533203125, -15.693359375, -15.17138671875, -14.6494140625, -14.12744140625, -13.60546875, -13.08349609375, -12.5615234375, -12.03955078125, -11.517578125, -10.99560546875, -10.4736328125, -9.95166015625, -9.4296875, -8.90771484375, -8.3857421875, -7.86376953125, -7.341796875, -6.81982421875, -6.2978515625, -5.77587890625, -5.25390625, -4.73193359375, -4.2099609375, -3.68798828125, -3.166015625, -2.64404296875, -2.1220703125, -1.60009765625, -1.078125, -0.55615234375, -0.0341796875, 0.48779296875, 1.009765625, 1.53173828125, 2.0537109375, 2.57568359375, 3.09765625, 3.61962890625, 4.1416015625, 4.66357421875, 5.185546875, 5.70751953125, 6.2294921875, 6.75146484375, 7.2734375, 7.79541015625, 8.3173828125, 8.83935546875, 9.361328125, 9.88330078125, 10.4052734375, 10.92724609375, 11.44921875, 11.97119140625, 12.4931640625, 13.01513671875, 13.537109375, 14.05908203125, 14.5810546875, 15.10302734375, 15.625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 11.0, 21.0, 12.0, 37.0, 35.0, 66.0, 127.0, 162.0, 318.0, 514.0, 861.0, 1461.0, 2435.0, 4116.0, 7102.0, 12282.0, 20902.0, 35131.0, 57254.0, 86589.0, 119133.0, 142941.0, 149114.0, 131367.0, 100333.0, 69018.0, 43798.0, 26669.0, 15152.0, 9027.0, 5132.0, 3005.0, 1797.0, 1047.0, 602.0, 356.0, 236.0, 150.0, 103.0, 55.0, 35.0, 22.0, 8.0, 10.0, 8.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9375, -10.5631103515625, -10.188720703125, -9.8143310546875, -9.43994140625, -9.0655517578125, -8.691162109375, -8.3167724609375, -7.9423828125, -7.5679931640625, -7.193603515625, -6.8192138671875, -6.44482421875, -6.0704345703125, -5.696044921875, -5.3216552734375, -4.947265625, -4.5728759765625, -4.198486328125, -3.8240966796875, -3.44970703125, -3.0753173828125, -2.700927734375, -2.3265380859375, -1.9521484375, -1.5777587890625, -1.203369140625, -0.8289794921875, -0.45458984375, -0.0802001953125, 0.294189453125, 0.6685791015625, 1.04296875, 1.4173583984375, 1.791748046875, 2.1661376953125, 2.54052734375, 2.9149169921875, 3.289306640625, 3.6636962890625, 4.0380859375, 4.4124755859375, 4.786865234375, 5.1612548828125, 5.53564453125, 5.9100341796875, 6.284423828125, 6.6588134765625, 7.033203125, 7.4075927734375, 7.781982421875, 8.1563720703125, 8.53076171875, 8.9051513671875, 9.279541015625, 9.6539306640625, 10.0283203125, 10.4027099609375, 10.777099609375, 11.1514892578125, 11.52587890625, 11.9002685546875, 12.274658203125, 12.6490478515625, 13.0234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 6.0, 4.0, 5.0, 7.0, 5.0, 8.0, 12.0, 11.0, 14.0, 25.0, 27.0, 20.0, 41.0, 35.0, 50.0, 46.0, 67.0, 55.0, 62.0, 63.0, 62.0, 51.0, 49.0, 38.0, 39.0, 38.0, 27.0, 26.0, 20.0, 17.0, 17.0, 18.0, 8.0, 7.0, 5.0, 8.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0014162063598632812, -0.001373589038848877, -0.0013309717178344727, -0.0012883543968200684, -0.001245737075805664, -0.0012031197547912598, -0.0011605024337768555, -0.0011178851127624512, -0.0010752677917480469, -0.0010326504707336426, -0.0009900331497192383, -0.000947415828704834, -0.0009047985076904297, -0.0008621811866760254, -0.0008195638656616211, -0.0007769465446472168, -0.0007343292236328125, -0.0006917119026184082, -0.0006490945816040039, -0.0006064772605895996, -0.0005638599395751953, -0.000521242618560791, -0.0004786252975463867, -0.0004360079765319824, -0.0003933906555175781, -0.00035077333450317383, -0.00030815601348876953, -0.00026553869247436523, -0.00022292137145996094, -0.00018030405044555664, -0.00013768672943115234, -9.506940841674805e-05, -5.245208740234375e-05, -9.834766387939453e-06, 3.2782554626464844e-05, 7.539987564086914e-05, 0.00011801719665527344, 0.00016063451766967773, 0.00020325183868408203, 0.00024586915969848633, 0.0002884864807128906, 0.0003311038017272949, 0.0003737211227416992, 0.0004163384437561035, 0.0004589557647705078, 0.0005015730857849121, 0.0005441904067993164, 0.0005868077278137207, 0.000629425048828125, 0.0006720423698425293, 0.0007146596908569336, 0.0007572770118713379, 0.0007998943328857422, 0.0008425116539001465, 0.0008851289749145508, 0.0009277462959289551, 0.0009703636169433594, 0.0010129809379577637, 0.001055598258972168, 0.0010982155799865723, 0.0011408329010009766, 0.0011834502220153809, 0.0012260675430297852, 0.0012686848640441895, 0.0013113021850585938]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 22.0, 26.0, 44.0, 67.0, 118.0, 179.0, 346.0, 627.0, 1119.0, 1975.0, 3736.0, 6687.0, 12393.0, 22413.0, 39004.0, 64550.0, 97771.0, 131214.0, 153161.0, 151326.0, 126892.0, 92674.0, 60132.0, 36238.0, 20682.0, 11352.0, 6226.0, 3330.0, 1864.0, 1077.0, 542.0, 306.0, 195.0, 97.0, 65.0, 43.0, 20.0, 9.0, 10.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.1484375, -13.754638671875, -13.36083984375, -12.967041015625, -12.5732421875, -12.179443359375, -11.78564453125, -11.391845703125, -10.998046875, -10.604248046875, -10.21044921875, -9.816650390625, -9.4228515625, -9.029052734375, -8.63525390625, -8.241455078125, -7.84765625, -7.453857421875, -7.06005859375, -6.666259765625, -6.2724609375, -5.878662109375, -5.48486328125, -5.091064453125, -4.697265625, -4.303466796875, -3.90966796875, -3.515869140625, -3.1220703125, -2.728271484375, -2.33447265625, -1.940673828125, -1.546875, -1.153076171875, -0.75927734375, -0.365478515625, 0.0283203125, 0.422119140625, 0.81591796875, 1.209716796875, 1.603515625, 1.997314453125, 2.39111328125, 2.784912109375, 3.1787109375, 3.572509765625, 3.96630859375, 4.360107421875, 4.75390625, 5.147705078125, 5.54150390625, 5.935302734375, 6.3291015625, 6.722900390625, 7.11669921875, 7.510498046875, 7.904296875, 8.298095703125, 8.69189453125, 9.085693359375, 9.4794921875, 9.873291015625, 10.26708984375, 10.660888671875, 11.0546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 7.0, 3.0, 4.0, 15.0, 14.0, 8.0, 16.0, 12.0, 16.0, 27.0, 28.0, 24.0, 27.0, 36.0, 40.0, 37.0, 43.0, 31.0, 49.0, 42.0, 41.0, 47.0, 40.0, 31.0, 36.0, 32.0, 31.0, 38.0, 30.0, 25.0, 32.0, 23.0, 26.0, 14.0, 16.0, 11.0, 10.0, 6.0, 9.0, 6.0, 4.0, 2.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-4.1875, -4.065826416015625, -3.94415283203125, -3.822479248046875, -3.7008056640625, -3.579132080078125, -3.45745849609375, -3.335784912109375, -3.214111328125, -3.092437744140625, -2.97076416015625, -2.849090576171875, -2.7274169921875, -2.605743408203125, -2.48406982421875, -2.362396240234375, -2.24072265625, -2.119049072265625, -1.99737548828125, -1.875701904296875, -1.7540283203125, -1.632354736328125, -1.51068115234375, -1.389007568359375, -1.267333984375, -1.145660400390625, -1.02398681640625, -0.902313232421875, -0.7806396484375, -0.658966064453125, -0.53729248046875, -0.415618896484375, -0.2939453125, -0.172271728515625, -0.05059814453125, 0.071075439453125, 0.1927490234375, 0.314422607421875, 0.43609619140625, 0.557769775390625, 0.679443359375, 0.801116943359375, 0.92279052734375, 1.044464111328125, 1.1661376953125, 1.287811279296875, 1.40948486328125, 1.531158447265625, 1.65283203125, 1.774505615234375, 1.89617919921875, 2.017852783203125, 2.1395263671875, 2.261199951171875, 2.38287353515625, 2.504547119140625, 2.626220703125, 2.747894287109375, 2.86956787109375, 2.991241455078125, 3.1129150390625, 3.234588623046875, 3.35626220703125, 3.477935791015625, 3.599609375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 7.0, 6.0, 8.0, 8.0, 9.0, 16.0, 8.0, 16.0, 12.0, 28.0, 18.0, 37.0, 21.0, 20.0, 25.0, 37.0, 39.0, 34.0, 41.0, 27.0, 35.0, 32.0, 43.0, 49.0, 36.0, 39.0, 38.0, 22.0, 31.0, 36.0, 28.0, 28.0, 15.0, 27.0, 20.0, 15.0, 15.0, 12.0, 16.0, 14.0, 11.0, 5.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-25.63030433654785, -24.85382652282715, -24.077346801757812, -23.30086898803711, -22.524391174316406, -21.74791145324707, -20.971433639526367, -20.19495391845703, -19.418476104736328, -18.641998291015625, -17.86551856994629, -17.089040756225586, -16.31256103515625, -15.536083221435547, -14.759605407714844, -13.983126640319824, -13.206647872924805, -12.430169105529785, -11.653690338134766, -10.877212524414062, -10.100733757019043, -9.324254989624023, -8.54777717590332, -7.771298408508301, -6.994819641113281, -6.218340873718262, -5.4418625831604, -4.665384292602539, -3.8889055252075195, -3.112426996231079, -2.3359484672546387, -1.5594701766967773, -0.782989501953125, -0.00651097297668457, 0.7699675559997559, 1.5464460849761963, 2.3229246139526367, 3.099403142929077, 3.8758816719055176, 4.652359962463379, 5.428838729858398, 6.205317497253418, 6.981795787811279, 7.758274078369141, 8.53475284576416, 9.31123161315918, 10.087709426879883, 10.864188194274902, 11.640666961669922, 12.417145729064941, 13.193624496459961, 13.970102310180664, 14.746581077575684, 15.523059844970703, 16.299537658691406, 17.07601547241211, 17.852495193481445, 18.62897300720215, 19.405452728271484, 20.181930541992188, 20.95840835571289, 21.734888076782227, 22.51136589050293, 23.287845611572266, 24.06432342529297]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 6.0, 6.0, 8.0, 12.0, 8.0, 16.0, 17.0, 16.0, 21.0, 32.0, 24.0, 17.0, 30.0, 26.0, 28.0, 18.0, 41.0, 32.0, 53.0, 35.0, 37.0, 33.0, 31.0, 50.0, 35.0, 25.0, 30.0, 19.0, 32.0, 31.0, 24.0, 28.0, 24.0, 21.0, 24.0, 13.0, 10.0, 18.0, 13.0, 9.0, 8.0, 9.0, 4.0, 8.0, 3.0, 2.0, 5.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-28.252376556396484, -27.406330108642578, -26.56028175354004, -25.7142333984375, -24.868186950683594, -24.022140502929688, -23.17609214782715, -22.33004379272461, -21.483997344970703, -20.637950897216797, -19.791902542114258, -18.94585418701172, -18.099807739257812, -17.253761291503906, -16.407712936401367, -15.561665534973145, -14.715618133544922, -13.8695707321167, -13.023523330688477, -12.177475929260254, -11.331428527832031, -10.485381126403809, -9.639333724975586, -8.793286323547363, -7.947238922119141, -7.101191520690918, -6.255144119262695, -5.409096717834473, -4.56304931640625, -3.7170019149780273, -2.8709545135498047, -2.024907112121582, -1.1788578033447266, -0.3328104019165039, 0.5132369995117188, 1.3592844009399414, 2.205331802368164, 3.0513792037963867, 3.8974266052246094, 4.743474006652832, 5.589521408081055, 6.435568809509277, 7.2816162109375, 8.127663612365723, 8.973711013793945, 9.819758415222168, 10.66580581665039, 11.511853218078613, 12.357900619506836, 13.203948020935059, 14.049995422363281, 14.896042823791504, 15.742090225219727, 16.588138580322266, 17.434185028076172, 18.280231475830078, 19.126279830932617, 19.972328186035156, 20.818374633789062, 21.66442108154297, 22.510469436645508, 23.356517791748047, 24.202564239501953, 25.04861068725586, 25.8946590423584]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 5.0, 4.0, 2.0, 7.0, 7.0, 17.0, 35.0, 61.0, 90.0, 107.0, 209.0, 327.0, 570.0, 866.0, 1374.0, 2194.0, 3622.0, 5643.0, 8646.0, 13609.0, 21393.0, 32668.0, 49037.0, 73227.0, 105770.0, 149478.0, 203951.0, 267203.0, 327205.0, 382307.0, 414181.0, 416653.0, 388898.0, 338046.0, 275118.0, 213227.0, 157396.0, 111875.0, 77417.0, 52769.0, 35101.0, 22857.0, 14866.0, 9580.0, 6236.0, 3894.0, 2480.0, 1549.0, 969.0, 605.0, 403.0, 193.0, 141.0, 92.0, 48.0, 39.0, 14.0, 7.0, 7.0, 3.0, 0.0, 1.0, 3.0], "bins": [-18.59375, -18.01416015625, -17.4345703125, -16.85498046875, -16.275390625, -15.69580078125, -15.1162109375, -14.53662109375, -13.95703125, -13.37744140625, -12.7978515625, -12.21826171875, -11.638671875, -11.05908203125, -10.4794921875, -9.89990234375, -9.3203125, -8.74072265625, -8.1611328125, -7.58154296875, -7.001953125, -6.42236328125, -5.8427734375, -5.26318359375, -4.68359375, -4.10400390625, -3.5244140625, -2.94482421875, -2.365234375, -1.78564453125, -1.2060546875, -0.62646484375, -0.046875, 0.53271484375, 1.1123046875, 1.69189453125, 2.271484375, 2.85107421875, 3.4306640625, 4.01025390625, 4.58984375, 5.16943359375, 5.7490234375, 6.32861328125, 6.908203125, 7.48779296875, 8.0673828125, 8.64697265625, 9.2265625, 9.80615234375, 10.3857421875, 10.96533203125, 11.544921875, 12.12451171875, 12.7041015625, 13.28369140625, 13.86328125, 14.44287109375, 15.0224609375, 15.60205078125, 16.181640625, 16.76123046875, 17.3408203125, 17.92041015625, 18.5]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 6.0, 6.0, 14.0, 11.0, 5.0, 18.0, 17.0, 17.0, 13.0, 31.0, 29.0, 19.0, 24.0, 32.0, 23.0, 19.0, 34.0, 27.0, 50.0, 45.0, 32.0, 33.0, 33.0, 50.0, 40.0, 23.0, 28.0, 23.0, 34.0, 26.0, 22.0, 31.0, 24.0, 17.0, 22.0, 22.0, 8.0, 13.0, 20.0, 11.0, 7.0, 8.0, 8.0, 6.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-24.53125, -23.798828125, -23.06640625, -22.333984375, -21.6015625, -20.869140625, -20.13671875, -19.404296875, -18.671875, -17.939453125, -17.20703125, -16.474609375, -15.7421875, -15.009765625, -14.27734375, -13.544921875, -12.8125, -12.080078125, -11.34765625, -10.615234375, -9.8828125, -9.150390625, -8.41796875, -7.685546875, -6.953125, -6.220703125, -5.48828125, -4.755859375, -4.0234375, -3.291015625, -2.55859375, -1.826171875, -1.09375, -0.361328125, 0.37109375, 1.103515625, 1.8359375, 2.568359375, 3.30078125, 4.033203125, 4.765625, 5.498046875, 6.23046875, 6.962890625, 7.6953125, 8.427734375, 9.16015625, 9.892578125, 10.625, 11.357421875, 12.08984375, 12.822265625, 13.5546875, 14.287109375, 15.01953125, 15.751953125, 16.484375, 17.216796875, 17.94921875, 18.681640625, 19.4140625, 20.146484375, 20.87890625, 21.611328125, 22.34375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 19.0, 33.0, 48.0, 85.0, 152.0, 281.0, 420.0, 845.0, 1508.0, 2615.0, 4726.0, 8326.0, 14122.0, 24548.0, 40085.0, 66157.0, 103215.0, 157544.0, 225166.0, 305926.0, 384404.0, 447468.0, 475367.0, 460431.0, 405994.0, 330219.0, 249778.0, 176178.0, 118702.0, 75509.0, 46848.0, 28188.0, 16849.0, 9761.0, 5532.0, 3195.0, 1735.0, 1028.0, 536.0, 334.0, 167.0, 100.0, 67.0, 31.0, 23.0, 12.0, 5.0, 2.0, 4.0, 1.0, 2.0], "bins": [-26.46875, -25.726318359375, -24.98388671875, -24.241455078125, -23.4990234375, -22.756591796875, -22.01416015625, -21.271728515625, -20.529296875, -19.786865234375, -19.04443359375, -18.302001953125, -17.5595703125, -16.817138671875, -16.07470703125, -15.332275390625, -14.58984375, -13.847412109375, -13.10498046875, -12.362548828125, -11.6201171875, -10.877685546875, -10.13525390625, -9.392822265625, -8.650390625, -7.907958984375, -7.16552734375, -6.423095703125, -5.6806640625, -4.938232421875, -4.19580078125, -3.453369140625, -2.7109375, -1.968505859375, -1.22607421875, -0.483642578125, 0.2587890625, 1.001220703125, 1.74365234375, 2.486083984375, 3.228515625, 3.970947265625, 4.71337890625, 5.455810546875, 6.1982421875, 6.940673828125, 7.68310546875, 8.425537109375, 9.16796875, 9.910400390625, 10.65283203125, 11.395263671875, 12.1376953125, 12.880126953125, 13.62255859375, 14.364990234375, 15.107421875, 15.849853515625, 16.59228515625, 17.334716796875, 18.0771484375, 18.819580078125, 19.56201171875, 20.304443359375, 21.046875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 13.0, 14.0, 23.0, 24.0, 30.0, 42.0, 55.0, 74.0, 72.0, 87.0, 112.0, 124.0, 151.0, 170.0, 179.0, 198.0, 216.0, 207.0, 225.0, 203.0, 223.0, 199.0, 194.0, 191.0, 161.0, 167.0, 118.0, 123.0, 105.0, 83.0, 61.0, 58.0, 44.0, 41.0, 27.0, 19.0, 12.0, 5.0, 7.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5859375, -11.19873046875, -10.8115234375, -10.42431640625, -10.037109375, -9.64990234375, -9.2626953125, -8.87548828125, -8.48828125, -8.10107421875, -7.7138671875, -7.32666015625, -6.939453125, -6.55224609375, -6.1650390625, -5.77783203125, -5.390625, -5.00341796875, -4.6162109375, -4.22900390625, -3.841796875, -3.45458984375, -3.0673828125, -2.68017578125, -2.29296875, -1.90576171875, -1.5185546875, -1.13134765625, -0.744140625, -0.35693359375, 0.0302734375, 0.41748046875, 0.8046875, 1.19189453125, 1.5791015625, 1.96630859375, 2.353515625, 2.74072265625, 3.1279296875, 3.51513671875, 3.90234375, 4.28955078125, 4.6767578125, 5.06396484375, 5.451171875, 5.83837890625, 6.2255859375, 6.61279296875, 7.0, 7.38720703125, 7.7744140625, 8.16162109375, 8.548828125, 8.93603515625, 9.3232421875, 9.71044921875, 10.09765625, 10.48486328125, 10.8720703125, 11.25927734375, 11.646484375, 12.03369140625, 12.4208984375, 12.80810546875, 13.1953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 6.0, 10.0, 16.0, 20.0, 17.0, 21.0, 25.0, 22.0, 39.0, 31.0, 31.0, 28.0, 45.0, 37.0, 37.0, 42.0, 48.0, 34.0, 55.0, 36.0, 45.0, 33.0, 41.0, 36.0, 30.0, 28.0, 34.0, 26.0, 18.0, 14.0, 13.0, 13.0, 9.0, 9.0, 5.0, 7.0, 6.0, 2.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-30.24650001525879, -29.386260986328125, -28.526020050048828, -27.665781021118164, -26.8055419921875, -25.945301055908203, -25.08506202697754, -24.224822998046875, -23.364582061767578, -22.504343032836914, -21.644102096557617, -20.783863067626953, -19.923622131347656, -19.063383102416992, -18.203144073486328, -17.34290313720703, -16.482664108276367, -15.622424125671387, -14.762184143066406, -13.901945114135742, -13.041705131530762, -12.181465148925781, -11.321226119995117, -10.460986137390137, -9.600746154785156, -8.740506172180176, -7.8802666664123535, -7.020027160644531, -6.159787178039551, -5.29954719543457, -4.439307689666748, -3.579068183898926, -2.7188262939453125, -1.8585865497589111, -0.9983468055725098, -0.1381070613861084, 0.722132682800293, 1.5823726654052734, 2.4426121711730957, 3.302851676940918, 4.163091659545898, 5.023331642150879, 5.883571147918701, 6.743810653686523, 7.604050636291504, 8.464290618896484, 9.324529647827148, 10.184769630432129, 11.04500961303711, 11.90524959564209, 12.76548957824707, 13.625728607177734, 14.485968589782715, 15.346208572387695, 16.20644760131836, 17.066688537597656, 17.92692756652832, 18.787166595458984, 19.64740753173828, 20.507646560668945, 21.36788558959961, 22.228126525878906, 23.08836555480957, 23.948604583740234, 24.80884552001953]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 6.0, 4.0, 9.0, 9.0, 6.0, 10.0, 11.0, 14.0, 13.0, 10.0, 17.0, 16.0, 18.0, 33.0, 31.0, 28.0, 28.0, 31.0, 31.0, 28.0, 31.0, 25.0, 32.0, 34.0, 39.0, 34.0, 31.0, 36.0, 27.0, 32.0, 30.0, 26.0, 31.0, 30.0, 18.0, 20.0, 12.0, 28.0, 26.0, 21.0, 16.0, 15.0, 11.0, 8.0, 3.0, 5.0, 11.0, 6.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.26994514465332, -23.497737884521484, -22.72553062438965, -21.953323364257812, -21.18111801147461, -20.408910751342773, -19.636703491210938, -18.8644962310791, -18.092288970947266, -17.32008171081543, -16.547874450683594, -15.775668144226074, -15.003461837768555, -14.231254577636719, -13.459047317504883, -12.686840057373047, -11.914634704589844, -11.142427444458008, -10.370221138000488, -9.598013877868652, -8.825807571411133, -8.053600311279297, -7.281393051147461, -6.509186267852783, -5.7369794845581055, -4.964772701263428, -4.19256591796875, -3.420358657836914, -2.6481518745422363, -1.8759450912475586, -1.1037378311157227, -0.3315310478210449, 0.440673828125, 1.2128807306289673, 1.9850876331329346, 2.7572946548461914, 3.529501438140869, 4.301708221435547, 5.073915481567383, 5.8461222648620605, 6.618329048156738, 7.390535831451416, 8.162742614746094, 8.93494987487793, 9.707157135009766, 10.479363441467285, 11.251570701599121, 12.02377700805664, 12.795984268188477, 13.568191528320312, 14.340397834777832, 15.112605094909668, 15.884811401367188, 16.657018661499023, 17.42922592163086, 18.201433181762695, 18.97364044189453, 19.745847702026367, 20.518054962158203, 21.290260314941406, 22.062467575073242, 22.834674835205078, 23.606882095336914, 24.37908935546875, 25.151294708251953]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 16.0, 24.0, 50.0, 66.0, 103.0, 150.0, 232.0, 398.0, 594.0, 1012.0, 1464.0, 2241.0, 3687.0, 5697.0, 8344.0, 12604.0, 18435.0, 27045.0, 37558.0, 51217.0, 67443.0, 83648.0, 97554.0, 105544.0, 105869.0, 97464.0, 83526.0, 67205.0, 50842.0, 37261.0, 26433.0, 18156.0, 12785.0, 8298.0, 5432.0, 3572.0, 2378.0, 1492.0, 1003.0, 638.0, 418.0, 259.0, 172.0, 91.0, 57.0, 34.0, 19.0, 11.0, 3.0, 7.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-6.1875, -5.99407958984375, -5.8006591796875, -5.60723876953125, -5.413818359375, -5.22039794921875, -5.0269775390625, -4.83355712890625, -4.64013671875, -4.44671630859375, -4.2532958984375, -4.05987548828125, -3.866455078125, -3.67303466796875, -3.4796142578125, -3.28619384765625, -3.0927734375, -2.89935302734375, -2.7059326171875, -2.51251220703125, -2.319091796875, -2.12567138671875, -1.9322509765625, -1.73883056640625, -1.54541015625, -1.35198974609375, -1.1585693359375, -0.96514892578125, -0.771728515625, -0.57830810546875, -0.3848876953125, -0.19146728515625, 0.001953125, 0.19537353515625, 0.3887939453125, 0.58221435546875, 0.775634765625, 0.96905517578125, 1.1624755859375, 1.35589599609375, 1.54931640625, 1.74273681640625, 1.9361572265625, 2.12957763671875, 2.322998046875, 2.51641845703125, 2.7098388671875, 2.90325927734375, 3.0966796875, 3.29010009765625, 3.4835205078125, 3.67694091796875, 3.870361328125, 4.06378173828125, 4.2572021484375, 4.45062255859375, 4.64404296875, 4.83746337890625, 5.0308837890625, 5.22430419921875, 5.417724609375, 5.61114501953125, 5.8045654296875, 5.99798583984375, 6.19140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 5.0, 4.0, 10.0, 9.0, 7.0, 10.0, 11.0, 13.0, 13.0, 11.0, 16.0, 17.0, 19.0, 34.0, 30.0, 26.0, 29.0, 37.0, 25.0, 30.0, 29.0, 27.0, 33.0, 31.0, 39.0, 33.0, 32.0, 35.0, 26.0, 33.0, 29.0, 30.0, 30.0, 31.0, 15.0, 20.0, 15.0, 24.0, 28.0, 20.0, 16.0, 16.0, 8.0, 8.0, 4.0, 5.0, 13.0, 5.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.296875, -23.52587890625, -22.7548828125, -21.98388671875, -21.212890625, -20.44189453125, -19.6708984375, -18.89990234375, -18.12890625, -17.35791015625, -16.5869140625, -15.81591796875, -15.044921875, -14.27392578125, -13.5029296875, -12.73193359375, -11.9609375, -11.18994140625, -10.4189453125, -9.64794921875, -8.876953125, -8.10595703125, -7.3349609375, -6.56396484375, -5.79296875, -5.02197265625, -4.2509765625, -3.47998046875, -2.708984375, -1.93798828125, -1.1669921875, -0.39599609375, 0.375, 1.14599609375, 1.9169921875, 2.68798828125, 3.458984375, 4.22998046875, 5.0009765625, 5.77197265625, 6.54296875, 7.31396484375, 8.0849609375, 8.85595703125, 9.626953125, 10.39794921875, 11.1689453125, 11.93994140625, 12.7109375, 13.48193359375, 14.2529296875, 15.02392578125, 15.794921875, 16.56591796875, 17.3369140625, 18.10791015625, 18.87890625, 19.64990234375, 20.4208984375, 21.19189453125, 21.962890625, 22.73388671875, 23.5048828125, 24.27587890625, 25.046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 10.0, 18.0, 22.0, 16.0, 42.0, 46.0, 71.0, 89.0, 112.0, 174.0, 282.0, 420.0, 558.0, 878.0, 1330.0, 1962.0, 2908.0, 4381.0, 6319.0, 9854.0, 15762.0, 26979.0, 167602.0, 721185.0, 33995.0, 19055.0, 11743.0, 7508.0, 5051.0, 3297.0, 2258.0, 1465.0, 1002.0, 636.0, 440.0, 328.0, 225.0, 140.0, 92.0, 85.0, 57.0, 53.0, 19.0, 32.0, 17.0, 5.0, 8.0, 5.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-20.65625, -20.014404296875, -19.37255859375, -18.730712890625, -18.0888671875, -17.447021484375, -16.80517578125, -16.163330078125, -15.521484375, -14.879638671875, -14.23779296875, -13.595947265625, -12.9541015625, -12.312255859375, -11.67041015625, -11.028564453125, -10.38671875, -9.744873046875, -9.10302734375, -8.461181640625, -7.8193359375, -7.177490234375, -6.53564453125, -5.893798828125, -5.251953125, -4.610107421875, -3.96826171875, -3.326416015625, -2.6845703125, -2.042724609375, -1.40087890625, -0.759033203125, -0.1171875, 0.524658203125, 1.16650390625, 1.808349609375, 2.4501953125, 3.092041015625, 3.73388671875, 4.375732421875, 5.017578125, 5.659423828125, 6.30126953125, 6.943115234375, 7.5849609375, 8.226806640625, 8.86865234375, 9.510498046875, 10.15234375, 10.794189453125, 11.43603515625, 12.077880859375, 12.7197265625, 13.361572265625, 14.00341796875, 14.645263671875, 15.287109375, 15.928955078125, 16.57080078125, 17.212646484375, 17.8544921875, 18.496337890625, 19.13818359375, 19.780029296875, 20.421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 4.0, 5.0, 9.0, 8.0, 11.0, 8.0, 9.0, 18.0, 18.0, 24.0, 23.0, 26.0, 30.0, 30.0, 36.0, 35.0, 40.0, 45.0, 37.0, 41.0, 45.0, 41.0, 43.0, 35.0, 36.0, 32.0, 46.0, 31.0, 23.0, 25.0, 24.0, 32.0, 24.0, 28.0, 13.0, 22.0, 6.0, 10.0, 10.0, 9.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.96875, -20.3505859375, -19.732421875, -19.1142578125, -18.49609375, -17.8779296875, -17.259765625, -16.6416015625, -16.0234375, -15.4052734375, -14.787109375, -14.1689453125, -13.55078125, -12.9326171875, -12.314453125, -11.6962890625, -11.078125, -10.4599609375, -9.841796875, -9.2236328125, -8.60546875, -7.9873046875, -7.369140625, -6.7509765625, -6.1328125, -5.5146484375, -4.896484375, -4.2783203125, -3.66015625, -3.0419921875, -2.423828125, -1.8056640625, -1.1875, -0.5693359375, 0.048828125, 0.6669921875, 1.28515625, 1.9033203125, 2.521484375, 3.1396484375, 3.7578125, 4.3759765625, 4.994140625, 5.6123046875, 6.23046875, 6.8486328125, 7.466796875, 8.0849609375, 8.703125, 9.3212890625, 9.939453125, 10.5576171875, 11.17578125, 11.7939453125, 12.412109375, 13.0302734375, 13.6484375, 14.2666015625, 14.884765625, 15.5029296875, 16.12109375, 16.7392578125, 17.357421875, 17.9755859375, 18.59375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 4.0, 5.0, 9.0, 11.0, 17.0, 9.0, 34.0, 42.0, 54.0, 60.0, 97.0, 118.0, 200.0, 255.0, 370.0, 533.0, 758.0, 1281.0, 1867.0, 2964.0, 4609.0, 7808.0, 12922.0, 22803.0, 57387.0, 828973.0, 50563.0, 21950.0, 12529.0, 7415.0, 4596.0, 2909.0, 1817.0, 1072.0, 768.0, 513.0, 335.0, 238.0, 175.0, 125.0, 86.0, 81.0, 56.0, 44.0, 30.0, 19.0, 15.0, 10.0, 7.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.3740234375, -1.327392578125, -1.28076171875, -1.234130859375, -1.1875, -1.140869140625, -1.09423828125, -1.047607421875, -1.0009765625, -0.954345703125, -0.90771484375, -0.861083984375, -0.814453125, -0.767822265625, -0.72119140625, -0.674560546875, -0.6279296875, -0.581298828125, -0.53466796875, -0.488037109375, -0.44140625, -0.394775390625, -0.34814453125, -0.301513671875, -0.2548828125, -0.208251953125, -0.16162109375, -0.114990234375, -0.068359375, -0.021728515625, 0.02490234375, 0.071533203125, 0.1181640625, 0.164794921875, 0.21142578125, 0.258056640625, 0.3046875, 0.351318359375, 0.39794921875, 0.444580078125, 0.4912109375, 0.537841796875, 0.58447265625, 0.631103515625, 0.677734375, 0.724365234375, 0.77099609375, 0.817626953125, 0.8642578125, 0.910888671875, 0.95751953125, 1.004150390625, 1.05078125, 1.097412109375, 1.14404296875, 1.190673828125, 1.2373046875, 1.283935546875, 1.33056640625, 1.377197265625, 1.423828125, 1.470458984375, 1.51708984375, 1.563720703125, 1.6103515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 7.0, 6.0, 4.0, 10.0, 21.0, 8.0, 21.0, 38.0, 26.0, 35.0, 37.0, 56.0, 54.0, 91.0, 72.0, 76.0, 62.0, 68.0, 47.0, 51.0, 44.0, 29.0, 35.0, 19.0, 21.0, 13.0, 14.0, 16.0, 5.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.822845458984375e-05, -9.500514715909958e-05, -9.178183972835541e-05, -8.855853229761124e-05, -8.533522486686707e-05, -8.21119174361229e-05, -7.888861000537872e-05, -7.566530257463455e-05, -7.244199514389038e-05, -6.921868771314621e-05, -6.599538028240204e-05, -6.277207285165787e-05, -5.9548765420913696e-05, -5.6325457990169525e-05, -5.3102150559425354e-05, -4.987884312868118e-05, -4.665553569793701e-05, -4.343222826719284e-05, -4.020892083644867e-05, -3.69856134057045e-05, -3.376230597496033e-05, -3.0538998544216156e-05, -2.7315691113471985e-05, -2.4092383682727814e-05, -2.0869076251983643e-05, -1.764576882123947e-05, -1.44224613904953e-05, -1.1199153959751129e-05, -7.975846529006958e-06, -4.752539098262787e-06, -1.5292316675186157e-06, 1.6940757632255554e-06, 4.9173831939697266e-06, 8.140690624713898e-06, 1.1363998055458069e-05, 1.458730548620224e-05, 1.781061291694641e-05, 2.1033920347690582e-05, 2.4257227778434753e-05, 2.7480535209178925e-05, 3.0703842639923096e-05, 3.392715007066727e-05, 3.715045750141144e-05, 4.037376493215561e-05, 4.359707236289978e-05, 4.682037979364395e-05, 5.004368722438812e-05, 5.3266994655132294e-05, 5.6490302085876465e-05, 5.9713609516620636e-05, 6.293691694736481e-05, 6.616022437810898e-05, 6.938353180885315e-05, 7.260683923959732e-05, 7.583014667034149e-05, 7.905345410108566e-05, 8.227676153182983e-05, 8.5500068962574e-05, 8.872337639331818e-05, 9.194668382406235e-05, 9.516999125480652e-05, 9.839329868555069e-05, 0.00010161660611629486, 0.00010483991354703903, 0.0001080632209777832]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 9.0, 8.0, 18.0, 27.0, 46.0, 88.0, 111.0, 198.0, 314.0, 458.0, 764.0, 1076.0, 1878.0, 2880.0, 4525.0, 7211.0, 11202.0, 17471.0, 26389.0, 39716.0, 57121.0, 78431.0, 102181.0, 121126.0, 128143.0, 117852.0, 97705.0, 74093.0, 53271.0, 35926.0, 24409.0, 15785.0, 10193.0, 6663.0, 4044.0, 2686.0, 1653.0, 1079.0, 650.0, 433.0, 271.0, 167.0, 96.0, 72.0, 56.0, 25.0, 15.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-1.1708984375, -1.1368560791015625, -1.102813720703125, -1.0687713623046875, -1.03472900390625, -1.0006866455078125, -0.966644287109375, -0.9326019287109375, -0.8985595703125, -0.8645172119140625, -0.830474853515625, -0.7964324951171875, -0.76239013671875, -0.7283477783203125, -0.694305419921875, -0.6602630615234375, -0.626220703125, -0.5921783447265625, -0.558135986328125, -0.5240936279296875, -0.49005126953125, -0.4560089111328125, -0.421966552734375, -0.3879241943359375, -0.3538818359375, -0.3198394775390625, -0.285797119140625, -0.2517547607421875, -0.21771240234375, -0.1836700439453125, -0.149627685546875, -0.1155853271484375, -0.08154296875, -0.0475006103515625, -0.013458251953125, 0.0205841064453125, 0.05462646484375, 0.0886688232421875, 0.122711181640625, 0.1567535400390625, 0.1907958984375, 0.2248382568359375, 0.258880615234375, 0.2929229736328125, 0.32696533203125, 0.3610076904296875, 0.395050048828125, 0.4290924072265625, 0.463134765625, 0.4971771240234375, 0.531219482421875, 0.5652618408203125, 0.59930419921875, 0.6333465576171875, 0.667388916015625, 0.7014312744140625, 0.7354736328125, 0.7695159912109375, 0.803558349609375, 0.8376007080078125, 0.87164306640625, 0.9056854248046875, 0.939727783203125, 0.9737701416015625, 1.0078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 5.0, 7.0, 6.0, 7.0, 7.0, 4.0, 7.0, 19.0, 18.0, 14.0, 18.0, 20.0, 20.0, 28.0, 33.0, 29.0, 37.0, 47.0, 40.0, 40.0, 43.0, 53.0, 31.0, 33.0, 34.0, 41.0, 38.0, 27.0, 39.0, 35.0, 24.0, 24.0, 19.0, 22.0, 27.0, 16.0, 16.0, 13.0, 11.0, 11.0, 3.0, 10.0, 6.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.52978515625, -0.5149192810058594, -0.5000534057617188, -0.4851875305175781, -0.4703216552734375, -0.4554557800292969, -0.44058990478515625, -0.4257240295410156, -0.410858154296875, -0.3959922790527344, -0.38112640380859375, -0.3662605285644531, -0.3513946533203125, -0.3365287780761719, -0.32166290283203125, -0.3067970275878906, -0.29193115234375, -0.2770652770996094, -0.26219940185546875, -0.24733352661132812, -0.2324676513671875, -0.21760177612304688, -0.20273590087890625, -0.18787002563476562, -0.173004150390625, -0.15813827514648438, -0.14327239990234375, -0.12840652465820312, -0.1135406494140625, -0.09867477416992188, -0.08380889892578125, -0.06894302368164062, -0.0540771484375, -0.039211273193359375, -0.02434539794921875, -0.009479522705078125, 0.0053863525390625, 0.020252227783203125, 0.03511810302734375, 0.049983978271484375, 0.064849853515625, 0.07971572875976562, 0.09458160400390625, 0.10944747924804688, 0.1243133544921875, 0.13917922973632812, 0.15404510498046875, 0.16891098022460938, 0.18377685546875, 0.19864273071289062, 0.21350860595703125, 0.22837448120117188, 0.2432403564453125, 0.2581062316894531, 0.27297210693359375, 0.2878379821777344, 0.302703857421875, 0.3175697326660156, 0.33243560791015625, 0.3473014831542969, 0.3621673583984375, 0.3770332336425781, 0.39189910888671875, 0.4067649841308594, 0.421630859375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 13.0, 6.0, 16.0, 19.0, 18.0, 25.0, 16.0, 28.0, 42.0, 35.0, 28.0, 39.0, 40.0, 39.0, 43.0, 32.0, 52.0, 46.0, 44.0, 48.0, 35.0, 33.0, 40.0, 37.0, 27.0, 35.0, 32.0, 20.0, 17.0, 13.0, 21.0, 9.0, 4.0, 5.0, 8.0, 4.0, 7.0, 5.0, 2.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.643497467041016, -30.758874893188477, -29.874250411987305, -28.989627838134766, -28.105003356933594, -27.220380783081055, -26.335758209228516, -25.451133728027344, -24.566509246826172, -23.681886672973633, -22.79726219177246, -21.912639617919922, -21.02801513671875, -20.14339256286621, -19.258769989013672, -18.3741455078125, -17.48952293395996, -16.604900360107422, -15.72027587890625, -14.835653305053711, -13.951028823852539, -13.06640625, -12.181782722473145, -11.297159194946289, -10.412535667419434, -9.527912139892578, -8.643288612365723, -7.758665561676025, -6.87404203414917, -5.9894185066223145, -5.104795455932617, -4.220171928405762, -3.3355484008789062, -2.450924873352051, -1.5663015842437744, -0.681678295135498, 0.20294523239135742, 1.087568759918213, 1.9721918106079102, 2.8568153381347656, 3.741438865661621, 4.626062393188477, 5.510685920715332, 6.395308971405029, 7.279932498931885, 8.164556503295898, 9.049179077148438, 9.933802604675293, 10.818426132202148, 11.703049659729004, 12.58767318725586, 13.472295761108398, 14.35692024230957, 15.24154281616211, 16.12616729736328, 17.01078987121582, 17.89541244506836, 18.7800350189209, 19.66465950012207, 20.54928207397461, 21.43390655517578, 22.31852912902832, 23.20315170288086, 24.08777618408203, 24.972400665283203]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 3.0, 5.0, 7.0, 11.0, 5.0, 11.0, 10.0, 13.0, 12.0, 13.0, 18.0, 13.0, 16.0, 30.0, 32.0, 29.0, 24.0, 40.0, 22.0, 35.0, 28.0, 31.0, 29.0, 29.0, 43.0, 28.0, 35.0, 33.0, 36.0, 28.0, 36.0, 24.0, 29.0, 31.0, 23.0, 15.0, 16.0, 24.0, 22.0, 25.0, 14.0, 20.0, 11.0, 5.0, 4.0, 7.0, 13.0, 3.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.720094680786133, -23.941967010498047, -23.16383934020996, -22.385711669921875, -21.607582092285156, -20.82945442199707, -20.051326751708984, -19.2731990814209, -18.495071411132812, -17.716943740844727, -16.93881607055664, -16.160686492919922, -15.382559776306152, -14.60443115234375, -13.826303482055664, -13.048175811767578, -12.270047187805176, -11.49191951751709, -10.713790893554688, -9.935663223266602, -9.157535552978516, -8.37940788269043, -7.601279258728027, -6.823151588439941, -6.045023441314697, -5.266895294189453, -4.488767623901367, -3.710639476776123, -2.932511568069458, -2.154383659362793, -1.3762555122375488, -0.5981278419494629, 0.18000030517578125, 0.9581282734870911, 1.7362562417984009, 2.5143842697143555, 3.2925121784210205, 4.0706400871276855, 4.84876823425293, 5.626895904541016, 6.40502405166626, 7.183152198791504, 7.96127986907959, 8.739408493041992, 9.517536163330078, 10.295663833618164, 11.07379150390625, 11.851919174194336, 12.630047798156738, 13.408175468444824, 14.186304092407227, 14.964431762695312, 15.742559432983398, 16.520687103271484, 17.298816680908203, 18.076942443847656, 18.855072021484375, 19.63319969177246, 20.411327362060547, 21.189456939697266, 21.96758460998535, 22.745712280273438, 23.523839950561523, 24.30196762084961, 25.080095291137695]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 5.0, 12.0, 26.0, 39.0, 53.0, 91.0, 168.0, 239.0, 382.0, 572.0, 862.0, 1418.0, 2101.0, 3125.0, 4697.0, 7187.0, 10206.0, 14584.0, 20008.0, 27101.0, 36231.0, 46361.0, 57024.0, 67317.0, 76638.0, 83795.0, 85711.0, 84820.0, 80603.0, 72113.0, 62484.0, 51322.0, 41158.0, 31350.0, 23571.0, 17177.0, 12538.0, 8578.0, 5726.0, 3885.0, 2552.0, 1734.0, 1104.0, 692.0, 443.0, 289.0, 175.0, 95.0, 75.0, 51.0, 35.0, 14.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-15.578125, -15.071533203125, -14.56494140625, -14.058349609375, -13.5517578125, -13.045166015625, -12.53857421875, -12.031982421875, -11.525390625, -11.018798828125, -10.51220703125, -10.005615234375, -9.4990234375, -8.992431640625, -8.48583984375, -7.979248046875, -7.47265625, -6.966064453125, -6.45947265625, -5.952880859375, -5.4462890625, -4.939697265625, -4.43310546875, -3.926513671875, -3.419921875, -2.913330078125, -2.40673828125, -1.900146484375, -1.3935546875, -0.886962890625, -0.38037109375, 0.126220703125, 0.6328125, 1.139404296875, 1.64599609375, 2.152587890625, 2.6591796875, 3.165771484375, 3.67236328125, 4.178955078125, 4.685546875, 5.192138671875, 5.69873046875, 6.205322265625, 6.7119140625, 7.218505859375, 7.72509765625, 8.231689453125, 8.73828125, 9.244873046875, 9.75146484375, 10.258056640625, 10.7646484375, 11.271240234375, 11.77783203125, 12.284423828125, 12.791015625, 13.297607421875, 13.80419921875, 14.310791015625, 14.8173828125, 15.323974609375, 15.83056640625, 16.337158203125, 16.84375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 1.0, 3.0, 5.0, 7.0, 10.0, 7.0, 9.0, 13.0, 11.0, 13.0, 15.0, 17.0, 13.0, 22.0, 28.0, 29.0, 32.0, 20.0, 40.0, 23.0, 35.0, 26.0, 36.0, 26.0, 34.0, 42.0, 25.0, 38.0, 33.0, 31.0, 29.0, 36.0, 23.0, 30.0, 30.0, 22.0, 18.0, 16.0, 21.0, 25.0, 20.0, 16.0, 19.0, 11.0, 5.0, 5.0, 9.0, 10.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.90625, -23.151611328125, -22.39697265625, -21.642333984375, -20.8876953125, -20.133056640625, -19.37841796875, -18.623779296875, -17.869140625, -17.114501953125, -16.35986328125, -15.605224609375, -14.8505859375, -14.095947265625, -13.34130859375, -12.586669921875, -11.83203125, -11.077392578125, -10.32275390625, -9.568115234375, -8.8134765625, -8.058837890625, -7.30419921875, -6.549560546875, -5.794921875, -5.040283203125, -4.28564453125, -3.531005859375, -2.7763671875, -2.021728515625, -1.26708984375, -0.512451171875, 0.2421875, 0.996826171875, 1.75146484375, 2.506103515625, 3.2607421875, 4.015380859375, 4.77001953125, 5.524658203125, 6.279296875, 7.033935546875, 7.78857421875, 8.543212890625, 9.2978515625, 10.052490234375, 10.80712890625, 11.561767578125, 12.31640625, 13.071044921875, 13.82568359375, 14.580322265625, 15.3349609375, 16.089599609375, 16.84423828125, 17.598876953125, 18.353515625, 19.108154296875, 19.86279296875, 20.617431640625, 21.3720703125, 22.126708984375, 22.88134765625, 23.635986328125, 24.390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 11.0, 8.0, 22.0, 46.0, 65.0, 107.0, 171.0, 275.0, 468.0, 794.0, 1160.0, 1801.0, 2720.0, 4272.0, 6435.0, 9451.0, 13614.0, 19451.0, 26840.0, 35967.0, 46534.0, 58979.0, 70041.0, 80267.0, 87229.0, 89786.0, 88658.0, 82629.0, 73086.0, 61715.0, 50199.0, 39046.0, 29614.0, 21299.0, 15044.0, 10459.0, 7114.0, 4693.0, 2994.0, 1989.0, 1310.0, 823.0, 513.0, 315.0, 209.0, 120.0, 87.0, 49.0, 31.0, 15.0, 12.0, 10.0, 5.0, 2.0, 3.0, 3.0], "bins": [-17.078125, -16.5704345703125, -16.062744140625, -15.5550537109375, -15.04736328125, -14.5396728515625, -14.031982421875, -13.5242919921875, -13.0166015625, -12.5089111328125, -12.001220703125, -11.4935302734375, -10.98583984375, -10.4781494140625, -9.970458984375, -9.4627685546875, -8.955078125, -8.4473876953125, -7.939697265625, -7.4320068359375, -6.92431640625, -6.4166259765625, -5.908935546875, -5.4012451171875, -4.8935546875, -4.3858642578125, -3.878173828125, -3.3704833984375, -2.86279296875, -2.3551025390625, -1.847412109375, -1.3397216796875, -0.83203125, -0.3243408203125, 0.183349609375, 0.6910400390625, 1.19873046875, 1.7064208984375, 2.214111328125, 2.7218017578125, 3.2294921875, 3.7371826171875, 4.244873046875, 4.7525634765625, 5.26025390625, 5.7679443359375, 6.275634765625, 6.7833251953125, 7.291015625, 7.7987060546875, 8.306396484375, 8.8140869140625, 9.32177734375, 9.8294677734375, 10.337158203125, 10.8448486328125, 11.3525390625, 11.8602294921875, 12.367919921875, 12.8756103515625, 13.38330078125, 13.8909912109375, 14.398681640625, 14.9063720703125, 15.4140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 3.0, 8.0, 11.0, 9.0, 16.0, 17.0, 15.0, 17.0, 28.0, 32.0, 41.0, 34.0, 29.0, 28.0, 36.0, 59.0, 38.0, 45.0, 39.0, 45.0, 39.0, 51.0, 42.0, 36.0, 28.0, 41.0, 29.0, 37.0, 24.0, 27.0, 19.0, 11.0, 10.0, 13.0, 8.0, 5.0, 10.0, 6.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.109375, -17.49658203125, -16.8837890625, -16.27099609375, -15.658203125, -15.04541015625, -14.4326171875, -13.81982421875, -13.20703125, -12.59423828125, -11.9814453125, -11.36865234375, -10.755859375, -10.14306640625, -9.5302734375, -8.91748046875, -8.3046875, -7.69189453125, -7.0791015625, -6.46630859375, -5.853515625, -5.24072265625, -4.6279296875, -4.01513671875, -3.40234375, -2.78955078125, -2.1767578125, -1.56396484375, -0.951171875, -0.33837890625, 0.2744140625, 0.88720703125, 1.5, 2.11279296875, 2.7255859375, 3.33837890625, 3.951171875, 4.56396484375, 5.1767578125, 5.78955078125, 6.40234375, 7.01513671875, 7.6279296875, 8.24072265625, 8.853515625, 9.46630859375, 10.0791015625, 10.69189453125, 11.3046875, 11.91748046875, 12.5302734375, 13.14306640625, 13.755859375, 14.36865234375, 14.9814453125, 15.59423828125, 16.20703125, 16.81982421875, 17.4326171875, 18.04541015625, 18.658203125, 19.27099609375, 19.8837890625, 20.49658203125, 21.109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 8.0, 10.0, 19.0, 9.0, 43.0, 58.0, 84.0, 122.0, 221.0, 316.0, 536.0, 853.0, 1383.0, 2371.0, 3968.0, 6597.0, 10802.0, 17719.0, 28864.0, 45558.0, 68140.0, 93097.0, 117779.0, 131816.0, 131266.0, 115462.0, 91177.0, 65316.0, 44234.0, 27668.0, 17175.0, 10257.0, 6094.0, 3674.0, 2259.0, 1342.0, 860.0, 492.0, 312.0, 227.0, 121.0, 76.0, 53.0, 36.0, 19.0, 24.0, 14.0, 11.0, 5.0, 2.0, 5.0, 1.0, 0.0, 2.0], "bins": [-10.7265625, -10.41064453125, -10.0947265625, -9.77880859375, -9.462890625, -9.14697265625, -8.8310546875, -8.51513671875, -8.19921875, -7.88330078125, -7.5673828125, -7.25146484375, -6.935546875, -6.61962890625, -6.3037109375, -5.98779296875, -5.671875, -5.35595703125, -5.0400390625, -4.72412109375, -4.408203125, -4.09228515625, -3.7763671875, -3.46044921875, -3.14453125, -2.82861328125, -2.5126953125, -2.19677734375, -1.880859375, -1.56494140625, -1.2490234375, -0.93310546875, -0.6171875, -0.30126953125, 0.0146484375, 0.33056640625, 0.646484375, 0.96240234375, 1.2783203125, 1.59423828125, 1.91015625, 2.22607421875, 2.5419921875, 2.85791015625, 3.173828125, 3.48974609375, 3.8056640625, 4.12158203125, 4.4375, 4.75341796875, 5.0693359375, 5.38525390625, 5.701171875, 6.01708984375, 6.3330078125, 6.64892578125, 6.96484375, 7.28076171875, 7.5966796875, 7.91259765625, 8.228515625, 8.54443359375, 8.8603515625, 9.17626953125, 9.4921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 4.0, 4.0, 11.0, 16.0, 15.0, 20.0, 33.0, 24.0, 39.0, 46.0, 55.0, 46.0, 53.0, 70.0, 68.0, 62.0, 62.0, 64.0, 38.0, 43.0, 43.0, 35.0, 36.0, 20.0, 26.0, 12.0, 13.0, 11.0, 10.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010528564453125, -0.0010097026824951172, -0.0009665489196777344, -0.0009233951568603516, -0.0008802413940429688, -0.0008370876312255859, -0.0007939338684082031, -0.0007507801055908203, -0.0007076263427734375, -0.0006644725799560547, -0.0006213188171386719, -0.0005781650543212891, -0.0005350112915039062, -0.0004918575286865234, -0.0004487037658691406, -0.0004055500030517578, -0.000362396240234375, -0.0003192424774169922, -0.0002760887145996094, -0.00023293495178222656, -0.00018978118896484375, -0.00014662742614746094, -0.00010347366333007812, -6.031990051269531e-05, -1.71661376953125e-05, 2.5987625122070312e-05, 6.914138793945312e-05, 0.00011229515075683594, 0.00015544891357421875, 0.00019860267639160156, 0.00024175643920898438, 0.0002849102020263672, 0.00032806396484375, 0.0003712177276611328, 0.0004143714904785156, 0.00045752525329589844, 0.0005006790161132812, 0.0005438327789306641, 0.0005869865417480469, 0.0006301403045654297, 0.0006732940673828125, 0.0007164478302001953, 0.0007596015930175781, 0.0008027553558349609, 0.0008459091186523438, 0.0008890628814697266, 0.0009322166442871094, 0.0009753704071044922, 0.001018524169921875, 0.0010616779327392578, 0.0011048316955566406, 0.0011479854583740234, 0.0011911392211914062, 0.001234292984008789, 0.0012774467468261719, 0.0013206005096435547, 0.0013637542724609375, 0.0014069080352783203, 0.0014500617980957031, 0.001493215560913086, 0.0015363693237304688, 0.0015795230865478516, 0.0016226768493652344, 0.0016658306121826172, 0.001708984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 14.0, 19.0, 24.0, 29.0, 49.0, 64.0, 106.0, 135.0, 251.0, 384.0, 635.0, 1024.0, 1689.0, 2907.0, 4940.0, 8529.0, 14682.0, 25346.0, 41699.0, 65526.0, 95189.0, 124760.0, 143681.0, 142316.0, 122331.0, 92349.0, 62897.0, 39536.0, 24008.0, 14025.0, 7928.0, 4599.0, 2700.0, 1614.0, 963.0, 547.0, 364.0, 228.0, 151.0, 105.0, 73.0, 45.0, 38.0, 20.0, 17.0, 5.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0546875, -11.6773681640625, -11.300048828125, -10.9227294921875, -10.54541015625, -10.1680908203125, -9.790771484375, -9.4134521484375, -9.0361328125, -8.6588134765625, -8.281494140625, -7.9041748046875, -7.52685546875, -7.1495361328125, -6.772216796875, -6.3948974609375, -6.017578125, -5.6402587890625, -5.262939453125, -4.8856201171875, -4.50830078125, -4.1309814453125, -3.753662109375, -3.3763427734375, -2.9990234375, -2.6217041015625, -2.244384765625, -1.8670654296875, -1.48974609375, -1.1124267578125, -0.735107421875, -0.3577880859375, 0.01953125, 0.3968505859375, 0.774169921875, 1.1514892578125, 1.52880859375, 1.9061279296875, 2.283447265625, 2.6607666015625, 3.0380859375, 3.4154052734375, 3.792724609375, 4.1700439453125, 4.54736328125, 4.9246826171875, 5.302001953125, 5.6793212890625, 6.056640625, 6.4339599609375, 6.811279296875, 7.1885986328125, 7.56591796875, 7.9432373046875, 8.320556640625, 8.6978759765625, 9.0751953125, 9.4525146484375, 9.829833984375, 10.2071533203125, 10.58447265625, 10.9617919921875, 11.339111328125, 11.7164306640625, 12.09375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 6.0, 14.0, 12.0, 12.0, 15.0, 16.0, 24.0, 28.0, 34.0, 33.0, 44.0, 47.0, 50.0, 57.0, 72.0, 58.0, 54.0, 60.0, 49.0, 45.0, 40.0, 37.0, 34.0, 35.0, 29.0, 20.0, 15.0, 14.0, 9.0, 6.0, 6.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0625, -4.88653564453125, -4.7105712890625, -4.53460693359375, -4.358642578125, -4.18267822265625, -4.0067138671875, -3.83074951171875, -3.65478515625, -3.47882080078125, -3.3028564453125, -3.12689208984375, -2.950927734375, -2.77496337890625, -2.5989990234375, -2.42303466796875, -2.2470703125, -2.07110595703125, -1.8951416015625, -1.71917724609375, -1.543212890625, -1.36724853515625, -1.1912841796875, -1.01531982421875, -0.83935546875, -0.66339111328125, -0.4874267578125, -0.31146240234375, -0.135498046875, 0.04046630859375, 0.2164306640625, 0.39239501953125, 0.568359375, 0.74432373046875, 0.9202880859375, 1.09625244140625, 1.272216796875, 1.44818115234375, 1.6241455078125, 1.80010986328125, 1.97607421875, 2.15203857421875, 2.3280029296875, 2.50396728515625, 2.679931640625, 2.85589599609375, 3.0318603515625, 3.20782470703125, 3.3837890625, 3.55975341796875, 3.7357177734375, 3.91168212890625, 4.087646484375, 4.26361083984375, 4.4395751953125, 4.61553955078125, 4.79150390625, 4.96746826171875, 5.1434326171875, 5.31939697265625, 5.495361328125, 5.67132568359375, 5.8472900390625, 6.02325439453125, 6.19921875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 11.0, 9.0, 12.0, 25.0, 26.0, 22.0, 15.0, 23.0, 26.0, 32.0, 46.0, 35.0, 41.0, 44.0, 52.0, 50.0, 38.0, 43.0, 46.0, 41.0, 37.0, 41.0, 39.0, 38.0, 37.0, 27.0, 19.0, 22.0, 15.0, 18.0, 11.0, 8.0, 2.0, 9.0, 10.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-30.67168426513672, -29.784299850463867, -28.896913528442383, -28.00952911376953, -27.12214469909668, -26.234758377075195, -25.347373962402344, -24.45998764038086, -23.572603225708008, -22.685218811035156, -21.797832489013672, -20.91044807434082, -20.02306365966797, -19.135677337646484, -18.248292922973633, -17.36090850830078, -16.473522186279297, -15.586136817932129, -14.698752403259277, -13.81136703491211, -12.923981666564941, -12.036596298217773, -11.149211883544922, -10.261826515197754, -9.374443054199219, -8.48705768585205, -7.599672794342041, -6.712287902832031, -5.824902534484863, -4.9375176429748535, -4.050132751464844, -3.162747383117676, -2.275362014770508, -1.387976884841919, -0.5005918741226196, 0.3867931365966797, 1.2741782665252686, 2.1615633964538574, 3.048948287963867, 3.936333656311035, 4.823718547821045, 5.711103439331055, 6.598488807678223, 7.485873699188232, 8.373258590698242, 9.26064395904541, 10.148029327392578, 11.03541374206543, 11.922799110412598, 12.810184478759766, 13.697568893432617, 14.584954261779785, 15.472339630126953, 16.359724044799805, 17.247108459472656, 18.13449478149414, 19.021879196166992, 19.909263610839844, 20.796649932861328, 21.68403434753418, 22.57141876220703, 23.458805084228516, 24.346189498901367, 25.23357391357422, 26.120960235595703]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 10.0, 6.0, 5.0, 3.0, 10.0, 13.0, 11.0, 16.0, 12.0, 16.0, 20.0, 16.0, 14.0, 38.0, 31.0, 27.0, 35.0, 32.0, 34.0, 29.0, 25.0, 30.0, 33.0, 38.0, 44.0, 40.0, 35.0, 40.0, 33.0, 28.0, 35.0, 33.0, 27.0, 27.0, 21.0, 21.0, 19.0, 15.0, 12.0, 14.0, 12.0, 14.0, 10.0, 9.0, 3.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.14889907836914, -25.28321647644043, -24.41753387451172, -23.551849365234375, -22.686166763305664, -21.820484161376953, -20.954801559448242, -20.08911895751953, -19.223434448242188, -18.357751846313477, -17.492069244384766, -16.626384735107422, -15.760702133178711, -14.89501953125, -14.029336929321289, -13.163654327392578, -12.297971725463867, -11.432289123535156, -10.566605567932129, -9.700922966003418, -8.83523941040039, -7.96955680847168, -7.103874206542969, -6.2381911277771, -5.3725080490112305, -4.506824970245361, -3.6411421298980713, -2.7754592895507812, -1.909776210784912, -1.044093132019043, -0.17841053009033203, 0.6872725486755371, 1.5529556274414062, 2.4186387062072754, 3.2843215465545654, 4.1500043869018555, 5.015687465667725, 5.881370544433594, 6.747053146362305, 7.612736225128174, 8.478419303894043, 9.344101905822754, 10.209785461425781, 11.075468063354492, 11.941150665283203, 12.80683422088623, 13.672516822814941, 14.538200378417969, 15.40388298034668, 16.26956558227539, 17.1352481842041, 18.000930786132812, 18.866615295410156, 19.732297897338867, 20.597980499267578, 21.46366310119629, 22.329345703125, 23.19502830505371, 24.060710906982422, 24.926395416259766, 25.792078018188477, 26.657760620117188, 27.5234432220459, 28.38912582397461, 29.254810333251953]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 4.0, 9.0, 4.0, 9.0, 20.0, 45.0, 78.0, 132.0, 228.0, 386.0, 610.0, 990.0, 1664.0, 2737.0, 4537.0, 7396.0, 12185.0, 19708.0, 31434.0, 49506.0, 76303.0, 114807.0, 166750.0, 230963.0, 303806.0, 374717.0, 424980.0, 448868.0, 434378.0, 387794.0, 319232.0, 246137.0, 179279.0, 124580.0, 84231.0, 54454.0, 34896.0, 21599.0, 13606.0, 8378.0, 5067.0, 3136.0, 1783.0, 1135.0, 681.0, 407.0, 259.0, 133.0, 103.0, 53.0, 35.0, 23.0, 21.0, 9.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.765625, -19.119873046875, -18.47412109375, -17.828369140625, -17.1826171875, -16.536865234375, -15.89111328125, -15.245361328125, -14.599609375, -13.953857421875, -13.30810546875, -12.662353515625, -12.0166015625, -11.370849609375, -10.72509765625, -10.079345703125, -9.43359375, -8.787841796875, -8.14208984375, -7.496337890625, -6.8505859375, -6.204833984375, -5.55908203125, -4.913330078125, -4.267578125, -3.621826171875, -2.97607421875, -2.330322265625, -1.6845703125, -1.038818359375, -0.39306640625, 0.252685546875, 0.8984375, 1.544189453125, 2.18994140625, 2.835693359375, 3.4814453125, 4.127197265625, 4.77294921875, 5.418701171875, 6.064453125, 6.710205078125, 7.35595703125, 8.001708984375, 8.6474609375, 9.293212890625, 9.93896484375, 10.584716796875, 11.23046875, 11.876220703125, 12.52197265625, 13.167724609375, 13.8134765625, 14.459228515625, 15.10498046875, 15.750732421875, 16.396484375, 17.042236328125, 17.68798828125, 18.333740234375, 18.9794921875, 19.625244140625, 20.27099609375, 20.916748046875, 21.5625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 10.0, 7.0, 3.0, 7.0, 7.0, 14.0, 11.0, 14.0, 14.0, 16.0, 18.0, 18.0, 15.0, 33.0, 30.0, 35.0, 39.0, 25.0, 38.0, 28.0, 28.0, 20.0, 42.0, 37.0, 41.0, 37.0, 40.0, 39.0, 30.0, 26.0, 34.0, 40.0, 29.0, 20.0, 23.0, 25.0, 23.0, 17.0, 6.0, 10.0, 12.0, 17.0, 11.0, 8.0, 1.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.296875, -22.5283203125, -21.759765625, -20.9912109375, -20.22265625, -19.4541015625, -18.685546875, -17.9169921875, -17.1484375, -16.3798828125, -15.611328125, -14.8427734375, -14.07421875, -13.3056640625, -12.537109375, -11.7685546875, -11.0, -10.2314453125, -9.462890625, -8.6943359375, -7.92578125, -7.1572265625, -6.388671875, -5.6201171875, -4.8515625, -4.0830078125, -3.314453125, -2.5458984375, -1.77734375, -1.0087890625, -0.240234375, 0.5283203125, 1.296875, 2.0654296875, 2.833984375, 3.6025390625, 4.37109375, 5.1396484375, 5.908203125, 6.6767578125, 7.4453125, 8.2138671875, 8.982421875, 9.7509765625, 10.51953125, 11.2880859375, 12.056640625, 12.8251953125, 13.59375, 14.3623046875, 15.130859375, 15.8994140625, 16.66796875, 17.4365234375, 18.205078125, 18.9736328125, 19.7421875, 20.5107421875, 21.279296875, 22.0478515625, 22.81640625, 23.5849609375, 24.353515625, 25.1220703125, 25.890625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 12.0, 6.0, 25.0, 27.0, 47.0, 62.0, 131.0, 206.0, 373.0, 559.0, 897.0, 1505.0, 2432.0, 3811.0, 6219.0, 9800.0, 15367.0, 23716.0, 36637.0, 54675.0, 80153.0, 114323.0, 156314.0, 207545.0, 263693.0, 316918.0, 361214.0, 386821.0, 390399.0, 369271.0, 329439.0, 279303.0, 222557.0, 169974.0, 125484.0, 88487.0, 60963.0, 41200.0, 26743.0, 17261.0, 11140.0, 6912.0, 4451.0, 2769.0, 1757.0, 1035.0, 623.0, 413.0, 243.0, 152.0, 79.0, 51.0, 46.0, 23.0, 20.0, 2.0, 5.0, 5.0, 0.0, 1.0], "bins": [-20.0, -19.377685546875, -18.75537109375, -18.133056640625, -17.5107421875, -16.888427734375, -16.26611328125, -15.643798828125, -15.021484375, -14.399169921875, -13.77685546875, -13.154541015625, -12.5322265625, -11.909912109375, -11.28759765625, -10.665283203125, -10.04296875, -9.420654296875, -8.79833984375, -8.176025390625, -7.5537109375, -6.931396484375, -6.30908203125, -5.686767578125, -5.064453125, -4.442138671875, -3.81982421875, -3.197509765625, -2.5751953125, -1.952880859375, -1.33056640625, -0.708251953125, -0.0859375, 0.536376953125, 1.15869140625, 1.781005859375, 2.4033203125, 3.025634765625, 3.64794921875, 4.270263671875, 4.892578125, 5.514892578125, 6.13720703125, 6.759521484375, 7.3818359375, 8.004150390625, 8.62646484375, 9.248779296875, 9.87109375, 10.493408203125, 11.11572265625, 11.738037109375, 12.3603515625, 12.982666015625, 13.60498046875, 14.227294921875, 14.849609375, 15.471923828125, 16.09423828125, 16.716552734375, 17.3388671875, 17.961181640625, 18.58349609375, 19.205810546875, 19.828125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 8.0, 7.0, 11.0, 9.0, 19.0, 32.0, 29.0, 33.0, 47.0, 59.0, 64.0, 106.0, 122.0, 119.0, 138.0, 152.0, 146.0, 214.0, 206.0, 205.0, 198.0, 253.0, 226.0, 208.0, 186.0, 191.0, 176.0, 145.0, 142.0, 118.0, 91.0, 74.0, 79.0, 68.0, 54.0, 34.0, 22.0, 25.0, 17.0, 18.0, 13.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.3046875, -12.9056396484375, -12.506591796875, -12.1075439453125, -11.70849609375, -11.3094482421875, -10.910400390625, -10.5113525390625, -10.1123046875, -9.7132568359375, -9.314208984375, -8.9151611328125, -8.51611328125, -8.1170654296875, -7.718017578125, -7.3189697265625, -6.919921875, -6.5208740234375, -6.121826171875, -5.7227783203125, -5.32373046875, -4.9246826171875, -4.525634765625, -4.1265869140625, -3.7275390625, -3.3284912109375, -2.929443359375, -2.5303955078125, -2.13134765625, -1.7322998046875, -1.333251953125, -0.9342041015625, -0.53515625, -0.1361083984375, 0.262939453125, 0.6619873046875, 1.06103515625, 1.4600830078125, 1.859130859375, 2.2581787109375, 2.6572265625, 3.0562744140625, 3.455322265625, 3.8543701171875, 4.25341796875, 4.6524658203125, 5.051513671875, 5.4505615234375, 5.849609375, 6.2486572265625, 6.647705078125, 7.0467529296875, 7.44580078125, 7.8448486328125, 8.243896484375, 8.6429443359375, 9.0419921875, 9.4410400390625, 9.840087890625, 10.2391357421875, 10.63818359375, 11.0372314453125, 11.436279296875, 11.8353271484375, 12.234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 3.0, 4.0, 13.0, 12.0, 7.0, 15.0, 11.0, 20.0, 18.0, 18.0, 31.0, 23.0, 30.0, 19.0, 27.0, 37.0, 33.0, 33.0, 27.0, 48.0, 40.0, 51.0, 53.0, 26.0, 43.0, 26.0, 25.0, 35.0, 42.0, 24.0, 18.0, 21.0, 27.0, 20.0, 10.0, 16.0, 15.0, 10.0, 12.0, 7.0, 10.0, 7.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 5.0, 1.0], "bins": [-26.77130889892578, -26.007795333862305, -25.244281768798828, -24.48076629638672, -23.717252731323242, -22.953739166259766, -22.19022560119629, -21.426712036132812, -20.663196563720703, -19.899682998657227, -19.13616943359375, -18.37265396118164, -17.609140396118164, -16.845626831054688, -16.08211326599121, -15.318599700927734, -14.555086135864258, -13.791572570800781, -13.028058052062988, -12.264544486999512, -11.501029968261719, -10.737516403198242, -9.974002838134766, -9.210489273071289, -8.446974754333496, -7.683460712432861, -6.919946670532227, -6.15643310546875, -5.392919063568115, -4.6294050216674805, -3.865891456604004, -3.102377414703369, -2.3388614654541016, -1.5753475427627563, -0.8118336200714111, -0.04831981658935547, 0.7151942253112793, 1.478708267211914, 2.2422218322753906, 3.0057358741760254, 3.76924991607666, 4.532763957977295, 5.29627799987793, 6.059791564941406, 6.823305606842041, 7.586819648742676, 8.350333213806152, 9.113847732543945, 9.877361297607422, 10.640874862670898, 11.404389381408691, 12.167902946472168, 12.931417465209961, 13.694931030273438, 14.458444595336914, 15.22195816040039, 15.985472679138184, 16.748987197875977, 17.512500762939453, 18.27601432800293, 19.039527893066406, 19.803043365478516, 20.56655502319336, 21.33007049560547, 22.093584060668945]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 4.0, 7.0, 7.0, 8.0, 7.0, 8.0, 12.0, 19.0, 19.0, 17.0, 27.0, 18.0, 26.0, 23.0, 32.0, 33.0, 24.0, 34.0, 36.0, 41.0, 41.0, 34.0, 50.0, 55.0, 38.0, 43.0, 33.0, 30.0, 35.0, 26.0, 36.0, 20.0, 28.0, 28.0, 25.0, 17.0, 5.0, 11.0, 7.0, 13.0, 11.0, 9.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.928504943847656, -26.996150970458984, -26.063796997070312, -25.131441116333008, -24.199087142944336, -23.266733169555664, -22.33437728881836, -21.402023315429688, -20.469669342041016, -19.537315368652344, -18.604961395263672, -17.672605514526367, -16.740251541137695, -15.807897567749023, -14.875542640686035, -13.943187713623047, -13.010833740234375, -12.078479766845703, -11.146124839782715, -10.213769912719727, -9.281415939331055, -8.349061965942383, -7.4167070388793945, -6.4843525886535645, -5.551998138427734, -4.619643688201904, -3.687289237976074, -2.754934787750244, -1.822580337524414, -0.890225887298584, 0.042128562927246094, 0.9744830131530762, 1.906839370727539, 2.839193820953369, 3.771548271179199, 4.703902721405029, 5.636257171630859, 6.5686116218566895, 7.5009660720825195, 8.433320999145508, 9.36567497253418, 10.298028945922852, 11.23038387298584, 12.162738800048828, 13.0950927734375, 14.027446746826172, 14.95980167388916, 15.892156600952148, 16.82451057434082, 17.756864547729492, 18.689220428466797, 19.62157440185547, 20.55392837524414, 21.486282348632812, 22.418636322021484, 23.35099220275879, 24.28334617614746, 25.215700149536133, 26.148056030273438, 27.08041000366211, 28.01276397705078, 28.945117950439453, 29.877471923828125, 30.80982780456543, 31.7421817779541]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 6.0, 11.0, 22.0, 31.0, 50.0, 85.0, 138.0, 183.0, 317.0, 466.0, 685.0, 1076.0, 1726.0, 2535.0, 4087.0, 6243.0, 9229.0, 13838.0, 20438.0, 29338.0, 41030.0, 55222.0, 71862.0, 87981.0, 101186.0, 107353.0, 104368.0, 94102.0, 78984.0, 62254.0, 46460.0, 34243.0, 23979.0, 16470.0, 11115.0, 7428.0, 4854.0, 3251.0, 2045.0, 1321.0, 885.0, 610.0, 390.0, 237.0, 159.0, 105.0, 66.0, 33.0, 30.0, 11.0, 7.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.984375, -4.83203125, -4.6796875, -4.52734375, -4.375, -4.22265625, -4.0703125, -3.91796875, -3.765625, -3.61328125, -3.4609375, -3.30859375, -3.15625, -3.00390625, -2.8515625, -2.69921875, -2.546875, -2.39453125, -2.2421875, -2.08984375, -1.9375, -1.78515625, -1.6328125, -1.48046875, -1.328125, -1.17578125, -1.0234375, -0.87109375, -0.71875, -0.56640625, -0.4140625, -0.26171875, -0.109375, 0.04296875, 0.1953125, 0.34765625, 0.5, 0.65234375, 0.8046875, 0.95703125, 1.109375, 1.26171875, 1.4140625, 1.56640625, 1.71875, 1.87109375, 2.0234375, 2.17578125, 2.328125, 2.48046875, 2.6328125, 2.78515625, 2.9375, 3.08984375, 3.2421875, 3.39453125, 3.546875, 3.69921875, 3.8515625, 4.00390625, 4.15625, 4.30859375, 4.4609375, 4.61328125, 4.765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 7.0, 7.0, 8.0, 6.0, 8.0, 11.0, 19.0, 21.0, 17.0, 27.0, 18.0, 26.0, 23.0, 31.0, 32.0, 26.0, 34.0, 36.0, 44.0, 37.0, 35.0, 52.0, 56.0, 36.0, 42.0, 33.0, 32.0, 34.0, 25.0, 35.0, 20.0, 30.0, 27.0, 25.0, 16.0, 6.0, 9.0, 9.0, 13.0, 13.0, 7.0, 5.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.203125, -27.26806640625, -26.3330078125, -25.39794921875, -24.462890625, -23.52783203125, -22.5927734375, -21.65771484375, -20.72265625, -19.78759765625, -18.8525390625, -17.91748046875, -16.982421875, -16.04736328125, -15.1123046875, -14.17724609375, -13.2421875, -12.30712890625, -11.3720703125, -10.43701171875, -9.501953125, -8.56689453125, -7.6318359375, -6.69677734375, -5.76171875, -4.82666015625, -3.8916015625, -2.95654296875, -2.021484375, -1.08642578125, -0.1513671875, 0.78369140625, 1.71875, 2.65380859375, 3.5888671875, 4.52392578125, 5.458984375, 6.39404296875, 7.3291015625, 8.26416015625, 9.19921875, 10.13427734375, 11.0693359375, 12.00439453125, 12.939453125, 13.87451171875, 14.8095703125, 15.74462890625, 16.6796875, 17.61474609375, 18.5498046875, 19.48486328125, 20.419921875, 21.35498046875, 22.2900390625, 23.22509765625, 24.16015625, 25.09521484375, 26.0302734375, 26.96533203125, 27.900390625, 28.83544921875, 29.7705078125, 30.70556640625, 31.640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 7.0, 18.0, 16.0, 18.0, 42.0, 65.0, 82.0, 130.0, 172.0, 302.0, 433.0, 680.0, 1051.0, 1642.0, 2588.0, 4007.0, 6557.0, 10663.0, 18179.0, 33939.0, 661836.0, 236326.0, 28594.0, 15656.0, 9435.0, 5836.0, 3742.0, 2378.0, 1481.0, 944.0, 613.0, 379.0, 247.0, 187.0, 105.0, 65.0, 38.0, 29.0, 28.0, 16.0, 9.0, 9.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.21875, -16.695068359375, -16.17138671875, -15.647705078125, -15.1240234375, -14.600341796875, -14.07666015625, -13.552978515625, -13.029296875, -12.505615234375, -11.98193359375, -11.458251953125, -10.9345703125, -10.410888671875, -9.88720703125, -9.363525390625, -8.83984375, -8.316162109375, -7.79248046875, -7.268798828125, -6.7451171875, -6.221435546875, -5.69775390625, -5.174072265625, -4.650390625, -4.126708984375, -3.60302734375, -3.079345703125, -2.5556640625, -2.031982421875, -1.50830078125, -0.984619140625, -0.4609375, 0.062744140625, 0.58642578125, 1.110107421875, 1.6337890625, 2.157470703125, 2.68115234375, 3.204833984375, 3.728515625, 4.252197265625, 4.77587890625, 5.299560546875, 5.8232421875, 6.346923828125, 6.87060546875, 7.394287109375, 7.91796875, 8.441650390625, 8.96533203125, 9.489013671875, 10.0126953125, 10.536376953125, 11.06005859375, 11.583740234375, 12.107421875, 12.631103515625, 13.15478515625, 13.678466796875, 14.2021484375, 14.725830078125, 15.24951171875, 15.773193359375, 16.296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 4.0, 3.0, 9.0, 11.0, 12.0, 17.0, 10.0, 27.0, 21.0, 23.0, 35.0, 23.0, 39.0, 34.0, 48.0, 48.0, 41.0, 43.0, 45.0, 48.0, 43.0, 44.0, 43.0, 45.0, 31.0, 33.0, 33.0, 29.0, 29.0, 20.0, 25.0, 19.0, 13.0, 9.0, 7.0, 7.0, 7.0, 5.0, 3.0, 5.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.859375, -23.171875, -22.484375, -21.796875, -21.109375, -20.421875, -19.734375, -19.046875, -18.359375, -17.671875, -16.984375, -16.296875, -15.609375, -14.921875, -14.234375, -13.546875, -12.859375, -12.171875, -11.484375, -10.796875, -10.109375, -9.421875, -8.734375, -8.046875, -7.359375, -6.671875, -5.984375, -5.296875, -4.609375, -3.921875, -3.234375, -2.546875, -1.859375, -1.171875, -0.484375, 0.203125, 0.890625, 1.578125, 2.265625, 2.953125, 3.640625, 4.328125, 5.015625, 5.703125, 6.390625, 7.078125, 7.765625, 8.453125, 9.140625, 9.828125, 10.515625, 11.203125, 11.890625, 12.578125, 13.265625, 13.953125, 14.640625, 15.328125, 16.015625, 16.703125, 17.390625, 18.078125, 18.765625, 19.453125, 20.140625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 1.0, 7.0, 10.0, 10.0, 12.0, 18.0, 42.0, 53.0, 67.0, 107.0, 133.0, 218.0, 328.0, 519.0, 797.0, 1179.0, 1821.0, 2943.0, 4759.0, 7615.0, 12694.0, 21945.0, 46710.0, 829595.0, 58432.0, 23450.0, 13467.0, 8062.0, 4846.0, 3115.0, 1946.0, 1224.0, 784.0, 543.0, 365.0, 230.0, 155.0, 100.0, 68.0, 57.0, 37.0, 29.0, 17.0, 15.0, 9.0, 8.0, 6.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.123046875, -1.085052490234375, -1.04705810546875, -1.009063720703125, -0.9710693359375, -0.933074951171875, -0.89508056640625, -0.857086181640625, -0.819091796875, -0.781097412109375, -0.74310302734375, -0.705108642578125, -0.6671142578125, -0.629119873046875, -0.59112548828125, -0.553131103515625, -0.51513671875, -0.477142333984375, -0.43914794921875, -0.401153564453125, -0.3631591796875, -0.325164794921875, -0.28717041015625, -0.249176025390625, -0.211181640625, -0.173187255859375, -0.13519287109375, -0.097198486328125, -0.0592041015625, -0.021209716796875, 0.01678466796875, 0.054779052734375, 0.0927734375, 0.130767822265625, 0.16876220703125, 0.206756591796875, 0.2447509765625, 0.282745361328125, 0.32073974609375, 0.358734130859375, 0.396728515625, 0.434722900390625, 0.47271728515625, 0.510711669921875, 0.5487060546875, 0.586700439453125, 0.62469482421875, 0.662689208984375, 0.70068359375, 0.738677978515625, 0.77667236328125, 0.814666748046875, 0.8526611328125, 0.890655517578125, 0.92864990234375, 0.966644287109375, 1.004638671875, 1.042633056640625, 1.08062744140625, 1.118621826171875, 1.1566162109375, 1.194610595703125, 1.23260498046875, 1.270599365234375, 1.30859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 8.0, 1.0, 1.0, 4.0, 5.0, 12.0, 13.0, 10.0, 11.0, 10.0, 22.0, 40.0, 28.0, 34.0, 45.0, 46.0, 55.0, 70.0, 56.0, 70.0, 67.0, 43.0, 65.0, 46.0, 49.0, 35.0, 28.0, 30.0, 26.0, 17.0, 14.0, 13.0, 9.0, 5.0, 7.0, 4.0, 8.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.698204040527344e-05, -5.5312179028987885e-05, -5.364231765270233e-05, -5.197245627641678e-05, -5.0302594900131226e-05, -4.863273352384567e-05, -4.696287214756012e-05, -4.529301077127457e-05, -4.3623149394989014e-05, -4.195328801870346e-05, -4.028342664241791e-05, -3.8613565266132355e-05, -3.69437038898468e-05, -3.527384251356125e-05, -3.3603981137275696e-05, -3.193411976099014e-05, -3.026425838470459e-05, -2.8594397008419037e-05, -2.6924535632133484e-05, -2.525467425584793e-05, -2.3584812879562378e-05, -2.1914951503276825e-05, -2.0245090126991272e-05, -1.857522875070572e-05, -1.6905367374420166e-05, -1.5235505998134613e-05, -1.356564462184906e-05, -1.1895783245563507e-05, -1.0225921869277954e-05, -8.556060492992401e-06, -6.886199116706848e-06, -5.216337740421295e-06, -3.546476364135742e-06, -1.8766149878501892e-06, -2.0675361156463623e-07, 1.4631077647209167e-06, 3.1329691410064697e-06, 4.802830517292023e-06, 6.472691893577576e-06, 8.142553269863129e-06, 9.812414646148682e-06, 1.1482276022434235e-05, 1.3152137398719788e-05, 1.482199877500534e-05, 1.6491860151290894e-05, 1.8161721527576447e-05, 1.9831582903862e-05, 2.1501444280147552e-05, 2.3171305656433105e-05, 2.484116703271866e-05, 2.651102840900421e-05, 2.8180889785289764e-05, 2.9850751161575317e-05, 3.152061253786087e-05, 3.319047391414642e-05, 3.4860335290431976e-05, 3.653019666671753e-05, 3.820005804300308e-05, 3.9869919419288635e-05, 4.153978079557419e-05, 4.320964217185974e-05, 4.4879503548145294e-05, 4.654936492443085e-05, 4.82192263007164e-05, 4.988908767700195e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 10.0, 11.0, 23.0, 25.0, 20.0, 46.0, 81.0, 142.0, 237.0, 353.0, 547.0, 909.0, 1408.0, 2378.0, 3603.0, 5627.0, 8901.0, 13512.0, 20398.0, 30041.0, 42633.0, 59928.0, 79906.0, 101401.0, 118076.0, 122311.0, 111662.0, 91838.0, 70666.0, 52078.0, 36897.0, 24928.0, 17062.0, 11143.0, 7026.0, 4762.0, 2941.0, 1899.0, 1145.0, 781.0, 422.0, 268.0, 180.0, 117.0, 81.0, 53.0, 35.0, 23.0, 17.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.896484375, -0.8678207397460938, -0.8391571044921875, -0.8104934692382812, -0.781829833984375, -0.7531661987304688, -0.7245025634765625, -0.6958389282226562, -0.66717529296875, -0.6385116577148438, -0.6098480224609375, -0.5811843872070312, -0.552520751953125, -0.5238571166992188, -0.4951934814453125, -0.46652984619140625, -0.4378662109375, -0.40920257568359375, -0.3805389404296875, -0.35187530517578125, -0.323211669921875, -0.29454803466796875, -0.2658843994140625, -0.23722076416015625, -0.20855712890625, -0.17989349365234375, -0.1512298583984375, -0.12256622314453125, -0.093902587890625, -0.06523895263671875, -0.0365753173828125, -0.00791168212890625, 0.020751953125, 0.04941558837890625, 0.0780792236328125, 0.10674285888671875, 0.135406494140625, 0.16407012939453125, 0.1927337646484375, 0.22139739990234375, 0.25006103515625, 0.27872467041015625, 0.3073883056640625, 0.33605194091796875, 0.364715576171875, 0.39337921142578125, 0.4220428466796875, 0.45070648193359375, 0.4793701171875, 0.5080337524414062, 0.5366973876953125, 0.5653610229492188, 0.594024658203125, 0.6226882934570312, 0.6513519287109375, 0.6800155639648438, 0.70867919921875, 0.7373428344726562, 0.7660064697265625, 0.7946701049804688, 0.823333740234375, 0.8519973754882812, 0.8806610107421875, 0.9093246459960938, 0.93798828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 5.0, 7.0, 12.0, 17.0, 15.0, 16.0, 28.0, 30.0, 40.0, 33.0, 41.0, 36.0, 52.0, 64.0, 59.0, 65.0, 54.0, 64.0, 44.0, 43.0, 57.0, 42.0, 30.0, 33.0, 37.0, 10.0, 12.0, 10.0, 5.0, 5.0, 7.0, 10.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58935546875, -0.5706710815429688, -0.5519866943359375, -0.5333023071289062, -0.514617919921875, -0.49593353271484375, -0.4772491455078125, -0.45856475830078125, -0.43988037109375, -0.42119598388671875, -0.4025115966796875, -0.38382720947265625, -0.365142822265625, -0.34645843505859375, -0.3277740478515625, -0.30908966064453125, -0.2904052734375, -0.27172088623046875, -0.2530364990234375, -0.23435211181640625, -0.215667724609375, -0.19698333740234375, -0.1782989501953125, -0.15961456298828125, -0.14093017578125, -0.12224578857421875, -0.1035614013671875, -0.08487701416015625, -0.066192626953125, -0.04750823974609375, -0.0288238525390625, -0.01013946533203125, 0.008544921875, 0.02722930908203125, 0.0459136962890625, 0.06459808349609375, 0.083282470703125, 0.10196685791015625, 0.1206512451171875, 0.13933563232421875, 0.15802001953125, 0.17670440673828125, 0.1953887939453125, 0.21407318115234375, 0.232757568359375, 0.25144195556640625, 0.2701263427734375, 0.28881072998046875, 0.3074951171875, 0.32617950439453125, 0.3448638916015625, 0.36354827880859375, 0.382232666015625, 0.40091705322265625, 0.4196014404296875, 0.43828582763671875, 0.45697021484375, 0.47565460205078125, 0.4943389892578125, 0.5130233764648438, 0.531707763671875, 0.5503921508789062, 0.5690765380859375, 0.5877609252929688, 0.6064453125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 2.0, 7.0, 13.0, 7.0, 11.0, 13.0, 12.0, 16.0, 16.0, 20.0, 20.0, 22.0, 31.0, 21.0, 21.0, 41.0, 30.0, 27.0, 38.0, 34.0, 42.0, 49.0, 47.0, 46.0, 27.0, 35.0, 33.0, 23.0, 30.0, 36.0, 26.0, 27.0, 21.0, 16.0, 21.0, 12.0, 15.0, 12.0, 12.0, 10.0, 11.0, 11.0, 8.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 5.0], "bins": [-26.746143341064453, -25.995161056518555, -25.24418067932129, -24.49319839477539, -23.742218017578125, -22.991235733032227, -22.240253448486328, -21.489273071289062, -20.738290786743164, -19.987308502197266, -19.236328125, -18.4853458404541, -17.734365463256836, -16.983383178710938, -16.232402801513672, -15.481420516967773, -14.730439186096191, -13.97945785522461, -13.228476524353027, -12.477495193481445, -11.726512908935547, -10.975531578063965, -10.224550247192383, -9.473567962646484, -8.722587585449219, -7.971606254577637, -7.2206244468688965, -6.4696431159973145, -5.718661308288574, -4.967679977416992, -4.21669864654541, -3.46571683883667, -2.7147350311279297, -1.9637534618377686, -1.212772011756897, -0.4617905616760254, 0.28919100761413574, 1.0401725769042969, 1.791153907775879, 2.542135715484619, 3.293117046356201, 4.044098377227783, 4.795080184936523, 5.5460615158081055, 6.2970428466796875, 7.048024654388428, 7.79900598526001, 8.54998779296875, 9.300969123840332, 10.051950454711914, 10.802931785583496, 11.553913116455078, 12.304895401000977, 13.055876731872559, 13.80685806274414, 14.557840347290039, 15.308820724487305, 16.059803009033203, 16.81078338623047, 17.561765670776367, 18.312746047973633, 19.06372833251953, 19.814708709716797, 20.565690994262695, 21.316673278808594]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 7.0, 5.0, 8.0, 8.0, 5.0, 10.0, 17.0, 19.0, 20.0, 25.0, 17.0, 24.0, 30.0, 26.0, 30.0, 27.0, 34.0, 37.0, 38.0, 38.0, 39.0, 48.0, 49.0, 50.0, 34.0, 44.0, 26.0, 34.0, 29.0, 32.0, 22.0, 30.0, 34.0, 18.0, 20.0, 9.0, 4.0, 14.0, 12.0, 10.0, 10.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.60406494140625, -27.664897918701172, -26.72572898864746, -25.786561965942383, -24.847393035888672, -23.908226013183594, -22.969058990478516, -22.029890060424805, -21.090721130371094, -20.151554107666016, -19.212385177612305, -18.273218154907227, -17.334049224853516, -16.394882202148438, -15.455714225769043, -14.516546249389648, -13.57737922668457, -12.638211250305176, -11.699043273925781, -10.759876251220703, -9.820707321166992, -8.881540298461914, -7.9423723220825195, -7.003204345703125, -6.0640363693237305, -5.124868392944336, -4.185700416564941, -3.246532917022705, -2.3073649406433105, -1.368196964263916, -0.4290294647216797, 0.5101385116577148, 1.4493083953857422, 2.3884763717651367, 3.327644109725952, 4.266811847686768, 5.205979824066162, 6.145147800445557, 7.084315299987793, 8.023483276367188, 8.962651252746582, 9.901819229125977, 10.840987205505371, 11.780155181884766, 12.719322204589844, 13.658491134643555, 14.597658157348633, 15.536826133728027, 16.475994110107422, 17.4151611328125, 18.35433006286621, 19.29349708557129, 20.232666015625, 21.171833038330078, 22.111000061035156, 23.050168991088867, 23.989337921142578, 24.928504943847656, 25.867673873901367, 26.806840896606445, 27.746009826660156, 28.685176849365234, 29.624343872070312, 30.563512802124023, 31.5026798248291]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 8.0, 9.0, 14.0, 32.0, 35.0, 61.0, 98.0, 172.0, 262.0, 397.0, 672.0, 1033.0, 1526.0, 2416.0, 3672.0, 5204.0, 7708.0, 10959.0, 14953.0, 20152.0, 26877.0, 34895.0, 43534.0, 53045.0, 61903.0, 70332.0, 76421.0, 80295.0, 80272.0, 77105.0, 72336.0, 63568.0, 54694.0, 45383.0, 36570.0, 28235.0, 21513.0, 15822.0, 11502.0, 8152.0, 5639.0, 3811.0, 2498.0, 1712.0, 1145.0, 723.0, 461.0, 278.0, 167.0, 127.0, 72.0, 43.0, 20.0, 12.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-13.5234375, -13.0885009765625, -12.653564453125, -12.2186279296875, -11.78369140625, -11.3487548828125, -10.913818359375, -10.4788818359375, -10.0439453125, -9.6090087890625, -9.174072265625, -8.7391357421875, -8.30419921875, -7.8692626953125, -7.434326171875, -6.9993896484375, -6.564453125, -6.1295166015625, -5.694580078125, -5.2596435546875, -4.82470703125, -4.3897705078125, -3.954833984375, -3.5198974609375, -3.0849609375, -2.6500244140625, -2.215087890625, -1.7801513671875, -1.34521484375, -0.9102783203125, -0.475341796875, -0.0404052734375, 0.39453125, 0.8294677734375, 1.264404296875, 1.6993408203125, 2.13427734375, 2.5692138671875, 3.004150390625, 3.4390869140625, 3.8740234375, 4.3089599609375, 4.743896484375, 5.1788330078125, 5.61376953125, 6.0487060546875, 6.483642578125, 6.9185791015625, 7.353515625, 7.7884521484375, 8.223388671875, 8.6583251953125, 9.09326171875, 9.5281982421875, 9.963134765625, 10.3980712890625, 10.8330078125, 11.2679443359375, 11.702880859375, 12.1378173828125, 12.57275390625, 13.0076904296875, 13.442626953125, 13.8775634765625, 14.3125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 7.0, 6.0, 8.0, 7.0, 7.0, 10.0, 22.0, 17.0, 17.0, 23.0, 24.0, 21.0, 28.0, 29.0, 31.0, 27.0, 33.0, 35.0, 43.0, 34.0, 41.0, 50.0, 48.0, 49.0, 35.0, 38.0, 30.0, 34.0, 27.0, 31.0, 25.0, 29.0, 32.0, 18.0, 18.0, 9.0, 6.0, 12.0, 13.0, 7.0, 13.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.71875, -26.804931640625, -25.89111328125, -24.977294921875, -24.0634765625, -23.149658203125, -22.23583984375, -21.322021484375, -20.408203125, -19.494384765625, -18.58056640625, -17.666748046875, -16.7529296875, -15.839111328125, -14.92529296875, -14.011474609375, -13.09765625, -12.183837890625, -11.27001953125, -10.356201171875, -9.4423828125, -8.528564453125, -7.61474609375, -6.700927734375, -5.787109375, -4.873291015625, -3.95947265625, -3.045654296875, -2.1318359375, -1.218017578125, -0.30419921875, 0.609619140625, 1.5234375, 2.437255859375, 3.35107421875, 4.264892578125, 5.1787109375, 6.092529296875, 7.00634765625, 7.920166015625, 8.833984375, 9.747802734375, 10.66162109375, 11.575439453125, 12.4892578125, 13.403076171875, 14.31689453125, 15.230712890625, 16.14453125, 17.058349609375, 17.97216796875, 18.885986328125, 19.7998046875, 20.713623046875, 21.62744140625, 22.541259765625, 23.455078125, 24.368896484375, 25.28271484375, 26.196533203125, 27.1103515625, 28.024169921875, 28.93798828125, 29.851806640625, 30.765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 16.0, 16.0, 30.0, 54.0, 117.0, 151.0, 296.0, 415.0, 708.0, 1206.0, 1855.0, 2838.0, 4422.0, 6948.0, 10094.0, 14873.0, 20856.0, 28414.0, 37978.0, 48550.0, 60632.0, 71775.0, 81223.0, 87487.0, 89480.0, 87255.0, 81430.0, 71425.0, 60091.0, 48061.0, 37783.0, 28459.0, 20608.0, 14538.0, 9867.0, 6574.0, 4312.0, 2836.0, 1845.0, 1189.0, 739.0, 433.0, 249.0, 159.0, 103.0, 71.0, 37.0, 22.0, 12.0, 10.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-15.5234375, -15.0455322265625, -14.567626953125, -14.0897216796875, -13.61181640625, -13.1339111328125, -12.656005859375, -12.1781005859375, -11.7001953125, -11.2222900390625, -10.744384765625, -10.2664794921875, -9.78857421875, -9.3106689453125, -8.832763671875, -8.3548583984375, -7.876953125, -7.3990478515625, -6.921142578125, -6.4432373046875, -5.96533203125, -5.4874267578125, -5.009521484375, -4.5316162109375, -4.0537109375, -3.5758056640625, -3.097900390625, -2.6199951171875, -2.14208984375, -1.6641845703125, -1.186279296875, -0.7083740234375, -0.23046875, 0.2474365234375, 0.725341796875, 1.2032470703125, 1.68115234375, 2.1590576171875, 2.636962890625, 3.1148681640625, 3.5927734375, 4.0706787109375, 4.548583984375, 5.0264892578125, 5.50439453125, 5.9822998046875, 6.460205078125, 6.9381103515625, 7.416015625, 7.8939208984375, 8.371826171875, 8.8497314453125, 9.32763671875, 9.8055419921875, 10.283447265625, 10.7613525390625, 11.2392578125, 11.7171630859375, 12.195068359375, 12.6729736328125, 13.15087890625, 13.6287841796875, 14.106689453125, 14.5845947265625, 15.0625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 8.0, 5.0, 8.0, 10.0, 8.0, 13.0, 9.0, 10.0, 22.0, 20.0, 28.0, 22.0, 29.0, 30.0, 33.0, 33.0, 35.0, 30.0, 47.0, 33.0, 29.0, 43.0, 40.0, 38.0, 34.0, 34.0, 25.0, 31.0, 38.0, 39.0, 34.0, 18.0, 33.0, 20.0, 17.0, 19.0, 18.0, 10.0, 9.0, 9.0, 9.0, 6.0, 6.0, 3.0, 1.0, 5.0, 0.0, 0.0, 4.0, 2.0, 1.0], "bins": [-19.75, -19.173583984375, -18.59716796875, -18.020751953125, -17.4443359375, -16.867919921875, -16.29150390625, -15.715087890625, -15.138671875, -14.562255859375, -13.98583984375, -13.409423828125, -12.8330078125, -12.256591796875, -11.68017578125, -11.103759765625, -10.52734375, -9.950927734375, -9.37451171875, -8.798095703125, -8.2216796875, -7.645263671875, -7.06884765625, -6.492431640625, -5.916015625, -5.339599609375, -4.76318359375, -4.186767578125, -3.6103515625, -3.033935546875, -2.45751953125, -1.881103515625, -1.3046875, -0.728271484375, -0.15185546875, 0.424560546875, 1.0009765625, 1.577392578125, 2.15380859375, 2.730224609375, 3.306640625, 3.883056640625, 4.45947265625, 5.035888671875, 5.6123046875, 6.188720703125, 6.76513671875, 7.341552734375, 7.91796875, 8.494384765625, 9.07080078125, 9.647216796875, 10.2236328125, 10.800048828125, 11.37646484375, 11.952880859375, 12.529296875, 13.105712890625, 13.68212890625, 14.258544921875, 14.8349609375, 15.411376953125, 15.98779296875, 16.564208984375, 17.140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 11.0, 23.0, 20.0, 47.0, 61.0, 85.0, 189.0, 284.0, 469.0, 802.0, 1394.0, 2311.0, 3877.0, 6388.0, 10580.0, 16854.0, 26730.0, 40275.0, 57635.0, 77668.0, 97853.0, 113391.0, 118680.0, 114934.0, 99766.0, 80926.0, 60427.0, 42653.0, 28113.0, 18141.0, 11159.0, 6824.0, 3916.0, 2392.0, 1461.0, 860.0, 509.0, 297.0, 211.0, 117.0, 84.0, 51.0, 31.0, 17.0, 16.0, 7.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.828125, -7.572021484375, -7.31591796875, -7.059814453125, -6.8037109375, -6.547607421875, -6.29150390625, -6.035400390625, -5.779296875, -5.523193359375, -5.26708984375, -5.010986328125, -4.7548828125, -4.498779296875, -4.24267578125, -3.986572265625, -3.73046875, -3.474365234375, -3.21826171875, -2.962158203125, -2.7060546875, -2.449951171875, -2.19384765625, -1.937744140625, -1.681640625, -1.425537109375, -1.16943359375, -0.913330078125, -0.6572265625, -0.401123046875, -0.14501953125, 0.111083984375, 0.3671875, 0.623291015625, 0.87939453125, 1.135498046875, 1.3916015625, 1.647705078125, 1.90380859375, 2.159912109375, 2.416015625, 2.672119140625, 2.92822265625, 3.184326171875, 3.4404296875, 3.696533203125, 3.95263671875, 4.208740234375, 4.46484375, 4.720947265625, 4.97705078125, 5.233154296875, 5.4892578125, 5.745361328125, 6.00146484375, 6.257568359375, 6.513671875, 6.769775390625, 7.02587890625, 7.281982421875, 7.5380859375, 7.794189453125, 8.05029296875, 8.306396484375, 8.5625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 12.0, 3.0, 8.0, 9.0, 15.0, 10.0, 21.0, 16.0, 20.0, 21.0, 28.0, 34.0, 30.0, 41.0, 46.0, 52.0, 46.0, 51.0, 41.0, 40.0, 40.0, 42.0, 58.0, 34.0, 40.0, 39.0, 32.0, 24.0, 16.0, 28.0, 19.0, 12.0, 8.0, 9.0, 9.0, 14.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00087738037109375, -0.0008480101823806763, -0.0008186399936676025, -0.0007892698049545288, -0.0007598996162414551, -0.0007305294275283813, -0.0007011592388153076, -0.0006717890501022339, -0.0006424188613891602, -0.0006130486726760864, -0.0005836784839630127, -0.000554308295249939, -0.0005249381065368652, -0.0004955679178237915, -0.0004661977291107178, -0.00043682754039764404, -0.0004074573516845703, -0.0003780871629714966, -0.00034871697425842285, -0.0003193467855453491, -0.0002899765968322754, -0.00026060640811920166, -0.00023123621940612793, -0.0002018660306930542, -0.00017249584197998047, -0.00014312565326690674, -0.00011375546455383301, -8.438527584075928e-05, -5.501508712768555e-05, -2.5644898414611816e-05, 3.725290298461914e-06, 3.3095479011535645e-05, 6.246566772460938e-05, 9.18358564376831e-05, 0.00012120604515075684, 0.00015057623386383057, 0.0001799464225769043, 0.00020931661128997803, 0.00023868680000305176, 0.0002680569887161255, 0.0002974271774291992, 0.00032679736614227295, 0.0003561675548553467, 0.0003855377435684204, 0.00041490793228149414, 0.00044427812099456787, 0.0004736483097076416, 0.0005030184984207153, 0.0005323886871337891, 0.0005617588758468628, 0.0005911290645599365, 0.0006204992532730103, 0.000649869441986084, 0.0006792396306991577, 0.0007086098194122314, 0.0007379800081253052, 0.0007673501968383789, 0.0007967203855514526, 0.0008260905742645264, 0.0008554607629776001, 0.0008848309516906738, 0.0009142011404037476, 0.0009435713291168213, 0.000972941517829895, 0.0010023117065429688]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 5.0, 13.0, 20.0, 27.0, 44.0, 78.0, 116.0, 219.0, 335.0, 503.0, 901.0, 1447.0, 2582.0, 4234.0, 6934.0, 11665.0, 18033.0, 28071.0, 41756.0, 58047.0, 77093.0, 94629.0, 108629.0, 114192.0, 110253.0, 98149.0, 81153.0, 61829.0, 44766.0, 30509.0, 20023.0, 12854.0, 7655.0, 4740.0, 2771.0, 1708.0, 1025.0, 616.0, 358.0, 247.0, 129.0, 82.0, 51.0, 28.0, 10.0, 14.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-9.1640625, -8.891357421875, -8.61865234375, -8.345947265625, -8.0732421875, -7.800537109375, -7.52783203125, -7.255126953125, -6.982421875, -6.709716796875, -6.43701171875, -6.164306640625, -5.8916015625, -5.618896484375, -5.34619140625, -5.073486328125, -4.80078125, -4.528076171875, -4.25537109375, -3.982666015625, -3.7099609375, -3.437255859375, -3.16455078125, -2.891845703125, -2.619140625, -2.346435546875, -2.07373046875, -1.801025390625, -1.5283203125, -1.255615234375, -0.98291015625, -0.710205078125, -0.4375, -0.164794921875, 0.10791015625, 0.380615234375, 0.6533203125, 0.926025390625, 1.19873046875, 1.471435546875, 1.744140625, 2.016845703125, 2.28955078125, 2.562255859375, 2.8349609375, 3.107666015625, 3.38037109375, 3.653076171875, 3.92578125, 4.198486328125, 4.47119140625, 4.743896484375, 5.0166015625, 5.289306640625, 5.56201171875, 5.834716796875, 6.107421875, 6.380126953125, 6.65283203125, 6.925537109375, 7.1982421875, 7.470947265625, 7.74365234375, 8.016357421875, 8.2890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 1.0, 4.0, 3.0, 5.0, 9.0, 21.0, 15.0, 22.0, 16.0, 29.0, 19.0, 30.0, 31.0, 31.0, 39.0, 30.0, 46.0, 42.0, 37.0, 51.0, 35.0, 34.0, 39.0, 49.0, 55.0, 44.0, 46.0, 35.0, 38.0, 20.0, 24.0, 15.0, 15.0, 15.0, 17.0, 10.0, 6.0, 2.0, 6.0, 5.0, 4.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.968109130859375, -3.84637451171875, -3.724639892578125, -3.6029052734375, -3.481170654296875, -3.35943603515625, -3.237701416015625, -3.115966796875, -2.994232177734375, -2.87249755859375, -2.750762939453125, -2.6290283203125, -2.507293701171875, -2.38555908203125, -2.263824462890625, -2.14208984375, -2.020355224609375, -1.89862060546875, -1.776885986328125, -1.6551513671875, -1.533416748046875, -1.41168212890625, -1.289947509765625, -1.168212890625, -1.046478271484375, -0.92474365234375, -0.803009033203125, -0.6812744140625, -0.559539794921875, -0.43780517578125, -0.316070556640625, -0.1943359375, -0.072601318359375, 0.04913330078125, 0.170867919921875, 0.2926025390625, 0.414337158203125, 0.53607177734375, 0.657806396484375, 0.779541015625, 0.901275634765625, 1.02301025390625, 1.144744873046875, 1.2664794921875, 1.388214111328125, 1.50994873046875, 1.631683349609375, 1.75341796875, 1.875152587890625, 1.99688720703125, 2.118621826171875, 2.2403564453125, 2.362091064453125, 2.48382568359375, 2.605560302734375, 2.727294921875, 2.849029541015625, 2.97076416015625, 3.092498779296875, 3.2142333984375, 3.335968017578125, 3.45770263671875, 3.579437255859375, 3.701171875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 2.0, 6.0, 6.0, 8.0, 5.0, 11.0, 15.0, 9.0, 18.0, 15.0, 23.0, 17.0, 15.0, 23.0, 26.0, 35.0, 38.0, 42.0, 32.0, 26.0, 38.0, 45.0, 44.0, 43.0, 49.0, 33.0, 37.0, 39.0, 32.0, 32.0, 31.0, 31.0, 17.0, 20.0, 23.0, 16.0, 16.0, 11.0, 19.0, 10.0, 7.0, 9.0, 4.0, 5.0, 8.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.271846771240234, -25.466659545898438, -24.661470413208008, -23.85628318786621, -23.051095962524414, -22.245906829833984, -21.440719604492188, -20.63553237915039, -19.830345153808594, -19.025157928466797, -18.219968795776367, -17.41478157043457, -16.609594345092773, -15.80440616607666, -14.999217987060547, -14.19403076171875, -13.38884162902832, -12.583653450012207, -11.77846622467041, -10.973278045654297, -10.1680908203125, -9.362902641296387, -8.557714462280273, -7.752526760101318, -6.947339057922363, -6.142151355743408, -5.336963653564453, -4.53177547454834, -3.7265877723693848, -2.9214000701904297, -2.1162118911743164, -1.3110241889953613, -0.5058345794677734, 0.2993532419204712, 1.1045410633087158, 1.90972900390625, 2.714916706085205, 3.52010440826416, 4.325292587280273, 5.1304802894592285, 5.935667991638184, 6.740855693817139, 7.546043395996094, 8.351231575012207, 9.15641975402832, 9.961606979370117, 10.76679515838623, 11.571983337402344, 12.37717056274414, 13.182358741760254, 13.98754596710205, 14.792734146118164, 15.597921371459961, 16.40311050415039, 17.208297729492188, 18.013484954833984, 18.81867218017578, 19.623859405517578, 20.429048538208008, 21.234235763549805, 22.0394229888916, 22.84461212158203, 23.649799346923828, 24.454986572265625, 25.260175704956055]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 6.0, 8.0, 13.0, 10.0, 13.0, 16.0, 27.0, 22.0, 22.0, 21.0, 30.0, 28.0, 26.0, 37.0, 37.0, 44.0, 25.0, 47.0, 48.0, 38.0, 44.0, 42.0, 35.0, 35.0, 33.0, 38.0, 39.0, 22.0, 26.0, 27.0, 18.0, 20.0, 20.0, 13.0, 15.0, 12.0, 6.0, 8.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.278982162475586, -30.311729431152344, -29.344478607177734, -28.377225875854492, -27.40997314453125, -26.44272232055664, -25.4754695892334, -24.508216857910156, -23.540964126586914, -22.573711395263672, -21.606460571289062, -20.63920783996582, -19.671955108642578, -18.70470428466797, -17.737451553344727, -16.770198822021484, -15.802947044372559, -14.835695266723633, -13.86844253540039, -12.901190757751465, -11.933938026428223, -10.966686248779297, -9.999433517456055, -9.032181739807129, -8.064929962158203, -7.097677707672119, -6.130425453186035, -5.163173675537109, -4.195920944213867, -3.2286691665649414, -2.2614169120788574, -1.2941646575927734, -0.32691192626953125, 0.640340268611908, 1.6075924634933472, 2.5748445987701416, 3.5420968532562256, 4.5093488693237305, 5.4766011238098145, 6.443853378295898, 7.411105632781982, 8.378357887268066, 9.345609664916992, 10.312862396240234, 11.28011417388916, 12.247365951538086, 13.214618682861328, 14.18187141418457, 15.149123191833496, 16.116374969482422, 17.083627700805664, 18.050880432128906, 19.018131256103516, 19.985383987426758, 20.95263671875, 21.91988754272461, 22.88714027404785, 23.854393005371094, 24.821643829345703, 25.788896560668945, 26.756149291992188, 27.723400115966797, 28.69065284729004, 29.65790557861328, 30.625158309936523]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 11.0, 15.0, 32.0, 51.0, 86.0, 124.0, 205.0, 338.0, 586.0, 974.0, 1656.0, 2650.0, 4404.0, 7057.0, 11255.0, 18067.0, 28108.0, 43381.0, 66569.0, 98038.0, 140713.0, 193727.0, 256838.0, 321573.0, 377770.0, 413952.0, 421657.0, 399168.0, 351278.0, 290094.0, 226009.0, 166355.0, 118129.0, 81540.0, 54500.0, 35539.0, 23047.0, 14471.0, 9275.0, 5729.0, 3617.0, 2215.0, 1338.0, 821.0, 537.0, 278.0, 206.0, 114.0, 72.0, 51.0, 26.0, 16.0, 13.0, 7.0, 8.0, 2.0, 2.0, 1.0, 1.0], "bins": [-19.515625, -18.891357421875, -18.26708984375, -17.642822265625, -17.0185546875, -16.394287109375, -15.77001953125, -15.145751953125, -14.521484375, -13.897216796875, -13.27294921875, -12.648681640625, -12.0244140625, -11.400146484375, -10.77587890625, -10.151611328125, -9.52734375, -8.903076171875, -8.27880859375, -7.654541015625, -7.0302734375, -6.406005859375, -5.78173828125, -5.157470703125, -4.533203125, -3.908935546875, -3.28466796875, -2.660400390625, -2.0361328125, -1.411865234375, -0.78759765625, -0.163330078125, 0.4609375, 1.085205078125, 1.70947265625, 2.333740234375, 2.9580078125, 3.582275390625, 4.20654296875, 4.830810546875, 5.455078125, 6.079345703125, 6.70361328125, 7.327880859375, 7.9521484375, 8.576416015625, 9.20068359375, 9.824951171875, 10.44921875, 11.073486328125, 11.69775390625, 12.322021484375, 12.9462890625, 13.570556640625, 14.19482421875, 14.819091796875, 15.443359375, 16.067626953125, 16.69189453125, 17.316162109375, 17.9404296875, 18.564697265625, 19.18896484375, 19.813232421875, 20.4375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 6.0, 6.0, 6.0, 12.0, 11.0, 10.0, 14.0, 21.0, 25.0, 27.0, 21.0, 24.0, 27.0, 28.0, 33.0, 41.0, 36.0, 33.0, 37.0, 49.0, 47.0, 36.0, 41.0, 42.0, 37.0, 27.0, 40.0, 40.0, 25.0, 25.0, 24.0, 27.0, 17.0, 19.0, 18.0, 14.0, 12.0, 8.0, 8.0, 7.0, 5.0, 5.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.390625, -26.528564453125, -25.66650390625, -24.804443359375, -23.9423828125, -23.080322265625, -22.21826171875, -21.356201171875, -20.494140625, -19.632080078125, -18.77001953125, -17.907958984375, -17.0458984375, -16.183837890625, -15.32177734375, -14.459716796875, -13.59765625, -12.735595703125, -11.87353515625, -11.011474609375, -10.1494140625, -9.287353515625, -8.42529296875, -7.563232421875, -6.701171875, -5.839111328125, -4.97705078125, -4.114990234375, -3.2529296875, -2.390869140625, -1.52880859375, -0.666748046875, 0.1953125, 1.057373046875, 1.91943359375, 2.781494140625, 3.6435546875, 4.505615234375, 5.36767578125, 6.229736328125, 7.091796875, 7.953857421875, 8.81591796875, 9.677978515625, 10.5400390625, 11.402099609375, 12.26416015625, 13.126220703125, 13.98828125, 14.850341796875, 15.71240234375, 16.574462890625, 17.4365234375, 18.298583984375, 19.16064453125, 20.022705078125, 20.884765625, 21.746826171875, 22.60888671875, 23.470947265625, 24.3330078125, 25.195068359375, 26.05712890625, 26.919189453125, 27.78125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 4.0, 7.0, 14.0, 19.0, 31.0, 67.0, 124.0, 179.0, 326.0, 564.0, 1008.0, 1725.0, 3022.0, 5020.0, 8653.0, 14556.0, 23973.0, 39100.0, 61375.0, 94067.0, 138067.0, 194767.0, 259916.0, 326951.0, 386933.0, 426045.0, 434008.0, 408876.0, 359430.0, 294975.0, 226964.0, 165389.0, 114485.0, 77278.0, 49247.0, 30853.0, 18814.0, 11395.0, 6702.0, 4004.0, 2238.0, 1389.0, 763.0, 439.0, 233.0, 136.0, 76.0, 47.0, 19.0, 11.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.265625, -20.562744140625, -19.85986328125, -19.156982421875, -18.4541015625, -17.751220703125, -17.04833984375, -16.345458984375, -15.642578125, -14.939697265625, -14.23681640625, -13.533935546875, -12.8310546875, -12.128173828125, -11.42529296875, -10.722412109375, -10.01953125, -9.316650390625, -8.61376953125, -7.910888671875, -7.2080078125, -6.505126953125, -5.80224609375, -5.099365234375, -4.396484375, -3.693603515625, -2.99072265625, -2.287841796875, -1.5849609375, -0.882080078125, -0.17919921875, 0.523681640625, 1.2265625, 1.929443359375, 2.63232421875, 3.335205078125, 4.0380859375, 4.740966796875, 5.44384765625, 6.146728515625, 6.849609375, 7.552490234375, 8.25537109375, 8.958251953125, 9.6611328125, 10.364013671875, 11.06689453125, 11.769775390625, 12.47265625, 13.175537109375, 13.87841796875, 14.581298828125, 15.2841796875, 15.987060546875, 16.68994140625, 17.392822265625, 18.095703125, 18.798583984375, 19.50146484375, 20.204345703125, 20.9072265625, 21.610107421875, 22.31298828125, 23.015869140625, 23.71875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 14.0, 10.0, 19.0, 31.0, 29.0, 41.0, 53.0, 75.0, 71.0, 84.0, 103.0, 123.0, 152.0, 138.0, 185.0, 191.0, 185.0, 194.0, 212.0, 203.0, 189.0, 194.0, 194.0, 171.0, 168.0, 156.0, 149.0, 117.0, 114.0, 110.0, 69.0, 65.0, 62.0, 54.0, 25.0, 24.0, 19.0, 18.0, 17.0, 9.0, 5.0, 11.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.4140625, -10.0238037109375, -9.633544921875, -9.2432861328125, -8.85302734375, -8.4627685546875, -8.072509765625, -7.6822509765625, -7.2919921875, -6.9017333984375, -6.511474609375, -6.1212158203125, -5.73095703125, -5.3406982421875, -4.950439453125, -4.5601806640625, -4.169921875, -3.7796630859375, -3.389404296875, -2.9991455078125, -2.60888671875, -2.2186279296875, -1.828369140625, -1.4381103515625, -1.0478515625, -0.6575927734375, -0.267333984375, 0.1229248046875, 0.51318359375, 0.9034423828125, 1.293701171875, 1.6839599609375, 2.07421875, 2.4644775390625, 2.854736328125, 3.2449951171875, 3.63525390625, 4.0255126953125, 4.415771484375, 4.8060302734375, 5.1962890625, 5.5865478515625, 5.976806640625, 6.3670654296875, 6.75732421875, 7.1475830078125, 7.537841796875, 7.9281005859375, 8.318359375, 8.7086181640625, 9.098876953125, 9.4891357421875, 9.87939453125, 10.2696533203125, 10.659912109375, 11.0501708984375, 11.4404296875, 11.8306884765625, 12.220947265625, 12.6112060546875, 13.00146484375, 13.3917236328125, 13.781982421875, 14.1722412109375, 14.5625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 8.0, 17.0, 9.0, 10.0, 13.0, 23.0, 15.0, 30.0, 25.0, 23.0, 35.0, 37.0, 29.0, 32.0, 27.0, 28.0, 27.0, 49.0, 44.0, 39.0, 28.0, 26.0, 48.0, 38.0, 49.0, 41.0, 42.0, 33.0, 25.0, 18.0, 13.0, 29.0, 19.0, 14.0, 8.0, 15.0, 4.0, 7.0, 6.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.76230812072754, -25.899370193481445, -25.03643226623535, -24.173492431640625, -23.31055450439453, -22.447616577148438, -21.584678649902344, -20.72174072265625, -19.858802795410156, -18.995864868164062, -18.13292694091797, -17.269989013671875, -16.40704917907715, -15.544111251831055, -14.681173324584961, -13.818235397338867, -12.95529556274414, -12.092357635498047, -11.229418754577637, -10.366480827331543, -9.503541946411133, -8.640604019165039, -7.777666091918945, -6.914727687835693, -6.051789283752441, -5.1888508796691895, -4.3259124755859375, -3.4629745483398438, -2.600036144256592, -1.7370977401733398, -0.8741598129272461, -0.01122140884399414, 0.851715087890625, 1.7146533727645874, 2.57759165763855, 3.4405298233032227, 4.303468227386475, 5.166406631469727, 6.02934455871582, 6.892282962799072, 7.755221366882324, 8.618159294128418, 9.481098175048828, 10.344036102294922, 11.206974029541016, 12.069912910461426, 12.93285083770752, 13.79578971862793, 14.658727645874023, 15.521665573120117, 16.38460350036621, 17.247543334960938, 18.11048126220703, 18.973419189453125, 19.83635711669922, 20.699295043945312, 21.562232971191406, 22.4251708984375, 23.288108825683594, 24.151046752929688, 25.013986587524414, 25.876924514770508, 26.7398624420166, 27.602800369262695, 28.465740203857422]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 7.0, 8.0, 4.0, 7.0, 14.0, 13.0, 8.0, 9.0, 14.0, 16.0, 16.0, 18.0, 15.0, 31.0, 28.0, 29.0, 38.0, 29.0, 26.0, 35.0, 34.0, 29.0, 35.0, 36.0, 31.0, 31.0, 35.0, 35.0, 39.0, 34.0, 27.0, 27.0, 24.0, 21.0, 20.0, 27.0, 14.0, 17.0, 20.0, 19.0, 16.0, 13.0, 10.0, 4.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-25.637876510620117, -24.81793785095215, -23.998001098632812, -23.178062438964844, -22.358123779296875, -21.53818702697754, -20.71824836730957, -19.898311614990234, -19.078372955322266, -18.258434295654297, -17.43849754333496, -16.618558883666992, -15.79862117767334, -14.978683471679688, -14.158744812011719, -13.338807106018066, -12.518869400024414, -11.698931694030762, -10.87899398803711, -10.05905532836914, -9.239117622375488, -8.419179916381836, -7.599241733551025, -6.779303550720215, -5.9593658447265625, -5.13942813873291, -4.3194899559021, -3.499552011489868, -2.6796140670776367, -1.8596763610839844, -1.0397381782531738, -0.21979999542236328, 0.6001396179199219, 1.4200775623321533, 2.2400155067443848, 3.059953451156616, 3.8798913955688477, 4.6998291015625, 5.5197672843933105, 6.339705467224121, 7.159643173217773, 7.979580879211426, 8.799518585205078, 9.619457244873047, 10.4393949508667, 11.259332656860352, 12.07927131652832, 12.899209022521973, 13.719146728515625, 14.539084434509277, 15.35902214050293, 16.1789608001709, 16.998897552490234, 17.818836212158203, 18.638774871826172, 19.45871353149414, 20.278650283813477, 21.098588943481445, 21.91852569580078, 22.73846435546875, 23.55840301513672, 24.378339767456055, 25.198278427124023, 26.01821517944336, 26.838153839111328]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 7.0, 4.0, 15.0, 16.0, 34.0, 45.0, 88.0, 123.0, 221.0, 317.0, 482.0, 731.0, 1097.0, 1789.0, 2768.0, 4307.0, 6603.0, 9877.0, 14647.0, 21173.0, 30888.0, 42686.0, 57454.0, 73343.0, 88219.0, 100575.0, 105272.0, 102516.0, 92112.0, 77484.0, 61462.0, 46599.0, 33548.0, 23965.0, 16306.0, 11042.0, 7199.0, 4783.0, 3154.0, 2010.0, 1278.0, 810.0, 515.0, 346.0, 248.0, 143.0, 96.0, 58.0, 47.0, 18.0, 14.0, 14.0, 4.0, 4.0, 4.0, 2.0, 0.0, 3.0], "bins": [-4.21484375, -4.085693359375, -3.95654296875, -3.827392578125, -3.6982421875, -3.569091796875, -3.43994140625, -3.310791015625, -3.181640625, -3.052490234375, -2.92333984375, -2.794189453125, -2.6650390625, -2.535888671875, -2.40673828125, -2.277587890625, -2.1484375, -2.019287109375, -1.89013671875, -1.760986328125, -1.6318359375, -1.502685546875, -1.37353515625, -1.244384765625, -1.115234375, -0.986083984375, -0.85693359375, -0.727783203125, -0.5986328125, -0.469482421875, -0.34033203125, -0.211181640625, -0.08203125, 0.047119140625, 0.17626953125, 0.305419921875, 0.4345703125, 0.563720703125, 0.69287109375, 0.822021484375, 0.951171875, 1.080322265625, 1.20947265625, 1.338623046875, 1.4677734375, 1.596923828125, 1.72607421875, 1.855224609375, 1.984375, 2.113525390625, 2.24267578125, 2.371826171875, 2.5009765625, 2.630126953125, 2.75927734375, 2.888427734375, 3.017578125, 3.146728515625, 3.27587890625, 3.405029296875, 3.5341796875, 3.663330078125, 3.79248046875, 3.921630859375, 4.05078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 6.0, 9.0, 4.0, 6.0, 14.0, 12.0, 10.0, 9.0, 13.0, 15.0, 16.0, 19.0, 15.0, 32.0, 23.0, 31.0, 36.0, 31.0, 26.0, 31.0, 39.0, 29.0, 34.0, 34.0, 34.0, 31.0, 33.0, 39.0, 35.0, 34.0, 29.0, 25.0, 27.0, 21.0, 16.0, 30.0, 14.0, 19.0, 20.0, 17.0, 18.0, 13.0, 10.0, 5.0, 3.0, 4.0, 4.0, 4.0, 3.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-25.640625, -24.81689453125, -23.9931640625, -23.16943359375, -22.345703125, -21.52197265625, -20.6982421875, -19.87451171875, -19.05078125, -18.22705078125, -17.4033203125, -16.57958984375, -15.755859375, -14.93212890625, -14.1083984375, -13.28466796875, -12.4609375, -11.63720703125, -10.8134765625, -9.98974609375, -9.166015625, -8.34228515625, -7.5185546875, -6.69482421875, -5.87109375, -5.04736328125, -4.2236328125, -3.39990234375, -2.576171875, -1.75244140625, -0.9287109375, -0.10498046875, 0.71875, 1.54248046875, 2.3662109375, 3.18994140625, 4.013671875, 4.83740234375, 5.6611328125, 6.48486328125, 7.30859375, 8.13232421875, 8.9560546875, 9.77978515625, 10.603515625, 11.42724609375, 12.2509765625, 13.07470703125, 13.8984375, 14.72216796875, 15.5458984375, 16.36962890625, 17.193359375, 18.01708984375, 18.8408203125, 19.66455078125, 20.48828125, 21.31201171875, 22.1357421875, 22.95947265625, 23.783203125, 24.60693359375, 25.4306640625, 26.25439453125, 27.078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 10.0, 16.0, 17.0, 32.0, 34.0, 46.0, 81.0, 123.0, 163.0, 287.0, 421.0, 631.0, 928.0, 1429.0, 2180.0, 3225.0, 4888.0, 7515.0, 11999.0, 19782.0, 39064.0, 718082.0, 166016.0, 27747.0, 15841.0, 9640.0, 6323.0, 4144.0, 2623.0, 1816.0, 1132.0, 790.0, 503.0, 362.0, 222.0, 170.0, 100.0, 44.0, 42.0, 34.0, 24.0, 9.0, 7.0, 8.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6484375, -10.2784423828125, -9.908447265625, -9.5384521484375, -9.16845703125, -8.7984619140625, -8.428466796875, -8.0584716796875, -7.6884765625, -7.3184814453125, -6.948486328125, -6.5784912109375, -6.20849609375, -5.8385009765625, -5.468505859375, -5.0985107421875, -4.728515625, -4.3585205078125, -3.988525390625, -3.6185302734375, -3.24853515625, -2.8785400390625, -2.508544921875, -2.1385498046875, -1.7685546875, -1.3985595703125, -1.028564453125, -0.6585693359375, -0.28857421875, 0.0814208984375, 0.451416015625, 0.8214111328125, 1.19140625, 1.5614013671875, 1.931396484375, 2.3013916015625, 2.67138671875, 3.0413818359375, 3.411376953125, 3.7813720703125, 4.1513671875, 4.5213623046875, 4.891357421875, 5.2613525390625, 5.63134765625, 6.0013427734375, 6.371337890625, 6.7413330078125, 7.111328125, 7.4813232421875, 7.851318359375, 8.2213134765625, 8.59130859375, 8.9613037109375, 9.331298828125, 9.7012939453125, 10.0712890625, 10.4412841796875, 10.811279296875, 11.1812744140625, 11.55126953125, 11.9212646484375, 12.291259765625, 12.6612548828125, 13.03125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 2.0, 4.0, 6.0, 8.0, 12.0, 14.0, 8.0, 13.0, 20.0, 15.0, 19.0, 15.0, 29.0, 29.0, 33.0, 31.0, 40.0, 42.0, 33.0, 42.0, 28.0, 36.0, 44.0, 30.0, 48.0, 35.0, 31.0, 37.0, 26.0, 31.0, 39.0, 31.0, 30.0, 24.0, 19.0, 14.0, 14.0, 8.0, 8.0, 7.0, 18.0, 11.0, 10.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.203125, -18.55859375, -17.9140625, -17.26953125, -16.625, -15.98046875, -15.3359375, -14.69140625, -14.046875, -13.40234375, -12.7578125, -12.11328125, -11.46875, -10.82421875, -10.1796875, -9.53515625, -8.890625, -8.24609375, -7.6015625, -6.95703125, -6.3125, -5.66796875, -5.0234375, -4.37890625, -3.734375, -3.08984375, -2.4453125, -1.80078125, -1.15625, -0.51171875, 0.1328125, 0.77734375, 1.421875, 2.06640625, 2.7109375, 3.35546875, 4.0, 4.64453125, 5.2890625, 5.93359375, 6.578125, 7.22265625, 7.8671875, 8.51171875, 9.15625, 9.80078125, 10.4453125, 11.08984375, 11.734375, 12.37890625, 13.0234375, 13.66796875, 14.3125, 14.95703125, 15.6015625, 16.24609375, 16.890625, 17.53515625, 18.1796875, 18.82421875, 19.46875, 20.11328125, 20.7578125, 21.40234375, 22.046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 9.0, 6.0, 23.0, 27.0, 46.0, 46.0, 81.0, 108.0, 152.0, 223.0, 354.0, 626.0, 879.0, 1479.0, 2462.0, 4324.0, 7273.0, 13116.0, 24083.0, 65679.0, 839444.0, 41144.0, 20114.0, 10991.0, 6502.0, 3616.0, 2081.0, 1328.0, 818.0, 547.0, 312.0, 210.0, 141.0, 103.0, 59.0, 44.0, 19.0, 29.0, 22.0, 12.0, 10.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2685546875, -1.2267608642578125, -1.184967041015625, -1.1431732177734375, -1.10137939453125, -1.0595855712890625, -1.017791748046875, -0.9759979248046875, -0.9342041015625, -0.8924102783203125, -0.850616455078125, -0.8088226318359375, -0.76702880859375, -0.7252349853515625, -0.683441162109375, -0.6416473388671875, -0.599853515625, -0.5580596923828125, -0.516265869140625, -0.4744720458984375, -0.43267822265625, -0.3908843994140625, -0.349090576171875, -0.3072967529296875, -0.2655029296875, -0.2237091064453125, -0.181915283203125, -0.1401214599609375, -0.09832763671875, -0.0565338134765625, -0.014739990234375, 0.0270538330078125, 0.06884765625, 0.1106414794921875, 0.152435302734375, 0.1942291259765625, 0.23602294921875, 0.2778167724609375, 0.319610595703125, 0.3614044189453125, 0.4031982421875, 0.4449920654296875, 0.486785888671875, 0.5285797119140625, 0.57037353515625, 0.6121673583984375, 0.653961181640625, 0.6957550048828125, 0.737548828125, 0.7793426513671875, 0.821136474609375, 0.8629302978515625, 0.90472412109375, 0.9465179443359375, 0.988311767578125, 1.0301055908203125, 1.0718994140625, 1.1136932373046875, 1.155487060546875, 1.1972808837890625, 1.23907470703125, 1.2808685302734375, 1.322662353515625, 1.3644561767578125, 1.40625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 16.0, 12.0, 14.0, 7.0, 9.0, 26.0, 34.0, 40.0, 49.0, 62.0, 55.0, 65.0, 61.0, 75.0, 62.0, 62.0, 69.0, 60.0, 43.0, 43.0, 37.0, 29.0, 18.0, 11.0, 12.0, 10.0, 2.0, 7.0, 2.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-6.109476089477539e-05, -5.9548765420913696e-05, -5.8002769947052e-05, -5.645677447319031e-05, -5.491077899932861e-05, -5.336478352546692e-05, -5.1818788051605225e-05, -5.027279257774353e-05, -4.8726797103881836e-05, -4.718080163002014e-05, -4.563480615615845e-05, -4.408881068229675e-05, -4.254281520843506e-05, -4.0996819734573364e-05, -3.945082426071167e-05, -3.7904828786849976e-05, -3.635883331298828e-05, -3.481283783912659e-05, -3.326684236526489e-05, -3.17208468914032e-05, -3.0174851417541504e-05, -2.862885594367981e-05, -2.7082860469818115e-05, -2.553686499595642e-05, -2.3990869522094727e-05, -2.2444874048233032e-05, -2.0898878574371338e-05, -1.9352883100509644e-05, -1.780688762664795e-05, -1.6260892152786255e-05, -1.471489667892456e-05, -1.3168901205062866e-05, -1.1622905731201172e-05, -1.0076910257339478e-05, -8.530914783477783e-06, -6.984919309616089e-06, -5.4389238357543945e-06, -3.8929283618927e-06, -2.346932888031006e-06, -8.009374141693115e-07, 7.450580596923828e-07, 2.291053533554077e-06, 3.8370490074157715e-06, 5.383044481277466e-06, 6.92903995513916e-06, 8.475035429000854e-06, 1.0021030902862549e-05, 1.1567026376724243e-05, 1.3113021850585938e-05, 1.4659017324447632e-05, 1.6205012798309326e-05, 1.775100827217102e-05, 1.9297003746032715e-05, 2.084299921989441e-05, 2.2388994693756104e-05, 2.3934990167617798e-05, 2.5480985641479492e-05, 2.7026981115341187e-05, 2.857297658920288e-05, 3.0118972063064575e-05, 3.166496753692627e-05, 3.3210963010787964e-05, 3.475695848464966e-05, 3.630295395851135e-05, 3.784894943237305e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 6.0, 6.0, 12.0, 10.0, 13.0, 26.0, 51.0, 71.0, 86.0, 152.0, 229.0, 338.0, 537.0, 823.0, 1322.0, 2031.0, 3076.0, 4658.0, 7192.0, 11359.0, 16839.0, 25211.0, 37084.0, 53596.0, 75131.0, 100936.0, 124855.0, 135214.0, 121992.0, 97143.0, 71711.0, 51455.0, 35241.0, 23777.0, 15908.0, 10491.0, 6974.0, 4673.0, 2896.0, 1961.0, 1155.0, 829.0, 515.0, 330.0, 211.0, 165.0, 106.0, 53.0, 36.0, 25.0, 14.0, 18.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.90966796875, -0.8807296752929688, -0.8517913818359375, -0.8228530883789062, -0.793914794921875, -0.7649765014648438, -0.7360382080078125, -0.7070999145507812, -0.67816162109375, -0.6492233276367188, -0.6202850341796875, -0.5913467407226562, -0.562408447265625, -0.5334701538085938, -0.5045318603515625, -0.47559356689453125, -0.4466552734375, -0.41771697998046875, -0.3887786865234375, -0.35984039306640625, -0.330902099609375, -0.30196380615234375, -0.2730255126953125, -0.24408721923828125, -0.21514892578125, -0.18621063232421875, -0.1572723388671875, -0.12833404541015625, -0.099395751953125, -0.07045745849609375, -0.0415191650390625, -0.01258087158203125, 0.016357421875, 0.04529571533203125, 0.0742340087890625, 0.10317230224609375, 0.132110595703125, 0.16104888916015625, 0.1899871826171875, 0.21892547607421875, 0.24786376953125, 0.27680206298828125, 0.3057403564453125, 0.33467864990234375, 0.363616943359375, 0.39255523681640625, 0.4214935302734375, 0.45043182373046875, 0.4793701171875, 0.5083084106445312, 0.5372467041015625, 0.5661849975585938, 0.595123291015625, 0.6240615844726562, 0.6529998779296875, 0.6819381713867188, 0.71087646484375, 0.7398147583007812, 0.7687530517578125, 0.7976913452148438, 0.826629638671875, 0.8555679321289062, 0.8845062255859375, 0.9134445190429688, 0.9423828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 1.0, 5.0, 0.0, 2.0, 5.0, 4.0, 4.0, 6.0, 7.0, 7.0, 8.0, 9.0, 19.0, 17.0, 13.0, 23.0, 20.0, 19.0, 23.0, 23.0, 34.0, 35.0, 38.0, 45.0, 44.0, 53.0, 48.0, 50.0, 46.0, 47.0, 43.0, 38.0, 24.0, 32.0, 24.0, 20.0, 21.0, 9.0, 20.0, 24.0, 10.0, 11.0, 9.0, 14.0, 12.0, 5.0, 6.0, 8.0, 8.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3662109375, -0.35453033447265625, -0.3428497314453125, -0.33116912841796875, -0.319488525390625, -0.30780792236328125, -0.2961273193359375, -0.28444671630859375, -0.27276611328125, -0.26108551025390625, -0.2494049072265625, -0.23772430419921875, -0.226043701171875, -0.21436309814453125, -0.2026824951171875, -0.19100189208984375, -0.1793212890625, -0.16764068603515625, -0.1559600830078125, -0.14427947998046875, -0.132598876953125, -0.12091827392578125, -0.1092376708984375, -0.09755706787109375, -0.08587646484375, -0.07419586181640625, -0.0625152587890625, -0.05083465576171875, -0.039154052734375, -0.02747344970703125, -0.0157928466796875, -0.00411224365234375, 0.007568359375, 0.01924896240234375, 0.0309295654296875, 0.04261016845703125, 0.054290771484375, 0.06597137451171875, 0.0776519775390625, 0.08933258056640625, 0.10101318359375, 0.11269378662109375, 0.1243743896484375, 0.13605499267578125, 0.147735595703125, 0.15941619873046875, 0.1710968017578125, 0.18277740478515625, 0.1944580078125, 0.20613861083984375, 0.2178192138671875, 0.22949981689453125, 0.241180419921875, 0.25286102294921875, 0.2645416259765625, 0.27622222900390625, 0.28790283203125, 0.29958343505859375, 0.3112640380859375, 0.32294464111328125, 0.334625244140625, 0.34630584716796875, 0.3579864501953125, 0.36966705322265625, 0.38134765625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 7.0, 7.0, 8.0, 15.0, 10.0, 8.0, 22.0, 17.0, 23.0, 28.0, 23.0, 22.0, 32.0, 42.0, 33.0, 30.0, 24.0, 36.0, 27.0, 49.0, 46.0, 32.0, 28.0, 33.0, 40.0, 44.0, 45.0, 47.0, 37.0, 28.0, 18.0, 20.0, 15.0, 34.0, 12.0, 16.0, 14.0, 3.0, 9.0, 9.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.501680374145508, -25.635757446289062, -24.769834518432617, -23.903911590576172, -23.037986755371094, -22.17206573486328, -21.306140899658203, -20.440217971801758, -19.574295043945312, -18.708372116088867, -17.842449188232422, -16.976526260375977, -16.11060333251953, -15.24467945098877, -14.378755569458008, -13.512832641601562, -12.646909713745117, -11.780986785888672, -10.915063858032227, -10.049139976501465, -9.18321704864502, -8.317294120788574, -7.451370716094971, -6.585447311401367, -5.719524383544922, -4.853601455688477, -3.987678050994873, -3.1217548847198486, -2.255831718444824, -1.389908790588379, -0.5239853858947754, 0.3419380187988281, 1.2078609466552734, 2.073784112930298, 2.9397072792053223, 3.8056304454803467, 4.671553611755371, 5.537476539611816, 6.40339994430542, 7.269323348999023, 8.135246276855469, 9.001169204711914, 9.86709213256836, 10.733016014099121, 11.598938941955566, 12.464861869812012, 13.330785751342773, 14.196708679199219, 15.062631607055664, 15.92855453491211, 16.794477462768555, 17.660400390625, 18.526325225830078, 19.39224624633789, 20.25817108154297, 21.124094009399414, 21.99001693725586, 22.855939865112305, 23.72186279296875, 24.587785720825195, 25.45370864868164, 26.31963348388672, 27.185556411743164, 28.05147933959961, 28.917402267456055]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 5.0, 9.0, 4.0, 6.0, 14.0, 12.0, 11.0, 8.0, 14.0, 13.0, 17.0, 20.0, 13.0, 29.0, 26.0, 27.0, 37.0, 32.0, 29.0, 29.0, 35.0, 34.0, 36.0, 31.0, 35.0, 28.0, 31.0, 42.0, 38.0, 36.0, 25.0, 25.0, 30.0, 20.0, 17.0, 24.0, 19.0, 18.0, 17.0, 18.0, 19.0, 14.0, 11.0, 4.0, 4.0, 4.0, 3.0, 4.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-25.635940551757812, -24.813968658447266, -23.99199676513672, -23.170024871826172, -22.348052978515625, -21.526081085205078, -20.70410919189453, -19.882137298583984, -19.060165405273438, -18.23819351196289, -17.416221618652344, -16.594249725341797, -15.77227783203125, -14.950305938720703, -14.12833309173584, -13.306361198425293, -12.48438835144043, -11.662416458129883, -10.840444564819336, -10.018472671508789, -9.196500778198242, -8.374528884887695, -7.552556037902832, -6.730584144592285, -5.908612251281738, -5.086640357971191, -4.2646684646606445, -3.4426960945129395, -2.6207242012023926, -1.7987523078918457, -0.9767799377441406, -0.15480804443359375, 0.6671638488769531, 1.4891358613967896, 2.311107873916626, 3.133080005645752, 3.955051898956299, 4.777023792266846, 5.598996162414551, 6.420968055725098, 7.2429399490356445, 8.064911842346191, 8.886883735656738, 9.708856582641602, 10.530828475952148, 11.352800369262695, 12.174772262573242, 12.996744155883789, 13.818716049194336, 14.640687942504883, 15.46265983581543, 16.284631729125977, 17.106603622436523, 17.92857551574707, 18.75054931640625, 19.572521209716797, 20.394493103027344, 21.21646499633789, 22.038436889648438, 22.860408782958984, 23.68238067626953, 24.504352569580078, 25.326324462890625, 26.148296356201172, 26.97026824951172]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 17.0, 29.0, 43.0, 87.0, 130.0, 193.0, 344.0, 572.0, 906.0, 1442.0, 2210.0, 3319.0, 5134.0, 7567.0, 11031.0, 15485.0, 21500.0, 28888.0, 38038.0, 48850.0, 59517.0, 69055.0, 78258.0, 83752.0, 86155.0, 84673.0, 78913.0, 69911.0, 60473.0, 49631.0, 39438.0, 30166.0, 22501.0, 16242.0, 11342.0, 7754.0, 5313.0, 3530.0, 2215.0, 1485.0, 942.0, 576.0, 358.0, 235.0, 147.0, 70.0, 50.0, 24.0, 23.0, 11.0, 2.0, 3.0, 4.0, 2.0], "bins": [-15.90625, -15.4459228515625, -14.985595703125, -14.5252685546875, -14.06494140625, -13.6046142578125, -13.144287109375, -12.6839599609375, -12.2236328125, -11.7633056640625, -11.302978515625, -10.8426513671875, -10.38232421875, -9.9219970703125, -9.461669921875, -9.0013427734375, -8.541015625, -8.0806884765625, -7.620361328125, -7.1600341796875, -6.69970703125, -6.2393798828125, -5.779052734375, -5.3187255859375, -4.8583984375, -4.3980712890625, -3.937744140625, -3.4774169921875, -3.01708984375, -2.5567626953125, -2.096435546875, -1.6361083984375, -1.17578125, -0.7154541015625, -0.255126953125, 0.2052001953125, 0.66552734375, 1.1258544921875, 1.586181640625, 2.0465087890625, 2.5068359375, 2.9671630859375, 3.427490234375, 3.8878173828125, 4.34814453125, 4.8084716796875, 5.268798828125, 5.7291259765625, 6.189453125, 6.6497802734375, 7.110107421875, 7.5704345703125, 8.03076171875, 8.4910888671875, 8.951416015625, 9.4117431640625, 9.8720703125, 10.3323974609375, 10.792724609375, 11.2530517578125, 11.71337890625, 12.1737060546875, 12.634033203125, 13.0943603515625, 13.5546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 11.0, 2.0, 6.0, 13.0, 16.0, 9.0, 6.0, 14.0, 14.0, 18.0, 18.0, 15.0, 28.0, 24.0, 30.0, 38.0, 31.0, 29.0, 30.0, 29.0, 38.0, 32.0, 35.0, 32.0, 29.0, 34.0, 38.0, 36.0, 39.0, 25.0, 29.0, 22.0, 22.0, 20.0, 21.0, 24.0, 14.0, 20.0, 13.0, 24.0, 11.0, 14.0, 3.0, 6.0, 3.0, 1.0, 6.0, 5.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-24.9375, -24.14013671875, -23.3427734375, -22.54541015625, -21.748046875, -20.95068359375, -20.1533203125, -19.35595703125, -18.55859375, -17.76123046875, -16.9638671875, -16.16650390625, -15.369140625, -14.57177734375, -13.7744140625, -12.97705078125, -12.1796875, -11.38232421875, -10.5849609375, -9.78759765625, -8.990234375, -8.19287109375, -7.3955078125, -6.59814453125, -5.80078125, -5.00341796875, -4.2060546875, -3.40869140625, -2.611328125, -1.81396484375, -1.0166015625, -0.21923828125, 0.578125, 1.37548828125, 2.1728515625, 2.97021484375, 3.767578125, 4.56494140625, 5.3623046875, 6.15966796875, 6.95703125, 7.75439453125, 8.5517578125, 9.34912109375, 10.146484375, 10.94384765625, 11.7412109375, 12.53857421875, 13.3359375, 14.13330078125, 14.9306640625, 15.72802734375, 16.525390625, 17.32275390625, 18.1201171875, 18.91748046875, 19.71484375, 20.51220703125, 21.3095703125, 22.10693359375, 22.904296875, 23.70166015625, 24.4990234375, 25.29638671875, 26.09375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 11.0, 14.0, 27.0, 34.0, 55.0, 98.0, 145.0, 245.0, 342.0, 662.0, 1036.0, 1689.0, 2598.0, 3894.0, 5772.0, 8796.0, 12778.0, 17930.0, 25001.0, 33749.0, 43704.0, 55106.0, 65558.0, 76326.0, 83754.0, 87760.0, 88021.0, 82991.0, 75755.0, 65311.0, 53818.0, 43464.0, 32894.0, 24586.0, 17423.0, 12440.0, 8575.0, 5707.0, 3729.0, 2444.0, 1529.0, 1048.0, 688.0, 403.0, 253.0, 159.0, 95.0, 58.0, 39.0, 20.0, 11.0, 9.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-14.484375, -14.03125, -13.578125, -13.125, -12.671875, -12.21875, -11.765625, -11.3125, -10.859375, -10.40625, -9.953125, -9.5, -9.046875, -8.59375, -8.140625, -7.6875, -7.234375, -6.78125, -6.328125, -5.875, -5.421875, -4.96875, -4.515625, -4.0625, -3.609375, -3.15625, -2.703125, -2.25, -1.796875, -1.34375, -0.890625, -0.4375, 0.015625, 0.46875, 0.921875, 1.375, 1.828125, 2.28125, 2.734375, 3.1875, 3.640625, 4.09375, 4.546875, 5.0, 5.453125, 5.90625, 6.359375, 6.8125, 7.265625, 7.71875, 8.171875, 8.625, 9.078125, 9.53125, 9.984375, 10.4375, 10.890625, 11.34375, 11.796875, 12.25, 12.703125, 13.15625, 13.609375, 14.0625, 14.515625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 4.0, 8.0, 8.0, 7.0, 7.0, 8.0, 17.0, 15.0, 11.0, 24.0, 23.0, 27.0, 22.0, 31.0, 37.0, 33.0, 38.0, 24.0, 41.0, 44.0, 46.0, 47.0, 31.0, 46.0, 35.0, 33.0, 44.0, 27.0, 29.0, 31.0, 22.0, 31.0, 14.0, 19.0, 25.0, 20.0, 7.0, 10.0, 6.0, 14.0, 4.0, 5.0, 4.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.1875, -18.5791015625, -17.970703125, -17.3623046875, -16.75390625, -16.1455078125, -15.537109375, -14.9287109375, -14.3203125, -13.7119140625, -13.103515625, -12.4951171875, -11.88671875, -11.2783203125, -10.669921875, -10.0615234375, -9.453125, -8.8447265625, -8.236328125, -7.6279296875, -7.01953125, -6.4111328125, -5.802734375, -5.1943359375, -4.5859375, -3.9775390625, -3.369140625, -2.7607421875, -2.15234375, -1.5439453125, -0.935546875, -0.3271484375, 0.28125, 0.8896484375, 1.498046875, 2.1064453125, 2.71484375, 3.3232421875, 3.931640625, 4.5400390625, 5.1484375, 5.7568359375, 6.365234375, 6.9736328125, 7.58203125, 8.1904296875, 8.798828125, 9.4072265625, 10.015625, 10.6240234375, 11.232421875, 11.8408203125, 12.44921875, 13.0576171875, 13.666015625, 14.2744140625, 14.8828125, 15.4912109375, 16.099609375, 16.7080078125, 17.31640625, 17.9248046875, 18.533203125, 19.1416015625, 19.75]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 7.0, 0.0, 6.0, 8.0, 6.0, 13.0, 14.0, 27.0, 47.0, 56.0, 79.0, 164.0, 244.0, 409.0, 709.0, 1226.0, 1960.0, 3440.0, 6121.0, 10144.0, 17177.0, 27282.0, 41218.0, 60208.0, 80591.0, 101127.0, 114787.0, 120698.0, 114869.0, 100015.0, 78834.0, 58996.0, 40670.0, 26423.0, 16771.0, 9979.0, 5915.0, 3465.0, 1978.0, 1152.0, 689.0, 412.0, 235.0, 140.0, 85.0, 54.0, 41.0, 21.0, 18.0, 14.0, 9.0, 6.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.3046875, -8.0489501953125, -7.793212890625, -7.5374755859375, -7.28173828125, -7.0260009765625, -6.770263671875, -6.5145263671875, -6.2587890625, -6.0030517578125, -5.747314453125, -5.4915771484375, -5.23583984375, -4.9801025390625, -4.724365234375, -4.4686279296875, -4.212890625, -3.9571533203125, -3.701416015625, -3.4456787109375, -3.18994140625, -2.9342041015625, -2.678466796875, -2.4227294921875, -2.1669921875, -1.9112548828125, -1.655517578125, -1.3997802734375, -1.14404296875, -0.8883056640625, -0.632568359375, -0.3768310546875, -0.12109375, 0.1346435546875, 0.390380859375, 0.6461181640625, 0.90185546875, 1.1575927734375, 1.413330078125, 1.6690673828125, 1.9248046875, 2.1805419921875, 2.436279296875, 2.6920166015625, 2.94775390625, 3.2034912109375, 3.459228515625, 3.7149658203125, 3.970703125, 4.2264404296875, 4.482177734375, 4.7379150390625, 4.99365234375, 5.2493896484375, 5.505126953125, 5.7608642578125, 6.0166015625, 6.2723388671875, 6.528076171875, 6.7838134765625, 7.03955078125, 7.2952880859375, 7.551025390625, 7.8067626953125, 8.0625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 8.0, 3.0, 3.0, 7.0, 6.0, 8.0, 14.0, 17.0, 18.0, 17.0, 27.0, 21.0, 42.0, 47.0, 32.0, 47.0, 60.0, 52.0, 50.0, 55.0, 53.0, 60.0, 45.0, 49.0, 47.0, 35.0, 39.0, 24.0, 18.0, 15.0, 22.0, 10.0, 14.0, 10.0, 7.0, 3.0, 6.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0012569427490234375, -0.0012216418981552124, -0.0011863410472869873, -0.0011510401964187622, -0.0011157393455505371, -0.001080438494682312, -0.001045137643814087, -0.0010098367929458618, -0.0009745359420776367, -0.0009392350912094116, -0.0009039342403411865, -0.0008686333894729614, -0.0008333325386047363, -0.0007980316877365112, -0.0007627308368682861, -0.000727429986000061, -0.0006921291351318359, -0.0006568282842636108, -0.0006215274333953857, -0.0005862265825271606, -0.0005509257316589355, -0.0005156248807907104, -0.00048032402992248535, -0.00044502317905426025, -0.00040972232818603516, -0.00037442147731781006, -0.00033912062644958496, -0.00030381977558135986, -0.00026851892471313477, -0.00023321807384490967, -0.00019791722297668457, -0.00016261637210845947, -0.00012731552124023438, -9.201467037200928e-05, -5.671381950378418e-05, -2.1412968635559082e-05, 1.3887882232666016e-05, 4.918873310089111e-05, 8.448958396911621e-05, 0.00011979043483734131, 0.0001550912857055664, 0.0001903921365737915, 0.0002256929874420166, 0.0002609938383102417, 0.0002962946891784668, 0.0003315955400466919, 0.000366896390914917, 0.0004021972417831421, 0.0004374980926513672, 0.0004727989435195923, 0.0005080997943878174, 0.0005434006452560425, 0.0005787014961242676, 0.0006140023469924927, 0.0006493031978607178, 0.0006846040487289429, 0.000719904899597168, 0.0007552057504653931, 0.0007905066013336182, 0.0008258074522018433, 0.0008611083030700684, 0.0008964091539382935, 0.0009317100048065186, 0.0009670108556747437, 0.0010023117065429688]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 12.0, 18.0, 32.0, 46.0, 69.0, 117.0, 145.0, 262.0, 446.0, 762.0, 1369.0, 2410.0, 4343.0, 7936.0, 13776.0, 24698.0, 40185.0, 62458.0, 89809.0, 116271.0, 134072.0, 137145.0, 124200.0, 100007.0, 71648.0, 47663.0, 29335.0, 17126.0, 9835.0, 5299.0, 3002.0, 1714.0, 928.0, 534.0, 327.0, 205.0, 118.0, 69.0, 44.0, 29.0, 17.0, 19.0, 10.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.25, -9.9212646484375, -9.592529296875, -9.2637939453125, -8.93505859375, -8.6063232421875, -8.277587890625, -7.9488525390625, -7.6201171875, -7.2913818359375, -6.962646484375, -6.6339111328125, -6.30517578125, -5.9764404296875, -5.647705078125, -5.3189697265625, -4.990234375, -4.6614990234375, -4.332763671875, -4.0040283203125, -3.67529296875, -3.3465576171875, -3.017822265625, -2.6890869140625, -2.3603515625, -2.0316162109375, -1.702880859375, -1.3741455078125, -1.04541015625, -0.7166748046875, -0.387939453125, -0.0592041015625, 0.26953125, 0.5982666015625, 0.927001953125, 1.2557373046875, 1.58447265625, 1.9132080078125, 2.241943359375, 2.5706787109375, 2.8994140625, 3.2281494140625, 3.556884765625, 3.8856201171875, 4.21435546875, 4.5430908203125, 4.871826171875, 5.2005615234375, 5.529296875, 5.8580322265625, 6.186767578125, 6.5155029296875, 6.84423828125, 7.1729736328125, 7.501708984375, 7.8304443359375, 8.1591796875, 8.4879150390625, 8.816650390625, 9.1453857421875, 9.47412109375, 9.8028564453125, 10.131591796875, 10.4603271484375, 10.7890625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 9.0, 3.0, 12.0, 6.0, 12.0, 15.0, 15.0, 18.0, 20.0, 19.0, 22.0, 36.0, 35.0, 32.0, 43.0, 46.0, 57.0, 56.0, 52.0, 62.0, 51.0, 49.0, 55.0, 46.0, 30.0, 41.0, 26.0, 23.0, 17.0, 14.0, 14.0, 12.0, 12.0, 9.0, 5.0, 9.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.95703125, -3.81304931640625, -3.6690673828125, -3.52508544921875, -3.381103515625, -3.23712158203125, -3.0931396484375, -2.94915771484375, -2.80517578125, -2.66119384765625, -2.5172119140625, -2.37322998046875, -2.229248046875, -2.08526611328125, -1.9412841796875, -1.79730224609375, -1.6533203125, -1.50933837890625, -1.3653564453125, -1.22137451171875, -1.077392578125, -0.93341064453125, -0.7894287109375, -0.64544677734375, -0.50146484375, -0.35748291015625, -0.2135009765625, -0.06951904296875, 0.074462890625, 0.21844482421875, 0.3624267578125, 0.50640869140625, 0.650390625, 0.79437255859375, 0.9383544921875, 1.08233642578125, 1.226318359375, 1.37030029296875, 1.5142822265625, 1.65826416015625, 1.80224609375, 1.94622802734375, 2.0902099609375, 2.23419189453125, 2.378173828125, 2.52215576171875, 2.6661376953125, 2.81011962890625, 2.9541015625, 3.09808349609375, 3.2420654296875, 3.38604736328125, 3.530029296875, 3.67401123046875, 3.8179931640625, 3.96197509765625, 4.10595703125, 4.24993896484375, 4.3939208984375, 4.53790283203125, 4.681884765625, 4.82586669921875, 4.9698486328125, 5.11383056640625, 5.2578125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 4.0, 4.0, 8.0, 3.0, 8.0, 8.0, 11.0, 6.0, 16.0, 13.0, 12.0, 24.0, 26.0, 17.0, 25.0, 27.0, 31.0, 44.0, 39.0, 29.0, 41.0, 33.0, 31.0, 33.0, 40.0, 34.0, 40.0, 36.0, 34.0, 41.0, 33.0, 35.0, 39.0, 29.0, 20.0, 26.0, 17.0, 19.0, 9.0, 18.0, 8.0, 12.0, 8.0, 2.0, 5.0, 5.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-25.911949157714844, -25.077377319335938, -24.2428035736084, -23.408231735229492, -22.573657989501953, -21.739086151123047, -20.904512405395508, -20.0699405670166, -19.235366821289062, -18.400794982910156, -17.566221237182617, -16.73164939880371, -15.897075653076172, -15.062503814697266, -14.227930068969727, -13.39335823059082, -12.558785438537598, -11.724212646484375, -10.889639854431152, -10.05506706237793, -9.220494270324707, -8.385921478271484, -7.55134916305542, -6.716776371002197, -5.882203578948975, -5.047630786895752, -4.213057994842529, -3.3784854412078857, -2.543912649154663, -1.7093400955200195, -0.8747673034667969, -0.04019451141357422, 0.7943782806396484, 1.628951072692871, 2.4635238647460938, 3.2980964183807373, 4.132669448852539, 4.9672417640686035, 5.801814556121826, 6.636387348175049, 7.4709601402282715, 8.305532455444336, 9.140105247497559, 9.974678039550781, 10.809250831604004, 11.643823623657227, 12.47839641571045, 13.312969207763672, 14.147541999816895, 14.982114791870117, 15.81668758392334, 16.651260375976562, 17.48583221435547, 18.320405960083008, 19.154977798461914, 19.989551544189453, 20.82412338256836, 21.658695220947266, 22.493268966674805, 23.32784080505371, 24.16241455078125, 24.996986389160156, 25.831560134887695, 26.6661319732666, 27.50070571899414]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 8.0, 6.0, 4.0, 6.0, 8.0, 13.0, 17.0, 6.0, 17.0, 18.0, 16.0, 22.0, 21.0, 27.0, 29.0, 35.0, 27.0, 32.0, 51.0, 41.0, 37.0, 37.0, 34.0, 38.0, 25.0, 38.0, 28.0, 29.0, 35.0, 36.0, 28.0, 28.0, 34.0, 25.0, 21.0, 21.0, 21.0, 14.0, 8.0, 12.0, 6.0, 13.0, 4.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.85369110107422, -26.894153594970703, -25.934616088867188, -24.975078582763672, -24.015541076660156, -23.05600357055664, -22.096466064453125, -21.13692855834961, -20.177391052246094, -19.217853546142578, -18.258316040039062, -17.298778533935547, -16.33924102783203, -15.379703521728516, -14.420166969299316, -13.4606294631958, -12.501092910766602, -11.541555404663086, -10.58201789855957, -9.622480392456055, -8.662942886352539, -7.703405857086182, -6.743868827819824, -5.784331321716309, -4.824793815612793, -3.8652563095092773, -2.905719041824341, -1.9461817741394043, -0.9866442680358887, -0.027106761932373047, 0.9324302673339844, 1.8919677734375, 2.8515052795410156, 3.8110427856445312, 4.770580291748047, 5.730117321014404, 6.68965482711792, 7.6491923332214355, 8.608729362487793, 9.568266868591309, 10.527804374694824, 11.48734188079834, 12.446879386901855, 13.406415939331055, 14.36595344543457, 15.325490951538086, 16.2850284576416, 17.244565963745117, 18.204103469848633, 19.16364097595215, 20.123178482055664, 21.08271598815918, 22.042253494262695, 23.00179100036621, 23.961326599121094, 24.92086410522461, 25.880401611328125, 26.83993911743164, 27.799476623535156, 28.759014129638672, 29.718551635742188, 30.678089141845703, 31.63762664794922, 32.597164154052734, 33.55670166015625]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 6.0, 17.0, 26.0, 48.0, 65.0, 152.0, 192.0, 389.0, 638.0, 1035.0, 1739.0, 2819.0, 4554.0, 7661.0, 12053.0, 19075.0, 29705.0, 44840.0, 66813.0, 97806.0, 137939.0, 187777.0, 242877.0, 301460.0, 353704.0, 388907.0, 401987.0, 389910.0, 352409.0, 299327.0, 241442.0, 184776.0, 135796.0, 95457.0, 66050.0, 44629.0, 29171.0, 18794.0, 11884.0, 7657.0, 4759.0, 2988.0, 1882.0, 1211.0, 730.0, 427.0, 261.0, 188.0, 107.0, 66.0, 30.0, 18.0, 20.0, 7.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0], "bins": [-19.03125, -18.406982421875, -17.78271484375, -17.158447265625, -16.5341796875, -15.909912109375, -15.28564453125, -14.661376953125, -14.037109375, -13.412841796875, -12.78857421875, -12.164306640625, -11.5400390625, -10.915771484375, -10.29150390625, -9.667236328125, -9.04296875, -8.418701171875, -7.79443359375, -7.170166015625, -6.5458984375, -5.921630859375, -5.29736328125, -4.673095703125, -4.048828125, -3.424560546875, -2.80029296875, -2.176025390625, -1.5517578125, -0.927490234375, -0.30322265625, 0.321044921875, 0.9453125, 1.569580078125, 2.19384765625, 2.818115234375, 3.4423828125, 4.066650390625, 4.69091796875, 5.315185546875, 5.939453125, 6.563720703125, 7.18798828125, 7.812255859375, 8.4365234375, 9.060791015625, 9.68505859375, 10.309326171875, 10.93359375, 11.557861328125, 12.18212890625, 12.806396484375, 13.4306640625, 14.054931640625, 14.67919921875, 15.303466796875, 15.927734375, 16.552001953125, 17.17626953125, 17.800537109375, 18.4248046875, 19.049072265625, 19.67333984375, 20.297607421875, 20.921875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 7.0, 4.0, 6.0, 10.0, 15.0, 12.0, 8.0, 19.0, 15.0, 15.0, 25.0, 18.0, 26.0, 36.0, 32.0, 26.0, 34.0, 50.0, 43.0, 33.0, 40.0, 35.0, 32.0, 26.0, 37.0, 32.0, 27.0, 30.0, 39.0, 26.0, 32.0, 27.0, 28.0, 24.0, 21.0, 19.0, 15.0, 9.0, 11.0, 9.0, 9.0, 4.0, 7.0, 9.0, 7.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.0625, -24.199951171875, -23.33740234375, -22.474853515625, -21.6123046875, -20.749755859375, -19.88720703125, -19.024658203125, -18.162109375, -17.299560546875, -16.43701171875, -15.574462890625, -14.7119140625, -13.849365234375, -12.98681640625, -12.124267578125, -11.26171875, -10.399169921875, -9.53662109375, -8.674072265625, -7.8115234375, -6.948974609375, -6.08642578125, -5.223876953125, -4.361328125, -3.498779296875, -2.63623046875, -1.773681640625, -0.9111328125, -0.048583984375, 0.81396484375, 1.676513671875, 2.5390625, 3.401611328125, 4.26416015625, 5.126708984375, 5.9892578125, 6.851806640625, 7.71435546875, 8.576904296875, 9.439453125, 10.302001953125, 11.16455078125, 12.027099609375, 12.8896484375, 13.752197265625, 14.61474609375, 15.477294921875, 16.33984375, 17.202392578125, 18.06494140625, 18.927490234375, 19.7900390625, 20.652587890625, 21.51513671875, 22.377685546875, 23.240234375, 24.102783203125, 24.96533203125, 25.827880859375, 26.6904296875, 27.552978515625, 28.41552734375, 29.278076171875, 30.140625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 7.0, 16.0, 41.0, 57.0, 97.0, 180.0, 278.0, 490.0, 833.0, 1297.0, 2189.0, 3690.0, 5940.0, 9439.0, 15027.0, 23497.0, 35960.0, 53630.0, 77549.0, 110396.0, 149884.0, 196326.0, 246677.0, 297622.0, 339310.0, 366745.0, 375410.0, 363799.0, 333264.0, 290457.0, 240090.0, 188820.0, 143323.0, 104294.0, 74053.0, 50528.0, 33590.0, 22296.0, 14192.0, 8863.0, 5552.0, 3435.0, 2075.0, 1264.0, 707.0, 453.0, 275.0, 167.0, 85.0, 52.0, 36.0, 19.0, 10.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.6875, -19.06103515625, -18.4345703125, -17.80810546875, -17.181640625, -16.55517578125, -15.9287109375, -15.30224609375, -14.67578125, -14.04931640625, -13.4228515625, -12.79638671875, -12.169921875, -11.54345703125, -10.9169921875, -10.29052734375, -9.6640625, -9.03759765625, -8.4111328125, -7.78466796875, -7.158203125, -6.53173828125, -5.9052734375, -5.27880859375, -4.65234375, -4.02587890625, -3.3994140625, -2.77294921875, -2.146484375, -1.52001953125, -0.8935546875, -0.26708984375, 0.359375, 0.98583984375, 1.6123046875, 2.23876953125, 2.865234375, 3.49169921875, 4.1181640625, 4.74462890625, 5.37109375, 5.99755859375, 6.6240234375, 7.25048828125, 7.876953125, 8.50341796875, 9.1298828125, 9.75634765625, 10.3828125, 11.00927734375, 11.6357421875, 12.26220703125, 12.888671875, 13.51513671875, 14.1416015625, 14.76806640625, 15.39453125, 16.02099609375, 16.6474609375, 17.27392578125, 17.900390625, 18.52685546875, 19.1533203125, 19.77978515625, 20.40625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 7.0, 6.0, 14.0, 19.0, 19.0, 21.0, 25.0, 32.0, 60.0, 60.0, 75.0, 99.0, 90.0, 119.0, 127.0, 143.0, 185.0, 149.0, 181.0, 208.0, 189.0, 231.0, 202.0, 196.0, 180.0, 180.0, 162.0, 169.0, 144.0, 134.0, 134.0, 118.0, 72.0, 63.0, 56.0, 40.0, 40.0, 26.0, 27.0, 20.0, 13.0, 17.0, 9.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2265625, -12.8109130859375, -12.395263671875, -11.9796142578125, -11.56396484375, -11.1483154296875, -10.732666015625, -10.3170166015625, -9.9013671875, -9.4857177734375, -9.070068359375, -8.6544189453125, -8.23876953125, -7.8231201171875, -7.407470703125, -6.9918212890625, -6.576171875, -6.1605224609375, -5.744873046875, -5.3292236328125, -4.91357421875, -4.4979248046875, -4.082275390625, -3.6666259765625, -3.2509765625, -2.8353271484375, -2.419677734375, -2.0040283203125, -1.58837890625, -1.1727294921875, -0.757080078125, -0.3414306640625, 0.07421875, 0.4898681640625, 0.905517578125, 1.3211669921875, 1.73681640625, 2.1524658203125, 2.568115234375, 2.9837646484375, 3.3994140625, 3.8150634765625, 4.230712890625, 4.6463623046875, 5.06201171875, 5.4776611328125, 5.893310546875, 6.3089599609375, 6.724609375, 7.1402587890625, 7.555908203125, 7.9715576171875, 8.38720703125, 8.8028564453125, 9.218505859375, 9.6341552734375, 10.0498046875, 10.4654541015625, 10.881103515625, 11.2967529296875, 11.71240234375, 12.1280517578125, 12.543701171875, 12.9593505859375, 13.375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 3.0, 8.0, 3.0, 11.0, 21.0, 20.0, 17.0, 25.0, 28.0, 31.0, 31.0, 24.0, 34.0, 41.0, 33.0, 37.0, 47.0, 48.0, 41.0, 46.0, 40.0, 48.0, 38.0, 43.0, 39.0, 24.0, 41.0, 34.0, 25.0, 11.0, 23.0, 15.0, 13.0, 12.0, 12.0, 4.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.273366928100586, -30.314577102661133, -29.355789184570312, -28.39699935913086, -27.43821144104004, -26.479421615600586, -25.520633697509766, -24.561843872070312, -23.60305404663086, -22.644264221191406, -21.685476303100586, -20.726686477661133, -19.767898559570312, -18.80910873413086, -17.850318908691406, -16.891530990600586, -15.932743072509766, -14.973954200744629, -14.015165328979492, -13.056375503540039, -12.097587585449219, -11.138797760009766, -10.180008888244629, -9.221220016479492, -8.262431144714355, -7.303642272949219, -6.344853401184082, -5.386064052581787, -4.42727518081665, -3.4684863090515137, -2.5096969604492188, -1.550908088684082, -0.5921192169189453, 0.36666977405548096, 1.3254587650299072, 2.284247875213623, 3.2430367469787598, 4.2018256187438965, 5.160614967346191, 6.119403839111328, 7.078192710876465, 8.036981582641602, 8.995770454406738, 9.954559326171875, 10.913349151611328, 11.872137069702148, 12.830926895141602, 13.789715766906738, 14.748504638671875, 15.707293510437012, 16.66608238220215, 17.6248722076416, 18.583660125732422, 19.542449951171875, 20.501239776611328, 21.46002769470215, 22.41881561279297, 23.377605438232422, 24.336393356323242, 25.295183181762695, 26.253971099853516, 27.21276092529297, 28.171550750732422, 29.130338668823242, 30.089128494262695]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 4.0, 8.0, 5.0, 5.0, 15.0, 17.0, 17.0, 19.0, 15.0, 25.0, 23.0, 17.0, 24.0, 29.0, 28.0, 30.0, 41.0, 31.0, 45.0, 40.0, 40.0, 44.0, 53.0, 51.0, 38.0, 34.0, 29.0, 31.0, 24.0, 24.0, 31.0, 26.0, 19.0, 30.0, 16.0, 11.0, 10.0, 11.0, 9.0, 5.0, 8.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.164623260498047, -28.139732360839844, -27.114843368530273, -26.089954376220703, -25.0650634765625, -24.040172576904297, -23.015283584594727, -21.990394592285156, -20.965503692626953, -19.94061279296875, -18.91572380065918, -17.89083480834961, -16.865943908691406, -15.84105396270752, -14.816164016723633, -13.791274070739746, -12.76638412475586, -11.741494178771973, -10.716604232788086, -9.6917142868042, -8.666824340820312, -7.641934394836426, -6.617044448852539, -5.592154502868652, -4.567264556884766, -3.542374610900879, -2.517484664916992, -1.4925947189331055, -0.46770477294921875, 0.557185173034668, 1.5820751190185547, 2.6069650650024414, 3.631855010986328, 4.656744956970215, 5.681634902954102, 6.706524848937988, 7.731414794921875, 8.756304740905762, 9.781194686889648, 10.806084632873535, 11.830974578857422, 12.855864524841309, 13.880754470825195, 14.905644416809082, 15.930534362792969, 16.955425262451172, 17.980314254760742, 19.005203247070312, 20.030094146728516, 21.05498504638672, 22.07987403869629, 23.10476303100586, 24.129653930664062, 25.154544830322266, 26.179433822631836, 27.204322814941406, 28.22921371459961, 29.254104614257812, 30.278993606567383, 31.303882598876953, 32.328773498535156, 33.35366439819336, 34.37855529785156, 35.4034423828125, 36.4283332824707]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 11.0, 17.0, 23.0, 48.0, 71.0, 78.0, 140.0, 227.0, 379.0, 523.0, 842.0, 1405.0, 2080.0, 3377.0, 5309.0, 8279.0, 12716.0, 19372.0, 28495.0, 41227.0, 56595.0, 74345.0, 92573.0, 106586.0, 112012.0, 109481.0, 96285.0, 79170.0, 60553.0, 44285.0, 31302.0, 21429.0, 14229.0, 9050.0, 5868.0, 3753.0, 2376.0, 1500.0, 906.0, 626.0, 392.0, 228.0, 134.0, 101.0, 62.0, 35.0, 24.0, 8.0, 9.0, 7.0, 6.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.03515625, -3.90753173828125, -3.7799072265625, -3.65228271484375, -3.524658203125, -3.39703369140625, -3.2694091796875, -3.14178466796875, -3.01416015625, -2.88653564453125, -2.7589111328125, -2.63128662109375, -2.503662109375, -2.37603759765625, -2.2484130859375, -2.12078857421875, -1.9931640625, -1.86553955078125, -1.7379150390625, -1.61029052734375, -1.482666015625, -1.35504150390625, -1.2274169921875, -1.09979248046875, -0.97216796875, -0.84454345703125, -0.7169189453125, -0.58929443359375, -0.461669921875, -0.33404541015625, -0.2064208984375, -0.07879638671875, 0.048828125, 0.17645263671875, 0.3040771484375, 0.43170166015625, 0.559326171875, 0.68695068359375, 0.8145751953125, 0.94219970703125, 1.06982421875, 1.19744873046875, 1.3250732421875, 1.45269775390625, 1.580322265625, 1.70794677734375, 1.8355712890625, 1.96319580078125, 2.0908203125, 2.21844482421875, 2.3460693359375, 2.47369384765625, 2.601318359375, 2.72894287109375, 2.8565673828125, 2.98419189453125, 3.11181640625, 3.23944091796875, 3.3670654296875, 3.49468994140625, 3.622314453125, 3.74993896484375, 3.8775634765625, 4.00518798828125, 4.1328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 3.0, 5.0, 7.0, 5.0, 6.0, 14.0, 18.0, 15.0, 21.0, 14.0, 27.0, 22.0, 16.0, 24.0, 27.0, 28.0, 31.0, 39.0, 33.0, 44.0, 41.0, 40.0, 43.0, 54.0, 51.0, 39.0, 33.0, 30.0, 28.0, 27.0, 23.0, 30.0, 29.0, 17.0, 29.0, 18.0, 10.0, 11.0, 10.0, 10.0, 5.0, 8.0, 6.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.15625, -28.13037109375, -27.1044921875, -26.07861328125, -25.052734375, -24.02685546875, -23.0009765625, -21.97509765625, -20.94921875, -19.92333984375, -18.8974609375, -17.87158203125, -16.845703125, -15.81982421875, -14.7939453125, -13.76806640625, -12.7421875, -11.71630859375, -10.6904296875, -9.66455078125, -8.638671875, -7.61279296875, -6.5869140625, -5.56103515625, -4.53515625, -3.50927734375, -2.4833984375, -1.45751953125, -0.431640625, 0.59423828125, 1.6201171875, 2.64599609375, 3.671875, 4.69775390625, 5.7236328125, 6.74951171875, 7.775390625, 8.80126953125, 9.8271484375, 10.85302734375, 11.87890625, 12.90478515625, 13.9306640625, 14.95654296875, 15.982421875, 17.00830078125, 18.0341796875, 19.06005859375, 20.0859375, 21.11181640625, 22.1376953125, 23.16357421875, 24.189453125, 25.21533203125, 26.2412109375, 27.26708984375, 28.29296875, 29.31884765625, 30.3447265625, 31.37060546875, 32.396484375, 33.42236328125, 34.4482421875, 35.47412109375, 36.5]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 14.0, 11.0, 19.0, 26.0, 56.0, 59.0, 105.0, 162.0, 241.0, 381.0, 531.0, 798.0, 1080.0, 1683.0, 2337.0, 3325.0, 4958.0, 7206.0, 10599.0, 16337.0, 27789.0, 153345.0, 702867.0, 50568.0, 21850.0, 13548.0, 8919.0, 6143.0, 4172.0, 2982.0, 2045.0, 1376.0, 973.0, 640.0, 452.0, 328.0, 216.0, 140.0, 96.0, 69.0, 38.0, 16.0, 22.0, 14.0, 13.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.9296875, -8.6614990234375, -8.393310546875, -8.1251220703125, -7.85693359375, -7.5887451171875, -7.320556640625, -7.0523681640625, -6.7841796875, -6.5159912109375, -6.247802734375, -5.9796142578125, -5.71142578125, -5.4432373046875, -5.175048828125, -4.9068603515625, -4.638671875, -4.3704833984375, -4.102294921875, -3.8341064453125, -3.56591796875, -3.2977294921875, -3.029541015625, -2.7613525390625, -2.4931640625, -2.2249755859375, -1.956787109375, -1.6885986328125, -1.42041015625, -1.1522216796875, -0.884033203125, -0.6158447265625, -0.34765625, -0.0794677734375, 0.188720703125, 0.4569091796875, 0.72509765625, 0.9932861328125, 1.261474609375, 1.5296630859375, 1.7978515625, 2.0660400390625, 2.334228515625, 2.6024169921875, 2.87060546875, 3.1387939453125, 3.406982421875, 3.6751708984375, 3.943359375, 4.2115478515625, 4.479736328125, 4.7479248046875, 5.01611328125, 5.2843017578125, 5.552490234375, 5.8206787109375, 6.0888671875, 6.3570556640625, 6.625244140625, 6.8934326171875, 7.16162109375, 7.4298095703125, 7.697998046875, 7.9661865234375, 8.234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 3.0, 11.0, 10.0, 11.0, 13.0, 21.0, 21.0, 20.0, 18.0, 36.0, 29.0, 27.0, 31.0, 25.0, 33.0, 41.0, 40.0, 45.0, 30.0, 34.0, 43.0, 33.0, 43.0, 47.0, 39.0, 37.0, 31.0, 17.0, 23.0, 33.0, 20.0, 29.0, 18.0, 12.0, 14.0, 12.0, 8.0, 7.0, 7.0, 10.0, 4.0, 2.0, 4.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.53125, -21.847900390625, -21.16455078125, -20.481201171875, -19.7978515625, -19.114501953125, -18.43115234375, -17.747802734375, -17.064453125, -16.381103515625, -15.69775390625, -15.014404296875, -14.3310546875, -13.647705078125, -12.96435546875, -12.281005859375, -11.59765625, -10.914306640625, -10.23095703125, -9.547607421875, -8.8642578125, -8.180908203125, -7.49755859375, -6.814208984375, -6.130859375, -5.447509765625, -4.76416015625, -4.080810546875, -3.3974609375, -2.714111328125, -2.03076171875, -1.347412109375, -0.6640625, 0.019287109375, 0.70263671875, 1.385986328125, 2.0693359375, 2.752685546875, 3.43603515625, 4.119384765625, 4.802734375, 5.486083984375, 6.16943359375, 6.852783203125, 7.5361328125, 8.219482421875, 8.90283203125, 9.586181640625, 10.26953125, 10.952880859375, 11.63623046875, 12.319580078125, 13.0029296875, 13.686279296875, 14.36962890625, 15.052978515625, 15.736328125, 16.419677734375, 17.10302734375, 17.786376953125, 18.4697265625, 19.153076171875, 19.83642578125, 20.519775390625, 21.203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 8.0, 1.0, 4.0, 2.0, 4.0, 5.0, 10.0, 16.0, 17.0, 23.0, 33.0, 44.0, 46.0, 82.0, 117.0, 143.0, 252.0, 323.0, 451.0, 687.0, 968.0, 1304.0, 1939.0, 2735.0, 3938.0, 5960.0, 8724.0, 13102.0, 20535.0, 36309.0, 753660.0, 121359.0, 25940.0, 16174.0, 10599.0, 7095.0, 4772.0, 3383.0, 2400.0, 1620.0, 1096.0, 767.0, 566.0, 383.0, 266.0, 187.0, 151.0, 82.0, 73.0, 54.0, 43.0, 38.0, 27.0, 16.0, 7.0, 6.0, 10.0, 4.0, 3.0, 4.0, 3.0, 1.0], "bins": [-1.0185546875, -0.9874420166015625, -0.956329345703125, -0.9252166748046875, -0.89410400390625, -0.8629913330078125, -0.831878662109375, -0.8007659912109375, -0.7696533203125, -0.7385406494140625, -0.707427978515625, -0.6763153076171875, -0.64520263671875, -0.6140899658203125, -0.582977294921875, -0.5518646240234375, -0.520751953125, -0.4896392822265625, -0.458526611328125, -0.4274139404296875, -0.39630126953125, -0.3651885986328125, -0.334075927734375, -0.3029632568359375, -0.2718505859375, -0.2407379150390625, -0.209625244140625, -0.1785125732421875, -0.14739990234375, -0.1162872314453125, -0.085174560546875, -0.0540618896484375, -0.02294921875, 0.0081634521484375, 0.039276123046875, 0.0703887939453125, 0.10150146484375, 0.1326141357421875, 0.163726806640625, 0.1948394775390625, 0.2259521484375, 0.2570648193359375, 0.288177490234375, 0.3192901611328125, 0.35040283203125, 0.3815155029296875, 0.412628173828125, 0.4437408447265625, 0.474853515625, 0.5059661865234375, 0.537078857421875, 0.5681915283203125, 0.59930419921875, 0.6304168701171875, 0.661529541015625, 0.6926422119140625, 0.7237548828125, 0.7548675537109375, 0.785980224609375, 0.8170928955078125, 0.84820556640625, 0.8793182373046875, 0.910430908203125, 0.9415435791015625, 0.97265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 8.0, 14.0, 18.0, 20.0, 17.0, 22.0, 30.0, 36.0, 37.0, 43.0, 50.0, 55.0, 62.0, 47.0, 46.0, 49.0, 58.0, 57.0, 51.0, 39.0, 32.0, 26.0, 28.0, 22.0, 15.0, 30.0, 16.0, 12.0, 5.0, 13.0, 10.0, 4.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.314018249511719e-05, -3.213062882423401e-05, -3.112107515335083e-05, -3.011152148246765e-05, -2.9101967811584473e-05, -2.8092414140701294e-05, -2.7082860469818115e-05, -2.6073306798934937e-05, -2.5063753128051758e-05, -2.405419945716858e-05, -2.30446457862854e-05, -2.203509211540222e-05, -2.1025538444519043e-05, -2.0015984773635864e-05, -1.9006431102752686e-05, -1.7996877431869507e-05, -1.6987323760986328e-05, -1.597777009010315e-05, -1.496821641921997e-05, -1.3958662748336792e-05, -1.2949109077453613e-05, -1.1939555406570435e-05, -1.0930001735687256e-05, -9.920448064804077e-06, -8.910894393920898e-06, -7.90134072303772e-06, -6.891787052154541e-06, -5.882233381271362e-06, -4.872679710388184e-06, -3.863126039505005e-06, -2.853572368621826e-06, -1.8440186977386475e-06, -8.344650268554688e-07, 1.7508864402770996e-07, 1.1846423149108887e-06, 2.1941959857940674e-06, 3.203749656677246e-06, 4.213303327560425e-06, 5.2228569984436035e-06, 6.232410669326782e-06, 7.241964340209961e-06, 8.25151801109314e-06, 9.261071681976318e-06, 1.0270625352859497e-05, 1.1280179023742676e-05, 1.2289732694625854e-05, 1.3299286365509033e-05, 1.4308840036392212e-05, 1.531839370727539e-05, 1.632794737815857e-05, 1.7337501049041748e-05, 1.8347054719924927e-05, 1.9356608390808105e-05, 2.0366162061691284e-05, 2.1375715732574463e-05, 2.238526940345764e-05, 2.339482307434082e-05, 2.4404376745224e-05, 2.5413930416107178e-05, 2.6423484086990356e-05, 2.7433037757873535e-05, 2.8442591428756714e-05, 2.9452145099639893e-05, 3.046169877052307e-05, 3.147125244140625e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 8.0, 16.0, 31.0, 47.0, 66.0, 103.0, 146.0, 226.0, 381.0, 539.0, 862.0, 1327.0, 2147.0, 3293.0, 4826.0, 7381.0, 11009.0, 16835.0, 24967.0, 36315.0, 53595.0, 77299.0, 106062.0, 131355.0, 141280.0, 123869.0, 94554.0, 67314.0, 46987.0, 31917.0, 21516.0, 14391.0, 9571.0, 6462.0, 4149.0, 2773.0, 1731.0, 1161.0, 708.0, 480.0, 283.0, 204.0, 137.0, 93.0, 53.0, 26.0, 23.0, 17.0, 5.0, 9.0, 4.0, 4.0, 3.0, 1.0], "bins": [-0.9873046875, -0.9585342407226562, -0.9297637939453125, -0.9009933471679688, -0.872222900390625, -0.8434524536132812, -0.8146820068359375, -0.7859115600585938, -0.75714111328125, -0.7283706665039062, -0.6996002197265625, -0.6708297729492188, -0.642059326171875, -0.6132888793945312, -0.5845184326171875, -0.5557479858398438, -0.5269775390625, -0.49820709228515625, -0.4694366455078125, -0.44066619873046875, -0.411895751953125, -0.38312530517578125, -0.3543548583984375, -0.32558441162109375, -0.29681396484375, -0.26804351806640625, -0.2392730712890625, -0.21050262451171875, -0.181732177734375, -0.15296173095703125, -0.1241912841796875, -0.09542083740234375, -0.066650390625, -0.03787994384765625, -0.0091094970703125, 0.01966094970703125, 0.048431396484375, 0.07720184326171875, 0.1059722900390625, 0.13474273681640625, 0.16351318359375, 0.19228363037109375, 0.2210540771484375, 0.24982452392578125, 0.278594970703125, 0.30736541748046875, 0.3361358642578125, 0.36490631103515625, 0.3936767578125, 0.42244720458984375, 0.4512176513671875, 0.47998809814453125, 0.508758544921875, 0.5375289916992188, 0.5662994384765625, 0.5950698852539062, 0.62384033203125, 0.6526107788085938, 0.6813812255859375, 0.7101516723632812, 0.738922119140625, 0.7676925659179688, 0.7964630126953125, 0.8252334594726562, 0.85400390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 4.0, 8.0, 6.0, 12.0, 6.0, 9.0, 13.0, 14.0, 14.0, 17.0, 22.0, 25.0, 27.0, 30.0, 33.0, 39.0, 53.0, 48.0, 58.0, 62.0, 76.0, 47.0, 55.0, 39.0, 51.0, 39.0, 25.0, 18.0, 16.0, 11.0, 14.0, 16.0, 18.0, 10.0, 12.0, 10.0, 9.0, 7.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.50927734375, -0.49341583251953125, -0.4775543212890625, -0.46169281005859375, -0.445831298828125, -0.42996978759765625, -0.4141082763671875, -0.39824676513671875, -0.38238525390625, -0.36652374267578125, -0.3506622314453125, -0.33480072021484375, -0.318939208984375, -0.30307769775390625, -0.2872161865234375, -0.27135467529296875, -0.2554931640625, -0.23963165283203125, -0.2237701416015625, -0.20790863037109375, -0.192047119140625, -0.17618560791015625, -0.1603240966796875, -0.14446258544921875, -0.12860107421875, -0.11273956298828125, -0.0968780517578125, -0.08101654052734375, -0.065155029296875, -0.04929351806640625, -0.0334320068359375, -0.01757049560546875, -0.001708984375, 0.01415252685546875, 0.0300140380859375, 0.04587554931640625, 0.061737060546875, 0.07759857177734375, 0.0934600830078125, 0.10932159423828125, 0.12518310546875, 0.14104461669921875, 0.1569061279296875, 0.17276763916015625, 0.188629150390625, 0.20449066162109375, 0.2203521728515625, 0.23621368408203125, 0.2520751953125, 0.26793670654296875, 0.2837982177734375, 0.29965972900390625, 0.315521240234375, 0.33138275146484375, 0.3472442626953125, 0.36310577392578125, 0.37896728515625, 0.39482879638671875, 0.4106903076171875, 0.42655181884765625, 0.442413330078125, 0.45827484130859375, 0.4741363525390625, 0.48999786376953125, 0.505859375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 8.0, 8.0, 16.0, 21.0, 24.0, 31.0, 21.0, 35.0, 29.0, 31.0, 35.0, 35.0, 36.0, 44.0, 41.0, 50.0, 42.0, 40.0, 44.0, 50.0, 42.0, 36.0, 37.0, 26.0, 42.0, 27.0, 25.0, 17.0, 18.0, 15.0, 8.0, 15.0, 6.0, 7.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.252750396728516, -30.284765243530273, -29.31678009033203, -28.34879493713379, -27.380809783935547, -26.412822723388672, -25.44483757019043, -24.476852416992188, -23.508867263793945, -22.540882110595703, -21.57289695739746, -20.60491180419922, -19.636924743652344, -18.668941497802734, -17.70095443725586, -16.732969284057617, -15.764984130859375, -14.796998977661133, -13.82901382446289, -12.861027717590332, -11.89304256439209, -10.925057411193848, -9.957071304321289, -8.989086151123047, -8.021100997924805, -7.0531158447265625, -6.085130214691162, -5.117144584655762, -4.1491594314575195, -3.1811742782592773, -2.213188648223877, -1.2452030181884766, -0.2772197723388672, 0.6907656192779541, 1.6587510108947754, 2.6267364025115967, 3.594721794128418, 4.56270694732666, 5.5306925773620605, 6.498678207397461, 7.466663360595703, 8.434648513793945, 9.402633666992188, 10.370619773864746, 11.338604927062988, 12.30659008026123, 13.274576187133789, 14.242561340332031, 15.210546493530273, 16.178531646728516, 17.146516799926758, 18.114501953125, 19.082489013671875, 20.050472259521484, 21.01845932006836, 21.9864444732666, 22.954429626464844, 23.922414779663086, 24.890399932861328, 25.85838508605957, 26.826370239257812, 27.794357299804688, 28.76234245300293, 29.730327606201172, 30.698312759399414]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 8.0, 13.0, 16.0, 17.0, 18.0, 17.0, 21.0, 27.0, 16.0, 17.0, 31.0, 30.0, 28.0, 39.0, 34.0, 39.0, 41.0, 43.0, 44.0, 56.0, 49.0, 38.0, 38.0, 27.0, 29.0, 30.0, 22.0, 31.0, 27.0, 20.0, 28.0, 19.0, 10.0, 15.0, 8.0, 11.0, 4.0, 6.0, 8.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.467607498168945, -28.4381046295166, -27.408601760864258, -26.379098892211914, -25.34959602355957, -24.320093154907227, -23.290592193603516, -22.261089324951172, -21.231586456298828, -20.202083587646484, -19.17258071899414, -18.143077850341797, -17.113574981689453, -16.08407211303711, -15.054570198059082, -14.025067329406738, -12.995563507080078, -11.966060638427734, -10.93655776977539, -9.907054901123047, -8.877552032470703, -7.848049640655518, -6.818547248840332, -5.789044380187988, -4.7595415115356445, -3.730038642883301, -2.700536012649536, -1.6710333824157715, -0.6415305137634277, 0.387972354888916, 1.4174747467041016, 2.4469776153564453, 3.476482391357422, 4.505985260009766, 5.535488128662109, 6.564990520477295, 7.594493389129639, 8.62399673461914, 9.653498649597168, 10.683001518249512, 11.712504386901855, 12.7420072555542, 13.771510124206543, 14.80101203918457, 15.830514907836914, 16.860017776489258, 17.8895206451416, 18.919023513793945, 19.94852638244629, 20.978029251098633, 22.007532119750977, 23.03703498840332, 24.066537857055664, 25.096040725708008, 26.12554168701172, 27.155044555664062, 28.184547424316406, 29.21405029296875, 30.243553161621094, 31.273056030273438, 32.30255889892578, 33.332061767578125, 34.36156463623047, 35.39106750488281, 36.420570373535156]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 7.0, 18.0, 18.0, 31.0, 61.0, 91.0, 126.0, 185.0, 304.0, 489.0, 772.0, 1213.0, 1738.0, 2556.0, 3819.0, 5673.0, 8008.0, 11178.0, 15381.0, 21221.0, 27580.0, 34915.0, 43988.0, 52118.0, 61226.0, 69252.0, 75115.0, 78171.0, 78784.0, 75963.0, 70931.0, 63082.0, 54761.0, 45802.0, 36723.0, 28936.0, 22091.0, 16805.0, 12107.0, 8557.0, 6233.0, 4245.0, 2717.0, 1988.0, 1246.0, 806.0, 577.0, 372.0, 229.0, 131.0, 79.0, 57.0, 36.0, 25.0, 11.0, 7.0, 3.0, 5.0, 1.0, 3.0, 1.0], "bins": [-13.265625, -12.8392333984375, -12.412841796875, -11.9864501953125, -11.56005859375, -11.1336669921875, -10.707275390625, -10.2808837890625, -9.8544921875, -9.4281005859375, -9.001708984375, -8.5753173828125, -8.14892578125, -7.7225341796875, -7.296142578125, -6.8697509765625, -6.443359375, -6.0169677734375, -5.590576171875, -5.1641845703125, -4.73779296875, -4.3114013671875, -3.885009765625, -3.4586181640625, -3.0322265625, -2.6058349609375, -2.179443359375, -1.7530517578125, -1.32666015625, -0.9002685546875, -0.473876953125, -0.0474853515625, 0.37890625, 0.8052978515625, 1.231689453125, 1.6580810546875, 2.08447265625, 2.5108642578125, 2.937255859375, 3.3636474609375, 3.7900390625, 4.2164306640625, 4.642822265625, 5.0692138671875, 5.49560546875, 5.9219970703125, 6.348388671875, 6.7747802734375, 7.201171875, 7.6275634765625, 8.053955078125, 8.4803466796875, 8.90673828125, 9.3331298828125, 9.759521484375, 10.1859130859375, 10.6123046875, 11.0386962890625, 11.465087890625, 11.8914794921875, 12.31787109375, 12.7442626953125, 13.170654296875, 13.5970458984375, 14.0234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 7.0, 11.0, 16.0, 16.0, 19.0, 19.0, 17.0, 27.0, 18.0, 17.0, 28.0, 30.0, 31.0, 35.0, 37.0, 37.0, 42.0, 45.0, 36.0, 65.0, 41.0, 44.0, 38.0, 27.0, 35.0, 29.0, 20.0, 30.0, 29.0, 19.0, 30.0, 20.0, 10.0, 13.0, 8.0, 12.0, 5.0, 6.0, 8.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.0, -27.9921875, -26.984375, -25.9765625, -24.96875, -23.9609375, -22.953125, -21.9453125, -20.9375, -19.9296875, -18.921875, -17.9140625, -16.90625, -15.8984375, -14.890625, -13.8828125, -12.875, -11.8671875, -10.859375, -9.8515625, -8.84375, -7.8359375, -6.828125, -5.8203125, -4.8125, -3.8046875, -2.796875, -1.7890625, -0.78125, 0.2265625, 1.234375, 2.2421875, 3.25, 4.2578125, 5.265625, 6.2734375, 7.28125, 8.2890625, 9.296875, 10.3046875, 11.3125, 12.3203125, 13.328125, 14.3359375, 15.34375, 16.3515625, 17.359375, 18.3671875, 19.375, 20.3828125, 21.390625, 22.3984375, 23.40625, 24.4140625, 25.421875, 26.4296875, 27.4375, 28.4453125, 29.453125, 30.4609375, 31.46875, 32.4765625, 33.484375, 34.4921875, 35.5]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 5.0, 7.0, 10.0, 13.0, 33.0, 46.0, 71.0, 129.0, 217.0, 346.0, 547.0, 817.0, 1324.0, 2123.0, 3238.0, 5088.0, 7508.0, 11011.0, 15864.0, 22176.0, 29870.0, 39317.0, 50295.0, 61151.0, 71063.0, 80059.0, 85549.0, 87526.0, 84743.0, 78554.0, 70192.0, 59557.0, 48064.0, 37718.0, 28675.0, 20590.0, 14575.0, 10411.0, 7059.0, 4683.0, 3082.0, 1952.0, 1251.0, 800.0, 515.0, 295.0, 193.0, 91.0, 76.0, 39.0, 25.0, 12.0, 12.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.6015625, -14.13671875, -13.671875, -13.20703125, -12.7421875, -12.27734375, -11.8125, -11.34765625, -10.8828125, -10.41796875, -9.953125, -9.48828125, -9.0234375, -8.55859375, -8.09375, -7.62890625, -7.1640625, -6.69921875, -6.234375, -5.76953125, -5.3046875, -4.83984375, -4.375, -3.91015625, -3.4453125, -2.98046875, -2.515625, -2.05078125, -1.5859375, -1.12109375, -0.65625, -0.19140625, 0.2734375, 0.73828125, 1.203125, 1.66796875, 2.1328125, 2.59765625, 3.0625, 3.52734375, 3.9921875, 4.45703125, 4.921875, 5.38671875, 5.8515625, 6.31640625, 6.78125, 7.24609375, 7.7109375, 8.17578125, 8.640625, 9.10546875, 9.5703125, 10.03515625, 10.5, 10.96484375, 11.4296875, 11.89453125, 12.359375, 12.82421875, 13.2890625, 13.75390625, 14.21875, 14.68359375, 15.1484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 8.0, 1.0, 4.0, 6.0, 3.0, 8.0, 9.0, 16.0, 16.0, 9.0, 24.0, 22.0, 14.0, 26.0, 26.0, 32.0, 34.0, 37.0, 37.0, 48.0, 39.0, 36.0, 44.0, 33.0, 43.0, 46.0, 32.0, 45.0, 36.0, 32.0, 37.0, 25.0, 27.0, 23.0, 20.0, 25.0, 17.0, 11.0, 6.0, 9.0, 7.0, 7.0, 9.0, 3.0, 3.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.84375, -19.150390625, -18.45703125, -17.763671875, -17.0703125, -16.376953125, -15.68359375, -14.990234375, -14.296875, -13.603515625, -12.91015625, -12.216796875, -11.5234375, -10.830078125, -10.13671875, -9.443359375, -8.75, -8.056640625, -7.36328125, -6.669921875, -5.9765625, -5.283203125, -4.58984375, -3.896484375, -3.203125, -2.509765625, -1.81640625, -1.123046875, -0.4296875, 0.263671875, 0.95703125, 1.650390625, 2.34375, 3.037109375, 3.73046875, 4.423828125, 5.1171875, 5.810546875, 6.50390625, 7.197265625, 7.890625, 8.583984375, 9.27734375, 9.970703125, 10.6640625, 11.357421875, 12.05078125, 12.744140625, 13.4375, 14.130859375, 14.82421875, 15.517578125, 16.2109375, 16.904296875, 17.59765625, 18.291015625, 18.984375, 19.677734375, 20.37109375, 21.064453125, 21.7578125, 22.451171875, 23.14453125, 23.837890625, 24.53125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 3.0, 13.0, 23.0, 51.0, 62.0, 108.0, 168.0, 261.0, 438.0, 677.0, 1120.0, 1820.0, 2877.0, 4600.0, 7022.0, 10785.0, 16128.0, 23429.0, 33271.0, 45359.0, 59183.0, 72651.0, 85820.0, 94886.0, 98597.0, 96456.0, 88686.0, 77044.0, 62990.0, 49193.0, 36326.0, 26099.0, 18069.0, 12363.0, 7934.0, 5198.0, 3253.0, 2095.0, 1307.0, 841.0, 533.0, 316.0, 181.0, 128.0, 71.0, 43.0, 28.0, 22.0, 11.0, 8.0, 3.0, 3.0, 1.0, 3.0], "bins": [-8.2578125, -8.01947021484375, -7.7811279296875, -7.54278564453125, -7.304443359375, -7.06610107421875, -6.8277587890625, -6.58941650390625, -6.35107421875, -6.11273193359375, -5.8743896484375, -5.63604736328125, -5.397705078125, -5.15936279296875, -4.9210205078125, -4.68267822265625, -4.4443359375, -4.20599365234375, -3.9676513671875, -3.72930908203125, -3.490966796875, -3.25262451171875, -3.0142822265625, -2.77593994140625, -2.53759765625, -2.29925537109375, -2.0609130859375, -1.82257080078125, -1.584228515625, -1.34588623046875, -1.1075439453125, -0.86920166015625, -0.630859375, -0.39251708984375, -0.1541748046875, 0.08416748046875, 0.322509765625, 0.56085205078125, 0.7991943359375, 1.03753662109375, 1.27587890625, 1.51422119140625, 1.7525634765625, 1.99090576171875, 2.229248046875, 2.46759033203125, 2.7059326171875, 2.94427490234375, 3.1826171875, 3.42095947265625, 3.6593017578125, 3.89764404296875, 4.135986328125, 4.37432861328125, 4.6126708984375, 4.85101318359375, 5.08935546875, 5.32769775390625, 5.5660400390625, 5.80438232421875, 6.042724609375, 6.28106689453125, 6.5194091796875, 6.75775146484375, 6.99609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 10.0, 16.0, 14.0, 17.0, 17.0, 27.0, 42.0, 41.0, 50.0, 41.0, 46.0, 48.0, 55.0, 65.0, 53.0, 70.0, 62.0, 52.0, 49.0, 49.0, 35.0, 25.0, 29.0, 23.0, 9.0, 10.0, 11.0, 10.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001735687255859375, -0.0016918033361434937, -0.0016479194164276123, -0.001604035496711731, -0.0015601515769958496, -0.0015162676572799683, -0.001472383737564087, -0.0014284998178482056, -0.0013846158981323242, -0.0013407319784164429, -0.0012968480587005615, -0.0012529641389846802, -0.0012090802192687988, -0.0011651962995529175, -0.0011213123798370361, -0.0010774284601211548, -0.0010335445404052734, -0.000989660620689392, -0.0009457767009735107, -0.0009018927812576294, -0.000858008861541748, -0.0008141249418258667, -0.0007702410221099854, -0.000726357102394104, -0.0006824731826782227, -0.0006385892629623413, -0.00059470534324646, -0.0005508214235305786, -0.0005069375038146973, -0.0004630535840988159, -0.00041916966438293457, -0.0003752857446670532, -0.0003314018249511719, -0.00028751790523529053, -0.00024363398551940918, -0.00019975006580352783, -0.00015586614608764648, -0.00011198222637176514, -6.809830665588379e-05, -2.421438694000244e-05, 1.9669532775878906e-05, 6.355345249176025e-05, 0.0001074373722076416, 0.00015132129192352295, 0.0001952052116394043, 0.00023908913135528564, 0.000282973051071167, 0.00032685697078704834, 0.0003707408905029297, 0.00041462481021881104, 0.0004585087299346924, 0.0005023926496505737, 0.0005462765693664551, 0.0005901604890823364, 0.0006340444087982178, 0.0006779283285140991, 0.0007218122482299805, 0.0007656961679458618, 0.0008095800876617432, 0.0008534640073776245, 0.0008973479270935059, 0.0009412318468093872, 0.0009851157665252686, 0.00102899968624115, 0.0010728836059570312]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 9.0, 16.0, 24.0, 18.0, 32.0, 78.0, 115.0, 204.0, 287.0, 489.0, 842.0, 1435.0, 2378.0, 4032.0, 6629.0, 10667.0, 16940.0, 26498.0, 38864.0, 54822.0, 72862.0, 91347.0, 105606.0, 111836.0, 110944.0, 100362.0, 84217.0, 66166.0, 48407.0, 33604.0, 22387.0, 14366.0, 8737.0, 5409.0, 3112.0, 1985.0, 1097.0, 693.0, 395.0, 251.0, 155.0, 87.0, 55.0, 32.0, 20.0, 16.0, 12.0, 4.0, 6.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.25, -8.94970703125, -8.6494140625, -8.34912109375, -8.048828125, -7.74853515625, -7.4482421875, -7.14794921875, -6.84765625, -6.54736328125, -6.2470703125, -5.94677734375, -5.646484375, -5.34619140625, -5.0458984375, -4.74560546875, -4.4453125, -4.14501953125, -3.8447265625, -3.54443359375, -3.244140625, -2.94384765625, -2.6435546875, -2.34326171875, -2.04296875, -1.74267578125, -1.4423828125, -1.14208984375, -0.841796875, -0.54150390625, -0.2412109375, 0.05908203125, 0.359375, 0.65966796875, 0.9599609375, 1.26025390625, 1.560546875, 1.86083984375, 2.1611328125, 2.46142578125, 2.76171875, 3.06201171875, 3.3623046875, 3.66259765625, 3.962890625, 4.26318359375, 4.5634765625, 4.86376953125, 5.1640625, 5.46435546875, 5.7646484375, 6.06494140625, 6.365234375, 6.66552734375, 6.9658203125, 7.26611328125, 7.56640625, 7.86669921875, 8.1669921875, 8.46728515625, 8.767578125, 9.06787109375, 9.3681640625, 9.66845703125, 9.96875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 7.0, 6.0, 7.0, 14.0, 11.0, 21.0, 13.0, 13.0, 27.0, 23.0, 28.0, 24.0, 24.0, 37.0, 36.0, 35.0, 43.0, 46.0, 31.0, 43.0, 65.0, 42.0, 43.0, 31.0, 38.0, 35.0, 31.0, 27.0, 28.0, 19.0, 28.0, 12.0, 21.0, 18.0, 8.0, 8.0, 13.0, 4.0, 9.0, 2.0, 4.0, 5.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0], "bins": [-3.818359375, -3.70050048828125, -3.5826416015625, -3.46478271484375, -3.346923828125, -3.22906494140625, -3.1112060546875, -2.99334716796875, -2.87548828125, -2.75762939453125, -2.6397705078125, -2.52191162109375, -2.404052734375, -2.28619384765625, -2.1683349609375, -2.05047607421875, -1.9326171875, -1.81475830078125, -1.6968994140625, -1.57904052734375, -1.461181640625, -1.34332275390625, -1.2254638671875, -1.10760498046875, -0.98974609375, -0.87188720703125, -0.7540283203125, -0.63616943359375, -0.518310546875, -0.40045166015625, -0.2825927734375, -0.16473388671875, -0.046875, 0.07098388671875, 0.1888427734375, 0.30670166015625, 0.424560546875, 0.54241943359375, 0.6602783203125, 0.77813720703125, 0.89599609375, 1.01385498046875, 1.1317138671875, 1.24957275390625, 1.367431640625, 1.48529052734375, 1.6031494140625, 1.72100830078125, 1.8388671875, 1.95672607421875, 2.0745849609375, 2.19244384765625, 2.310302734375, 2.42816162109375, 2.5460205078125, 2.66387939453125, 2.78173828125, 2.89959716796875, 3.0174560546875, 3.13531494140625, 3.253173828125, 3.37103271484375, 3.4888916015625, 3.60675048828125, 3.724609375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 8.0, 3.0, 9.0, 10.0, 10.0, 12.0, 24.0, 18.0, 16.0, 26.0, 35.0, 25.0, 32.0, 30.0, 49.0, 33.0, 34.0, 34.0, 48.0, 48.0, 41.0, 50.0, 39.0, 49.0, 42.0, 41.0, 37.0, 25.0, 35.0, 19.0, 24.0, 20.0, 12.0, 12.0, 9.0, 14.0, 13.0, 8.0, 3.0, 2.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.63239860534668, -29.672460556030273, -28.712522506713867, -27.75258445739746, -26.792648315429688, -25.83271026611328, -24.872772216796875, -23.91283416748047, -22.952896118164062, -21.992958068847656, -21.03302001953125, -20.073081970214844, -19.113143920898438, -18.15320587158203, -17.193269729614258, -16.23333168029785, -15.273393630981445, -14.313455581665039, -13.353517532348633, -12.393580436706543, -11.433642387390137, -10.47370433807373, -9.51376724243164, -8.553829193115234, -7.593891143798828, -6.633953094482422, -5.674015522003174, -4.714077949523926, -3.7541399002075195, -2.7942018508911133, -1.8342642784118652, -0.8743267059326172, 0.08561134338378906, 1.0455491542816162, 2.0054869651794434, 2.9654247760772705, 3.9253625869750977, 4.885300636291504, 5.845238208770752, 6.80517578125, 7.765113830566406, 8.725051879882812, 9.684989929199219, 10.644927024841309, 11.604865074157715, 12.564803123474121, 13.524740219116211, 14.484678268432617, 15.444616317749023, 16.40455436706543, 17.364492416381836, 18.324430465698242, 19.284366607666016, 20.244304656982422, 21.204242706298828, 22.164180755615234, 23.12411880493164, 24.084056854248047, 25.043994903564453, 26.00393295288086, 26.963871002197266, 27.923809051513672, 28.883745193481445, 29.84368324279785, 30.803621292114258]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 7.0, 7.0, 12.0, 10.0, 19.0, 16.0, 17.0, 31.0, 18.0, 26.0, 25.0, 27.0, 35.0, 31.0, 34.0, 34.0, 47.0, 34.0, 32.0, 44.0, 39.0, 39.0, 47.0, 44.0, 26.0, 41.0, 36.0, 22.0, 23.0, 27.0, 25.0, 18.0, 18.0, 9.0, 10.0, 10.0, 10.0, 9.0, 11.0, 1.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.79273223876953, -32.674896240234375, -31.55706024169922, -30.439224243164062, -29.321388244628906, -28.20355224609375, -27.08571434020996, -25.967878341674805, -24.85004234313965, -23.732206344604492, -22.614370346069336, -21.49653434753418, -20.37869644165039, -19.260860443115234, -18.143024444580078, -17.025188446044922, -15.907352447509766, -14.78951644897461, -13.671680450439453, -12.55384349822998, -11.436007499694824, -10.318171501159668, -9.200334548950195, -8.082498550415039, -6.964662551879883, -5.846826553344727, -4.728990077972412, -3.6111538410186768, -2.4933176040649414, -1.3754816055297852, -0.2576451301574707, 0.8601913452148438, 1.9780235290527344, 3.0958597660064697, 4.213696002960205, 5.3315324783325195, 6.449368476867676, 7.567204475402832, 8.685041427612305, 9.802877426147461, 10.920713424682617, 12.038549423217773, 13.15638542175293, 14.274222373962402, 15.392058372497559, 16.50989532470703, 17.627731323242188, 18.745567321777344, 19.8634033203125, 20.981239318847656, 22.099075317382812, 23.21691131591797, 24.334747314453125, 25.45258331298828, 26.57042121887207, 27.688257217407227, 28.806093215942383, 29.92392921447754, 31.041765213012695, 32.159603118896484, 33.27743911743164, 34.3952751159668, 35.51311111450195, 36.63094711303711, 37.748783111572266]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 9.0, 10.0, 31.0, 37.0, 69.0, 137.0, 199.0, 364.0, 606.0, 1040.0, 1804.0, 3122.0, 5314.0, 8825.0, 14667.0, 23818.0, 37827.0, 59367.0, 90597.0, 132809.0, 189355.0, 254453.0, 325252.0, 387667.0, 429624.0, 439385.0, 415462.0, 364408.0, 295840.0, 227598.0, 164561.0, 113473.0, 76269.0, 49437.0, 31511.0, 19637.0, 12032.0, 7134.0, 4331.0, 2601.0, 1479.0, 931.0, 496.0, 286.0, 156.0, 114.0, 68.0, 38.0, 18.0, 13.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.875, -21.176025390625, -20.47705078125, -19.778076171875, -19.0791015625, -18.380126953125, -17.68115234375, -16.982177734375, -16.283203125, -15.584228515625, -14.88525390625, -14.186279296875, -13.4873046875, -12.788330078125, -12.08935546875, -11.390380859375, -10.69140625, -9.992431640625, -9.29345703125, -8.594482421875, -7.8955078125, -7.196533203125, -6.49755859375, -5.798583984375, -5.099609375, -4.400634765625, -3.70166015625, -3.002685546875, -2.3037109375, -1.604736328125, -0.90576171875, -0.206787109375, 0.4921875, 1.191162109375, 1.89013671875, 2.589111328125, 3.2880859375, 3.987060546875, 4.68603515625, 5.385009765625, 6.083984375, 6.782958984375, 7.48193359375, 8.180908203125, 8.8798828125, 9.578857421875, 10.27783203125, 10.976806640625, 11.67578125, 12.374755859375, 13.07373046875, 13.772705078125, 14.4716796875, 15.170654296875, 15.86962890625, 16.568603515625, 17.267578125, 17.966552734375, 18.66552734375, 19.364501953125, 20.0634765625, 20.762451171875, 21.46142578125, 22.160400390625, 22.859375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 7.0, 12.0, 12.0, 19.0, 18.0, 20.0, 23.0, 20.0, 26.0, 22.0, 28.0, 39.0, 30.0, 35.0, 34.0, 48.0, 29.0, 36.0, 41.0, 38.0, 43.0, 48.0, 38.0, 30.0, 43.0, 32.0, 20.0, 29.0, 25.0, 27.0, 12.0, 22.0, 8.0, 9.0, 10.0, 9.0, 11.0, 10.0, 2.0, 4.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.34375, -31.28173828125, -30.2197265625, -29.15771484375, -28.095703125, -27.03369140625, -25.9716796875, -24.90966796875, -23.84765625, -22.78564453125, -21.7236328125, -20.66162109375, -19.599609375, -18.53759765625, -17.4755859375, -16.41357421875, -15.3515625, -14.28955078125, -13.2275390625, -12.16552734375, -11.103515625, -10.04150390625, -8.9794921875, -7.91748046875, -6.85546875, -5.79345703125, -4.7314453125, -3.66943359375, -2.607421875, -1.54541015625, -0.4833984375, 0.57861328125, 1.640625, 2.70263671875, 3.7646484375, 4.82666015625, 5.888671875, 6.95068359375, 8.0126953125, 9.07470703125, 10.13671875, 11.19873046875, 12.2607421875, 13.32275390625, 14.384765625, 15.44677734375, 16.5087890625, 17.57080078125, 18.6328125, 19.69482421875, 20.7568359375, 21.81884765625, 22.880859375, 23.94287109375, 25.0048828125, 26.06689453125, 27.12890625, 28.19091796875, 29.2529296875, 30.31494140625, 31.376953125, 32.43896484375, 33.5009765625, 34.56298828125, 35.625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 11.0, 24.0, 37.0, 58.0, 105.0, 182.0, 314.0, 576.0, 1061.0, 1796.0, 3141.0, 5255.0, 8995.0, 14810.0, 23542.0, 37715.0, 57690.0, 87580.0, 125035.0, 173995.0, 230552.0, 290179.0, 345954.0, 386996.0, 404723.0, 399495.0, 367766.0, 318629.0, 260263.0, 200640.0, 148161.0, 104890.0, 71260.0, 47225.0, 29624.0, 18448.0, 11273.0, 6827.0, 3992.0, 2247.0, 1417.0, 800.0, 470.0, 231.0, 150.0, 66.0, 39.0, 24.0, 12.0, 10.0, 1.0, 3.0, 0.0, 3.0, 2.0], "bins": [-24.015625, -23.303955078125, -22.59228515625, -21.880615234375, -21.1689453125, -20.457275390625, -19.74560546875, -19.033935546875, -18.322265625, -17.610595703125, -16.89892578125, -16.187255859375, -15.4755859375, -14.763916015625, -14.05224609375, -13.340576171875, -12.62890625, -11.917236328125, -11.20556640625, -10.493896484375, -9.7822265625, -9.070556640625, -8.35888671875, -7.647216796875, -6.935546875, -6.223876953125, -5.51220703125, -4.800537109375, -4.0888671875, -3.377197265625, -2.66552734375, -1.953857421875, -1.2421875, -0.530517578125, 0.18115234375, 0.892822265625, 1.6044921875, 2.316162109375, 3.02783203125, 3.739501953125, 4.451171875, 5.162841796875, 5.87451171875, 6.586181640625, 7.2978515625, 8.009521484375, 8.72119140625, 9.432861328125, 10.14453125, 10.856201171875, 11.56787109375, 12.279541015625, 12.9912109375, 13.702880859375, 14.41455078125, 15.126220703125, 15.837890625, 16.549560546875, 17.26123046875, 17.972900390625, 18.6845703125, 19.396240234375, 20.10791015625, 20.819580078125, 21.53125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 8.0, 9.0, 18.0, 18.0, 24.0, 24.0, 39.0, 40.0, 64.0, 70.0, 71.0, 103.0, 119.0, 132.0, 164.0, 172.0, 184.0, 192.0, 200.0, 205.0, 216.0, 194.0, 229.0, 198.0, 194.0, 168.0, 155.0, 131.0, 126.0, 116.0, 118.0, 88.0, 67.0, 55.0, 47.0, 32.0, 24.0, 13.0, 9.0, 7.0, 9.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.5703125, -14.0916748046875, -13.613037109375, -13.1343994140625, -12.65576171875, -12.1771240234375, -11.698486328125, -11.2198486328125, -10.7412109375, -10.2625732421875, -9.783935546875, -9.3052978515625, -8.82666015625, -8.3480224609375, -7.869384765625, -7.3907470703125, -6.912109375, -6.4334716796875, -5.954833984375, -5.4761962890625, -4.99755859375, -4.5189208984375, -4.040283203125, -3.5616455078125, -3.0830078125, -2.6043701171875, -2.125732421875, -1.6470947265625, -1.16845703125, -0.6898193359375, -0.211181640625, 0.2674560546875, 0.74609375, 1.2247314453125, 1.703369140625, 2.1820068359375, 2.66064453125, 3.1392822265625, 3.617919921875, 4.0965576171875, 4.5751953125, 5.0538330078125, 5.532470703125, 6.0111083984375, 6.48974609375, 6.9683837890625, 7.447021484375, 7.9256591796875, 8.404296875, 8.8829345703125, 9.361572265625, 9.8402099609375, 10.31884765625, 10.7974853515625, 11.276123046875, 11.7547607421875, 12.2333984375, 12.7120361328125, 13.190673828125, 13.6693115234375, 14.14794921875, 14.6265869140625, 15.105224609375, 15.5838623046875, 16.0625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 5.0, 0.0, 8.0, 3.0, 3.0, 6.0, 8.0, 11.0, 9.0, 8.0, 17.0, 15.0, 23.0, 27.0, 27.0, 30.0, 26.0, 27.0, 33.0, 36.0, 29.0, 38.0, 33.0, 46.0, 36.0, 39.0, 27.0, 45.0, 37.0, 29.0, 28.0, 40.0, 31.0, 41.0, 25.0, 18.0, 26.0, 19.0, 15.0, 14.0, 13.0, 10.0, 7.0, 5.0, 7.0, 7.0, 5.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.797842025756836, -24.91282844543457, -24.027814865112305, -23.14280128479004, -22.25778579711914, -21.372772216796875, -20.48775863647461, -19.602745056152344, -18.717731475830078, -17.832717895507812, -16.947704315185547, -16.06269073486328, -15.1776762008667, -14.292662620544434, -13.407648086547852, -12.522634506225586, -11.63762092590332, -10.752607345581055, -9.867593765258789, -8.982579231262207, -8.097565650939941, -7.212552070617676, -6.327538013458252, -5.442523956298828, -4.5575103759765625, -3.6724965572357178, -2.787482738494873, -1.9024689197540283, -1.0174551010131836, -0.13244152069091797, 0.7525725364685059, 1.6375865936279297, 2.5226001739501953, 3.40761399269104, 4.292627811431885, 5.177641868591309, 6.062655448913574, 6.94766902923584, 7.832683086395264, 8.717697143554688, 9.602710723876953, 10.487724304199219, 11.372737884521484, 12.257752418518066, 13.142765998840332, 14.027779579162598, 14.91279411315918, 15.797807693481445, 16.68282127380371, 17.567834854125977, 18.452848434448242, 19.337862014770508, 20.222877502441406, 21.107891082763672, 21.992904663085938, 22.877918243408203, 23.76293182373047, 24.647945404052734, 25.532958984375, 26.417972564697266, 27.30298614501953, 28.187999725341797, 29.073015213012695, 29.95802879333496, 30.843042373657227]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 0.0, 7.0, 8.0, 2.0, 13.0, 14.0, 16.0, 14.0, 21.0, 23.0, 22.0, 20.0, 21.0, 30.0, 29.0, 27.0, 31.0, 38.0, 35.0, 40.0, 40.0, 34.0, 40.0, 45.0, 49.0, 31.0, 33.0, 33.0, 39.0, 36.0, 19.0, 23.0, 29.0, 23.0, 17.0, 21.0, 14.0, 9.0, 10.0, 5.0, 9.0, 3.0, 9.0, 3.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-36.66719055175781, -35.495819091796875, -34.32444763183594, -33.153076171875, -31.981704711914062, -30.810333251953125, -29.63896369934082, -28.467592239379883, -27.296220779418945, -26.124849319458008, -24.95347785949707, -23.782106399536133, -22.610736846923828, -21.43936538696289, -20.267993927001953, -19.096622467041016, -17.925251007080078, -16.75387954711914, -15.582508087158203, -14.411137580871582, -13.239766120910645, -12.068394660949707, -10.897024154663086, -9.725652694702148, -8.554281234741211, -7.382909774780273, -6.211538791656494, -5.040167808532715, -3.8687963485717773, -2.69742488861084, -1.5260539054870605, -0.35468292236328125, 0.8166923522949219, 1.9880635738372803, 3.1594347953796387, 4.330805778503418, 5.5021772384643555, 6.673548698425293, 7.844919681549072, 9.016290664672852, 10.187662124633789, 11.359033584594727, 12.530405044555664, 13.701775550842285, 14.873147010803223, 16.044517517089844, 17.21588897705078, 18.38726043701172, 19.558631896972656, 20.730003356933594, 21.90137481689453, 23.07274627685547, 24.244117736816406, 25.415489196777344, 26.58685874938965, 27.758230209350586, 28.929601669311523, 30.10097312927246, 31.2723445892334, 32.4437141418457, 33.61508560180664, 34.78645706176758, 35.957828521728516, 37.12919998168945, 38.30057144165039]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 0.0, 5.0, 5.0, 5.0, 14.0, 16.0, 41.0, 40.0, 71.0, 94.0, 138.0, 253.0, 330.0, 487.0, 755.0, 1127.0, 1773.0, 2873.0, 4349.0, 6614.0, 9969.0, 15157.0, 22238.0, 32429.0, 45904.0, 62891.0, 81064.0, 99572.0, 112137.0, 113902.0, 105863.0, 88937.0, 70299.0, 52537.0, 37850.0, 26140.0, 17757.0, 11920.0, 7926.0, 5199.0, 3445.0, 2210.0, 1546.0, 946.0, 604.0, 393.0, 229.0, 167.0, 109.0, 81.0, 61.0, 21.0, 26.0, 21.0, 9.0, 7.0, 4.0, 6.0, 1.0, 2.0], "bins": [-5.13671875, -4.9820556640625, -4.827392578125, -4.6727294921875, -4.51806640625, -4.3634033203125, -4.208740234375, -4.0540771484375, -3.8994140625, -3.7447509765625, -3.590087890625, -3.4354248046875, -3.28076171875, -3.1260986328125, -2.971435546875, -2.8167724609375, -2.662109375, -2.5074462890625, -2.352783203125, -2.1981201171875, -2.04345703125, -1.8887939453125, -1.734130859375, -1.5794677734375, -1.4248046875, -1.2701416015625, -1.115478515625, -0.9608154296875, -0.80615234375, -0.6514892578125, -0.496826171875, -0.3421630859375, -0.1875, -0.0328369140625, 0.121826171875, 0.2764892578125, 0.43115234375, 0.5858154296875, 0.740478515625, 0.8951416015625, 1.0498046875, 1.2044677734375, 1.359130859375, 1.5137939453125, 1.66845703125, 1.8231201171875, 1.977783203125, 2.1324462890625, 2.287109375, 2.4417724609375, 2.596435546875, 2.7510986328125, 2.90576171875, 3.0604248046875, 3.215087890625, 3.3697509765625, 3.5244140625, 3.6790771484375, 3.833740234375, 3.9884033203125, 4.14306640625, 4.2977294921875, 4.452392578125, 4.6070556640625, 4.76171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 8.0, 5.0, 11.0, 18.0, 12.0, 15.0, 24.0, 24.0, 17.0, 24.0, 21.0, 32.0, 29.0, 28.0, 33.0, 35.0, 33.0, 41.0, 41.0, 37.0, 34.0, 49.0, 46.0, 31.0, 33.0, 39.0, 31.0, 37.0, 20.0, 19.0, 30.0, 23.0, 18.0, 21.0, 12.0, 9.0, 10.0, 4.0, 9.0, 4.0, 9.0, 3.0, 2.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-36.25, -35.07568359375, -33.9013671875, -32.72705078125, -31.552734375, -30.37841796875, -29.2041015625, -28.02978515625, -26.85546875, -25.68115234375, -24.5068359375, -23.33251953125, -22.158203125, -20.98388671875, -19.8095703125, -18.63525390625, -17.4609375, -16.28662109375, -15.1123046875, -13.93798828125, -12.763671875, -11.58935546875, -10.4150390625, -9.24072265625, -8.06640625, -6.89208984375, -5.7177734375, -4.54345703125, -3.369140625, -2.19482421875, -1.0205078125, 0.15380859375, 1.328125, 2.50244140625, 3.6767578125, 4.85107421875, 6.025390625, 7.19970703125, 8.3740234375, 9.54833984375, 10.72265625, 11.89697265625, 13.0712890625, 14.24560546875, 15.419921875, 16.59423828125, 17.7685546875, 18.94287109375, 20.1171875, 21.29150390625, 22.4658203125, 23.64013671875, 24.814453125, 25.98876953125, 27.1630859375, 28.33740234375, 29.51171875, 30.68603515625, 31.8603515625, 33.03466796875, 34.208984375, 35.38330078125, 36.5576171875, 37.73193359375, 38.90625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 8.0, 10.0, 11.0, 13.0, 22.0, 37.0, 48.0, 74.0, 107.0, 180.0, 252.0, 427.0, 611.0, 894.0, 1379.0, 2106.0, 3141.0, 4581.0, 6923.0, 10538.0, 17267.0, 31898.0, 349669.0, 531194.0, 35647.0, 18471.0, 11203.0, 7299.0, 4875.0, 3263.0, 2130.0, 1436.0, 952.0, 665.0, 420.0, 268.0, 185.0, 119.0, 71.0, 53.0, 41.0, 24.0, 18.0, 12.0, 9.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.015625, -11.640869140625, -11.26611328125, -10.891357421875, -10.5166015625, -10.141845703125, -9.76708984375, -9.392333984375, -9.017578125, -8.642822265625, -8.26806640625, -7.893310546875, -7.5185546875, -7.143798828125, -6.76904296875, -6.394287109375, -6.01953125, -5.644775390625, -5.27001953125, -4.895263671875, -4.5205078125, -4.145751953125, -3.77099609375, -3.396240234375, -3.021484375, -2.646728515625, -2.27197265625, -1.897216796875, -1.5224609375, -1.147705078125, -0.77294921875, -0.398193359375, -0.0234375, 0.351318359375, 0.72607421875, 1.100830078125, 1.4755859375, 1.850341796875, 2.22509765625, 2.599853515625, 2.974609375, 3.349365234375, 3.72412109375, 4.098876953125, 4.4736328125, 4.848388671875, 5.22314453125, 5.597900390625, 5.97265625, 6.347412109375, 6.72216796875, 7.096923828125, 7.4716796875, 7.846435546875, 8.22119140625, 8.595947265625, 8.970703125, 9.345458984375, 9.72021484375, 10.094970703125, 10.4697265625, 10.844482421875, 11.21923828125, 11.593994140625, 11.96875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 7.0, 7.0, 10.0, 11.0, 17.0, 20.0, 18.0, 25.0, 15.0, 27.0, 22.0, 28.0, 31.0, 34.0, 37.0, 38.0, 44.0, 48.0, 55.0, 34.0, 46.0, 33.0, 23.0, 35.0, 33.0, 24.0, 19.0, 39.0, 27.0, 29.0, 25.0, 18.0, 17.0, 19.0, 9.0, 8.0, 12.0, 8.0, 8.0, 9.0, 3.0, 7.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-25.734375, -24.944580078125, -24.15478515625, -23.364990234375, -22.5751953125, -21.785400390625, -20.99560546875, -20.205810546875, -19.416015625, -18.626220703125, -17.83642578125, -17.046630859375, -16.2568359375, -15.467041015625, -14.67724609375, -13.887451171875, -13.09765625, -12.307861328125, -11.51806640625, -10.728271484375, -9.9384765625, -9.148681640625, -8.35888671875, -7.569091796875, -6.779296875, -5.989501953125, -5.19970703125, -4.409912109375, -3.6201171875, -2.830322265625, -2.04052734375, -1.250732421875, -0.4609375, 0.328857421875, 1.11865234375, 1.908447265625, 2.6982421875, 3.488037109375, 4.27783203125, 5.067626953125, 5.857421875, 6.647216796875, 7.43701171875, 8.226806640625, 9.0166015625, 9.806396484375, 10.59619140625, 11.385986328125, 12.17578125, 12.965576171875, 13.75537109375, 14.545166015625, 15.3349609375, 16.124755859375, 16.91455078125, 17.704345703125, 18.494140625, 19.283935546875, 20.07373046875, 20.863525390625, 21.6533203125, 22.443115234375, 23.23291015625, 24.022705078125, 24.8125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 7.0, 11.0, 18.0, 10.0, 34.0, 53.0, 69.0, 99.0, 122.0, 200.0, 304.0, 426.0, 590.0, 966.0, 1405.0, 2178.0, 3287.0, 5240.0, 8033.0, 13060.0, 21221.0, 42021.0, 815539.0, 68973.0, 24390.0, 14453.0, 8983.0, 5782.0, 3758.0, 2491.0, 1621.0, 1008.0, 703.0, 499.0, 305.0, 223.0, 132.0, 119.0, 58.0, 53.0, 30.0, 23.0, 14.0, 15.0, 9.0, 8.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.3173828125, -1.275726318359375, -1.23406982421875, -1.192413330078125, -1.1507568359375, -1.109100341796875, -1.06744384765625, -1.025787353515625, -0.984130859375, -0.942474365234375, -0.90081787109375, -0.859161376953125, -0.8175048828125, -0.775848388671875, -0.73419189453125, -0.692535400390625, -0.65087890625, -0.609222412109375, -0.56756591796875, -0.525909423828125, -0.4842529296875, -0.442596435546875, -0.40093994140625, -0.359283447265625, -0.317626953125, -0.275970458984375, -0.23431396484375, -0.192657470703125, -0.1510009765625, -0.109344482421875, -0.06768798828125, -0.026031494140625, 0.015625, 0.057281494140625, 0.09893798828125, 0.140594482421875, 0.1822509765625, 0.223907470703125, 0.26556396484375, 0.307220458984375, 0.348876953125, 0.390533447265625, 0.43218994140625, 0.473846435546875, 0.5155029296875, 0.557159423828125, 0.59881591796875, 0.640472412109375, 0.68212890625, 0.723785400390625, 0.76544189453125, 0.807098388671875, 0.8487548828125, 0.890411376953125, 0.93206787109375, 0.973724365234375, 1.015380859375, 1.057037353515625, 1.09869384765625, 1.140350341796875, 1.1820068359375, 1.223663330078125, 1.26531982421875, 1.306976318359375, 1.3486328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 6.0, 4.0, 8.0, 18.0, 22.0, 15.0, 27.0, 19.0, 27.0, 33.0, 34.0, 36.0, 37.0, 42.0, 50.0, 42.0, 51.0, 50.0, 57.0, 48.0, 47.0, 45.0, 41.0, 39.0, 31.0, 25.0, 25.0, 18.0, 19.0, 11.0, 15.0, 13.0, 7.0, 5.0, 5.0, 3.0, 7.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.3974647521972656e-05, -3.2806769013404846e-05, -3.1638890504837036e-05, -3.0471011996269226e-05, -2.9303133487701416e-05, -2.8135254979133606e-05, -2.6967376470565796e-05, -2.5799497961997986e-05, -2.4631619453430176e-05, -2.3463740944862366e-05, -2.2295862436294556e-05, -2.1127983927726746e-05, -1.9960105419158936e-05, -1.8792226910591125e-05, -1.7624348402023315e-05, -1.6456469893455505e-05, -1.5288591384887695e-05, -1.4120712876319885e-05, -1.2952834367752075e-05, -1.1784955859184265e-05, -1.0617077350616455e-05, -9.449198842048645e-06, -8.281320333480835e-06, -7.113441824913025e-06, -5.945563316345215e-06, -4.777684807777405e-06, -3.6098062992095947e-06, -2.4419277906417847e-06, -1.2740492820739746e-06, -1.0617077350616455e-07, 1.0617077350616455e-06, 2.2295862436294556e-06, 3.3974647521972656e-06, 4.565343260765076e-06, 5.733221769332886e-06, 6.901100277900696e-06, 8.068978786468506e-06, 9.236857295036316e-06, 1.0404735803604126e-05, 1.1572614312171936e-05, 1.2740492820739746e-05, 1.3908371329307556e-05, 1.5076249837875366e-05, 1.6244128346443176e-05, 1.7412006855010986e-05, 1.8579885363578796e-05, 1.9747763872146606e-05, 2.0915642380714417e-05, 2.2083520889282227e-05, 2.3251399397850037e-05, 2.4419277906417847e-05, 2.5587156414985657e-05, 2.6755034923553467e-05, 2.7922913432121277e-05, 2.9090791940689087e-05, 3.0258670449256897e-05, 3.142654895782471e-05, 3.259442746639252e-05, 3.376230597496033e-05, 3.493018448352814e-05, 3.609806299209595e-05, 3.726594150066376e-05, 3.843382000923157e-05, 3.960169851779938e-05, 4.076957702636719e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 7.0, 15.0, 19.0, 21.0, 38.0, 41.0, 80.0, 134.0, 186.0, 273.0, 500.0, 761.0, 1225.0, 1890.0, 3031.0, 4918.0, 7948.0, 12708.0, 20517.0, 32718.0, 51681.0, 80511.0, 120105.0, 158630.0, 165815.0, 132660.0, 91659.0, 59432.0, 37994.0, 23710.0, 14902.0, 9203.0, 5657.0, 3498.0, 2276.0, 1391.0, 841.0, 558.0, 366.0, 211.0, 144.0, 105.0, 56.0, 53.0, 25.0, 19.0, 8.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-1.2998046875, -1.261749267578125, -1.22369384765625, -1.185638427734375, -1.1475830078125, -1.109527587890625, -1.07147216796875, -1.033416748046875, -0.995361328125, -0.957305908203125, -0.91925048828125, -0.881195068359375, -0.8431396484375, -0.805084228515625, -0.76702880859375, -0.728973388671875, -0.69091796875, -0.652862548828125, -0.61480712890625, -0.576751708984375, -0.5386962890625, -0.500640869140625, -0.46258544921875, -0.424530029296875, -0.386474609375, -0.348419189453125, -0.31036376953125, -0.272308349609375, -0.2342529296875, -0.196197509765625, -0.15814208984375, -0.120086669921875, -0.08203125, -0.043975830078125, -0.00592041015625, 0.032135009765625, 0.0701904296875, 0.108245849609375, 0.14630126953125, 0.184356689453125, 0.222412109375, 0.260467529296875, 0.29852294921875, 0.336578369140625, 0.3746337890625, 0.412689208984375, 0.45074462890625, 0.488800048828125, 0.52685546875, 0.564910888671875, 0.60296630859375, 0.641021728515625, 0.6790771484375, 0.717132568359375, 0.75518798828125, 0.793243408203125, 0.831298828125, 0.869354248046875, 0.90740966796875, 0.945465087890625, 0.9835205078125, 1.021575927734375, 1.05963134765625, 1.097686767578125, 1.1357421875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 2.0, 4.0, 4.0, 5.0, 6.0, 6.0, 9.0, 8.0, 13.0, 20.0, 23.0, 31.0, 42.0, 50.0, 62.0, 67.0, 68.0, 71.0, 65.0, 86.0, 47.0, 54.0, 44.0, 41.0, 34.0, 24.0, 15.0, 28.0, 14.0, 9.0, 13.0, 7.0, 5.0, 3.0, 7.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55859375, -0.537811279296875, -0.51702880859375, -0.496246337890625, -0.4754638671875, -0.454681396484375, -0.43389892578125, -0.413116455078125, -0.392333984375, -0.371551513671875, -0.35076904296875, -0.329986572265625, -0.3092041015625, -0.288421630859375, -0.26763916015625, -0.246856689453125, -0.22607421875, -0.205291748046875, -0.18450927734375, -0.163726806640625, -0.1429443359375, -0.122161865234375, -0.10137939453125, -0.080596923828125, -0.059814453125, -0.039031982421875, -0.01824951171875, 0.002532958984375, 0.0233154296875, 0.044097900390625, 0.06488037109375, 0.085662841796875, 0.1064453125, 0.127227783203125, 0.14801025390625, 0.168792724609375, 0.1895751953125, 0.210357666015625, 0.23114013671875, 0.251922607421875, 0.272705078125, 0.293487548828125, 0.31427001953125, 0.335052490234375, 0.3558349609375, 0.376617431640625, 0.39739990234375, 0.418182373046875, 0.43896484375, 0.459747314453125, 0.48052978515625, 0.501312255859375, 0.5220947265625, 0.542877197265625, 0.56365966796875, 0.584442138671875, 0.605224609375, 0.626007080078125, 0.64678955078125, 0.667572021484375, 0.6883544921875, 0.709136962890625, 0.72991943359375, 0.750701904296875, 0.771484375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 4.0, 6.0, 2.0, 7.0, 3.0, 6.0, 10.0, 11.0, 17.0, 14.0, 16.0, 30.0, 20.0, 34.0, 27.0, 28.0, 32.0, 27.0, 35.0, 44.0, 29.0, 41.0, 37.0, 39.0, 37.0, 36.0, 38.0, 36.0, 34.0, 34.0, 30.0, 38.0, 34.0, 23.0, 24.0, 17.0, 15.0, 20.0, 10.0, 7.0, 7.0, 6.0, 13.0, 5.0, 8.0, 2.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.750097274780273, -25.847896575927734, -24.945693969726562, -24.04349136352539, -23.14129066467285, -22.239089965820312, -21.33688735961914, -20.43468475341797, -19.53248405456543, -18.63028335571289, -17.72808074951172, -16.825878143310547, -15.923677444458008, -15.021475791931152, -14.119274139404297, -13.217072486877441, -12.314870834350586, -11.41266918182373, -10.510467529296875, -9.60826587677002, -8.706064224243164, -7.803862571716309, -6.901660919189453, -5.999459266662598, -5.097257614135742, -4.195055961608887, -3.2928543090820312, -2.390652656555176, -1.4884510040283203, -0.5862493515014648, 0.3159523010253906, 1.218153953552246, 2.1203575134277344, 3.02255916595459, 3.9247608184814453, 4.826962471008301, 5.729164123535156, 6.631365776062012, 7.533567428588867, 8.435769081115723, 9.337970733642578, 10.240172386169434, 11.142374038696289, 12.044575691223145, 12.94677734375, 13.848978996276855, 14.751180648803711, 15.653382301330566, 16.555583953857422, 17.457786560058594, 18.359987258911133, 19.262187957763672, 20.164390563964844, 21.066593170166016, 21.968793869018555, 22.870994567871094, 23.773197174072266, 24.675399780273438, 25.577600479125977, 26.479801177978516, 27.382003784179688, 28.28420639038086, 29.1864070892334, 30.088607788085938, 30.99081039428711]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 1.0, 6.0, 8.0, 2.0, 13.0, 17.0, 13.0, 14.0, 23.0, 23.0, 20.0, 21.0, 22.0, 31.0, 29.0, 26.0, 34.0, 37.0, 35.0, 38.0, 42.0, 36.0, 41.0, 49.0, 40.0, 34.0, 36.0, 34.0, 34.0, 33.0, 20.0, 23.0, 33.0, 18.0, 24.0, 16.0, 12.0, 9.0, 11.0, 5.0, 8.0, 4.0, 9.0, 2.0, 2.0, 8.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-36.592384338378906, -35.40847396850586, -34.22455978393555, -33.0406494140625, -31.856739044189453, -30.672826766967773, -29.488914489746094, -28.305004119873047, -27.121091842651367, -25.937179565429688, -24.75326919555664, -23.56935691833496, -22.38544464111328, -21.201534271240234, -20.017621994018555, -18.833709716796875, -17.649799346923828, -16.46588706970215, -15.281976699829102, -14.098064422607422, -12.914153099060059, -11.730241775512695, -10.546329498291016, -9.362418174743652, -8.178506851196289, -6.994595527648926, -5.810683727264404, -4.626771926879883, -3.4428606033325195, -2.2589492797851562, -1.0750374794006348, 0.10887432098388672, 1.2927818298339844, 2.4766933917999268, 3.660604953765869, 4.844516754150391, 6.028428077697754, 7.212339401245117, 8.396251678466797, 9.58016300201416, 10.764074325561523, 11.947985649108887, 13.13189697265625, 14.31580924987793, 15.499720573425293, 16.683631896972656, 17.867544174194336, 19.051456451416016, 20.235366821289062, 21.419279098510742, 22.60318946838379, 23.78710174560547, 24.971012115478516, 26.154924392700195, 27.338836669921875, 28.522747039794922, 29.7066593170166, 30.89057159423828, 32.07448196411133, 33.258392333984375, 34.44230651855469, 35.626216888427734, 36.81012725830078, 37.994041442871094, 39.17795181274414]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 20.0, 12.0, 34.0, 49.0, 67.0, 121.0, 158.0, 250.0, 416.0, 632.0, 1026.0, 1536.0, 2295.0, 3624.0, 5300.0, 8016.0, 11692.0, 16834.0, 23720.0, 31866.0, 41574.0, 53282.0, 64967.0, 76181.0, 84158.0, 89399.0, 89227.0, 85669.0, 77192.0, 66871.0, 55094.0, 43665.0, 33322.0, 24825.0, 17670.0, 12428.0, 8635.0, 5728.0, 3858.0, 2509.0, 1660.0, 1046.0, 656.0, 482.0, 267.0, 185.0, 151.0, 79.0, 38.0, 25.0, 23.0, 13.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-16.125, -15.606201171875, -15.08740234375, -14.568603515625, -14.0498046875, -13.531005859375, -13.01220703125, -12.493408203125, -11.974609375, -11.455810546875, -10.93701171875, -10.418212890625, -9.8994140625, -9.380615234375, -8.86181640625, -8.343017578125, -7.82421875, -7.305419921875, -6.78662109375, -6.267822265625, -5.7490234375, -5.230224609375, -4.71142578125, -4.192626953125, -3.673828125, -3.155029296875, -2.63623046875, -2.117431640625, -1.5986328125, -1.079833984375, -0.56103515625, -0.042236328125, 0.4765625, 0.995361328125, 1.51416015625, 2.032958984375, 2.5517578125, 3.070556640625, 3.58935546875, 4.108154296875, 4.626953125, 5.145751953125, 5.66455078125, 6.183349609375, 6.7021484375, 7.220947265625, 7.73974609375, 8.258544921875, 8.77734375, 9.296142578125, 9.81494140625, 10.333740234375, 10.8525390625, 11.371337890625, 11.89013671875, 12.408935546875, 12.927734375, 13.446533203125, 13.96533203125, 14.484130859375, 15.0029296875, 15.521728515625, 16.04052734375, 16.559326171875, 17.078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 7.0, 5.0, 10.0, 19.0, 14.0, 14.0, 23.0, 23.0, 18.0, 22.0, 27.0, 31.0, 28.0, 27.0, 33.0, 38.0, 32.0, 40.0, 44.0, 33.0, 44.0, 44.0, 40.0, 35.0, 37.0, 36.0, 30.0, 34.0, 20.0, 22.0, 30.0, 19.0, 24.0, 16.0, 11.0, 9.0, 10.0, 5.0, 10.0, 2.0, 9.0, 2.0, 2.0, 9.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-35.875, -34.708984375, -33.54296875, -32.376953125, -31.2109375, -30.044921875, -28.87890625, -27.712890625, -26.546875, -25.380859375, -24.21484375, -23.048828125, -21.8828125, -20.716796875, -19.55078125, -18.384765625, -17.21875, -16.052734375, -14.88671875, -13.720703125, -12.5546875, -11.388671875, -10.22265625, -9.056640625, -7.890625, -6.724609375, -5.55859375, -4.392578125, -3.2265625, -2.060546875, -0.89453125, 0.271484375, 1.4375, 2.603515625, 3.76953125, 4.935546875, 6.1015625, 7.267578125, 8.43359375, 9.599609375, 10.765625, 11.931640625, 13.09765625, 14.263671875, 15.4296875, 16.595703125, 17.76171875, 18.927734375, 20.09375, 21.259765625, 22.42578125, 23.591796875, 24.7578125, 25.923828125, 27.08984375, 28.255859375, 29.421875, 30.587890625, 31.75390625, 32.919921875, 34.0859375, 35.251953125, 36.41796875, 37.583984375, 38.75]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 12.0, 32.0, 47.0, 55.0, 73.0, 145.0, 208.0, 376.0, 585.0, 926.0, 1513.0, 2426.0, 3733.0, 5890.0, 9137.0, 14058.0, 20517.0, 30524.0, 43245.0, 58414.0, 75248.0, 90907.0, 102497.0, 106880.0, 104152.0, 93707.0, 78302.0, 61802.0, 45760.0, 32732.0, 22628.0, 15059.0, 9726.0, 6386.0, 4022.0, 2551.0, 1542.0, 1007.0, 642.0, 406.0, 229.0, 177.0, 98.0, 67.0, 33.0, 25.0, 15.0, 13.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-22.75, -22.052001953125, -21.35400390625, -20.656005859375, -19.9580078125, -19.260009765625, -18.56201171875, -17.864013671875, -17.166015625, -16.468017578125, -15.77001953125, -15.072021484375, -14.3740234375, -13.676025390625, -12.97802734375, -12.280029296875, -11.58203125, -10.884033203125, -10.18603515625, -9.488037109375, -8.7900390625, -8.092041015625, -7.39404296875, -6.696044921875, -5.998046875, -5.300048828125, -4.60205078125, -3.904052734375, -3.2060546875, -2.508056640625, -1.81005859375, -1.112060546875, -0.4140625, 0.283935546875, 0.98193359375, 1.679931640625, 2.3779296875, 3.075927734375, 3.77392578125, 4.471923828125, 5.169921875, 5.867919921875, 6.56591796875, 7.263916015625, 7.9619140625, 8.659912109375, 9.35791015625, 10.055908203125, 10.75390625, 11.451904296875, 12.14990234375, 12.847900390625, 13.5458984375, 14.243896484375, 14.94189453125, 15.639892578125, 16.337890625, 17.035888671875, 17.73388671875, 18.431884765625, 19.1298828125, 19.827880859375, 20.52587890625, 21.223876953125, 21.921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 5.0, 13.0, 10.0, 10.0, 16.0, 18.0, 21.0, 20.0, 23.0, 42.0, 33.0, 35.0, 41.0, 40.0, 42.0, 49.0, 44.0, 35.0, 50.0, 35.0, 52.0, 51.0, 47.0, 39.0, 30.0, 29.0, 24.0, 19.0, 18.0, 20.0, 16.0, 21.0, 10.0, 13.0, 7.0, 7.0, 5.0, 1.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.546875, -28.582763671875, -27.61865234375, -26.654541015625, -25.6904296875, -24.726318359375, -23.76220703125, -22.798095703125, -21.833984375, -20.869873046875, -19.90576171875, -18.941650390625, -17.9775390625, -17.013427734375, -16.04931640625, -15.085205078125, -14.12109375, -13.156982421875, -12.19287109375, -11.228759765625, -10.2646484375, -9.300537109375, -8.33642578125, -7.372314453125, -6.408203125, -5.444091796875, -4.47998046875, -3.515869140625, -2.5517578125, -1.587646484375, -0.62353515625, 0.340576171875, 1.3046875, 2.268798828125, 3.23291015625, 4.197021484375, 5.1611328125, 6.125244140625, 7.08935546875, 8.053466796875, 9.017578125, 9.981689453125, 10.94580078125, 11.909912109375, 12.8740234375, 13.838134765625, 14.80224609375, 15.766357421875, 16.73046875, 17.694580078125, 18.65869140625, 19.622802734375, 20.5869140625, 21.551025390625, 22.51513671875, 23.479248046875, 24.443359375, 25.407470703125, 26.37158203125, 27.335693359375, 28.2998046875, 29.263916015625, 30.22802734375, 31.192138671875, 32.15625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 22.0, 35.0, 60.0, 60.0, 119.0, 207.0, 297.0, 508.0, 900.0, 1329.0, 2223.0, 3549.0, 5505.0, 8760.0, 13238.0, 20186.0, 28743.0, 40052.0, 54061.0, 68936.0, 83114.0, 94313.0, 100846.0, 100802.0, 94252.0, 82835.0, 67980.0, 52988.0, 39331.0, 27861.0, 19540.0, 13029.0, 8408.0, 5372.0, 3455.0, 2105.0, 1336.0, 857.0, 494.0, 347.0, 198.0, 120.0, 69.0, 39.0, 32.0, 18.0, 9.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.0, -6.76641845703125, -6.5328369140625, -6.29925537109375, -6.065673828125, -5.83209228515625, -5.5985107421875, -5.36492919921875, -5.13134765625, -4.89776611328125, -4.6641845703125, -4.43060302734375, -4.197021484375, -3.96343994140625, -3.7298583984375, -3.49627685546875, -3.2626953125, -3.02911376953125, -2.7955322265625, -2.56195068359375, -2.328369140625, -2.09478759765625, -1.8612060546875, -1.62762451171875, -1.39404296875, -1.16046142578125, -0.9268798828125, -0.69329833984375, -0.459716796875, -0.22613525390625, 0.0074462890625, 0.24102783203125, 0.474609375, 0.70819091796875, 0.9417724609375, 1.17535400390625, 1.408935546875, 1.64251708984375, 1.8760986328125, 2.10968017578125, 2.34326171875, 2.57684326171875, 2.8104248046875, 3.04400634765625, 3.277587890625, 3.51116943359375, 3.7447509765625, 3.97833251953125, 4.2119140625, 4.44549560546875, 4.6790771484375, 4.91265869140625, 5.146240234375, 5.37982177734375, 5.6134033203125, 5.84698486328125, 6.08056640625, 6.31414794921875, 6.5477294921875, 6.78131103515625, 7.014892578125, 7.24847412109375, 7.4820556640625, 7.71563720703125, 7.94921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 6.0, 7.0, 7.0, 13.0, 13.0, 10.0, 14.0, 15.0, 24.0, 28.0, 23.0, 30.0, 43.0, 35.0, 35.0, 44.0, 50.0, 58.0, 51.0, 46.0, 49.0, 45.0, 49.0, 46.0, 48.0, 27.0, 18.0, 24.0, 40.0, 15.0, 23.0, 18.0, 10.0, 6.0, 4.0, 5.0, 2.0, 6.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.0011224746704101562, -0.001089334487915039, -0.0010561943054199219, -0.0010230541229248047, -0.0009899139404296875, -0.0009567737579345703, -0.0009236335754394531, -0.0008904933929443359, -0.0008573532104492188, -0.0008242130279541016, -0.0007910728454589844, -0.0007579326629638672, -0.00072479248046875, -0.0006916522979736328, -0.0006585121154785156, -0.0006253719329833984, -0.0005922317504882812, -0.0005590915679931641, -0.0005259513854980469, -0.0004928112030029297, -0.0004596710205078125, -0.0004265308380126953, -0.0003933906555175781, -0.00036025047302246094, -0.00032711029052734375, -0.00029397010803222656, -0.0002608299255371094, -0.0002276897430419922, -0.000194549560546875, -0.0001614093780517578, -0.00012826919555664062, -9.512901306152344e-05, -6.198883056640625e-05, -2.8848648071289062e-05, 4.291534423828125e-06, 3.743171691894531e-05, 7.05718994140625e-05, 0.00010371208190917969, 0.00013685226440429688, 0.00016999244689941406, 0.00020313262939453125, 0.00023627281188964844, 0.0002694129943847656, 0.0003025531768798828, 0.000335693359375, 0.0003688335418701172, 0.0004019737243652344, 0.00043511390686035156, 0.00046825408935546875, 0.0005013942718505859, 0.0005345344543457031, 0.0005676746368408203, 0.0006008148193359375, 0.0006339550018310547, 0.0006670951843261719, 0.0007002353668212891, 0.0007333755493164062, 0.0007665157318115234, 0.0007996559143066406, 0.0008327960968017578, 0.000865936279296875, 0.0008990764617919922, 0.0009322166442871094, 0.0009653568267822266, 0.0009984970092773438]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 8.0, 16.0, 16.0, 41.0, 60.0, 83.0, 161.0, 278.0, 484.0, 822.0, 1294.0, 1955.0, 3088.0, 4748.0, 7143.0, 10640.0, 15368.0, 21883.0, 29552.0, 38852.0, 50424.0, 61257.0, 71746.0, 80893.0, 86499.0, 88318.0, 85892.0, 79778.0, 70101.0, 59040.0, 48083.0, 37695.0, 28624.0, 20581.0, 14310.0, 10063.0, 6689.0, 4381.0, 2923.0, 1818.0, 1167.0, 755.0, 405.0, 255.0, 146.0, 81.0, 64.0, 30.0, 18.0, 12.0, 5.0, 9.0, 4.0, 2.0, 2.0, 1.0], "bins": [-7.08984375, -6.877685546875, -6.66552734375, -6.453369140625, -6.2412109375, -6.029052734375, -5.81689453125, -5.604736328125, -5.392578125, -5.180419921875, -4.96826171875, -4.756103515625, -4.5439453125, -4.331787109375, -4.11962890625, -3.907470703125, -3.6953125, -3.483154296875, -3.27099609375, -3.058837890625, -2.8466796875, -2.634521484375, -2.42236328125, -2.210205078125, -1.998046875, -1.785888671875, -1.57373046875, -1.361572265625, -1.1494140625, -0.937255859375, -0.72509765625, -0.512939453125, -0.30078125, -0.088623046875, 0.12353515625, 0.335693359375, 0.5478515625, 0.760009765625, 0.97216796875, 1.184326171875, 1.396484375, 1.608642578125, 1.82080078125, 2.032958984375, 2.2451171875, 2.457275390625, 2.66943359375, 2.881591796875, 3.09375, 3.305908203125, 3.51806640625, 3.730224609375, 3.9423828125, 4.154541015625, 4.36669921875, 4.578857421875, 4.791015625, 5.003173828125, 5.21533203125, 5.427490234375, 5.6396484375, 5.851806640625, 6.06396484375, 6.276123046875, 6.48828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 8.0, 10.0, 7.0, 15.0, 8.0, 10.0, 19.0, 22.0, 16.0, 24.0, 32.0, 20.0, 32.0, 33.0, 33.0, 35.0, 35.0, 30.0, 36.0, 42.0, 32.0, 35.0, 41.0, 43.0, 39.0, 32.0, 30.0, 31.0, 32.0, 29.0, 16.0, 24.0, 18.0, 17.0, 11.0, 17.0, 19.0, 11.0, 10.0, 10.0, 12.0, 6.0, 3.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.5234375, -3.4136962890625, -3.303955078125, -3.1942138671875, -3.08447265625, -2.9747314453125, -2.864990234375, -2.7552490234375, -2.6455078125, -2.5357666015625, -2.426025390625, -2.3162841796875, -2.20654296875, -2.0968017578125, -1.987060546875, -1.8773193359375, -1.767578125, -1.6578369140625, -1.548095703125, -1.4383544921875, -1.32861328125, -1.2188720703125, -1.109130859375, -0.9993896484375, -0.8896484375, -0.7799072265625, -0.670166015625, -0.5604248046875, -0.45068359375, -0.3409423828125, -0.231201171875, -0.1214599609375, -0.01171875, 0.0980224609375, 0.207763671875, 0.3175048828125, 0.42724609375, 0.5369873046875, 0.646728515625, 0.7564697265625, 0.8662109375, 0.9759521484375, 1.085693359375, 1.1954345703125, 1.30517578125, 1.4149169921875, 1.524658203125, 1.6343994140625, 1.744140625, 1.8538818359375, 1.963623046875, 2.0733642578125, 2.18310546875, 2.2928466796875, 2.402587890625, 2.5123291015625, 2.6220703125, 2.7318115234375, 2.841552734375, 2.9512939453125, 3.06103515625, 3.1707763671875, 3.280517578125, 3.3902587890625, 3.5]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 7.0, 1.0, 1.0, 5.0, 8.0, 4.0, 9.0, 10.0, 13.0, 23.0, 16.0, 20.0, 29.0, 29.0, 35.0, 24.0, 37.0, 29.0, 39.0, 43.0, 42.0, 31.0, 32.0, 31.0, 39.0, 42.0, 34.0, 44.0, 38.0, 37.0, 39.0, 19.0, 29.0, 25.0, 16.0, 29.0, 15.0, 17.0, 10.0, 10.0, 11.0, 6.0, 6.0, 10.0, 3.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-29.699382781982422, -28.756195068359375, -27.813005447387695, -26.86981773376465, -25.9266300201416, -24.983440399169922, -24.040252685546875, -23.097064971923828, -22.15387725830078, -21.210689544677734, -20.267499923706055, -19.324312210083008, -18.38112449645996, -17.43793487548828, -16.494747161865234, -15.551559448242188, -14.608369827270508, -13.665181159973145, -12.721993446350098, -11.778804779052734, -10.835617065429688, -9.892428398132324, -8.949239730834961, -8.006052017211914, -7.062863349914551, -6.119675159454346, -5.176486968994141, -4.233298301696777, -3.2901101112365723, -2.346921920776367, -1.403733253479004, -0.46054506301879883, 0.48264122009277344, 1.425829529762268, 2.3690178394317627, 3.312206268310547, 4.255394458770752, 5.198582649230957, 6.14177131652832, 7.084959506988525, 8.02814769744873, 8.971336364746094, 9.91452407836914, 10.857712745666504, 11.800901412963867, 12.744089126586914, 13.687277793884277, 14.63046646118164, 15.573654174804688, 16.516841888427734, 17.460031509399414, 18.40321922302246, 19.346406936645508, 20.289596557617188, 21.232784271240234, 22.17597198486328, 23.119159698486328, 24.062347412109375, 25.005537033081055, 25.9487247467041, 26.89191246032715, 27.835102081298828, 28.778289794921875, 29.721477508544922, 30.6646671295166]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 1.0, 3.0, 3.0, 2.0, 2.0, 13.0, 12.0, 12.0, 18.0, 18.0, 27.0, 21.0, 16.0, 25.0, 26.0, 24.0, 53.0, 38.0, 38.0, 46.0, 38.0, 39.0, 33.0, 41.0, 31.0, 29.0, 44.0, 34.0, 41.0, 32.0, 29.0, 29.0, 22.0, 21.0, 20.0, 22.0, 13.0, 13.0, 14.0, 12.0, 9.0, 11.0, 4.0, 10.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-48.507598876953125, -47.037899017333984, -45.56820297241211, -44.09850311279297, -42.62880325317383, -41.15910339355469, -39.68940734863281, -38.21970748901367, -36.75000762939453, -35.28030776977539, -33.810611724853516, -32.340911865234375, -30.871212005615234, -29.401514053344727, -27.93181610107422, -26.462116241455078, -24.992420196533203, -23.522722244262695, -22.053022384643555, -20.583324432373047, -19.113624572753906, -17.6439266204834, -16.17422866821289, -14.704529762268066, -13.234830856323242, -11.765131950378418, -10.295433044433594, -8.825735092163086, -7.356036186218262, -5.8863372802734375, -4.41663932800293, -2.9469404220581055, -1.4772377014160156, -0.007539033889770508, 1.4621596336364746, 2.9318580627441406, 4.401556968688965, 5.871255874633789, 7.340953826904297, 8.810652732849121, 10.280351638793945, 11.75005054473877, 13.219749450683594, 14.689447402954102, 16.15914535522461, 17.62884521484375, 19.098543167114258, 20.568241119384766, 22.037940979003906, 23.507638931274414, 24.977338790893555, 26.447036743164062, 27.916736602783203, 29.38643455505371, 30.85613250732422, 32.32583236694336, 33.7955322265625, 35.26523208618164, 36.734928131103516, 38.204627990722656, 39.6743278503418, 41.14402770996094, 42.61372375488281, 44.08342361450195, 45.55311965942383]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 10.0, 13.0, 18.0, 23.0, 27.0, 40.0, 55.0, 84.0, 112.0, 113.0, 156.0, 234.0, 312.0, 396.0, 501.0, 668.0, 925.0, 1101.0, 1478.0, 1953.0, 2512.0, 3283.0, 4769.0, 6644.0, 998793.0, 6936.0, 4849.0, 3538.0, 2551.0, 1979.0, 1495.0, 1171.0, 906.0, 758.0, 550.0, 425.0, 300.0, 235.0, 161.0, 145.0, 113.0, 83.0, 47.0, 39.0, 30.0, 24.0, 13.0, 18.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-253.26527404785156, -245.48699951171875, -237.708740234375, -229.9304656982422, -222.15219116210938, -214.37393188476562, -206.5956573486328, -198.8173828125, -191.03912353515625, -183.26084899902344, -175.4825897216797, -167.70431518554688, -159.92605590820312, -152.1477813720703, -144.3695068359375, -136.59124755859375, -128.81297302246094, -121.03470611572266, -113.25643920898438, -105.47816467285156, -97.69989776611328, -89.921630859375, -82.14335632324219, -74.3650894165039, -66.58682250976562, -58.808555603027344, -51.0302848815918, -43.25201416015625, -35.47374725341797, -27.695480346679688, -19.91720962524414, -12.138938903808594, -4.360687255859375, 3.417581558227539, 11.195850372314453, 18.974119186401367, 26.75238800048828, 34.53065490722656, 42.30892562866211, 50.087196350097656, 57.86546325683594, 65.64373016357422, 73.4219970703125, 81.20027160644531, 88.9785385131836, 96.75680541992188, 104.53507995605469, 112.31334686279297, 120.09161376953125, 127.86988067626953, 135.6481475830078, 143.42642211914062, 151.20468139648438, 158.9829559326172, 166.76123046875, 174.53948974609375, 182.31776428222656, 190.09603881835938, 197.87429809570312, 205.65257263183594, 213.43084716796875, 221.2091064453125, 228.9873809814453, 236.76565551757812, 244.54391479492188]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 10.0, 9.0, 13.0, 10.0, 27.0, 46.0, 64.0, 71.0, 104.0, 144.0, 203.0, 271.0, 387.0, 467.0, 621.0, 840.0, 1105.0, 1487.0, 1928.0, 2588.0, 3425.0, 4996.0, 7646.0, 14104.0, 31745.0, 51302640.0, 48362.0, 18123.0, 9058.0, 5583.0, 3834.0, 2903.0, 2123.0, 1548.0, 1180.0, 933.0, 686.0, 550.0, 390.0, 290.0, 245.0, 174.0, 113.0, 96.0, 67.0, 50.0, 37.0, 19.0, 11.0, 14.0, 8.0, 7.0, 4.0, 1.0, 1.0], "bins": [-298.9438781738281, -290.31976318359375, -281.6956787109375, -273.0715637207031, -264.44744873046875, -255.82333374023438, -247.19923400878906, -238.57513427734375, -229.95101928710938, -221.326904296875, -212.7028045654297, -204.07870483398438, -195.45458984375, -186.83047485351562, -178.2063751220703, -169.582275390625, -160.95816040039062, -152.33404541015625, -143.70994567871094, -135.08584594726562, -126.46173095703125, -117.8376235961914, -109.21351623535156, -100.58940887451172, -91.96530151367188, -83.34119415283203, -74.71708679199219, -66.09297943115234, -57.4688720703125, -48.844764709472656, -40.22065734863281, -31.59654998779297, -22.972457885742188, -14.348350524902344, -5.7242431640625, 2.8998641967773438, 11.523971557617188, 20.14807891845703, 28.772186279296875, 37.39629364013672, 46.02040100097656, 54.644508361816406, 63.26861572265625, 71.8927230834961, 80.51683044433594, 89.14093780517578, 97.76504516601562, 106.38915252685547, 115.01325988769531, 123.63736724853516, 132.261474609375, 140.88558959960938, 149.5096893310547, 158.1337890625, 166.75790405273438, 175.38201904296875, 184.00611877441406, 192.63021850585938, 201.25433349609375, 209.87844848632812, 218.50254821777344, 227.12664794921875, 235.75076293945312, 244.3748779296875, 252.9989776611328]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 8.0, 6.0, 12.0, 6.0, 14.0, 18.0, 14.0, 18.0, 20.0, 28.0, 36.0, 34.0, 30.0, 48.0, 37.0, 49.0, 55.0, 56.0, 41.0, 50.0, 45.0, 41.0, 40.0, 40.0, 35.0, 26.0, 29.0, 20.0, 19.0, 18.0, 11.0, 10.0, 16.0, 9.0, 11.0, 7.0, 10.0, 4.0, 2.0, 2.0, 4.0, 3.0, 1.0], "bins": [-281.85919189453125, -274.5696716308594, -267.2801513671875, -259.9906311035156, -252.7011260986328, -245.41160583496094, -238.12210083007812, -230.83258056640625, -223.54306030273438, -216.2535400390625, -208.96401977539062, -201.6745147705078, -194.38499450683594, -187.09547424316406, -179.80596923828125, -172.51644897460938, -165.2269287109375, -157.93740844726562, -150.64788818359375, -143.35838317871094, -136.06886291503906, -128.7793426513672, -121.48983001708984, -114.2003173828125, -106.91079711914062, -99.62127685546875, -92.3317642211914, -85.04225158691406, -77.75273132324219, -70.46321105957031, -63.17369842529297, -55.88418197631836, -48.59468078613281, -41.3051643371582, -34.015647888183594, -26.726131439208984, -19.436614990234375, -12.147098541259766, -4.857582092285156, 2.431934356689453, 9.721450805664062, 17.010967254638672, 24.30048370361328, 31.59000015258789, 38.8795166015625, 46.16903305053711, 53.45854949951172, 60.74806594848633, 68.03758239746094, 75.32710266113281, 82.61661529541016, 89.9061279296875, 97.19564819335938, 104.48516845703125, 111.7746810913086, 119.06419372558594, 126.35371398925781, 133.6432342529297, 140.9327392578125, 148.22225952148438, 155.51177978515625, 162.80130004882812, 170.0908203125, 177.3803253173828, 184.6698455810547]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 0.0, 2.0, 3.0, 6.0, 7.0, 10.0, 4.0, 6.0, 15.0, 14.0, 11.0, 21.0, 16.0, 19.0, 25.0, 27.0, 40.0, 45.0, 40.0, 50.0, 52.0, 55.0, 80.0, 55.0, 43.0, 41.0, 42.0, 26.0, 35.0, 26.0, 26.0, 15.0, 26.0, 20.0, 9.0, 14.0, 13.0, 12.0, 14.0, 8.0, 8.0, 4.0, 3.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-339.97601318359375, -329.10198974609375, -318.22796630859375, -307.35394287109375, -296.4798889160156, -285.6058654785156, -274.7318420410156, -263.8578186035156, -252.98377990722656, -242.10975646972656, -231.2357177734375, -220.3616943359375, -209.4876708984375, -198.61363220214844, -187.73960876464844, -176.86557006835938, -165.99154663085938, -155.11752319335938, -144.2434844970703, -133.3694610595703, -122.49542999267578, -111.62139892578125, -100.74737548828125, -89.87334442138672, -78.99931335449219, -68.12528228759766, -57.25125503540039, -46.377227783203125, -35.503196716308594, -24.629165649414062, -13.755142211914062, -2.8811111450195312, 7.992919921875, 18.8669490814209, 29.740978240966797, 40.61500549316406, 51.489036560058594, 62.363067626953125, 73.23709106445312, 84.11112213134766, 94.98515319824219, 105.85918426513672, 116.73321533203125, 127.60723876953125, 138.48126220703125, 149.3553009033203, 160.2293243408203, 171.10336303710938, 181.97738647460938, 192.85140991210938, 203.72544860839844, 214.59947204589844, 225.4735107421875, 236.3475341796875, 247.2215576171875, 258.0955810546875, 268.9696044921875, 279.8436279296875, 290.7176513671875, 301.5916748046875, 312.4657287597656, 323.3397521972656, 334.2137756347656, 345.0877990722656, 355.96185302734375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 13.0, 24.0, 21.0, 28.0, 33.0, 46.0, 70.0, 100.0, 121.0, 173.0, 183.0, 278.0, 385.0, 514.0, 699.0, 1039.0, 1451.0, 2148.0, 3258.0, 5132.0, 8346.0, 14144.0, 26139.0, 51729.0, 116317.0, 350089.0, 2687356.0, 607702.0, 172616.0, 68434.0, 32045.0, 16948.0, 9517.0, 5820.0, 3585.0, 2508.0, 1611.0, 1119.0, 813.0, 559.0, 352.0, 277.0, 175.0, 126.0, 89.0, 48.0, 38.0, 30.0, 13.0, 8.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.4375, -11.097900390625, -10.75830078125, -10.418701171875, -10.0791015625, -9.739501953125, -9.39990234375, -9.060302734375, -8.720703125, -8.381103515625, -8.04150390625, -7.701904296875, -7.3623046875, -7.022705078125, -6.68310546875, -6.343505859375, -6.00390625, -5.664306640625, -5.32470703125, -4.985107421875, -4.6455078125, -4.305908203125, -3.96630859375, -3.626708984375, -3.287109375, -2.947509765625, -2.60791015625, -2.268310546875, -1.9287109375, -1.589111328125, -1.24951171875, -0.909912109375, -0.5703125, -0.230712890625, 0.10888671875, 0.448486328125, 0.7880859375, 1.127685546875, 1.46728515625, 1.806884765625, 2.146484375, 2.486083984375, 2.82568359375, 3.165283203125, 3.5048828125, 3.844482421875, 4.18408203125, 4.523681640625, 4.86328125, 5.202880859375, 5.54248046875, 5.882080078125, 6.2216796875, 6.561279296875, 6.90087890625, 7.240478515625, 7.580078125, 7.919677734375, 8.25927734375, 8.598876953125, 8.9384765625, 9.278076171875, 9.61767578125, 9.957275390625, 10.296875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 4.0, 10.0, 12.0, 12.0, 8.0, 15.0, 19.0, 25.0, 38.0, 47.0, 68.0, 75.0, 92.0, 123.0, 86.0, 92.0, 76.0, 54.0, 34.0, 29.0, 20.0, 17.0, 8.0, 3.0, 9.0, 1.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.57421875, -1.53094482421875, -1.4876708984375, -1.44439697265625, -1.401123046875, -1.35784912109375, -1.3145751953125, -1.27130126953125, -1.22802734375, -1.18475341796875, -1.1414794921875, -1.09820556640625, -1.054931640625, -1.01165771484375, -0.9683837890625, -0.92510986328125, -0.8818359375, -0.83856201171875, -0.7952880859375, -0.75201416015625, -0.708740234375, -0.66546630859375, -0.6221923828125, -0.57891845703125, -0.53564453125, -0.49237060546875, -0.4490966796875, -0.40582275390625, -0.362548828125, -0.31927490234375, -0.2760009765625, -0.23272705078125, -0.189453125, -0.14617919921875, -0.1029052734375, -0.05963134765625, -0.016357421875, 0.02691650390625, 0.0701904296875, 0.11346435546875, 0.15673828125, 0.20001220703125, 0.2432861328125, 0.28656005859375, 0.329833984375, 0.37310791015625, 0.4163818359375, 0.45965576171875, 0.5029296875, 0.54620361328125, 0.5894775390625, 0.63275146484375, 0.676025390625, 0.71929931640625, 0.7625732421875, 0.80584716796875, 0.84912109375, 0.89239501953125, 0.9356689453125, 0.97894287109375, 1.022216796875, 1.06549072265625, 1.1087646484375, 1.15203857421875, 1.1953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 10.0, 12.0, 20.0, 25.0, 57.0, 50.0, 92.0, 145.0, 247.0, 474.0, 1138.0, 3043.0, 9867.0, 41348.0, 226570.0, 2563696.0, 1157425.0, 148429.0, 29565.0, 7586.0, 2493.0, 931.0, 404.0, 228.0, 134.0, 82.0, 55.0, 40.0, 25.0, 22.0, 15.0, 8.0, 7.0, 6.0, 6.0, 7.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.1875, -15.645751953125, -15.10400390625, -14.562255859375, -14.0205078125, -13.478759765625, -12.93701171875, -12.395263671875, -11.853515625, -11.311767578125, -10.77001953125, -10.228271484375, -9.6865234375, -9.144775390625, -8.60302734375, -8.061279296875, -7.51953125, -6.977783203125, -6.43603515625, -5.894287109375, -5.3525390625, -4.810791015625, -4.26904296875, -3.727294921875, -3.185546875, -2.643798828125, -2.10205078125, -1.560302734375, -1.0185546875, -0.476806640625, 0.06494140625, 0.606689453125, 1.1484375, 1.690185546875, 2.23193359375, 2.773681640625, 3.3154296875, 3.857177734375, 4.39892578125, 4.940673828125, 5.482421875, 6.024169921875, 6.56591796875, 7.107666015625, 7.6494140625, 8.191162109375, 8.73291015625, 9.274658203125, 9.81640625, 10.358154296875, 10.89990234375, 11.441650390625, 11.9833984375, 12.525146484375, 13.06689453125, 13.608642578125, 14.150390625, 14.692138671875, 15.23388671875, 15.775634765625, 16.3173828125, 16.859130859375, 17.40087890625, 17.942626953125, 18.484375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 2.0, 6.0, 9.0, 14.0, 16.0, 12.0, 29.0, 31.0, 35.0, 39.0, 68.0, 76.0, 86.0, 131.0, 170.0, 268.0, 333.0, 828.0, 586.0, 315.0, 242.0, 185.0, 147.0, 102.0, 80.0, 61.0, 49.0, 28.0, 27.0, 30.0, 16.0, 11.0, 10.0, 12.0, 7.0, 6.0, 7.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4921875, -3.3790283203125, -3.265869140625, -3.1527099609375, -3.03955078125, -2.9263916015625, -2.813232421875, -2.7000732421875, -2.5869140625, -2.4737548828125, -2.360595703125, -2.2474365234375, -2.13427734375, -2.0211181640625, -1.907958984375, -1.7947998046875, -1.681640625, -1.5684814453125, -1.455322265625, -1.3421630859375, -1.22900390625, -1.1158447265625, -1.002685546875, -0.8895263671875, -0.7763671875, -0.6632080078125, -0.550048828125, -0.4368896484375, -0.32373046875, -0.2105712890625, -0.097412109375, 0.0157470703125, 0.12890625, 0.2420654296875, 0.355224609375, 0.4683837890625, 0.58154296875, 0.6947021484375, 0.807861328125, 0.9210205078125, 1.0341796875, 1.1473388671875, 1.260498046875, 1.3736572265625, 1.48681640625, 1.5999755859375, 1.713134765625, 1.8262939453125, 1.939453125, 2.0526123046875, 2.165771484375, 2.2789306640625, 2.39208984375, 2.5052490234375, 2.618408203125, 2.7315673828125, 2.8447265625, 2.9578857421875, 3.071044921875, 3.1842041015625, 3.29736328125, 3.4105224609375, 3.523681640625, 3.6368408203125, 3.75]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 15.0, 56.0, 147.0, 255.0, 268.0, 149.0, 77.0, 24.0, 11.0, 8.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.955406188964844, -23.580018997192383, -21.20462989807129, -18.829242706298828, -16.453853607177734, -14.078466415405273, -11.703079223632812, -9.327690124511719, -6.952302932739258, -4.5769147872924805, -2.2015271186828613, 0.1738605499267578, 2.549248695373535, 4.9246368408203125, 7.300024032592773, 9.675413131713867, 12.050800323486328, 14.426188468933105, 16.801576614379883, 19.176963806152344, 21.552352905273438, 23.9277400970459, 26.30312728881836, 28.678516387939453, 31.053903579711914, 33.429290771484375, 35.80467987060547, 38.18006896972656, 40.55545425415039, 42.930843353271484, 45.30622863769531, 47.681617736816406, 50.0570068359375, 52.432395935058594, 54.80778121948242, 57.183170318603516, 59.55855941772461, 61.93394470214844, 64.30933380126953, 66.68472290039062, 69.06011199951172, 71.43550109863281, 73.8108901977539, 76.186279296875, 78.56166076660156, 80.93704986572266, 83.31243896484375, 85.68782806396484, 88.06321716308594, 90.43860626220703, 92.81399536132812, 95.18937683105469, 97.56476593017578, 99.94015502929688, 102.31554412841797, 104.69093322753906, 107.06631469726562, 109.44170379638672, 111.81709289550781, 114.19247436523438, 116.56786346435547, 118.94325256347656, 121.31864166259766, 123.69403076171875, 126.06941986083984]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 5.0, 7.0, 12.0, 8.0, 20.0, 12.0, 24.0, 30.0, 21.0, 27.0, 35.0, 37.0, 42.0, 36.0, 36.0, 50.0, 39.0, 57.0, 47.0, 38.0, 48.0, 42.0, 41.0, 38.0, 33.0, 25.0, 29.0, 21.0, 23.0, 16.0, 15.0, 11.0, 16.0, 11.0, 12.0, 8.0, 1.0, 5.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.200023651123047, -17.639678955078125, -17.079336166381836, -16.518991470336914, -15.958647727966309, -15.398303985595703, -14.837959289550781, -14.277615547180176, -13.71727180480957, -13.156928062438965, -12.596583366394043, -12.036239624023438, -11.475895881652832, -10.915552139282227, -10.355207443237305, -9.7948637008667, -9.234519004821777, -8.674175262451172, -8.11383056640625, -7.5534868240356445, -6.993143081665039, -6.432798862457275, -5.872454643249512, -5.312110900878906, -4.751766681671143, -4.191422462463379, -3.6310787200927734, -3.0707345008850098, -2.510390520095825, -1.9500465393066406, -1.389702320098877, -0.8293583393096924, -0.2690143585205078, 0.29132968187332153, 0.8516737222671509, 1.412017822265625, 1.9723618030548096, 2.532705783843994, 3.093050003051758, 3.6533939838409424, 4.213737964630127, 4.774082183837891, 5.334425926208496, 5.89477014541626, 6.455114364624023, 7.015458106994629, 7.575802326202393, 8.136146545410156, 8.696490287780762, 9.256834030151367, 9.817178726196289, 10.377522468566895, 10.9378662109375, 11.498210906982422, 12.058554649353027, 12.618898391723633, 13.179243087768555, 13.73958683013916, 14.299931526184082, 14.860275268554688, 15.420619010925293, 15.980962753295898, 16.54130744934082, 17.101652145385742, 17.66199493408203]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 5.0, 7.0, 11.0, 9.0, 21.0, 19.0, 40.0, 52.0, 79.0, 104.0, 173.0, 210.0, 312.0, 412.0, 573.0, 865.0, 1292.0, 1912.0, 3076.0, 5020.0, 8467.0, 16013.0, 31552.0, 68261.0, 158708.0, 297535.0, 242572.0, 109241.0, 48374.0, 23163.0, 11949.0, 6792.0, 4088.0, 2457.0, 1592.0, 1106.0, 731.0, 540.0, 358.0, 245.0, 189.0, 140.0, 86.0, 68.0, 38.0, 25.0, 28.0, 18.0, 7.0, 11.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.9921875, -9.6873779296875, -9.382568359375, -9.0777587890625, -8.77294921875, -8.4681396484375, -8.163330078125, -7.8585205078125, -7.5537109375, -7.2489013671875, -6.944091796875, -6.6392822265625, -6.33447265625, -6.0296630859375, -5.724853515625, -5.4200439453125, -5.115234375, -4.8104248046875, -4.505615234375, -4.2008056640625, -3.89599609375, -3.5911865234375, -3.286376953125, -2.9815673828125, -2.6767578125, -2.3719482421875, -2.067138671875, -1.7623291015625, -1.45751953125, -1.1527099609375, -0.847900390625, -0.5430908203125, -0.23828125, 0.0665283203125, 0.371337890625, 0.6761474609375, 0.98095703125, 1.2857666015625, 1.590576171875, 1.8953857421875, 2.2001953125, 2.5050048828125, 2.809814453125, 3.1146240234375, 3.41943359375, 3.7242431640625, 4.029052734375, 4.3338623046875, 4.638671875, 4.9434814453125, 5.248291015625, 5.5531005859375, 5.85791015625, 6.1627197265625, 6.467529296875, 6.7723388671875, 7.0771484375, 7.3819580078125, 7.686767578125, 7.9915771484375, 8.29638671875, 8.6011962890625, 8.906005859375, 9.2108154296875, 9.515625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 11.0, 13.0, 13.0, 26.0, 24.0, 34.0, 47.0, 59.0, 84.0, 96.0, 97.0, 95.0, 102.0, 74.0, 61.0, 52.0, 23.0, 23.0, 9.0, 11.0, 8.0, 5.0, 10.0, 3.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.126953125, -2.0718841552734375, -2.016815185546875, -1.9617462158203125, -1.90667724609375, -1.8516082763671875, -1.796539306640625, -1.7414703369140625, -1.6864013671875, -1.6313323974609375, -1.576263427734375, -1.5211944580078125, -1.46612548828125, -1.4110565185546875, -1.355987548828125, -1.3009185791015625, -1.245849609375, -1.1907806396484375, -1.135711669921875, -1.0806427001953125, -1.02557373046875, -0.9705047607421875, -0.915435791015625, -0.8603668212890625, -0.8052978515625, -0.7502288818359375, -0.695159912109375, -0.6400909423828125, -0.58502197265625, -0.5299530029296875, -0.474884033203125, -0.4198150634765625, -0.36474609375, -0.3096771240234375, -0.254608154296875, -0.1995391845703125, -0.14447021484375, -0.0894012451171875, -0.034332275390625, 0.0207366943359375, 0.0758056640625, 0.1308746337890625, 0.185943603515625, 0.2410125732421875, 0.29608154296875, 0.3511505126953125, 0.406219482421875, 0.4612884521484375, 0.516357421875, 0.5714263916015625, 0.626495361328125, 0.6815643310546875, 0.73663330078125, 0.7917022705078125, 0.846771240234375, 0.9018402099609375, 0.9569091796875, 1.0119781494140625, 1.067047119140625, 1.1221160888671875, 1.17718505859375, 1.2322540283203125, 1.287322998046875, 1.3423919677734375, 1.3974609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 15.0, 12.0, 16.0, 25.0, 33.0, 51.0, 72.0, 109.0, 252.0, 400.0, 778.0, 1478.0, 2957.0, 6326.0, 14603.0, 44449.0, 243129.0, 571886.0, 115213.0, 26931.0, 10272.0, 4696.0, 2262.0, 1155.0, 627.0, 321.0, 173.0, 115.0, 45.0, 41.0, 20.0, 17.0, 15.0, 12.0, 8.0, 6.0, 4.0, 5.0, 4.0, 1.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.049072265625, -16.50439453125, -15.959716796875, -15.4150390625, -14.870361328125, -14.32568359375, -13.781005859375, -13.236328125, -12.691650390625, -12.14697265625, -11.602294921875, -11.0576171875, -10.512939453125, -9.96826171875, -9.423583984375, -8.87890625, -8.334228515625, -7.78955078125, -7.244873046875, -6.7001953125, -6.155517578125, -5.61083984375, -5.066162109375, -4.521484375, -3.976806640625, -3.43212890625, -2.887451171875, -2.3427734375, -1.798095703125, -1.25341796875, -0.708740234375, -0.1640625, 0.380615234375, 0.92529296875, 1.469970703125, 2.0146484375, 2.559326171875, 3.10400390625, 3.648681640625, 4.193359375, 4.738037109375, 5.28271484375, 5.827392578125, 6.3720703125, 6.916748046875, 7.46142578125, 8.006103515625, 8.55078125, 9.095458984375, 9.64013671875, 10.184814453125, 10.7294921875, 11.274169921875, 11.81884765625, 12.363525390625, 12.908203125, 13.452880859375, 13.99755859375, 14.542236328125, 15.0869140625, 15.631591796875, 16.17626953125, 16.720947265625, 17.265625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 0.0, 4.0, 10.0, 6.0, 5.0, 11.0, 16.0, 10.0, 18.0, 24.0, 17.0, 23.0, 34.0, 25.0, 24.0, 31.0, 44.0, 33.0, 48.0, 42.0, 37.0, 39.0, 44.0, 47.0, 49.0, 34.0, 40.0, 36.0, 27.0, 31.0, 35.0, 21.0, 21.0, 20.0, 17.0, 11.0, 9.0, 12.0, 12.0, 1.0, 8.0, 4.0, 6.0, 3.0, 1.0, 0.0, 4.0, 0.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.5546875, -8.2862548828125, -8.017822265625, -7.7493896484375, -7.48095703125, -7.2125244140625, -6.944091796875, -6.6756591796875, -6.4072265625, -6.1387939453125, -5.870361328125, -5.6019287109375, -5.33349609375, -5.0650634765625, -4.796630859375, -4.5281982421875, -4.259765625, -3.9913330078125, -3.722900390625, -3.4544677734375, -3.18603515625, -2.9176025390625, -2.649169921875, -2.3807373046875, -2.1123046875, -1.8438720703125, -1.575439453125, -1.3070068359375, -1.03857421875, -0.7701416015625, -0.501708984375, -0.2332763671875, 0.03515625, 0.3035888671875, 0.572021484375, 0.8404541015625, 1.10888671875, 1.3773193359375, 1.645751953125, 1.9141845703125, 2.1826171875, 2.4510498046875, 2.719482421875, 2.9879150390625, 3.25634765625, 3.5247802734375, 3.793212890625, 4.0616455078125, 4.330078125, 4.5985107421875, 4.866943359375, 5.1353759765625, 5.40380859375, 5.6722412109375, 5.940673828125, 6.2091064453125, 6.4775390625, 6.7459716796875, 7.014404296875, 7.2828369140625, 7.55126953125, 7.8197021484375, 8.088134765625, 8.3565673828125, 8.625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 12.0, 14.0, 24.0, 39.0, 59.0, 79.0, 148.0, 200.0, 379.0, 593.0, 1118.0, 2244.0, 4933.0, 12559.0, 42811.0, 285708.0, 589483.0, 76172.0, 18930.0, 6839.0, 2819.0, 1455.0, 809.0, 433.0, 231.0, 157.0, 113.0, 68.0, 30.0, 28.0, 10.0, 11.0, 12.0, 6.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.0625, -24.232177734375, -23.40185546875, -22.571533203125, -21.7412109375, -20.910888671875, -20.08056640625, -19.250244140625, -18.419921875, -17.589599609375, -16.75927734375, -15.928955078125, -15.0986328125, -14.268310546875, -13.43798828125, -12.607666015625, -11.77734375, -10.947021484375, -10.11669921875, -9.286376953125, -8.4560546875, -7.625732421875, -6.79541015625, -5.965087890625, -5.134765625, -4.304443359375, -3.47412109375, -2.643798828125, -1.8134765625, -0.983154296875, -0.15283203125, 0.677490234375, 1.5078125, 2.338134765625, 3.16845703125, 3.998779296875, 4.8291015625, 5.659423828125, 6.48974609375, 7.320068359375, 8.150390625, 8.980712890625, 9.81103515625, 10.641357421875, 11.4716796875, 12.302001953125, 13.13232421875, 13.962646484375, 14.79296875, 15.623291015625, 16.45361328125, 17.283935546875, 18.1142578125, 18.944580078125, 19.77490234375, 20.605224609375, 21.435546875, 22.265869140625, 23.09619140625, 23.926513671875, 24.7568359375, 25.587158203125, 26.41748046875, 27.247802734375, 28.078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 5.0, 2.0, 3.0, 8.0, 16.0, 17.0, 30.0, 34.0, 73.0, 112.0, 173.0, 184.0, 141.0, 69.0, 45.0, 26.0, 20.0, 11.0, 6.0, 12.0, 5.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00402069091796875, -0.003909289836883545, -0.00379788875579834, -0.0036864876747131348, -0.0035750865936279297, -0.0034636855125427246, -0.0033522844314575195, -0.0032408833503723145, -0.0031294822692871094, -0.0030180811882019043, -0.0029066801071166992, -0.002795279026031494, -0.002683877944946289, -0.002572476863861084, -0.002461075782775879, -0.002349674701690674, -0.0022382736206054688, -0.0021268725395202637, -0.0020154714584350586, -0.0019040703773498535, -0.0017926692962646484, -0.0016812682151794434, -0.0015698671340942383, -0.0014584660530090332, -0.0013470649719238281, -0.001235663890838623, -0.001124262809753418, -0.0010128617286682129, -0.0009014606475830078, -0.0007900595664978027, -0.0006786584854125977, -0.0005672574043273926, -0.0004558563232421875, -0.0003444552421569824, -0.00023305416107177734, -0.00012165307998657227, -1.0251998901367188e-05, 0.00010114908218383789, 0.00021255016326904297, 0.00032395124435424805, 0.0004353523254394531, 0.0005467534065246582, 0.0006581544876098633, 0.0007695555686950684, 0.0008809566497802734, 0.0009923577308654785, 0.0011037588119506836, 0.0012151598930358887, 0.0013265609741210938, 0.0014379620552062988, 0.001549363136291504, 0.001660764217376709, 0.001772165298461914, 0.0018835663795471191, 0.0019949674606323242, 0.0021063685417175293, 0.0022177696228027344, 0.0023291707038879395, 0.0024405717849731445, 0.0025519728660583496, 0.0026633739471435547, 0.0027747750282287598, 0.002886176109313965, 0.00299757719039917, 0.003108978271484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 8.0, 22.0, 29.0, 39.0, 68.0, 115.0, 205.0, 405.0, 778.0, 1648.0, 3674.0, 9445.0, 30815.0, 221249.0, 672411.0, 78970.0, 17413.0, 6252.0, 2568.0, 1195.0, 571.0, 275.0, 147.0, 98.0, 65.0, 27.0, 13.0, 13.0, 13.0, 4.0, 5.0, 0.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.765625, -24.021484375, -23.27734375, -22.533203125, -21.7890625, -21.044921875, -20.30078125, -19.556640625, -18.8125, -18.068359375, -17.32421875, -16.580078125, -15.8359375, -15.091796875, -14.34765625, -13.603515625, -12.859375, -12.115234375, -11.37109375, -10.626953125, -9.8828125, -9.138671875, -8.39453125, -7.650390625, -6.90625, -6.162109375, -5.41796875, -4.673828125, -3.9296875, -3.185546875, -2.44140625, -1.697265625, -0.953125, -0.208984375, 0.53515625, 1.279296875, 2.0234375, 2.767578125, 3.51171875, 4.255859375, 5.0, 5.744140625, 6.48828125, 7.232421875, 7.9765625, 8.720703125, 9.46484375, 10.208984375, 10.953125, 11.697265625, 12.44140625, 13.185546875, 13.9296875, 14.673828125, 15.41796875, 16.162109375, 16.90625, 17.650390625, 18.39453125, 19.138671875, 19.8828125, 20.626953125, 21.37109375, 22.115234375, 22.859375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 13.0, 7.0, 12.0, 17.0, 24.0, 31.0, 40.0, 50.0, 52.0, 55.0, 67.0, 62.0, 78.0, 88.0, 78.0, 54.0, 59.0, 46.0, 39.0, 29.0, 29.0, 15.0, 11.0, 14.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3046875, -9.9866943359375, -9.668701171875, -9.3507080078125, -9.03271484375, -8.7147216796875, -8.396728515625, -8.0787353515625, -7.7607421875, -7.4427490234375, -7.124755859375, -6.8067626953125, -6.48876953125, -6.1707763671875, -5.852783203125, -5.5347900390625, -5.216796875, -4.8988037109375, -4.580810546875, -4.2628173828125, -3.94482421875, -3.6268310546875, -3.308837890625, -2.9908447265625, -2.6728515625, -2.3548583984375, -2.036865234375, -1.7188720703125, -1.40087890625, -1.0828857421875, -0.764892578125, -0.4468994140625, -0.12890625, 0.1890869140625, 0.507080078125, 0.8250732421875, 1.14306640625, 1.4610595703125, 1.779052734375, 2.0970458984375, 2.4150390625, 2.7330322265625, 3.051025390625, 3.3690185546875, 3.68701171875, 4.0050048828125, 4.322998046875, 4.6409912109375, 4.958984375, 5.2769775390625, 5.594970703125, 5.9129638671875, 6.23095703125, 6.5489501953125, 6.866943359375, 7.1849365234375, 7.5029296875, 7.8209228515625, 8.138916015625, 8.4569091796875, 8.77490234375, 9.0928955078125, 9.410888671875, 9.7288818359375, 10.046875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 11.0, 22.0, 18.0, 39.0, 153.0, 400.0, 225.0, 66.0, 24.0, 16.0, 11.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-353.36859130859375, -342.2578125, -331.14703369140625, -320.0362548828125, -308.9255065917969, -297.8147277832031, -286.7039489746094, -275.5931701660156, -264.4823913574219, -253.37161254882812, -242.26084899902344, -231.1500701904297, -220.03929138183594, -208.92852783203125, -197.8177490234375, -186.70697021484375, -175.59620666503906, -164.4854278564453, -153.37466430664062, -142.26388549804688, -131.15310668945312, -120.0423355102539, -108.93156433105469, -97.82078552246094, -86.71001434326172, -75.5992431640625, -64.48846435546875, -53.37769317626953, -42.26691818237305, -31.156143188476562, -20.045372009277344, -8.934593200683594, 2.176177978515625, 13.286952018737793, 24.39772605895996, 35.50849914550781, 46.6192741394043, 57.73004913330078, 68.8408203125, 79.95159912109375, 91.06237030029297, 102.17314147949219, 113.28392028808594, 124.39469146728516, 135.50546264648438, 146.61624145507812, 157.72702026367188, 168.83779907226562, 179.9485626220703, 191.05934143066406, 202.17010498046875, 213.2808837890625, 224.39166259765625, 235.50244140625, 246.6132049560547, 257.7239990234375, 268.8347473144531, 279.9455261230469, 291.0563049316406, 302.16705322265625, 313.27783203125, 324.38861083984375, 335.4993896484375, 346.61016845703125, 357.720947265625]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 6.0, 4.0, 7.0, 7.0, 10.0, 17.0, 20.0, 32.0, 46.0, 96.0, 128.0, 146.0, 128.0, 122.0, 71.0, 47.0, 19.0, 13.0, 17.0, 9.0, 6.0, 7.0, 3.0, 1.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.73660278320312, -150.3291778564453, -144.9217529296875, -139.51431274414062, -134.1068878173828, -128.699462890625, -123.29203796386719, -117.88461303710938, -112.47718811035156, -107.06976318359375, -101.6623306274414, -96.2549057006836, -90.84748077392578, -85.44004821777344, -80.03262329101562, -74.62519836425781, -69.21776580810547, -63.81033706665039, -58.40291213989258, -52.9954833984375, -47.58805847167969, -42.18062973022461, -36.77320098876953, -31.36577606201172, -25.95834732055664, -20.550920486450195, -15.143492698669434, -9.736064910888672, -4.328638076782227, 1.0787887573242188, 6.486217498779297, 11.89364242553711, 17.301071166992188, 22.708498001098633, 28.115924835205078, 33.523353576660156, 38.93077850341797, 44.33820724487305, 49.745635986328125, 55.15306091308594, 60.560489654541016, 65.9679183959961, 71.3753433227539, 76.78277587890625, 82.19020080566406, 87.59762573242188, 93.00505065917969, 98.4124755859375, 103.81990814208984, 109.22733306884766, 114.634765625, 120.04219055175781, 125.44961547851562, 130.85704040527344, 136.26446533203125, 141.67190551757812, 147.07933044433594, 152.48675537109375, 157.89418029785156, 163.30160522460938, 168.70904541015625, 174.11647033691406, 179.52389526367188, 184.9313201904297, 190.3387451171875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 5.0, 5.0, 16.0, 18.0, 42.0, 63.0, 108.0, 187.0, 265.0, 493.0, 965.0, 2008.0, 4697.0, 13668.0, 53639.0, 488710.0, 3491201.0, 104933.0, 21619.0, 6664.0, 2526.0, 1075.0, 583.0, 321.0, 162.0, 101.0, 76.0, 45.0, 29.0, 27.0, 11.0, 9.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.625, -40.09423828125, -38.5634765625, -37.03271484375, -35.501953125, -33.97119140625, -32.4404296875, -30.90966796875, -29.37890625, -27.84814453125, -26.3173828125, -24.78662109375, -23.255859375, -21.72509765625, -20.1943359375, -18.66357421875, -17.1328125, -15.60205078125, -14.0712890625, -12.54052734375, -11.009765625, -9.47900390625, -7.9482421875, -6.41748046875, -4.88671875, -3.35595703125, -1.8251953125, -0.29443359375, 1.236328125, 2.76708984375, 4.2978515625, 5.82861328125, 7.359375, 8.89013671875, 10.4208984375, 11.95166015625, 13.482421875, 15.01318359375, 16.5439453125, 18.07470703125, 19.60546875, 21.13623046875, 22.6669921875, 24.19775390625, 25.728515625, 27.25927734375, 28.7900390625, 30.32080078125, 31.8515625, 33.38232421875, 34.9130859375, 36.44384765625, 37.974609375, 39.50537109375, 41.0361328125, 42.56689453125, 44.09765625, 45.62841796875, 47.1591796875, 48.68994140625, 50.220703125, 51.75146484375, 53.2822265625, 54.81298828125, 56.34375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 9.0, 14.0, 9.0, 24.0, 17.0, 25.0, 40.0, 49.0, 62.0, 57.0, 94.0, 97.0, 77.0, 76.0, 78.0, 54.0, 64.0, 38.0, 26.0, 17.0, 15.0, 10.0, 6.0, 7.0, 9.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.9072265625, -1.8523101806640625, -1.797393798828125, -1.7424774169921875, -1.68756103515625, -1.6326446533203125, -1.577728271484375, -1.5228118896484375, -1.4678955078125, -1.4129791259765625, -1.358062744140625, -1.3031463623046875, -1.24822998046875, -1.1933135986328125, -1.138397216796875, -1.0834808349609375, -1.028564453125, -0.9736480712890625, -0.918731689453125, -0.8638153076171875, -0.80889892578125, -0.7539825439453125, -0.699066162109375, -0.6441497802734375, -0.5892333984375, -0.5343170166015625, -0.479400634765625, -0.4244842529296875, -0.36956787109375, -0.3146514892578125, -0.259735107421875, -0.2048187255859375, -0.14990234375, -0.0949859619140625, -0.040069580078125, 0.0148468017578125, 0.06976318359375, 0.1246795654296875, 0.179595947265625, 0.2345123291015625, 0.2894287109375, 0.3443450927734375, 0.399261474609375, 0.4541778564453125, 0.50909423828125, 0.5640106201171875, 0.618927001953125, 0.6738433837890625, 0.728759765625, 0.7836761474609375, 0.838592529296875, 0.8935089111328125, 0.94842529296875, 1.0033416748046875, 1.058258056640625, 1.1131744384765625, 1.1680908203125, 1.2230072021484375, 1.277923583984375, 1.3328399658203125, 1.38775634765625, 1.4426727294921875, 1.497589111328125, 1.5525054931640625, 1.607421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 6.0, 3.0, 11.0, 14.0, 21.0, 26.0, 37.0, 80.0, 103.0, 179.0, 338.0, 635.0, 1292.0, 2827.0, 7229.0, 21769.0, 81146.0, 425508.0, 2997040.0, 522910.0, 95006.0, 24379.0, 7778.0, 3017.0, 1384.0, 665.0, 337.0, 202.0, 126.0, 74.0, 42.0, 34.0, 21.0, 10.0, 8.0, 3.0, 3.0, 5.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-29.8125, -28.996826171875, -28.18115234375, -27.365478515625, -26.5498046875, -25.734130859375, -24.91845703125, -24.102783203125, -23.287109375, -22.471435546875, -21.65576171875, -20.840087890625, -20.0244140625, -19.208740234375, -18.39306640625, -17.577392578125, -16.76171875, -15.946044921875, -15.13037109375, -14.314697265625, -13.4990234375, -12.683349609375, -11.86767578125, -11.052001953125, -10.236328125, -9.420654296875, -8.60498046875, -7.789306640625, -6.9736328125, -6.157958984375, -5.34228515625, -4.526611328125, -3.7109375, -2.895263671875, -2.07958984375, -1.263916015625, -0.4482421875, 0.367431640625, 1.18310546875, 1.998779296875, 2.814453125, 3.630126953125, 4.44580078125, 5.261474609375, 6.0771484375, 6.892822265625, 7.70849609375, 8.524169921875, 9.33984375, 10.155517578125, 10.97119140625, 11.786865234375, 12.6025390625, 13.418212890625, 14.23388671875, 15.049560546875, 15.865234375, 16.680908203125, 17.49658203125, 18.312255859375, 19.1279296875, 19.943603515625, 20.75927734375, 21.574951171875, 22.390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 11.0, 16.0, 23.0, 39.0, 46.0, 62.0, 115.0, 174.0, 297.0, 558.0, 1278.0, 542.0, 301.0, 216.0, 140.0, 80.0, 50.0, 45.0, 13.0, 12.0, 13.0, 12.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.53125, -4.3828125, -4.234375, -4.0859375, -3.9375, -3.7890625, -3.640625, -3.4921875, -3.34375, -3.1953125, -3.046875, -2.8984375, -2.75, -2.6015625, -2.453125, -2.3046875, -2.15625, -2.0078125, -1.859375, -1.7109375, -1.5625, -1.4140625, -1.265625, -1.1171875, -0.96875, -0.8203125, -0.671875, -0.5234375, -0.375, -0.2265625, -0.078125, 0.0703125, 0.21875, 0.3671875, 0.515625, 0.6640625, 0.8125, 0.9609375, 1.109375, 1.2578125, 1.40625, 1.5546875, 1.703125, 1.8515625, 2.0, 2.1484375, 2.296875, 2.4453125, 2.59375, 2.7421875, 2.890625, 3.0390625, 3.1875, 3.3359375, 3.484375, 3.6328125, 3.78125, 3.9296875, 4.078125, 4.2265625, 4.375, 4.5234375, 4.671875, 4.8203125, 4.96875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 13.0, 32.0, 66.0, 167.0, 321.0, 250.0, 95.0, 33.0, 12.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.17215347290039, -51.10664749145508, -49.04114532470703, -46.97563934326172, -44.910133361816406, -42.844627380371094, -40.77912139892578, -38.713619232177734, -36.64811325073242, -34.58260726928711, -32.51710510253906, -30.45159912109375, -28.386093139648438, -26.320587158203125, -24.255083084106445, -22.189579010009766, -20.124073028564453, -18.05856704711914, -15.993062973022461, -13.927557945251465, -11.862052917480469, -9.796547889709473, -7.731042861938477, -5.6655378341674805, -3.6000328063964844, -1.5345277786254883, 0.5309772491455078, 2.596482276916504, 4.6619873046875, 6.727492332458496, 8.792997360229492, 10.858502388000488, 12.924003601074219, 14.989508628845215, 17.05501365661621, 19.12051773071289, 21.186023712158203, 23.251529693603516, 25.317033767700195, 27.382537841796875, 29.448043823242188, 31.5135498046875, 33.57905578613281, 35.64455795288086, 37.71006393432617, 39.775569915771484, 41.84107208251953, 43.906578063964844, 45.972084045410156, 48.03759002685547, 50.10309600830078, 52.16859817504883, 54.23410415649414, 56.29961013793945, 58.3651123046875, 60.43061828613281, 62.496124267578125, 64.56163024902344, 66.62713623046875, 68.69264221191406, 70.75814819335938, 72.82364654541016, 74.88915252685547, 76.95465850830078, 79.0201644897461]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 3.0, 7.0, 4.0, 14.0, 8.0, 19.0, 21.0, 32.0, 40.0, 51.0, 73.0, 57.0, 67.0, 77.0, 70.0, 70.0, 59.0, 69.0, 41.0, 46.0, 34.0, 26.0, 24.0, 21.0, 8.0, 12.0, 4.0, 6.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.335447311401367, -18.68726348876953, -18.039077758789062, -17.390893936157227, -16.74271011352539, -16.094524383544922, -15.446340560913086, -14.798155784606934, -14.149971008300781, -13.501786231994629, -12.853601455688477, -12.20541763305664, -11.557232856750488, -10.909048080444336, -10.2608642578125, -9.612679481506348, -8.964494705200195, -8.316309928894043, -7.668125629425049, -7.019941329956055, -6.371756553649902, -5.72357177734375, -5.075387477874756, -4.427203178405762, -3.7790184020996094, -3.130833864212036, -2.482649326324463, -1.8344647884368896, -1.1862802505493164, -0.5380957126617432, 0.11008882522583008, 0.7582731246948242, 1.4064559936523438, 2.054640531539917, 2.7028250694274902, 3.3510096073150635, 3.9991941452026367, 4.647378921508789, 5.295563220977783, 5.943747520446777, 6.59193229675293, 7.240117073059082, 7.888301372528076, 8.53648567199707, 9.184670448303223, 9.832855224609375, 10.481039047241211, 11.129223823547363, 11.777408599853516, 12.425593376159668, 13.07377815246582, 13.721961975097656, 14.370146751403809, 15.018331527709961, 15.666515350341797, 16.314701080322266, 16.9628849029541, 17.611068725585938, 18.259254455566406, 18.907438278198242, 19.555622100830078, 20.203807830810547, 20.851991653442383, 21.50017547607422, 22.148361206054688]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 8.0, 5.0, 14.0, 8.0, 9.0, 31.0, 26.0, 42.0, 52.0, 109.0, 280.0, 1797.0, 17639.0, 307383.0, 673021.0, 43483.0, 3767.0, 553.0, 136.0, 53.0, 29.0, 33.0, 16.0, 15.0, 15.0, 7.0, 7.0, 3.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-45.375, -44.154296875, -42.93359375, -41.712890625, -40.4921875, -39.271484375, -38.05078125, -36.830078125, -35.609375, -34.388671875, -33.16796875, -31.947265625, -30.7265625, -29.505859375, -28.28515625, -27.064453125, -25.84375, -24.623046875, -23.40234375, -22.181640625, -20.9609375, -19.740234375, -18.51953125, -17.298828125, -16.078125, -14.857421875, -13.63671875, -12.416015625, -11.1953125, -9.974609375, -8.75390625, -7.533203125, -6.3125, -5.091796875, -3.87109375, -2.650390625, -1.4296875, -0.208984375, 1.01171875, 2.232421875, 3.453125, 4.673828125, 5.89453125, 7.115234375, 8.3359375, 9.556640625, 10.77734375, 11.998046875, 13.21875, 14.439453125, 15.66015625, 16.880859375, 18.1015625, 19.322265625, 20.54296875, 21.763671875, 22.984375, 24.205078125, 25.42578125, 26.646484375, 27.8671875, 29.087890625, 30.30859375, 31.529296875, 32.75]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 5.0, 11.0, 11.0, 13.0, 33.0, 35.0, 43.0, 47.0, 61.0, 82.0, 78.0, 78.0, 108.0, 80.0, 75.0, 64.0, 61.0, 40.0, 28.0, 18.0, 13.0, 7.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2010040283203125, -1.143218994140625, -1.0854339599609375, -1.02764892578125, -0.9698638916015625, -0.912078857421875, -0.8542938232421875, -0.7965087890625, -0.7387237548828125, -0.680938720703125, -0.6231536865234375, -0.56536865234375, -0.5075836181640625, -0.449798583984375, -0.3920135498046875, -0.334228515625, -0.2764434814453125, -0.218658447265625, -0.1608734130859375, -0.10308837890625, -0.0453033447265625, 0.012481689453125, 0.0702667236328125, 0.1280517578125, 0.1858367919921875, 0.243621826171875, 0.3014068603515625, 0.35919189453125, 0.4169769287109375, 0.474761962890625, 0.5325469970703125, 0.59033203125, 0.6481170654296875, 0.705902099609375, 0.7636871337890625, 0.82147216796875, 0.8792572021484375, 0.937042236328125, 0.9948272705078125, 1.0526123046875, 1.1103973388671875, 1.168182373046875, 1.2259674072265625, 1.28375244140625, 1.3415374755859375, 1.399322509765625, 1.4571075439453125, 1.514892578125, 1.5726776123046875, 1.630462646484375, 1.6882476806640625, 1.74603271484375, 1.8038177490234375, 1.861602783203125, 1.9193878173828125, 1.9771728515625, 2.0349578857421875, 2.092742919921875, 2.1505279541015625, 2.20831298828125, 2.2660980224609375, 2.323883056640625, 2.3816680908203125, 2.439453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 6.0, 16.0, 20.0, 27.0, 74.0, 175.0, 293.0, 718.0, 1884.0, 5455.0, 18714.0, 80539.0, 373433.0, 436505.0, 99056.0, 21930.0, 6202.0, 2083.0, 716.0, 345.0, 155.0, 84.0, 33.0, 33.0, 14.0, 5.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.6695556640625, -11.221923828125, -10.7742919921875, -10.32666015625, -9.8790283203125, -9.431396484375, -8.9837646484375, -8.5361328125, -8.0885009765625, -7.640869140625, -7.1932373046875, -6.74560546875, -6.2979736328125, -5.850341796875, -5.4027099609375, -4.955078125, -4.5074462890625, -4.059814453125, -3.6121826171875, -3.16455078125, -2.7169189453125, -2.269287109375, -1.8216552734375, -1.3740234375, -0.9263916015625, -0.478759765625, -0.0311279296875, 0.41650390625, 0.8641357421875, 1.311767578125, 1.7593994140625, 2.20703125, 2.6546630859375, 3.102294921875, 3.5499267578125, 3.99755859375, 4.4451904296875, 4.892822265625, 5.3404541015625, 5.7880859375, 6.2357177734375, 6.683349609375, 7.1309814453125, 7.57861328125, 8.0262451171875, 8.473876953125, 8.9215087890625, 9.369140625, 9.8167724609375, 10.264404296875, 10.7120361328125, 11.15966796875, 11.6072998046875, 12.054931640625, 12.5025634765625, 12.9501953125, 13.3978271484375, 13.845458984375, 14.2930908203125, 14.74072265625, 15.1883544921875, 15.635986328125, 16.0836181640625, 16.53125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 9.0, 4.0, 8.0, 13.0, 14.0, 8.0, 18.0, 26.0, 24.0, 29.0, 30.0, 39.0, 38.0, 39.0, 40.0, 50.0, 34.0, 51.0, 57.0, 51.0, 39.0, 38.0, 52.0, 44.0, 31.0, 25.0, 42.0, 30.0, 20.0, 19.0, 20.0, 9.0, 15.0, 11.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.9085693359375, -5.707763671875, -5.5069580078125, -5.30615234375, -5.1053466796875, -4.904541015625, -4.7037353515625, -4.5029296875, -4.3021240234375, -4.101318359375, -3.9005126953125, -3.69970703125, -3.4989013671875, -3.298095703125, -3.0972900390625, -2.896484375, -2.6956787109375, -2.494873046875, -2.2940673828125, -2.09326171875, -1.8924560546875, -1.691650390625, -1.4908447265625, -1.2900390625, -1.0892333984375, -0.888427734375, -0.6876220703125, -0.48681640625, -0.2860107421875, -0.085205078125, 0.1156005859375, 0.31640625, 0.5172119140625, 0.718017578125, 0.9188232421875, 1.11962890625, 1.3204345703125, 1.521240234375, 1.7220458984375, 1.9228515625, 2.1236572265625, 2.324462890625, 2.5252685546875, 2.72607421875, 2.9268798828125, 3.127685546875, 3.3284912109375, 3.529296875, 3.7301025390625, 3.930908203125, 4.1317138671875, 4.33251953125, 4.5333251953125, 4.734130859375, 4.9349365234375, 5.1357421875, 5.3365478515625, 5.537353515625, 5.7381591796875, 5.93896484375, 6.1397705078125, 6.340576171875, 6.5413818359375, 6.7421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 10.0, 18.0, 28.0, 47.0, 89.0, 229.0, 420.0, 1258.0, 4130.0, 19607.0, 198796.0, 728111.0, 80707.0, 10904.0, 2689.0, 889.0, 312.0, 151.0, 84.0, 32.0, 16.0, 10.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.0625, -36.165771484375, -35.26904296875, -34.372314453125, -33.4755859375, -32.578857421875, -31.68212890625, -30.785400390625, -29.888671875, -28.991943359375, -28.09521484375, -27.198486328125, -26.3017578125, -25.405029296875, -24.50830078125, -23.611572265625, -22.71484375, -21.818115234375, -20.92138671875, -20.024658203125, -19.1279296875, -18.231201171875, -17.33447265625, -16.437744140625, -15.541015625, -14.644287109375, -13.74755859375, -12.850830078125, -11.9541015625, -11.057373046875, -10.16064453125, -9.263916015625, -8.3671875, -7.470458984375, -6.57373046875, -5.677001953125, -4.7802734375, -3.883544921875, -2.98681640625, -2.090087890625, -1.193359375, -0.296630859375, 0.60009765625, 1.496826171875, 2.3935546875, 3.290283203125, 4.18701171875, 5.083740234375, 5.98046875, 6.877197265625, 7.77392578125, 8.670654296875, 9.5673828125, 10.464111328125, 11.36083984375, 12.257568359375, 13.154296875, 14.051025390625, 14.94775390625, 15.844482421875, 16.7412109375, 17.637939453125, 18.53466796875, 19.431396484375, 20.328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 5.0, 9.0, 6.0, 21.0, 11.0, 16.0, 30.0, 28.0, 33.0, 41.0, 55.0, 49.0, 70.0, 63.0, 98.0, 63.0, 78.0, 56.0, 51.0, 47.0, 24.0, 27.0, 16.0, 20.0, 13.0, 10.0, 6.0, 5.0, 6.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0007228851318359375, -0.0007006004452705383, -0.0006783157587051392, -0.00065603107213974, -0.0006337463855743408, -0.0006114616990089417, -0.0005891770124435425, -0.0005668923258781433, -0.0005446076393127441, -0.000522322952747345, -0.0005000382661819458, -0.00047775357961654663, -0.00045546889305114746, -0.0004331842064857483, -0.0004108995199203491, -0.00038861483335494995, -0.0003663301467895508, -0.0003440454602241516, -0.00032176077365875244, -0.00029947608709335327, -0.0002771914005279541, -0.00025490671396255493, -0.00023262202739715576, -0.0002103373408317566, -0.00018805265426635742, -0.00016576796770095825, -0.00014348328113555908, -0.00012119859457015991, -9.891390800476074e-05, -7.662922143936157e-05, -5.43445348739624e-05, -3.205984830856323e-05, -9.775161743164062e-06, 1.2509524822235107e-05, 3.479421138763428e-05, 5.707889795303345e-05, 7.936358451843262e-05, 0.00010164827108383179, 0.00012393295764923096, 0.00014621764421463013, 0.0001685023307800293, 0.00019078701734542847, 0.00021307170391082764, 0.0002353563904762268, 0.000257641077041626, 0.00027992576360702515, 0.0003022104501724243, 0.0003244951367378235, 0.00034677982330322266, 0.0003690645098686218, 0.000391349196434021, 0.00041363388299942017, 0.00043591856956481934, 0.0004582032561302185, 0.0004804879426956177, 0.0005027726292610168, 0.000525057315826416, 0.0005473420023918152, 0.0005696266889572144, 0.0005919113755226135, 0.0006141960620880127, 0.0006364807486534119, 0.000658765435218811, 0.0006810501217842102, 0.0007033348083496094]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 10.0, 14.0, 17.0, 27.0, 31.0, 55.0, 79.0, 104.0, 189.0, 306.0, 518.0, 959.0, 1824.0, 3751.0, 8369.0, 21800.0, 64982.0, 217440.0, 424899.0, 204985.0, 61878.0, 20578.0, 8171.0, 3521.0, 1791.0, 925.0, 511.0, 307.0, 183.0, 114.0, 61.0, 37.0, 26.0, 29.0, 16.0, 13.0, 7.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.4375, -14.041748046875, -13.64599609375, -13.250244140625, -12.8544921875, -12.458740234375, -12.06298828125, -11.667236328125, -11.271484375, -10.875732421875, -10.47998046875, -10.084228515625, -9.6884765625, -9.292724609375, -8.89697265625, -8.501220703125, -8.10546875, -7.709716796875, -7.31396484375, -6.918212890625, -6.5224609375, -6.126708984375, -5.73095703125, -5.335205078125, -4.939453125, -4.543701171875, -4.14794921875, -3.752197265625, -3.3564453125, -2.960693359375, -2.56494140625, -2.169189453125, -1.7734375, -1.377685546875, -0.98193359375, -0.586181640625, -0.1904296875, 0.205322265625, 0.60107421875, 0.996826171875, 1.392578125, 1.788330078125, 2.18408203125, 2.579833984375, 2.9755859375, 3.371337890625, 3.76708984375, 4.162841796875, 4.55859375, 4.954345703125, 5.35009765625, 5.745849609375, 6.1416015625, 6.537353515625, 6.93310546875, 7.328857421875, 7.724609375, 8.120361328125, 8.51611328125, 8.911865234375, 9.3076171875, 9.703369140625, 10.09912109375, 10.494873046875, 10.890625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 2.0, 6.0, 11.0, 14.0, 20.0, 24.0, 32.0, 51.0, 77.0, 70.0, 78.0, 84.0, 91.0, 78.0, 75.0, 77.0, 45.0, 47.0, 33.0, 17.0, 14.0, 13.0, 10.0, 9.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0], "bins": [-10.84375, -10.60003662109375, -10.3563232421875, -10.11260986328125, -9.868896484375, -9.62518310546875, -9.3814697265625, -9.13775634765625, -8.89404296875, -8.65032958984375, -8.4066162109375, -8.16290283203125, -7.919189453125, -7.67547607421875, -7.4317626953125, -7.18804931640625, -6.9443359375, -6.70062255859375, -6.4569091796875, -6.21319580078125, -5.969482421875, -5.72576904296875, -5.4820556640625, -5.23834228515625, -4.99462890625, -4.75091552734375, -4.5072021484375, -4.26348876953125, -4.019775390625, -3.77606201171875, -3.5323486328125, -3.28863525390625, -3.044921875, -2.80120849609375, -2.5574951171875, -2.31378173828125, -2.070068359375, -1.82635498046875, -1.5826416015625, -1.33892822265625, -1.09521484375, -0.85150146484375, -0.6077880859375, -0.36407470703125, -0.120361328125, 0.12335205078125, 0.3670654296875, 0.61077880859375, 0.8544921875, 1.09820556640625, 1.3419189453125, 1.58563232421875, 1.829345703125, 2.07305908203125, 2.3167724609375, 2.56048583984375, 2.80419921875, 3.04791259765625, 3.2916259765625, 3.53533935546875, 3.779052734375, 4.02276611328125, 4.2664794921875, 4.51019287109375, 4.75390625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 10.0, 21.0, 34.0, 64.0, 113.0, 176.0, 219.0, 170.0, 86.0, 45.0, 24.0, 13.0, 2.0, 2.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-116.05673217773438, -112.68064880371094, -109.30457305908203, -105.9284896850586, -102.55241394042969, -99.17633056640625, -95.80024719238281, -92.4241714477539, -89.04808807373047, -85.67200469970703, -82.29592895507812, -78.91984558105469, -75.54376983642578, -72.16768646240234, -68.79161071777344, -65.41552734375, -62.03944778442383, -58.663368225097656, -55.287288665771484, -51.91120910644531, -48.535125732421875, -45.1590461730957, -41.78296661376953, -38.406883239746094, -35.03080749511719, -31.654727935791016, -28.27864646911621, -24.90256690979004, -21.526485443115234, -18.150405883789062, -14.77432632446289, -11.398244857788086, -8.022163391113281, -4.646082878112793, -1.270002841949463, 2.106077194213867, 5.4821577072143555, 8.858238220214844, 12.234317779541016, 15.61039924621582, 18.986478805541992, 22.362558364868164, 25.73863983154297, 29.11471939086914, 32.49079895019531, 35.86688232421875, 39.242958068847656, 42.619041442871094, 45.995121002197266, 49.37120056152344, 52.74728012084961, 56.12335968017578, 59.49944305419922, 62.87552261352539, 66.25160217285156, 69.627685546875, 73.0037612915039, 76.37984466552734, 79.75592041015625, 83.13200378417969, 86.5080795288086, 89.88416290283203, 93.26023864746094, 96.63632202148438, 100.01240539550781]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 7.0, 6.0, 8.0, 7.0, 9.0, 13.0, 14.0, 19.0, 30.0, 38.0, 44.0, 46.0, 53.0, 77.0, 75.0, 68.0, 74.0, 73.0, 64.0, 58.0, 42.0, 44.0, 33.0, 24.0, 15.0, 13.0, 9.0, 2.0, 3.0, 5.0, 1.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.847251892089844, -42.85832214355469, -40.86939239501953, -38.88045883178711, -36.89152908325195, -34.9025993347168, -32.91366958618164, -30.92473793029785, -28.935806274414062, -26.946876525878906, -24.957944869995117, -22.96901512145996, -20.980083465576172, -18.991153717041016, -17.00222396850586, -15.01329231262207, -13.024362564086914, -11.035431861877441, -9.046501159667969, -7.057570934295654, -5.068640232086182, -3.079710006713867, -1.0907793045043945, 0.8981513977050781, 2.887082099914551, 4.876012802124023, 6.864943504333496, 8.853874206542969, 10.842803955078125, 12.831734657287598, 14.82066535949707, 16.80959701538086, 18.798526763916016, 20.787456512451172, 22.77638816833496, 24.765317916870117, 26.754249572753906, 28.743179321289062, 30.73210906982422, 32.721038818359375, 34.7099723815918, 36.69890213012695, 38.68783187866211, 40.67676544189453, 42.66569519042969, 44.654624938964844, 46.6435546875, 48.632484436035156, 50.62141418457031, 52.61034393310547, 54.599273681640625, 56.58820724487305, 58.5771369934082, 60.56606674194336, 62.554996490478516, 64.54393005371094, 66.5328598022461, 68.52178955078125, 70.5107192993164, 72.49964904785156, 74.48857879638672, 76.47750854492188, 78.46644592285156, 80.45537567138672, 82.44430541992188]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 7.0, 15.0, 41.0, 68.0, 131.0, 278.0, 586.0, 1390.0, 3717.0, 10570.0, 40658.0, 568541.0, 3484132.0, 62766.0, 14216.0, 4346.0, 1523.0, 619.0, 273.0, 135.0, 73.0, 39.0, 29.0, 25.0, 19.0, 12.0, 16.0, 6.0, 8.0, 8.0, 10.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.203125, -28.623779296875, -27.04443359375, -25.465087890625, -23.8857421875, -22.306396484375, -20.72705078125, -19.147705078125, -17.568359375, -15.989013671875, -14.40966796875, -12.830322265625, -11.2509765625, -9.671630859375, -8.09228515625, -6.512939453125, -4.93359375, -3.354248046875, -1.77490234375, -0.195556640625, 1.3837890625, 2.963134765625, 4.54248046875, 6.121826171875, 7.701171875, 9.280517578125, 10.85986328125, 12.439208984375, 14.0185546875, 15.597900390625, 17.17724609375, 18.756591796875, 20.3359375, 21.915283203125, 23.49462890625, 25.073974609375, 26.6533203125, 28.232666015625, 29.81201171875, 31.391357421875, 32.970703125, 34.550048828125, 36.12939453125, 37.708740234375, 39.2880859375, 40.867431640625, 42.44677734375, 44.026123046875, 45.60546875, 47.184814453125, 48.76416015625, 50.343505859375, 51.9228515625, 53.502197265625, 55.08154296875, 56.660888671875, 58.240234375, 59.819580078125, 61.39892578125, 62.978271484375, 64.5576171875, 66.136962890625, 67.71630859375, 69.295654296875, 70.875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 11.0, 14.0, 11.0, 14.0, 18.0, 12.0, 37.0, 54.0, 44.0, 47.0, 52.0, 92.0, 72.0, 73.0, 64.0, 67.0, 54.0, 51.0, 48.0, 42.0, 34.0, 23.0, 15.0, 12.0, 11.0, 7.0, 6.0, 4.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4921875, -1.4427642822265625, -1.393341064453125, -1.3439178466796875, -1.29449462890625, -1.2450714111328125, -1.195648193359375, -1.1462249755859375, -1.0968017578125, -1.0473785400390625, -0.997955322265625, -0.9485321044921875, -0.89910888671875, -0.8496856689453125, -0.800262451171875, -0.7508392333984375, -0.701416015625, -0.6519927978515625, -0.602569580078125, -0.5531463623046875, -0.50372314453125, -0.4542999267578125, -0.404876708984375, -0.3554534912109375, -0.3060302734375, -0.2566070556640625, -0.207183837890625, -0.1577606201171875, -0.10833740234375, -0.0589141845703125, -0.009490966796875, 0.0399322509765625, 0.08935546875, 0.1387786865234375, 0.188201904296875, 0.2376251220703125, 0.28704833984375, 0.3364715576171875, 0.385894775390625, 0.4353179931640625, 0.4847412109375, 0.5341644287109375, 0.583587646484375, 0.6330108642578125, 0.68243408203125, 0.7318572998046875, 0.781280517578125, 0.8307037353515625, 0.880126953125, 0.9295501708984375, 0.978973388671875, 1.0283966064453125, 1.07781982421875, 1.1272430419921875, 1.176666259765625, 1.2260894775390625, 1.2755126953125, 1.3249359130859375, 1.374359130859375, 1.4237823486328125, 1.47320556640625, 1.5226287841796875, 1.572052001953125, 1.6214752197265625, 1.6708984375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 0.0, 2.0, 4.0, 17.0, 11.0, 22.0, 36.0, 52.0, 72.0, 100.0, 206.0, 346.0, 820.0, 2163.0, 6472.0, 23386.0, 120471.0, 2937008.0, 998626.0, 79762.0, 16779.0, 4796.0, 1690.0, 667.0, 341.0, 152.0, 84.0, 61.0, 42.0, 22.0, 27.0, 9.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-29.796875, -28.688720703125, -27.58056640625, -26.472412109375, -25.3642578125, -24.256103515625, -23.14794921875, -22.039794921875, -20.931640625, -19.823486328125, -18.71533203125, -17.607177734375, -16.4990234375, -15.390869140625, -14.28271484375, -13.174560546875, -12.06640625, -10.958251953125, -9.85009765625, -8.741943359375, -7.6337890625, -6.525634765625, -5.41748046875, -4.309326171875, -3.201171875, -2.093017578125, -0.98486328125, 0.123291015625, 1.2314453125, 2.339599609375, 3.44775390625, 4.555908203125, 5.6640625, 6.772216796875, 7.88037109375, 8.988525390625, 10.0966796875, 11.204833984375, 12.31298828125, 13.421142578125, 14.529296875, 15.637451171875, 16.74560546875, 17.853759765625, 18.9619140625, 20.070068359375, 21.17822265625, 22.286376953125, 23.39453125, 24.502685546875, 25.61083984375, 26.718994140625, 27.8271484375, 28.935302734375, 30.04345703125, 31.151611328125, 32.259765625, 33.367919921875, 34.47607421875, 35.584228515625, 36.6923828125, 37.800537109375, 38.90869140625, 40.016845703125, 41.125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 6.0, 9.0, 9.0, 7.0, 18.0, 30.0, 29.0, 42.0, 47.0, 98.0, 140.0, 200.0, 318.0, 703.0, 1172.0, 460.0, 261.0, 141.0, 91.0, 67.0, 40.0, 37.0, 27.0, 20.0, 17.0, 23.0, 10.0, 8.0, 9.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0546875, -3.94549560546875, -3.8363037109375, -3.72711181640625, -3.617919921875, -3.50872802734375, -3.3995361328125, -3.29034423828125, -3.18115234375, -3.07196044921875, -2.9627685546875, -2.85357666015625, -2.744384765625, -2.63519287109375, -2.5260009765625, -2.41680908203125, -2.3076171875, -2.19842529296875, -2.0892333984375, -1.98004150390625, -1.870849609375, -1.76165771484375, -1.6524658203125, -1.54327392578125, -1.43408203125, -1.32489013671875, -1.2156982421875, -1.10650634765625, -0.997314453125, -0.88812255859375, -0.7789306640625, -0.66973876953125, -0.560546875, -0.45135498046875, -0.3421630859375, -0.23297119140625, -0.123779296875, -0.01458740234375, 0.0946044921875, 0.20379638671875, 0.31298828125, 0.42218017578125, 0.5313720703125, 0.64056396484375, 0.749755859375, 0.85894775390625, 0.9681396484375, 1.07733154296875, 1.1865234375, 1.29571533203125, 1.4049072265625, 1.51409912109375, 1.623291015625, 1.73248291015625, 1.8416748046875, 1.95086669921875, 2.06005859375, 2.16925048828125, 2.2784423828125, 2.38763427734375, 2.496826171875, 2.60601806640625, 2.7152099609375, 2.82440185546875, 2.93359375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 5.0, 16.0, 30.0, 41.0, 68.0, 107.0, 161.0, 162.0, 159.0, 97.0, 63.0, 36.0, 16.0, 19.0, 10.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.286975860595703, -18.184234619140625, -17.081491470336914, -15.978750228881836, -14.876008033752441, -13.773265838623047, -12.670524597167969, -11.567782402038574, -10.46504020690918, -9.362298011779785, -8.25955581665039, -7.1568145751953125, -6.054072380065918, -4.951330184936523, -3.848588466644287, -2.745846748352051, -1.6431045532226562, -0.5403625965118408, 0.5623793601989746, 1.66512131690979, 2.7678632736206055, 3.87060546875, 4.973347187042236, 6.076088905334473, 7.178831100463867, 8.281573295593262, 9.384315490722656, 10.487056732177734, 11.589798927307129, 12.692541122436523, 13.795282363891602, 14.898024559020996, 16.000762939453125, 17.103504180908203, 18.206247329711914, 19.308988571166992, 20.411731719970703, 21.51447296142578, 22.61721420288086, 23.719955444335938, 24.82269859313965, 25.925439834594727, 27.028182983398438, 28.130924224853516, 29.233665466308594, 30.336408615112305, 31.439149856567383, 32.541893005371094, 33.64463424682617, 34.74737548828125, 35.85011672973633, 36.95286178588867, 38.05560302734375, 39.15834426879883, 40.261085510253906, 41.363826751708984, 42.46656799316406, 43.56930923461914, 44.67205047607422, 45.77479553222656, 46.87753677368164, 47.98027801513672, 49.0830192565918, 50.185760498046875, 51.28850555419922]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 12.0, 13.0, 15.0, 25.0, 27.0, 45.0, 39.0, 37.0, 60.0, 90.0, 82.0, 76.0, 94.0, 77.0, 67.0, 44.0, 43.0, 34.0, 32.0, 20.0, 20.0, 14.0, 9.0, 8.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.44953155517578, -22.775856018066406, -22.1021785736084, -21.428503036499023, -20.754825592041016, -20.08115005493164, -19.407474517822266, -18.73379898071289, -18.060121536254883, -17.386445999145508, -16.7127685546875, -16.039093017578125, -15.365416526794434, -14.691740036010742, -14.018064498901367, -13.344388008117676, -12.670711517333984, -11.997035026550293, -11.323358535766602, -10.649682998657227, -9.976006507873535, -9.302330017089844, -8.628654479980469, -7.954977989196777, -7.281301498413086, -6.6076250076293945, -5.933948993682861, -5.260272979736328, -4.586596488952637, -3.9129202365875244, -3.239243984222412, -2.565567970275879, -1.8918914794921875, -1.2182152271270752, -0.5445389747619629, 0.12913727760314941, 0.8028135299682617, 1.476489782333374, 2.1501660346984863, 2.8238420486450195, 3.497518539428711, 4.171195030212402, 4.8448710441589355, 5.518547058105469, 6.19222354888916, 6.865900039672852, 7.539576053619385, 8.213252067565918, 8.88692855834961, 9.5606050491333, 10.234281539916992, 10.907957077026367, 11.581633567810059, 12.25531005859375, 12.928985595703125, 13.602662086486816, 14.276338577270508, 14.9500150680542, 15.62369155883789, 16.297367095947266, 16.97104263305664, 17.64472007751465, 18.318395614624023, 18.99207305908203, 19.665748596191406]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 12.0, 10.0, 26.0, 30.0, 51.0, 86.0, 114.0, 226.0, 419.0, 742.0, 1590.0, 3302.0, 7652.0, 17321.0, 42701.0, 106163.0, 238174.0, 314821.0, 183482.0, 77032.0, 30896.0, 12853.0, 5557.0, 2607.0, 1202.0, 665.0, 341.0, 175.0, 106.0, 62.0, 47.0, 22.0, 18.0, 14.0, 10.0, 5.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.6015625, -12.223388671875, -11.84521484375, -11.467041015625, -11.0888671875, -10.710693359375, -10.33251953125, -9.954345703125, -9.576171875, -9.197998046875, -8.81982421875, -8.441650390625, -8.0634765625, -7.685302734375, -7.30712890625, -6.928955078125, -6.55078125, -6.172607421875, -5.79443359375, -5.416259765625, -5.0380859375, -4.659912109375, -4.28173828125, -3.903564453125, -3.525390625, -3.147216796875, -2.76904296875, -2.390869140625, -2.0126953125, -1.634521484375, -1.25634765625, -0.878173828125, -0.5, -0.121826171875, 0.25634765625, 0.634521484375, 1.0126953125, 1.390869140625, 1.76904296875, 2.147216796875, 2.525390625, 2.903564453125, 3.28173828125, 3.659912109375, 4.0380859375, 4.416259765625, 4.79443359375, 5.172607421875, 5.55078125, 5.928955078125, 6.30712890625, 6.685302734375, 7.0634765625, 7.441650390625, 7.81982421875, 8.197998046875, 8.576171875, 8.954345703125, 9.33251953125, 9.710693359375, 10.0888671875, 10.467041015625, 10.84521484375, 11.223388671875, 11.6015625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 5.0, 10.0, 8.0, 11.0, 14.0, 17.0, 15.0, 21.0, 24.0, 36.0, 33.0, 43.0, 53.0, 50.0, 59.0, 74.0, 75.0, 66.0, 62.0, 55.0, 48.0, 44.0, 40.0, 35.0, 24.0, 23.0, 20.0, 14.0, 6.0, 8.0, 4.0, 4.0, 4.0, 1.0, 0.0, 3.0], "bins": [-1.830078125, -1.7885208129882812, -1.7469635009765625, -1.7054061889648438, -1.663848876953125, -1.6222915649414062, -1.5807342529296875, -1.5391769409179688, -1.49761962890625, -1.4560623168945312, -1.4145050048828125, -1.3729476928710938, -1.331390380859375, -1.2898330688476562, -1.2482757568359375, -1.2067184448242188, -1.1651611328125, -1.1236038208007812, -1.0820465087890625, -1.0404891967773438, -0.998931884765625, -0.9573745727539062, -0.9158172607421875, -0.8742599487304688, -0.83270263671875, -0.7911453247070312, -0.7495880126953125, -0.7080307006835938, -0.666473388671875, -0.6249160766601562, -0.5833587646484375, -0.5418014526367188, -0.500244140625, -0.45868682861328125, -0.4171295166015625, -0.37557220458984375, -0.334014892578125, -0.29245758056640625, -0.2509002685546875, -0.20934295654296875, -0.16778564453125, -0.12622833251953125, -0.0846710205078125, -0.04311370849609375, -0.001556396484375, 0.04000091552734375, 0.0815582275390625, 0.12311553955078125, 0.1646728515625, 0.20623016357421875, 0.2477874755859375, 0.28934478759765625, 0.330902099609375, 0.37245941162109375, 0.4140167236328125, 0.45557403564453125, 0.49713134765625, 0.5386886596679688, 0.5802459716796875, 0.6218032836914062, 0.663360595703125, 0.7049179077148438, 0.7464752197265625, 0.7880325317382812, 0.82958984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 6.0, 8.0, 11.0, 9.0, 18.0, 21.0, 26.0, 44.0, 58.0, 79.0, 106.0, 146.0, 163.0, 246.0, 324.0, 496.0, 798.0, 1311.0, 2794.0, 6703.0, 18423.0, 53402.0, 158667.0, 337764.0, 289079.0, 115973.0, 37978.0, 13157.0, 5060.0, 2246.0, 1141.0, 684.0, 437.0, 305.0, 222.0, 182.0, 121.0, 90.0, 68.0, 55.0, 40.0, 17.0, 26.0, 13.0, 12.0, 10.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.8671875, -13.45751953125, -13.0478515625, -12.63818359375, -12.228515625, -11.81884765625, -11.4091796875, -10.99951171875, -10.58984375, -10.18017578125, -9.7705078125, -9.36083984375, -8.951171875, -8.54150390625, -8.1318359375, -7.72216796875, -7.3125, -6.90283203125, -6.4931640625, -6.08349609375, -5.673828125, -5.26416015625, -4.8544921875, -4.44482421875, -4.03515625, -3.62548828125, -3.2158203125, -2.80615234375, -2.396484375, -1.98681640625, -1.5771484375, -1.16748046875, -0.7578125, -0.34814453125, 0.0615234375, 0.47119140625, 0.880859375, 1.29052734375, 1.7001953125, 2.10986328125, 2.51953125, 2.92919921875, 3.3388671875, 3.74853515625, 4.158203125, 4.56787109375, 4.9775390625, 5.38720703125, 5.796875, 6.20654296875, 6.6162109375, 7.02587890625, 7.435546875, 7.84521484375, 8.2548828125, 8.66455078125, 9.07421875, 9.48388671875, 9.8935546875, 10.30322265625, 10.712890625, 11.12255859375, 11.5322265625, 11.94189453125, 12.3515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 5.0, 4.0, 11.0, 5.0, 7.0, 12.0, 12.0, 15.0, 16.0, 22.0, 22.0, 24.0, 30.0, 26.0, 36.0, 35.0, 32.0, 46.0, 41.0, 41.0, 41.0, 42.0, 33.0, 34.0, 49.0, 39.0, 39.0, 39.0, 28.0, 30.0, 24.0, 22.0, 15.0, 19.0, 21.0, 20.0, 11.0, 13.0, 9.0, 4.0, 8.0, 7.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8046875, -5.615234375, -5.42578125, -5.236328125, -5.046875, -4.857421875, -4.66796875, -4.478515625, -4.2890625, -4.099609375, -3.91015625, -3.720703125, -3.53125, -3.341796875, -3.15234375, -2.962890625, -2.7734375, -2.583984375, -2.39453125, -2.205078125, -2.015625, -1.826171875, -1.63671875, -1.447265625, -1.2578125, -1.068359375, -0.87890625, -0.689453125, -0.5, -0.310546875, -0.12109375, 0.068359375, 0.2578125, 0.447265625, 0.63671875, 0.826171875, 1.015625, 1.205078125, 1.39453125, 1.583984375, 1.7734375, 1.962890625, 2.15234375, 2.341796875, 2.53125, 2.720703125, 2.91015625, 3.099609375, 3.2890625, 3.478515625, 3.66796875, 3.857421875, 4.046875, 4.236328125, 4.42578125, 4.615234375, 4.8046875, 4.994140625, 5.18359375, 5.373046875, 5.5625, 5.751953125, 5.94140625, 6.130859375, 6.3203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 10.0, 6.0, 20.0, 33.0, 38.0, 68.0, 107.0, 187.0, 277.0, 592.0, 1269.0, 3362.0, 10131.0, 37018.0, 174068.0, 520893.0, 232276.0, 48684.0, 12539.0, 3917.0, 1553.0, 615.0, 388.0, 180.0, 96.0, 81.0, 41.0, 23.0, 27.0, 12.0, 13.0, 9.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.546875, -19.896484375, -19.24609375, -18.595703125, -17.9453125, -17.294921875, -16.64453125, -15.994140625, -15.34375, -14.693359375, -14.04296875, -13.392578125, -12.7421875, -12.091796875, -11.44140625, -10.791015625, -10.140625, -9.490234375, -8.83984375, -8.189453125, -7.5390625, -6.888671875, -6.23828125, -5.587890625, -4.9375, -4.287109375, -3.63671875, -2.986328125, -2.3359375, -1.685546875, -1.03515625, -0.384765625, 0.265625, 0.916015625, 1.56640625, 2.216796875, 2.8671875, 3.517578125, 4.16796875, 4.818359375, 5.46875, 6.119140625, 6.76953125, 7.419921875, 8.0703125, 8.720703125, 9.37109375, 10.021484375, 10.671875, 11.322265625, 11.97265625, 12.623046875, 13.2734375, 13.923828125, 14.57421875, 15.224609375, 15.875, 16.525390625, 17.17578125, 17.826171875, 18.4765625, 19.126953125, 19.77734375, 20.427734375, 21.078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 10.0, 3.0, 4.0, 11.0, 10.0, 12.0, 21.0, 22.0, 31.0, 31.0, 43.0, 60.0, 68.0, 84.0, 72.0, 79.0, 88.0, 60.0, 52.0, 47.0, 38.0, 24.0, 22.0, 27.0, 22.0, 13.0, 17.0, 10.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014448165893554688, -0.0014014095067977905, -0.0013580024242401123, -0.001314595341682434, -0.0012711882591247559, -0.0012277811765670776, -0.0011843740940093994, -0.0011409670114517212, -0.001097559928894043, -0.0010541528463363647, -0.0010107457637786865, -0.0009673386812210083, -0.0009239315986633301, -0.0008805245161056519, -0.0008371174335479736, -0.0007937103509902954, -0.0007503032684326172, -0.000706896185874939, -0.0006634891033172607, -0.0006200820207595825, -0.0005766749382019043, -0.0005332678556442261, -0.0004898607730865479, -0.00044645369052886963, -0.0004030466079711914, -0.0003596395254135132, -0.00031623244285583496, -0.00027282536029815674, -0.00022941827774047852, -0.0001860111951828003, -0.00014260411262512207, -9.919703006744385e-05, -5.5789947509765625e-05, -1.2382864952087402e-05, 3.102421760559082e-05, 7.443130016326904e-05, 0.00011783838272094727, 0.0001612454652786255, 0.0002046525478363037, 0.00024805963039398193, 0.00029146671295166016, 0.0003348737955093384, 0.0003782808780670166, 0.0004216879606246948, 0.00046509504318237305, 0.0005085021257400513, 0.0005519092082977295, 0.0005953162908554077, 0.0006387233734130859, 0.0006821304559707642, 0.0007255375385284424, 0.0007689446210861206, 0.0008123517036437988, 0.000855758786201477, 0.0008991658687591553, 0.0009425729513168335, 0.0009859800338745117, 0.00102938711643219, 0.0010727941989898682, 0.0011162012815475464, 0.0011596083641052246, 0.0012030154466629028, 0.001246422529220581, 0.0012898296117782593, 0.0013332366943359375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 9.0, 4.0, 10.0, 12.0, 32.0, 38.0, 62.0, 97.0, 186.0, 331.0, 643.0, 1272.0, 3150.0, 8796.0, 33634.0, 188015.0, 582798.0, 181612.0, 33354.0, 8720.0, 3091.0, 1332.0, 605.0, 322.0, 162.0, 109.0, 50.0, 31.0, 28.0, 20.0, 6.0, 9.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-27.734375, -26.952880859375, -26.17138671875, -25.389892578125, -24.6083984375, -23.826904296875, -23.04541015625, -22.263916015625, -21.482421875, -20.700927734375, -19.91943359375, -19.137939453125, -18.3564453125, -17.574951171875, -16.79345703125, -16.011962890625, -15.23046875, -14.448974609375, -13.66748046875, -12.885986328125, -12.1044921875, -11.322998046875, -10.54150390625, -9.760009765625, -8.978515625, -8.197021484375, -7.41552734375, -6.634033203125, -5.8525390625, -5.071044921875, -4.28955078125, -3.508056640625, -2.7265625, -1.945068359375, -1.16357421875, -0.382080078125, 0.3994140625, 1.180908203125, 1.96240234375, 2.743896484375, 3.525390625, 4.306884765625, 5.08837890625, 5.869873046875, 6.6513671875, 7.432861328125, 8.21435546875, 8.995849609375, 9.77734375, 10.558837890625, 11.34033203125, 12.121826171875, 12.9033203125, 13.684814453125, 14.46630859375, 15.247802734375, 16.029296875, 16.810791015625, 17.59228515625, 18.373779296875, 19.1552734375, 19.936767578125, 20.71826171875, 21.499755859375, 22.28125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 2.0, 4.0, 7.0, 7.0, 14.0, 14.0, 17.0, 25.0, 31.0, 43.0, 62.0, 74.0, 63.0, 84.0, 98.0, 83.0, 75.0, 56.0, 64.0, 31.0, 27.0, 28.0, 28.0, 20.0, 11.0, 7.0, 6.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-11.9609375, -11.6561279296875, -11.351318359375, -11.0465087890625, -10.74169921875, -10.4368896484375, -10.132080078125, -9.8272705078125, -9.5224609375, -9.2176513671875, -8.912841796875, -8.6080322265625, -8.30322265625, -7.9984130859375, -7.693603515625, -7.3887939453125, -7.083984375, -6.7791748046875, -6.474365234375, -6.1695556640625, -5.86474609375, -5.5599365234375, -5.255126953125, -4.9503173828125, -4.6455078125, -4.3406982421875, -4.035888671875, -3.7310791015625, -3.42626953125, -3.1214599609375, -2.816650390625, -2.5118408203125, -2.20703125, -1.9022216796875, -1.597412109375, -1.2926025390625, -0.98779296875, -0.6829833984375, -0.378173828125, -0.0733642578125, 0.2314453125, 0.5362548828125, 0.841064453125, 1.1458740234375, 1.45068359375, 1.7554931640625, 2.060302734375, 2.3651123046875, 2.669921875, 2.9747314453125, 3.279541015625, 3.5843505859375, 3.88916015625, 4.1939697265625, 4.498779296875, 4.8035888671875, 5.1083984375, 5.4132080078125, 5.718017578125, 6.0228271484375, 6.32763671875, 6.6324462890625, 6.937255859375, 7.2420654296875, 7.546875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 8.0, 24.0, 29.0, 67.0, 140.0, 201.0, 207.0, 171.0, 86.0, 39.0, 15.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.872802734375, -145.87551879882812, -140.8782501220703, -135.88096618652344, -130.88369750976562, -125.88641357421875, -120.88912963867188, -115.89185333251953, -110.89457702636719, -105.89730072021484, -100.9000244140625, -95.90274047851562, -90.90546417236328, -85.90818786621094, -80.91090393066406, -75.91362762451172, -70.91635131835938, -65.91907501220703, -60.92179489135742, -55.92451477050781, -50.92723846435547, -45.929962158203125, -40.932682037353516, -35.935401916503906, -30.938125610351562, -25.940847396850586, -20.94356918334961, -15.946290969848633, -10.949012756347656, -5.95173454284668, -0.9544563293457031, 4.042823791503906, 9.040115356445312, 14.037393569946289, 19.034671783447266, 24.031949996948242, 29.02922821044922, 34.02650451660156, 39.02378463745117, 44.02106475830078, 49.018341064453125, 54.01561737060547, 59.01289749145508, 64.01017761230469, 69.00745391845703, 74.00473022460938, 79.00201416015625, 83.9992904663086, 88.99656677246094, 93.99384307861328, 98.99111938476562, 103.9884033203125, 108.98567962646484, 113.98295593261719, 118.98023986816406, 123.9775161743164, 128.97479248046875, 133.97207641601562, 138.96934509277344, 143.9666290283203, 148.96389770507812, 153.961181640625, 158.95846557617188, 163.95574951171875, 168.95301818847656]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 6.0, 12.0, 9.0, 13.0, 25.0, 35.0, 37.0, 44.0, 40.0, 44.0, 66.0, 62.0, 49.0, 58.0, 64.0, 64.0, 67.0, 49.0, 44.0, 42.0, 35.0, 27.0, 16.0, 21.0, 16.0, 8.0, 13.0, 10.0, 6.0, 7.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.16239929199219, -47.096717834472656, -45.031036376953125, -42.965354919433594, -40.89967346191406, -38.83399200439453, -36.768310546875, -34.70262908935547, -32.63694763183594, -30.571266174316406, -28.505584716796875, -26.439903259277344, -24.374221801757812, -22.30854034423828, -20.24285888671875, -18.17717742919922, -16.111495971679688, -14.045814514160156, -11.980133056640625, -9.914451599121094, -7.8487701416015625, -5.783088684082031, -3.7174072265625, -1.6517257690429688, 0.4139556884765625, 2.4796371459960938, 4.545318603515625, 6.611000061035156, 8.676681518554688, 10.742362976074219, 12.80804443359375, 14.873725891113281, 16.939407348632812, 19.005088806152344, 21.070770263671875, 23.136451721191406, 25.202133178710938, 27.26781463623047, 29.33349609375, 31.39917755126953, 33.46485900878906, 35.530540466308594, 37.596221923828125, 39.661903381347656, 41.72758483886719, 43.79326629638672, 45.85894775390625, 47.92462921142578, 49.99031066894531, 52.055992126464844, 54.121673583984375, 56.187355041503906, 58.25303649902344, 60.31871795654297, 62.3843994140625, 64.45008087158203, 66.51576232910156, 68.5814437866211, 70.64712524414062, 72.71280670166016, 74.77848815917969, 76.84416961669922, 78.90985107421875, 80.97553253173828, 83.04121398925781]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 7.0, 7.0, 6.0, 19.0, 13.0, 19.0, 33.0, 46.0, 85.0, 137.0, 441.0, 2633.0, 32719.0, 3941370.0, 207385.0, 7946.0, 911.0, 207.0, 107.0, 48.0, 53.0, 27.0, 22.0, 10.0, 14.0, 11.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.75, -66.3583984375, -63.966796875, -61.5751953125, -59.18359375, -56.7919921875, -54.400390625, -52.0087890625, -49.6171875, -47.2255859375, -44.833984375, -42.4423828125, -40.05078125, -37.6591796875, -35.267578125, -32.8759765625, -30.484375, -28.0927734375, -25.701171875, -23.3095703125, -20.91796875, -18.5263671875, -16.134765625, -13.7431640625, -11.3515625, -8.9599609375, -6.568359375, -4.1767578125, -1.78515625, 0.6064453125, 2.998046875, 5.3896484375, 7.78125, 10.1728515625, 12.564453125, 14.9560546875, 17.34765625, 19.7392578125, 22.130859375, 24.5224609375, 26.9140625, 29.3056640625, 31.697265625, 34.0888671875, 36.48046875, 38.8720703125, 41.263671875, 43.6552734375, 46.046875, 48.4384765625, 50.830078125, 53.2216796875, 55.61328125, 58.0048828125, 60.396484375, 62.7880859375, 65.1796875, 67.5712890625, 69.962890625, 72.3544921875, 74.74609375, 77.1376953125, 79.529296875, 81.9208984375, 84.3125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 11.0, 14.0, 18.0, 22.0, 28.0, 40.0, 67.0, 73.0, 61.0, 77.0, 82.0, 75.0, 73.0, 87.0, 64.0, 57.0, 42.0, 35.0, 15.0, 22.0, 12.0, 14.0, 5.0, 3.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0078125, -1.936309814453125, -1.86480712890625, -1.793304443359375, -1.7218017578125, -1.650299072265625, -1.57879638671875, -1.507293701171875, -1.435791015625, -1.364288330078125, -1.29278564453125, -1.221282958984375, -1.1497802734375, -1.078277587890625, -1.00677490234375, -0.935272216796875, -0.86376953125, -0.792266845703125, -0.72076416015625, -0.649261474609375, -0.5777587890625, -0.506256103515625, -0.43475341796875, -0.363250732421875, -0.291748046875, -0.220245361328125, -0.14874267578125, -0.077239990234375, -0.0057373046875, 0.065765380859375, 0.13726806640625, 0.208770751953125, 0.2802734375, 0.351776123046875, 0.42327880859375, 0.494781494140625, 0.5662841796875, 0.637786865234375, 0.70928955078125, 0.780792236328125, 0.852294921875, 0.923797607421875, 0.99530029296875, 1.066802978515625, 1.1383056640625, 1.209808349609375, 1.28131103515625, 1.352813720703125, 1.42431640625, 1.495819091796875, 1.56732177734375, 1.638824462890625, 1.7103271484375, 1.781829833984375, 1.85333251953125, 1.924835205078125, 1.996337890625, 2.067840576171875, 2.13934326171875, 2.210845947265625, 2.2823486328125, 2.353851318359375, 2.42535400390625, 2.496856689453125, 2.568359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 13.0, 4.0, 9.0, 19.0, 21.0, 27.0, 51.0, 66.0, 134.0, 241.0, 670.0, 2157.0, 8714.0, 48394.0, 500016.0, 3433894.0, 170537.0, 22736.0, 4622.0, 1171.0, 386.0, 156.0, 73.0, 50.0, 30.0, 14.0, 9.0, 14.0, 10.0, 7.0, 7.0, 7.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.828125, -26.633544921875, -25.43896484375, -24.244384765625, -23.0498046875, -21.855224609375, -20.66064453125, -19.466064453125, -18.271484375, -17.076904296875, -15.88232421875, -14.687744140625, -13.4931640625, -12.298583984375, -11.10400390625, -9.909423828125, -8.71484375, -7.520263671875, -6.32568359375, -5.131103515625, -3.9365234375, -2.741943359375, -1.54736328125, -0.352783203125, 0.841796875, 2.036376953125, 3.23095703125, 4.425537109375, 5.6201171875, 6.814697265625, 8.00927734375, 9.203857421875, 10.3984375, 11.593017578125, 12.78759765625, 13.982177734375, 15.1767578125, 16.371337890625, 17.56591796875, 18.760498046875, 19.955078125, 21.149658203125, 22.34423828125, 23.538818359375, 24.7333984375, 25.927978515625, 27.12255859375, 28.317138671875, 29.51171875, 30.706298828125, 31.90087890625, 33.095458984375, 34.2900390625, 35.484619140625, 36.67919921875, 37.873779296875, 39.068359375, 40.262939453125, 41.45751953125, 42.652099609375, 43.8466796875, 45.041259765625, 46.23583984375, 47.430419921875, 48.625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 8.0, 5.0, 11.0, 14.0, 17.0, 31.0, 29.0, 56.0, 87.0, 133.0, 241.0, 508.0, 1603.0, 599.0, 283.0, 158.0, 92.0, 57.0, 49.0, 31.0, 17.0, 14.0, 13.0, 13.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.4609375, -8.2752685546875, -8.089599609375, -7.9039306640625, -7.71826171875, -7.5325927734375, -7.346923828125, -7.1612548828125, -6.9755859375, -6.7899169921875, -6.604248046875, -6.4185791015625, -6.23291015625, -6.0472412109375, -5.861572265625, -5.6759033203125, -5.490234375, -5.3045654296875, -5.118896484375, -4.9332275390625, -4.74755859375, -4.5618896484375, -4.376220703125, -4.1905517578125, -4.0048828125, -3.8192138671875, -3.633544921875, -3.4478759765625, -3.26220703125, -3.0765380859375, -2.890869140625, -2.7052001953125, -2.51953125, -2.3338623046875, -2.148193359375, -1.9625244140625, -1.77685546875, -1.5911865234375, -1.405517578125, -1.2198486328125, -1.0341796875, -0.8485107421875, -0.662841796875, -0.4771728515625, -0.29150390625, -0.1058349609375, 0.079833984375, 0.2655029296875, 0.451171875, 0.6368408203125, 0.822509765625, 1.0081787109375, 1.19384765625, 1.3795166015625, 1.565185546875, 1.7508544921875, 1.9365234375, 2.1221923828125, 2.307861328125, 2.4935302734375, 2.67919921875, 2.8648681640625, 3.050537109375, 3.2362060546875, 3.421875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 10.0, 12.0, 27.0, 58.0, 83.0, 101.0, 131.0, 162.0, 138.0, 97.0, 65.0, 45.0, 26.0, 17.0, 13.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-42.3389892578125, -41.02665328979492, -39.71432113647461, -38.40198516845703, -37.08964920043945, -35.777313232421875, -34.46498107910156, -33.152645111083984, -31.840309143066406, -30.52797508239746, -29.215639114379883, -27.903305053710938, -26.59096908569336, -25.278635025024414, -23.96630096435547, -22.65396499633789, -21.341630935668945, -20.029296875, -18.716960906982422, -17.404626846313477, -16.0922908782959, -14.779956817626953, -13.467621803283691, -12.15528678894043, -10.842951774597168, -9.530616760253906, -8.218281745910645, -6.905947208404541, -5.593612194061279, -4.281277179718018, -2.968942642211914, -1.6566076278686523, -0.3442726135253906, 0.9680622816085815, 2.2803971767425537, 3.5927319526672363, 4.905066967010498, 6.21740198135376, 7.529736518859863, 8.842071533203125, 10.154406547546387, 11.466741561889648, 12.77907657623291, 14.091411590576172, 15.403745651245117, 16.716081619262695, 18.02841567993164, 19.34075164794922, 20.653085708618164, 21.96541976928711, 23.277755737304688, 24.590089797973633, 25.90242576599121, 27.214759826660156, 28.527095794677734, 29.83942985534668, 31.151763916015625, 32.4640998840332, 33.776432037353516, 35.088768005371094, 36.40110397338867, 37.71343994140625, 39.02577209472656, 40.33810806274414, 41.65044403076172]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 3.0, 6.0, 18.0, 16.0, 16.0, 17.0, 13.0, 19.0, 27.0, 26.0, 31.0, 26.0, 34.0, 42.0, 39.0, 37.0, 41.0, 41.0, 35.0, 39.0, 47.0, 38.0, 30.0, 35.0, 34.0, 41.0, 30.0, 38.0, 21.0, 22.0, 19.0, 11.0, 21.0, 15.0, 10.0, 10.0, 7.0, 7.0, 9.0, 2.0, 5.0, 2.0, 2.0, 7.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.81633758544922, -16.284326553344727, -15.752313613891602, -15.220301628112793, -14.688289642333984, -14.156278610229492, -13.624266624450684, -13.092254638671875, -12.560242652893066, -12.028230667114258, -11.49621868133545, -10.96420669555664, -10.432195663452148, -9.900182723999023, -9.368171691894531, -8.836159706115723, -8.304147720336914, -7.7721357345581055, -7.240123748779297, -6.7081122398376465, -6.176100254058838, -5.644088268280029, -5.112076759338379, -4.58006477355957, -4.048052787780762, -3.516040802001953, -2.9840290546417236, -2.452017307281494, -1.9200053215026855, -1.387993335723877, -0.8559815883636475, -0.32396984100341797, 0.20804405212402344, 0.7400559186935425, 1.2720677852630615, 1.8040796518325806, 2.3360915184020996, 2.868103504180908, 3.4001152515411377, 3.932126998901367, 4.464138984680176, 4.996150970458984, 5.528162956237793, 6.060174465179443, 6.592186450958252, 7.1241984367370605, 7.656209945678711, 8.18822193145752, 8.720233917236328, 9.252245903015137, 9.784257888793945, 10.316269874572754, 10.848281860351562, 11.380292892456055, 11.912304878234863, 12.444316864013672, 12.97632884979248, 13.508340835571289, 14.040352821350098, 14.572364807128906, 15.104375839233398, 15.636388778686523, 16.168399810791016, 16.70041275024414, 17.232423782348633]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 9.0, 3.0, 8.0, 14.0, 16.0, 12.0, 8.0, 44.0, 68.0, 104.0, 145.0, 247.0, 469.0, 939.0, 2210.0, 5174.0, 13987.0, 41164.0, 119723.0, 302380.0, 340103.0, 143780.0, 49620.0, 17221.0, 6343.0, 2441.0, 1073.0, 516.0, 262.0, 155.0, 99.0, 60.0, 54.0, 24.0, 18.0, 14.0, 10.0, 17.0, 5.0, 6.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5390625, -12.1357421875, -11.732421875, -11.3291015625, -10.92578125, -10.5224609375, -10.119140625, -9.7158203125, -9.3125, -8.9091796875, -8.505859375, -8.1025390625, -7.69921875, -7.2958984375, -6.892578125, -6.4892578125, -6.0859375, -5.6826171875, -5.279296875, -4.8759765625, -4.47265625, -4.0693359375, -3.666015625, -3.2626953125, -2.859375, -2.4560546875, -2.052734375, -1.6494140625, -1.24609375, -0.8427734375, -0.439453125, -0.0361328125, 0.3671875, 0.7705078125, 1.173828125, 1.5771484375, 1.98046875, 2.3837890625, 2.787109375, 3.1904296875, 3.59375, 3.9970703125, 4.400390625, 4.8037109375, 5.20703125, 5.6103515625, 6.013671875, 6.4169921875, 6.8203125, 7.2236328125, 7.626953125, 8.0302734375, 8.43359375, 8.8369140625, 9.240234375, 9.6435546875, 10.046875, 10.4501953125, 10.853515625, 11.2568359375, 11.66015625, 12.0634765625, 12.466796875, 12.8701171875, 13.2734375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 8.0, 13.0, 17.0, 31.0, 35.0, 54.0, 61.0, 64.0, 73.0, 95.0, 98.0, 94.0, 71.0, 75.0, 66.0, 49.0, 40.0, 18.0, 14.0, 9.0, 5.0, 7.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0625, -1.9815673828125, -1.900634765625, -1.8197021484375, -1.73876953125, -1.6578369140625, -1.576904296875, -1.4959716796875, -1.4150390625, -1.3341064453125, -1.253173828125, -1.1722412109375, -1.09130859375, -1.0103759765625, -0.929443359375, -0.8485107421875, -0.767578125, -0.6866455078125, -0.605712890625, -0.5247802734375, -0.44384765625, -0.3629150390625, -0.281982421875, -0.2010498046875, -0.1201171875, -0.0391845703125, 0.041748046875, 0.1226806640625, 0.20361328125, 0.2845458984375, 0.365478515625, 0.4464111328125, 0.52734375, 0.6082763671875, 0.689208984375, 0.7701416015625, 0.85107421875, 0.9320068359375, 1.012939453125, 1.0938720703125, 1.1748046875, 1.2557373046875, 1.336669921875, 1.4176025390625, 1.49853515625, 1.5794677734375, 1.660400390625, 1.7413330078125, 1.822265625, 1.9031982421875, 1.984130859375, 2.0650634765625, 2.14599609375, 2.2269287109375, 2.307861328125, 2.3887939453125, 2.4697265625, 2.5506591796875, 2.631591796875, 2.7125244140625, 2.79345703125, 2.8743896484375, 2.955322265625, 3.0362548828125, 3.1171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 10.0, 14.0, 16.0, 12.0, 20.0, 30.0, 31.0, 45.0, 61.0, 69.0, 124.0, 141.0, 207.0, 319.0, 491.0, 809.0, 1569.0, 3738.0, 10683.0, 38376.0, 152949.0, 467765.0, 273298.0, 68733.0, 18259.0, 5747.0, 2162.0, 1019.0, 610.0, 354.0, 262.0, 161.0, 123.0, 95.0, 66.0, 54.0, 29.0, 21.0, 16.0, 16.0, 12.0, 8.0, 3.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.71875, -14.223388671875, -13.72802734375, -13.232666015625, -12.7373046875, -12.241943359375, -11.74658203125, -11.251220703125, -10.755859375, -10.260498046875, -9.76513671875, -9.269775390625, -8.7744140625, -8.279052734375, -7.78369140625, -7.288330078125, -6.79296875, -6.297607421875, -5.80224609375, -5.306884765625, -4.8115234375, -4.316162109375, -3.82080078125, -3.325439453125, -2.830078125, -2.334716796875, -1.83935546875, -1.343994140625, -0.8486328125, -0.353271484375, 0.14208984375, 0.637451171875, 1.1328125, 1.628173828125, 2.12353515625, 2.618896484375, 3.1142578125, 3.609619140625, 4.10498046875, 4.600341796875, 5.095703125, 5.591064453125, 6.08642578125, 6.581787109375, 7.0771484375, 7.572509765625, 8.06787109375, 8.563232421875, 9.05859375, 9.553955078125, 10.04931640625, 10.544677734375, 11.0400390625, 11.535400390625, 12.03076171875, 12.526123046875, 13.021484375, 13.516845703125, 14.01220703125, 14.507568359375, 15.0029296875, 15.498291015625, 15.99365234375, 16.489013671875, 16.984375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 13.0, 4.0, 6.0, 6.0, 5.0, 7.0, 9.0, 15.0, 24.0, 16.0, 20.0, 26.0, 30.0, 27.0, 33.0, 31.0, 43.0, 38.0, 49.0, 42.0, 36.0, 48.0, 42.0, 50.0, 41.0, 41.0, 37.0, 33.0, 19.0, 28.0, 28.0, 30.0, 19.0, 22.0, 17.0, 13.0, 16.0, 14.0, 4.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.2177734375, -6.986328125, -6.7548828125, -6.5234375, -6.2919921875, -6.060546875, -5.8291015625, -5.59765625, -5.3662109375, -5.134765625, -4.9033203125, -4.671875, -4.4404296875, -4.208984375, -3.9775390625, -3.74609375, -3.5146484375, -3.283203125, -3.0517578125, -2.8203125, -2.5888671875, -2.357421875, -2.1259765625, -1.89453125, -1.6630859375, -1.431640625, -1.2001953125, -0.96875, -0.7373046875, -0.505859375, -0.2744140625, -0.04296875, 0.1884765625, 0.419921875, 0.6513671875, 0.8828125, 1.1142578125, 1.345703125, 1.5771484375, 1.80859375, 2.0400390625, 2.271484375, 2.5029296875, 2.734375, 2.9658203125, 3.197265625, 3.4287109375, 3.66015625, 3.8916015625, 4.123046875, 4.3544921875, 4.5859375, 4.8173828125, 5.048828125, 5.2802734375, 5.51171875, 5.7431640625, 5.974609375, 6.2060546875, 6.4375, 6.6689453125, 6.900390625, 7.1318359375, 7.36328125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 7.0, 13.0, 16.0, 21.0, 32.0, 52.0, 64.0, 112.0, 181.0, 329.0, 520.0, 1023.0, 2149.0, 4861.0, 12306.0, 35475.0, 112198.0, 324873.0, 361553.0, 128021.0, 40654.0, 13880.0, 5337.0, 2214.0, 1188.0, 579.0, 335.0, 202.0, 117.0, 76.0, 43.0, 38.0, 13.0, 11.0, 14.0, 7.0, 7.0, 3.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.7734375, -8.4815673828125, -8.189697265625, -7.8978271484375, -7.60595703125, -7.3140869140625, -7.022216796875, -6.7303466796875, -6.4384765625, -6.1466064453125, -5.854736328125, -5.5628662109375, -5.27099609375, -4.9791259765625, -4.687255859375, -4.3953857421875, -4.103515625, -3.8116455078125, -3.519775390625, -3.2279052734375, -2.93603515625, -2.6441650390625, -2.352294921875, -2.0604248046875, -1.7685546875, -1.4766845703125, -1.184814453125, -0.8929443359375, -0.60107421875, -0.3092041015625, -0.017333984375, 0.2745361328125, 0.56640625, 0.8582763671875, 1.150146484375, 1.4420166015625, 1.73388671875, 2.0257568359375, 2.317626953125, 2.6094970703125, 2.9013671875, 3.1932373046875, 3.485107421875, 3.7769775390625, 4.06884765625, 4.3607177734375, 4.652587890625, 4.9444580078125, 5.236328125, 5.5281982421875, 5.820068359375, 6.1119384765625, 6.40380859375, 6.6956787109375, 6.987548828125, 7.2794189453125, 7.5712890625, 7.8631591796875, 8.155029296875, 8.4468994140625, 8.73876953125, 9.0306396484375, 9.322509765625, 9.6143798828125, 9.90625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 11.0, 7.0, 12.0, 10.0, 8.0, 11.0, 20.0, 30.0, 30.0, 38.0, 54.0, 60.0, 111.0, 90.0, 94.0, 91.0, 76.0, 58.0, 28.0, 37.0, 24.0, 25.0, 24.0, 10.0, 11.0, 7.0, 4.0, 4.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.001331329345703125, -0.0012964680790901184, -0.0012616068124771118, -0.0012267455458641052, -0.0011918842792510986, -0.001157023012638092, -0.0011221617460250854, -0.0010873004794120789, -0.0010524392127990723, -0.0010175779461860657, -0.000982716679573059, -0.0009478554129600525, -0.0009129941463470459, -0.0008781328797340393, -0.0008432716131210327, -0.0008084103465080261, -0.0007735490798950195, -0.0007386878132820129, -0.0007038265466690063, -0.0006689652800559998, -0.0006341040134429932, -0.0005992427468299866, -0.00056438148021698, -0.0005295202136039734, -0.0004946589469909668, -0.0004597976803779602, -0.0004249364137649536, -0.000390075147151947, -0.00035521388053894043, -0.00032035261392593384, -0.00028549134731292725, -0.00025063008069992065, -0.00021576881408691406, -0.00018090754747390747, -0.00014604628086090088, -0.00011118501424789429, -7.63237476348877e-05, -4.1462481021881104e-05, -6.601214408874512e-06, 2.826005220413208e-05, 6.312131881713867e-05, 9.798258543014526e-05, 0.00013284385204315186, 0.00016770511865615845, 0.00020256638526916504, 0.00023742765188217163, 0.0002722889184951782, 0.0003071501851081848, 0.0003420114517211914, 0.000376872718334198, 0.0004117339849472046, 0.0004465952515602112, 0.0004814565181732178, 0.0005163177847862244, 0.000551179051399231, 0.0005860403180122375, 0.0006209015846252441, 0.0006557628512382507, 0.0006906241178512573, 0.0007254853844642639, 0.0007603466510772705, 0.0007952079176902771, 0.0008300691843032837, 0.0008649304509162903, 0.0008997917175292969]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 6.0, 11.0, 20.0, 37.0, 33.0, 88.0, 111.0, 154.0, 299.0, 502.0, 961.0, 2217.0, 5635.0, 17559.0, 66949.0, 291122.0, 479982.0, 134288.0, 32328.0, 9537.0, 3523.0, 1490.0, 683.0, 394.0, 220.0, 120.0, 87.0, 56.0, 35.0, 22.0, 18.0, 10.0, 11.0, 6.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.421875, -11.9970703125, -11.572265625, -11.1474609375, -10.72265625, -10.2978515625, -9.873046875, -9.4482421875, -9.0234375, -8.5986328125, -8.173828125, -7.7490234375, -7.32421875, -6.8994140625, -6.474609375, -6.0498046875, -5.625, -5.2001953125, -4.775390625, -4.3505859375, -3.92578125, -3.5009765625, -3.076171875, -2.6513671875, -2.2265625, -1.8017578125, -1.376953125, -0.9521484375, -0.52734375, -0.1025390625, 0.322265625, 0.7470703125, 1.171875, 1.5966796875, 2.021484375, 2.4462890625, 2.87109375, 3.2958984375, 3.720703125, 4.1455078125, 4.5703125, 4.9951171875, 5.419921875, 5.8447265625, 6.26953125, 6.6943359375, 7.119140625, 7.5439453125, 7.96875, 8.3935546875, 8.818359375, 9.2431640625, 9.66796875, 10.0927734375, 10.517578125, 10.9423828125, 11.3671875, 11.7919921875, 12.216796875, 12.6416015625, 13.06640625, 13.4912109375, 13.916015625, 14.3408203125, 14.765625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 2.0, 0.0, 0.0, 7.0, 6.0, 3.0, 6.0, 8.0, 11.0, 6.0, 19.0, 11.0, 18.0, 23.0, 27.0, 22.0, 30.0, 31.0, 39.0, 40.0, 56.0, 75.0, 68.0, 58.0, 62.0, 65.0, 38.0, 40.0, 36.0, 36.0, 31.0, 26.0, 23.0, 18.0, 9.0, 15.0, 8.0, 5.0, 9.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.6953125, -4.54022216796875, -4.3851318359375, -4.23004150390625, -4.074951171875, -3.91986083984375, -3.7647705078125, -3.60968017578125, -3.45458984375, -3.29949951171875, -3.1444091796875, -2.98931884765625, -2.834228515625, -2.67913818359375, -2.5240478515625, -2.36895751953125, -2.2138671875, -2.05877685546875, -1.9036865234375, -1.74859619140625, -1.593505859375, -1.43841552734375, -1.2833251953125, -1.12823486328125, -0.97314453125, -0.81805419921875, -0.6629638671875, -0.50787353515625, -0.352783203125, -0.19769287109375, -0.0426025390625, 0.11248779296875, 0.267578125, 0.42266845703125, 0.5777587890625, 0.73284912109375, 0.887939453125, 1.04302978515625, 1.1981201171875, 1.35321044921875, 1.50830078125, 1.66339111328125, 1.8184814453125, 1.97357177734375, 2.128662109375, 2.28375244140625, 2.4388427734375, 2.59393310546875, 2.7490234375, 2.90411376953125, 3.0592041015625, 3.21429443359375, 3.369384765625, 3.52447509765625, 3.6795654296875, 3.83465576171875, 3.98974609375, 4.14483642578125, 4.2999267578125, 4.45501708984375, 4.610107421875, 4.76519775390625, 4.9202880859375, 5.07537841796875, 5.23046875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 15.0, 40.0, 72.0, 123.0, 185.0, 183.0, 177.0, 80.0, 54.0, 33.0, 10.0, 12.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.84677124023438, -113.82637786865234, -109.80599212646484, -105.78559875488281, -101.76521301269531, -97.74481964111328, -93.72442626953125, -89.70404052734375, -85.68364715576172, -81.66325378417969, -77.64286804199219, -73.62247467041016, -69.60208129882812, -65.58169555664062, -61.561302185058594, -57.54091262817383, -53.52052307128906, -49.5001335144043, -45.47974395751953, -41.4593505859375, -37.438961029052734, -33.41857147216797, -29.39818000793457, -25.377788543701172, -21.357398986816406, -17.33700942993164, -13.316617965698242, -9.29622745513916, -5.275836944580078, -1.2554473876953125, 2.764944076538086, 6.785335540771484, 10.805709838867188, 14.82610034942627, 18.84649085998535, 22.86688232421875, 26.887271881103516, 30.90766143798828, 34.92805480957031, 38.94844436645508, 42.968833923339844, 46.98922348022461, 51.009613037109375, 55.030006408691406, 59.05039596557617, 63.07078552246094, 67.09117889404297, 71.111572265625, 75.1319580078125, 79.15235137939453, 83.17273712158203, 87.19313049316406, 91.21351623535156, 95.2339096069336, 99.25430297851562, 103.27468872070312, 107.29508209228516, 111.31547546386719, 115.33586120605469, 119.35625457763672, 123.37664794921875, 127.39703369140625, 131.41741943359375, 135.4378204345703, 139.4582061767578]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 5.0, 9.0, 9.0, 17.0, 14.0, 24.0, 22.0, 22.0, 24.0, 43.0, 38.0, 43.0, 38.0, 53.0, 54.0, 66.0, 45.0, 52.0, 50.0, 60.0, 45.0, 40.0, 34.0, 36.0, 29.0, 20.0, 14.0, 17.0, 25.0, 15.0, 4.0, 3.0, 3.0, 8.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-68.23907470703125, -66.34447479248047, -64.44987487792969, -62.55527877807617, -60.66067886352539, -58.76607894897461, -56.871482849121094, -54.97688293457031, -53.08228302001953, -51.18768310546875, -49.29308319091797, -47.39848709106445, -45.50388717651367, -43.60928726196289, -41.714691162109375, -39.820091247558594, -37.92549133300781, -36.03089141845703, -34.13629150390625, -32.241695404052734, -30.347095489501953, -28.452495574951172, -26.557897567749023, -24.663299560546875, -22.768699645996094, -20.874099731445312, -18.979501724243164, -17.084903717041016, -15.190303802490234, -13.29570484161377, -11.401105880737305, -9.50650691986084, -7.611907958984375, -5.71730899810791, -3.8227100372314453, -1.9281110763549805, -0.033512115478515625, 1.8610868453979492, 3.755685806274414, 5.650284767150879, 7.544883728027344, 9.439482688903809, 11.334081649780273, 13.228680610656738, 15.123279571533203, 17.017879486083984, 18.912477493286133, 20.80707550048828, 22.701675415039062, 24.596275329589844, 26.490873336791992, 28.38547134399414, 30.280071258544922, 32.1746711730957, 34.06926727294922, 35.9638671875, 37.85846710205078, 39.75306701660156, 41.647666931152344, 43.54226303100586, 45.43686294555664, 47.33146286010742, 49.22605895996094, 51.12065887451172, 53.0152587890625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 8.0, 13.0, 15.0, 27.0, 29.0, 55.0, 87.0, 151.0, 308.0, 637.0, 1824.0, 6064.0, 27112.0, 253274.0, 3762829.0, 118261.0, 17117.0, 4207.0, 1281.0, 477.0, 198.0, 89.0, 70.0, 44.0, 34.0, 18.0, 16.0, 15.0, 2.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.109375, -28.045654296875, -26.98193359375, -25.918212890625, -24.8544921875, -23.790771484375, -22.72705078125, -21.663330078125, -20.599609375, -19.535888671875, -18.47216796875, -17.408447265625, -16.3447265625, -15.281005859375, -14.21728515625, -13.153564453125, -12.08984375, -11.026123046875, -9.96240234375, -8.898681640625, -7.8349609375, -6.771240234375, -5.70751953125, -4.643798828125, -3.580078125, -2.516357421875, -1.45263671875, -0.388916015625, 0.6748046875, 1.738525390625, 2.80224609375, 3.865966796875, 4.9296875, 5.993408203125, 7.05712890625, 8.120849609375, 9.1845703125, 10.248291015625, 11.31201171875, 12.375732421875, 13.439453125, 14.503173828125, 15.56689453125, 16.630615234375, 17.6943359375, 18.758056640625, 19.82177734375, 20.885498046875, 21.94921875, 23.012939453125, 24.07666015625, 25.140380859375, 26.2041015625, 27.267822265625, 28.33154296875, 29.395263671875, 30.458984375, 31.522705078125, 32.58642578125, 33.650146484375, 34.7138671875, 35.777587890625, 36.84130859375, 37.905029296875, 38.96875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 14.0, 15.0, 10.0, 24.0, 30.0, 41.0, 50.0, 45.0, 33.0, 56.0, 53.0, 50.0, 62.0, 63.0, 70.0, 60.0, 55.0, 47.0, 47.0, 33.0, 37.0, 23.0, 15.0, 17.0, 9.0, 7.0, 10.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.38671875, -2.3218231201171875, -2.256927490234375, -2.1920318603515625, -2.12713623046875, -2.0622406005859375, -1.997344970703125, -1.9324493408203125, -1.8675537109375, -1.8026580810546875, -1.737762451171875, -1.6728668212890625, -1.60797119140625, -1.5430755615234375, -1.478179931640625, -1.4132843017578125, -1.348388671875, -1.2834930419921875, -1.218597412109375, -1.1537017822265625, -1.08880615234375, -1.0239105224609375, -0.959014892578125, -0.8941192626953125, -0.8292236328125, -0.7643280029296875, -0.699432373046875, -0.6345367431640625, -0.56964111328125, -0.5047454833984375, -0.439849853515625, -0.3749542236328125, -0.31005859375, -0.2451629638671875, -0.180267333984375, -0.1153717041015625, -0.05047607421875, 0.0144195556640625, 0.079315185546875, 0.1442108154296875, 0.2091064453125, 0.2740020751953125, 0.338897705078125, 0.4037933349609375, 0.46868896484375, 0.5335845947265625, 0.598480224609375, 0.6633758544921875, 0.728271484375, 0.7931671142578125, 0.858062744140625, 0.9229583740234375, 0.98785400390625, 1.0527496337890625, 1.117645263671875, 1.1825408935546875, 1.2474365234375, 1.3123321533203125, 1.377227783203125, 1.4421234130859375, 1.50701904296875, 1.5719146728515625, 1.636810302734375, 1.7017059326171875, 1.7666015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 10.0, 10.0, 6.0, 8.0, 19.0, 18.0, 35.0, 53.0, 88.0, 137.0, 249.0, 465.0, 980.0, 2491.0, 6795.0, 23141.0, 104052.0, 1000910.0, 2838159.0, 166190.0, 34065.0, 9949.0, 3483.0, 1458.0, 663.0, 350.0, 176.0, 98.0, 70.0, 45.0, 27.0, 25.0, 17.0, 9.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.515625, -23.85546875, -23.1953125, -22.53515625, -21.875, -21.21484375, -20.5546875, -19.89453125, -19.234375, -18.57421875, -17.9140625, -17.25390625, -16.59375, -15.93359375, -15.2734375, -14.61328125, -13.953125, -13.29296875, -12.6328125, -11.97265625, -11.3125, -10.65234375, -9.9921875, -9.33203125, -8.671875, -8.01171875, -7.3515625, -6.69140625, -6.03125, -5.37109375, -4.7109375, -4.05078125, -3.390625, -2.73046875, -2.0703125, -1.41015625, -0.75, -0.08984375, 0.5703125, 1.23046875, 1.890625, 2.55078125, 3.2109375, 3.87109375, 4.53125, 5.19140625, 5.8515625, 6.51171875, 7.171875, 7.83203125, 8.4921875, 9.15234375, 9.8125, 10.47265625, 11.1328125, 11.79296875, 12.453125, 13.11328125, 13.7734375, 14.43359375, 15.09375, 15.75390625, 16.4140625, 17.07421875, 17.734375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 3.0, 19.0, 23.0, 25.0, 58.0, 79.0, 144.0, 221.0, 427.0, 1384.0, 906.0, 346.0, 161.0, 80.0, 46.0, 49.0, 26.0, 20.0, 12.0, 10.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.46875, -6.29327392578125, -6.1177978515625, -5.94232177734375, -5.766845703125, -5.59136962890625, -5.4158935546875, -5.24041748046875, -5.06494140625, -4.88946533203125, -4.7139892578125, -4.53851318359375, -4.363037109375, -4.18756103515625, -4.0120849609375, -3.83660888671875, -3.6611328125, -3.48565673828125, -3.3101806640625, -3.13470458984375, -2.959228515625, -2.78375244140625, -2.6082763671875, -2.43280029296875, -2.25732421875, -2.08184814453125, -1.9063720703125, -1.73089599609375, -1.555419921875, -1.37994384765625, -1.2044677734375, -1.02899169921875, -0.853515625, -0.67803955078125, -0.5025634765625, -0.32708740234375, -0.151611328125, 0.02386474609375, 0.1993408203125, 0.37481689453125, 0.55029296875, 0.72576904296875, 0.9012451171875, 1.07672119140625, 1.252197265625, 1.42767333984375, 1.6031494140625, 1.77862548828125, 1.9541015625, 2.12957763671875, 2.3050537109375, 2.48052978515625, 2.656005859375, 2.83148193359375, 3.0069580078125, 3.18243408203125, 3.35791015625, 3.53338623046875, 3.7088623046875, 3.88433837890625, 4.059814453125, 4.23529052734375, 4.4107666015625, 4.58624267578125, 4.76171875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 27.0, 53.0, 92.0, 213.0, 205.0, 209.0, 119.0, 46.0, 20.0, 6.0, 6.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.61383056640625, -63.76617431640625, -61.91851806640625, -60.07086181640625, -58.22320556640625, -56.37554931640625, -54.52789306640625, -52.68023681640625, -50.83258056640625, -48.98492431640625, -47.13726806640625, -45.28961181640625, -43.44195556640625, -41.59429931640625, -39.74664306640625, -37.89898681640625, -36.051326751708984, -34.203670501708984, -32.356014251708984, -30.508358001708984, -28.660701751708984, -26.813045501708984, -24.96538734436035, -23.11773109436035, -21.27007484436035, -19.42241859436035, -17.57476234436035, -15.727105140686035, -13.879448890686035, -12.031792640686035, -10.184135437011719, -8.336479187011719, -6.488822937011719, -4.641166687011719, -2.7935099601745605, -0.9458532333374023, 0.9018030166625977, 2.7494592666625977, 4.597116470336914, 6.444772720336914, 8.292428970336914, 10.140085220336914, 11.987741470336914, 13.83539867401123, 15.68305492401123, 17.530712127685547, 19.378368377685547, 21.226024627685547, 23.073680877685547, 24.921337127685547, 26.768993377685547, 28.616649627685547, 30.464305877685547, 32.31196212768555, 34.15962219238281, 36.00727844238281, 37.85493469238281, 39.70259094238281, 41.55024719238281, 43.39790344238281, 45.24555969238281, 47.09321594238281, 48.94087219238281, 50.78852844238281, 52.63618469238281]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 9.0, 4.0, 6.0, 5.0, 7.0, 8.0, 9.0, 13.0, 14.0, 17.0, 20.0, 18.0, 19.0, 27.0, 32.0, 29.0, 28.0, 37.0, 44.0, 47.0, 47.0, 42.0, 49.0, 45.0, 39.0, 34.0, 36.0, 37.0, 36.0, 31.0, 31.0, 20.0, 31.0, 21.0, 20.0, 19.0, 12.0, 12.0, 10.0, 5.0, 10.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0], "bins": [-14.771269798278809, -14.335227012634277, -13.899185180664062, -13.463142395019531, -13.027100563049316, -12.591057777404785, -12.15501594543457, -11.718973159790039, -11.282930374145508, -10.846887588500977, -10.410845756530762, -9.97480297088623, -9.538761138916016, -9.102718353271484, -8.666675567626953, -8.230633735656738, -7.794591426849365, -7.358549118041992, -6.922506809234619, -6.486464500427246, -6.050421714782715, -5.614379405975342, -5.178337097167969, -4.7422943115234375, -4.306252479553223, -3.8702101707458496, -3.4341676235198975, -2.9981253147125244, -2.5620827674865723, -2.126040458679199, -1.6899981498718262, -1.253955602645874, -0.8179130554199219, -0.38187065720558167, 0.054171741008758545, 0.49021410942077637, 0.926256537437439, 1.3622989654541016, 1.7983412742614746, 2.2343838214874268, 2.6704261302948, 3.106468439102173, 3.542510986328125, 3.978553295135498, 4.414595603942871, 4.850638389587402, 5.286680221557617, 5.722723007202148, 6.1587653160095215, 6.5948076248168945, 7.030849933624268, 7.466892242431641, 7.902935028076172, 8.338977813720703, 8.775019645690918, 9.21106243133545, 9.647104263305664, 10.083147048950195, 10.51918888092041, 10.955231666564941, 11.391273498535156, 11.827316284179688, 12.263359069824219, 12.699400901794434, 13.135443687438965]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 4.0, 7.0, 10.0, 12.0, 20.0, 39.0, 59.0, 88.0, 145.0, 274.0, 495.0, 891.0, 1698.0, 3577.0, 7621.0, 17938.0, 46357.0, 118692.0, 261328.0, 312422.0, 165382.0, 66190.0, 25412.0, 10368.0, 4698.0, 2229.0, 1208.0, 579.0, 346.0, 161.0, 118.0, 74.0, 48.0, 16.0, 14.0, 15.0, 8.0, 2.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0546875, -9.7322998046875, -9.409912109375, -9.0875244140625, -8.76513671875, -8.4427490234375, -8.120361328125, -7.7979736328125, -7.4755859375, -7.1531982421875, -6.830810546875, -6.5084228515625, -6.18603515625, -5.8636474609375, -5.541259765625, -5.2188720703125, -4.896484375, -4.5740966796875, -4.251708984375, -3.9293212890625, -3.60693359375, -3.2845458984375, -2.962158203125, -2.6397705078125, -2.3173828125, -1.9949951171875, -1.672607421875, -1.3502197265625, -1.02783203125, -0.7054443359375, -0.383056640625, -0.0606689453125, 0.26171875, 0.5841064453125, 0.906494140625, 1.2288818359375, 1.55126953125, 1.8736572265625, 2.196044921875, 2.5184326171875, 2.8408203125, 3.1632080078125, 3.485595703125, 3.8079833984375, 4.13037109375, 4.4527587890625, 4.775146484375, 5.0975341796875, 5.419921875, 5.7423095703125, 6.064697265625, 6.3870849609375, 6.70947265625, 7.0318603515625, 7.354248046875, 7.6766357421875, 7.9990234375, 8.3214111328125, 8.643798828125, 8.9661865234375, 9.28857421875, 9.6109619140625, 9.933349609375, 10.2557373046875, 10.578125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 9.0, 7.0, 15.0, 9.0, 15.0, 22.0, 22.0, 17.0, 33.0, 35.0, 42.0, 39.0, 55.0, 53.0, 47.0, 55.0, 55.0, 44.0, 61.0, 59.0, 50.0, 36.0, 32.0, 29.0, 35.0, 26.0, 27.0, 12.0, 13.0, 8.0, 9.0, 6.0, 5.0, 11.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.810546875, -1.7529296875, -1.6953125, -1.6376953125, -1.580078125, -1.5224609375, -1.46484375, -1.4072265625, -1.349609375, -1.2919921875, -1.234375, -1.1767578125, -1.119140625, -1.0615234375, -1.00390625, -0.9462890625, -0.888671875, -0.8310546875, -0.7734375, -0.7158203125, -0.658203125, -0.6005859375, -0.54296875, -0.4853515625, -0.427734375, -0.3701171875, -0.3125, -0.2548828125, -0.197265625, -0.1396484375, -0.08203125, -0.0244140625, 0.033203125, 0.0908203125, 0.1484375, 0.2060546875, 0.263671875, 0.3212890625, 0.37890625, 0.4365234375, 0.494140625, 0.5517578125, 0.609375, 0.6669921875, 0.724609375, 0.7822265625, 0.83984375, 0.8974609375, 0.955078125, 1.0126953125, 1.0703125, 1.1279296875, 1.185546875, 1.2431640625, 1.30078125, 1.3583984375, 1.416015625, 1.4736328125, 1.53125, 1.5888671875, 1.646484375, 1.7041015625, 1.76171875, 1.8193359375, 1.876953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 7.0, 9.0, 14.0, 15.0, 19.0, 43.0, 54.0, 76.0, 98.0, 145.0, 169.0, 215.0, 427.0, 667.0, 1181.0, 2577.0, 6331.0, 18961.0, 61972.0, 197811.0, 399272.0, 242117.0, 78520.0, 23409.0, 7904.0, 2976.0, 1409.0, 715.0, 471.0, 279.0, 170.0, 142.0, 116.0, 70.0, 50.0, 46.0, 31.0, 17.0, 12.0, 13.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.7421875, -11.3927001953125, -11.043212890625, -10.6937255859375, -10.34423828125, -9.9947509765625, -9.645263671875, -9.2957763671875, -8.9462890625, -8.5968017578125, -8.247314453125, -7.8978271484375, -7.54833984375, -7.1988525390625, -6.849365234375, -6.4998779296875, -6.150390625, -5.8009033203125, -5.451416015625, -5.1019287109375, -4.75244140625, -4.4029541015625, -4.053466796875, -3.7039794921875, -3.3544921875, -3.0050048828125, -2.655517578125, -2.3060302734375, -1.95654296875, -1.6070556640625, -1.257568359375, -0.9080810546875, -0.55859375, -0.2091064453125, 0.140380859375, 0.4898681640625, 0.83935546875, 1.1888427734375, 1.538330078125, 1.8878173828125, 2.2373046875, 2.5867919921875, 2.936279296875, 3.2857666015625, 3.63525390625, 3.9847412109375, 4.334228515625, 4.6837158203125, 5.033203125, 5.3826904296875, 5.732177734375, 6.0816650390625, 6.43115234375, 6.7806396484375, 7.130126953125, 7.4796142578125, 7.8291015625, 8.1785888671875, 8.528076171875, 8.8775634765625, 9.22705078125, 9.5765380859375, 9.926025390625, 10.2755126953125, 10.625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 6.0, 2.0, 9.0, 14.0, 9.0, 10.0, 23.0, 15.0, 14.0, 27.0, 23.0, 27.0, 26.0, 30.0, 32.0, 30.0, 55.0, 48.0, 39.0, 44.0, 35.0, 36.0, 38.0, 42.0, 33.0, 32.0, 38.0, 27.0, 29.0, 22.0, 29.0, 30.0, 23.0, 18.0, 15.0, 12.0, 10.0, 16.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.73828125, -6.509033203125, -6.27978515625, -6.050537109375, -5.8212890625, -5.592041015625, -5.36279296875, -5.133544921875, -4.904296875, -4.675048828125, -4.44580078125, -4.216552734375, -3.9873046875, -3.758056640625, -3.52880859375, -3.299560546875, -3.0703125, -2.841064453125, -2.61181640625, -2.382568359375, -2.1533203125, -1.924072265625, -1.69482421875, -1.465576171875, -1.236328125, -1.007080078125, -0.77783203125, -0.548583984375, -0.3193359375, -0.090087890625, 0.13916015625, 0.368408203125, 0.59765625, 0.826904296875, 1.05615234375, 1.285400390625, 1.5146484375, 1.743896484375, 1.97314453125, 2.202392578125, 2.431640625, 2.660888671875, 2.89013671875, 3.119384765625, 3.3486328125, 3.577880859375, 3.80712890625, 4.036376953125, 4.265625, 4.494873046875, 4.72412109375, 4.953369140625, 5.1826171875, 5.411865234375, 5.64111328125, 5.870361328125, 6.099609375, 6.328857421875, 6.55810546875, 6.787353515625, 7.0166015625, 7.245849609375, 7.47509765625, 7.704345703125, 7.93359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 6.0, 3.0, 10.0, 15.0, 22.0, 30.0, 37.0, 68.0, 93.0, 139.0, 236.0, 452.0, 839.0, 1591.0, 3411.0, 7620.0, 18394.0, 52057.0, 163761.0, 388181.0, 271563.0, 89143.0, 29841.0, 11297.0, 4812.0, 2282.0, 1135.0, 595.0, 350.0, 199.0, 140.0, 61.0, 48.0, 28.0, 27.0, 12.0, 12.0, 10.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.9453125, -5.75189208984375, -5.5584716796875, -5.36505126953125, -5.171630859375, -4.97821044921875, -4.7847900390625, -4.59136962890625, -4.39794921875, -4.20452880859375, -4.0111083984375, -3.81768798828125, -3.624267578125, -3.43084716796875, -3.2374267578125, -3.04400634765625, -2.8505859375, -2.65716552734375, -2.4637451171875, -2.27032470703125, -2.076904296875, -1.88348388671875, -1.6900634765625, -1.49664306640625, -1.30322265625, -1.10980224609375, -0.9163818359375, -0.72296142578125, -0.529541015625, -0.33612060546875, -0.1427001953125, 0.05072021484375, 0.244140625, 0.43756103515625, 0.6309814453125, 0.82440185546875, 1.017822265625, 1.21124267578125, 1.4046630859375, 1.59808349609375, 1.79150390625, 1.98492431640625, 2.1783447265625, 2.37176513671875, 2.565185546875, 2.75860595703125, 2.9520263671875, 3.14544677734375, 3.3388671875, 3.53228759765625, 3.7257080078125, 3.91912841796875, 4.112548828125, 4.30596923828125, 4.4993896484375, 4.69281005859375, 4.88623046875, 5.07965087890625, 5.2730712890625, 5.46649169921875, 5.659912109375, 5.85333251953125, 6.0467529296875, 6.24017333984375, 6.43359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 8.0, 8.0, 21.0, 33.0, 35.0, 39.0, 51.0, 58.0, 99.0, 140.0, 128.0, 97.0, 60.0, 56.0, 49.0, 31.0, 21.0, 16.0, 9.0, 9.0, 8.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007333755493164062, -0.0007014721632003784, -0.0006695687770843506, -0.0006376653909683228, -0.0006057620048522949, -0.0005738586187362671, -0.0005419552326202393, -0.0005100518465042114, -0.0004781484603881836, -0.00044624507427215576, -0.00041434168815612793, -0.0003824383020401001, -0.00035053491592407227, -0.00031863152980804443, -0.0002867281436920166, -0.00025482475757598877, -0.00022292137145996094, -0.0001910179853439331, -0.00015911459922790527, -0.00012721121311187744, -9.530782699584961e-05, -6.340444087982178e-05, -3.1501054763793945e-05, 4.023313522338867e-07, 3.230571746826172e-05, 6.420910358428955e-05, 9.611248970031738e-05, 0.00012801587581634521, 0.00015991926193237305, 0.00019182264804840088, 0.0002237260341644287, 0.00025562942028045654, 0.0002875328063964844, 0.0003194361925125122, 0.00035133957862854004, 0.00038324296474456787, 0.0004151463508605957, 0.00044704973697662354, 0.00047895312309265137, 0.0005108565092086792, 0.000542759895324707, 0.0005746632814407349, 0.0006065666675567627, 0.0006384700536727905, 0.0006703734397888184, 0.0007022768259048462, 0.000734180212020874, 0.0007660835981369019, 0.0007979869842529297, 0.0008298903703689575, 0.0008617937564849854, 0.0008936971426010132, 0.000925600528717041, 0.0009575039148330688, 0.0009894073009490967, 0.0010213106870651245, 0.0010532140731811523, 0.0010851174592971802, 0.001117020845413208, 0.0011489242315292358, 0.0011808276176452637, 0.0012127310037612915, 0.0012446343898773193, 0.0012765377759933472, 0.001308441162109375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 10.0, 7.0, 7.0, 14.0, 20.0, 35.0, 62.0, 69.0, 153.0, 205.0, 440.0, 887.0, 1980.0, 5328.0, 19398.0, 109608.0, 578463.0, 276354.0, 40649.0, 9212.0, 3009.0, 1232.0, 610.0, 325.0, 188.0, 93.0, 62.0, 44.0, 28.0, 23.0, 13.0, 13.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-10.7890625, -10.43798828125, -10.0869140625, -9.73583984375, -9.384765625, -9.03369140625, -8.6826171875, -8.33154296875, -7.98046875, -7.62939453125, -7.2783203125, -6.92724609375, -6.576171875, -6.22509765625, -5.8740234375, -5.52294921875, -5.171875, -4.82080078125, -4.4697265625, -4.11865234375, -3.767578125, -3.41650390625, -3.0654296875, -2.71435546875, -2.36328125, -2.01220703125, -1.6611328125, -1.31005859375, -0.958984375, -0.60791015625, -0.2568359375, 0.09423828125, 0.4453125, 0.79638671875, 1.1474609375, 1.49853515625, 1.849609375, 2.20068359375, 2.5517578125, 2.90283203125, 3.25390625, 3.60498046875, 3.9560546875, 4.30712890625, 4.658203125, 5.00927734375, 5.3603515625, 5.71142578125, 6.0625, 6.41357421875, 6.7646484375, 7.11572265625, 7.466796875, 7.81787109375, 8.1689453125, 8.52001953125, 8.87109375, 9.22216796875, 9.5732421875, 9.92431640625, 10.275390625, 10.62646484375, 10.9775390625, 11.32861328125, 11.6796875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 13.0, 6.0, 16.0, 7.0, 21.0, 47.0, 40.0, 78.0, 81.0, 93.0, 116.0, 105.0, 94.0, 82.0, 51.0, 33.0, 37.0, 17.0, 16.0, 11.0, 10.0, 8.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.63079833984375, -8.4022216796875, -8.17364501953125, -7.945068359375, -7.71649169921875, -7.4879150390625, -7.25933837890625, -7.03076171875, -6.80218505859375, -6.5736083984375, -6.34503173828125, -6.116455078125, -5.88787841796875, -5.6593017578125, -5.43072509765625, -5.2021484375, -4.97357177734375, -4.7449951171875, -4.51641845703125, -4.287841796875, -4.05926513671875, -3.8306884765625, -3.60211181640625, -3.37353515625, -3.14495849609375, -2.9163818359375, -2.68780517578125, -2.459228515625, -2.23065185546875, -2.0020751953125, -1.77349853515625, -1.544921875, -1.31634521484375, -1.0877685546875, -0.85919189453125, -0.630615234375, -0.40203857421875, -0.1734619140625, 0.05511474609375, 0.28369140625, 0.51226806640625, 0.7408447265625, 0.96942138671875, 1.197998046875, 1.42657470703125, 1.6551513671875, 1.88372802734375, 2.1123046875, 2.34088134765625, 2.5694580078125, 2.79803466796875, 3.026611328125, 3.25518798828125, 3.4837646484375, 3.71234130859375, 3.94091796875, 4.16949462890625, 4.3980712890625, 4.62664794921875, 4.855224609375, 5.08380126953125, 5.3123779296875, 5.54095458984375, 5.76953125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 2.0, 13.0, 11.0, 28.0, 64.0, 154.0, 189.0, 197.0, 162.0, 95.0, 40.0, 27.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.34928512573242, -53.4930305480957, -49.63677215576172, -45.780517578125, -41.924259185791016, -38.0680046081543, -34.21174621582031, -30.355491638183594, -26.499235153198242, -22.64297866821289, -18.78672218322754, -14.930466651916504, -11.074210166931152, -7.217954635620117, -3.3616981506347656, 0.49455833435058594, 4.3508148193359375, 8.207071304321289, 12.06332778930664, 15.919583320617676, 19.775840759277344, 23.632095336914062, 27.488351821899414, 31.344608306884766, 35.20086669921875, 39.05712127685547, 42.91337966918945, 46.76963424682617, 50.625892639160156, 54.482147216796875, 58.338401794433594, 62.19466018676758, 66.05091094970703, 69.90716552734375, 73.76342010498047, 77.61968231201172, 81.47593688964844, 85.33219146728516, 89.18844604492188, 93.04470825195312, 96.90096282958984, 100.75721740722656, 104.61347198486328, 108.46973419189453, 112.32598876953125, 116.18224334716797, 120.03849792480469, 123.89476013183594, 127.75100708007812, 131.60726928710938, 135.46351623535156, 139.3197784423828, 143.176025390625, 147.03228759765625, 150.8885498046875, 154.7447967529297, 158.60105895996094, 162.4573211669922, 166.31356811523438, 170.16983032226562, 174.0260772705078, 177.88233947753906, 181.7386016845703, 185.5948486328125, 189.45111083984375]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 9.0, 19.0, 18.0, 15.0, 17.0, 31.0, 38.0, 46.0, 39.0, 56.0, 48.0, 55.0, 76.0, 73.0, 59.0, 55.0, 52.0, 57.0, 41.0, 38.0, 41.0, 20.0, 27.0, 14.0, 19.0, 6.0, 13.0, 4.0, 4.0, 6.0, 5.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.7430534362793, -56.71745300292969, -54.691856384277344, -52.666259765625, -50.64065933227539, -48.61505889892578, -46.58946228027344, -44.563865661621094, -42.538265228271484, -40.512664794921875, -38.48706817626953, -36.46147155761719, -34.43587112426758, -32.41027069091797, -30.384674072265625, -28.35907554626465, -26.333477020263672, -24.307878494262695, -22.28227996826172, -20.256681442260742, -18.231082916259766, -16.20548439025879, -14.179885864257812, -12.154287338256836, -10.12868881225586, -8.103090286254883, -6.077491760253906, -4.05189323425293, -2.026294708251953, -0.0006961822509765625, 2.02490234375, 4.050500869750977, 6.0760955810546875, 8.101694107055664, 10.12729263305664, 12.152891159057617, 14.178489685058594, 16.20408821105957, 18.229686737060547, 20.255285263061523, 22.2808837890625, 24.306482315063477, 26.332080841064453, 28.35767936706543, 30.383277893066406, 32.40887451171875, 34.43447494506836, 36.46007537841797, 38.48567199707031, 40.511268615722656, 42.536869049072266, 44.562469482421875, 46.58806610107422, 48.61366271972656, 50.63926315307617, 52.66486358642578, 54.690460205078125, 56.71605682373047, 58.74165725708008, 60.76725769042969, 62.79285430908203, 64.81845092773438, 66.84405517578125, 68.8696517944336, 70.89524841308594]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 8.0, 2.0, 9.0, 8.0, 9.0, 19.0, 28.0, 36.0, 54.0, 70.0, 131.0, 175.0, 298.0, 446.0, 707.0, 1127.0, 2190.0, 4158.0, 8377.0, 20382.0, 59040.0, 275136.0, 3428045.0, 294209.0, 61284.0, 20883.0, 8513.0, 3941.0, 2027.0, 1102.0, 672.0, 387.0, 255.0, 183.0, 119.0, 69.0, 58.0, 39.0, 20.0, 19.0, 17.0, 8.0, 3.0, 10.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.23193359375, -11.8310546875, -11.43017578125, -11.029296875, -10.62841796875, -10.2275390625, -9.82666015625, -9.42578125, -9.02490234375, -8.6240234375, -8.22314453125, -7.822265625, -7.42138671875, -7.0205078125, -6.61962890625, -6.21875, -5.81787109375, -5.4169921875, -5.01611328125, -4.615234375, -4.21435546875, -3.8134765625, -3.41259765625, -3.01171875, -2.61083984375, -2.2099609375, -1.80908203125, -1.408203125, -1.00732421875, -0.6064453125, -0.20556640625, 0.1953125, 0.59619140625, 0.9970703125, 1.39794921875, 1.798828125, 2.19970703125, 2.6005859375, 3.00146484375, 3.40234375, 3.80322265625, 4.2041015625, 4.60498046875, 5.005859375, 5.40673828125, 5.8076171875, 6.20849609375, 6.609375, 7.01025390625, 7.4111328125, 7.81201171875, 8.212890625, 8.61376953125, 9.0146484375, 9.41552734375, 9.81640625, 10.21728515625, 10.6181640625, 11.01904296875, 11.419921875, 11.82080078125, 12.2216796875, 12.62255859375, 13.0234375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 6.0, 9.0, 14.0, 19.0, 19.0, 30.0, 18.0, 35.0, 27.0, 46.0, 59.0, 65.0, 65.0, 59.0, 69.0, 56.0, 59.0, 63.0, 57.0, 45.0, 36.0, 38.0, 18.0, 16.0, 15.0, 16.0, 10.0, 6.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.248046875, -2.1822662353515625, -2.116485595703125, -2.0507049560546875, -1.98492431640625, -1.9191436767578125, -1.853363037109375, -1.7875823974609375, -1.7218017578125, -1.6560211181640625, -1.590240478515625, -1.5244598388671875, -1.45867919921875, -1.3928985595703125, -1.327117919921875, -1.2613372802734375, -1.195556640625, -1.1297760009765625, -1.063995361328125, -0.9982147216796875, -0.93243408203125, -0.8666534423828125, -0.800872802734375, -0.7350921630859375, -0.6693115234375, -0.6035308837890625, -0.537750244140625, -0.4719696044921875, -0.40618896484375, -0.3404083251953125, -0.274627685546875, -0.2088470458984375, -0.14306640625, -0.0772857666015625, -0.011505126953125, 0.0542755126953125, 0.12005615234375, 0.1858367919921875, 0.251617431640625, 0.3173980712890625, 0.3831787109375, 0.4489593505859375, 0.514739990234375, 0.5805206298828125, 0.64630126953125, 0.7120819091796875, 0.777862548828125, 0.8436431884765625, 0.909423828125, 0.9752044677734375, 1.040985107421875, 1.1067657470703125, 1.17254638671875, 1.2383270263671875, 1.304107666015625, 1.3698883056640625, 1.4356689453125, 1.5014495849609375, 1.567230224609375, 1.6330108642578125, 1.69879150390625, 1.7645721435546875, 1.830352783203125, 1.8961334228515625, 1.9619140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 13.0, 14.0, 36.0, 27.0, 42.0, 71.0, 117.0, 157.0, 272.0, 492.0, 777.0, 1392.0, 2726.0, 5150.0, 11017.0, 26416.0, 71085.0, 245670.0, 2413950.0, 1133827.0, 183747.0, 56165.0, 21279.0, 9388.0, 4556.0, 2361.0, 1410.0, 820.0, 446.0, 314.0, 183.0, 118.0, 85.0, 54.0, 38.0, 26.0, 12.0, 11.0, 7.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.375, -10.0496826171875, -9.724365234375, -9.3990478515625, -9.07373046875, -8.7484130859375, -8.423095703125, -8.0977783203125, -7.7724609375, -7.4471435546875, -7.121826171875, -6.7965087890625, -6.47119140625, -6.1458740234375, -5.820556640625, -5.4952392578125, -5.169921875, -4.8446044921875, -4.519287109375, -4.1939697265625, -3.86865234375, -3.5433349609375, -3.218017578125, -2.8927001953125, -2.5673828125, -2.2420654296875, -1.916748046875, -1.5914306640625, -1.26611328125, -0.9407958984375, -0.615478515625, -0.2901611328125, 0.03515625, 0.3604736328125, 0.685791015625, 1.0111083984375, 1.33642578125, 1.6617431640625, 1.987060546875, 2.3123779296875, 2.6376953125, 2.9630126953125, 3.288330078125, 3.6136474609375, 3.93896484375, 4.2642822265625, 4.589599609375, 4.9149169921875, 5.240234375, 5.5655517578125, 5.890869140625, 6.2161865234375, 6.54150390625, 6.8668212890625, 7.192138671875, 7.5174560546875, 7.8427734375, 8.1680908203125, 8.493408203125, 8.8187255859375, 9.14404296875, 9.4693603515625, 9.794677734375, 10.1199951171875, 10.4453125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 4.0, 4.0, 15.0, 19.0, 22.0, 31.0, 27.0, 51.0, 58.0, 84.0, 102.0, 188.0, 340.0, 793.0, 1163.0, 431.0, 238.0, 162.0, 95.0, 68.0, 36.0, 28.0, 21.0, 17.0, 11.0, 7.0, 15.0, 7.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.5703125, -3.46246337890625, -3.3546142578125, -3.24676513671875, -3.138916015625, -3.03106689453125, -2.9232177734375, -2.81536865234375, -2.70751953125, -2.59967041015625, -2.4918212890625, -2.38397216796875, -2.276123046875, -2.16827392578125, -2.0604248046875, -1.95257568359375, -1.8447265625, -1.73687744140625, -1.6290283203125, -1.52117919921875, -1.413330078125, -1.30548095703125, -1.1976318359375, -1.08978271484375, -0.98193359375, -0.87408447265625, -0.7662353515625, -0.65838623046875, -0.550537109375, -0.44268798828125, -0.3348388671875, -0.22698974609375, -0.119140625, -0.01129150390625, 0.0965576171875, 0.20440673828125, 0.312255859375, 0.42010498046875, 0.5279541015625, 0.63580322265625, 0.74365234375, 0.85150146484375, 0.9593505859375, 1.06719970703125, 1.175048828125, 1.28289794921875, 1.3907470703125, 1.49859619140625, 1.6064453125, 1.71429443359375, 1.8221435546875, 1.92999267578125, 2.037841796875, 2.14569091796875, 2.2535400390625, 2.36138916015625, 2.46923828125, 2.57708740234375, 2.6849365234375, 2.79278564453125, 2.900634765625, 3.00848388671875, 3.1163330078125, 3.22418212890625, 3.33203125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 9.0, 5.0, 17.0, 25.0, 63.0, 86.0, 123.0, 151.0, 144.0, 130.0, 97.0, 79.0, 35.0, 13.0, 13.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-49.85492706298828, -48.840660095214844, -47.82638931274414, -46.81211853027344, -45.7978515625, -44.78358459472656, -43.76931381225586, -42.755043029785156, -41.74077606201172, -40.72650909423828, -39.71223831176758, -38.697967529296875, -37.68370056152344, -36.66943359375, -35.6551628112793, -34.640892028808594, -33.626625061035156, -32.61235809326172, -31.598087310791016, -30.583818435668945, -29.569549560546875, -28.555280685424805, -27.541011810302734, -26.526742935180664, -25.512474060058594, -24.498205184936523, -23.483936309814453, -22.469667434692383, -21.455398559570312, -20.441129684448242, -19.426860809326172, -18.4125919342041, -17.39832305908203, -16.38405418395996, -15.36978530883789, -14.35551643371582, -13.34124755859375, -12.32697868347168, -11.31270980834961, -10.298440933227539, -9.284172058105469, -8.269903182983398, -7.255634307861328, -6.241365432739258, -5.2270965576171875, -4.212827682495117, -3.198558807373047, -2.1842899322509766, -1.1700210571289062, -0.15575218200683594, 0.8585166931152344, 1.8727855682373047, 2.887054443359375, 3.9013233184814453, 4.915592193603516, 5.929861068725586, 6.944129943847656, 7.958398818969727, 8.972667694091797, 9.986936569213867, 11.001205444335938, 12.015474319458008, 13.029743194580078, 14.044012069702148, 15.058280944824219]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 6.0, 3.0, 11.0, 16.0, 19.0, 34.0, 29.0, 31.0, 35.0, 52.0, 48.0, 59.0, 59.0, 59.0, 66.0, 55.0, 69.0, 55.0, 62.0, 51.0, 34.0, 38.0, 27.0, 19.0, 27.0, 12.0, 6.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.20915985107422, -23.619915008544922, -23.030668258666992, -22.441423416137695, -21.8521785736084, -21.2629337310791, -20.673686981201172, -20.084442138671875, -19.495197296142578, -18.90595245361328, -18.31670570373535, -17.727460861206055, -17.138216018676758, -16.54897117614746, -15.959724426269531, -15.370479583740234, -14.781233787536621, -14.191987991333008, -13.602743148803711, -13.013497352600098, -12.4242525100708, -11.835006713867188, -11.24576187133789, -10.656516075134277, -10.067270278930664, -9.47802448272705, -8.888779640197754, -8.29953384399414, -7.710289001464844, -7.1210432052612305, -6.531797885894775, -5.94255256652832, -5.353307723999023, -4.764062404632568, -4.174817085266113, -3.585571527481079, -2.996326208114624, -2.407080888748169, -1.8178353309631348, -1.2285900115966797, -0.6393446922302246, -0.050099313259124756, 0.5391460657119751, 1.1283915042877197, 1.7176368236541748, 2.30688214302063, 2.896127700805664, 3.485373020172119, 4.074618339538574, 4.663863658905029, 5.253108978271484, 5.842354774475098, 6.4315996170043945, 7.020845413208008, 7.610090732574463, 8.199336051940918, 8.788581848144531, 9.377827644348145, 9.967072486877441, 10.556318283081055, 11.145563125610352, 11.734808921813965, 12.324054718017578, 12.913299560546875, 13.502544403076172]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 6.0, 11.0, 7.0, 11.0, 19.0, 34.0, 40.0, 82.0, 118.0, 178.0, 274.0, 471.0, 816.0, 1451.0, 2513.0, 4575.0, 9051.0, 18303.0, 39898.0, 85764.0, 175518.0, 267942.0, 219913.0, 116496.0, 54529.0, 25034.0, 11878.0, 6078.0, 3153.0, 1804.0, 1017.0, 580.0, 359.0, 237.0, 155.0, 91.0, 45.0, 33.0, 19.0, 12.0, 10.0, 6.0, 4.0, 8.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.09375, -6.8699951171875, -6.646240234375, -6.4224853515625, -6.19873046875, -5.9749755859375, -5.751220703125, -5.5274658203125, -5.3037109375, -5.0799560546875, -4.856201171875, -4.6324462890625, -4.40869140625, -4.1849365234375, -3.961181640625, -3.7374267578125, -3.513671875, -3.2899169921875, -3.066162109375, -2.8424072265625, -2.61865234375, -2.3948974609375, -2.171142578125, -1.9473876953125, -1.7236328125, -1.4998779296875, -1.276123046875, -1.0523681640625, -0.82861328125, -0.6048583984375, -0.381103515625, -0.1573486328125, 0.06640625, 0.2901611328125, 0.513916015625, 0.7376708984375, 0.96142578125, 1.1851806640625, 1.408935546875, 1.6326904296875, 1.8564453125, 2.0802001953125, 2.303955078125, 2.5277099609375, 2.75146484375, 2.9752197265625, 3.198974609375, 3.4227294921875, 3.646484375, 3.8702392578125, 4.093994140625, 4.3177490234375, 4.54150390625, 4.7652587890625, 4.989013671875, 5.2127685546875, 5.4365234375, 5.6602783203125, 5.884033203125, 6.1077880859375, 6.33154296875, 6.5552978515625, 6.779052734375, 7.0028076171875, 7.2265625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 8.0, 6.0, 12.0, 6.0, 13.0, 19.0, 23.0, 22.0, 15.0, 27.0, 40.0, 40.0, 39.0, 47.0, 61.0, 57.0, 48.0, 51.0, 64.0, 56.0, 52.0, 44.0, 34.0, 36.0, 37.0, 31.0, 24.0, 16.0, 19.0, 9.0, 8.0, 12.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0], "bins": [-2.068359375, -2.01104736328125, -1.9537353515625, -1.89642333984375, -1.839111328125, -1.78179931640625, -1.7244873046875, -1.66717529296875, -1.60986328125, -1.55255126953125, -1.4952392578125, -1.43792724609375, -1.380615234375, -1.32330322265625, -1.2659912109375, -1.20867919921875, -1.1513671875, -1.09405517578125, -1.0367431640625, -0.97943115234375, -0.922119140625, -0.86480712890625, -0.8074951171875, -0.75018310546875, -0.69287109375, -0.63555908203125, -0.5782470703125, -0.52093505859375, -0.463623046875, -0.40631103515625, -0.3489990234375, -0.29168701171875, -0.234375, -0.17706298828125, -0.1197509765625, -0.06243896484375, -0.005126953125, 0.05218505859375, 0.1094970703125, 0.16680908203125, 0.22412109375, 0.28143310546875, 0.3387451171875, 0.39605712890625, 0.453369140625, 0.51068115234375, 0.5679931640625, 0.62530517578125, 0.6826171875, 0.73992919921875, 0.7972412109375, 0.85455322265625, 0.911865234375, 0.96917724609375, 1.0264892578125, 1.08380126953125, 1.14111328125, 1.19842529296875, 1.2557373046875, 1.31304931640625, 1.370361328125, 1.42767333984375, 1.4849853515625, 1.54229736328125, 1.599609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 8.0, 9.0, 7.0, 11.0, 8.0, 20.0, 25.0, 24.0, 49.0, 71.0, 99.0, 120.0, 159.0, 209.0, 275.0, 462.0, 711.0, 1291.0, 2642.0, 6015.0, 15805.0, 45176.0, 133180.0, 313255.0, 317818.0, 136205.0, 46561.0, 16087.0, 6129.0, 2567.0, 1312.0, 710.0, 457.0, 301.0, 195.0, 150.0, 119.0, 79.0, 50.0, 45.0, 36.0, 22.0, 23.0, 18.0, 14.0, 5.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-8.453125, -8.1805419921875, -7.907958984375, -7.6353759765625, -7.36279296875, -7.0902099609375, -6.817626953125, -6.5450439453125, -6.2724609375, -5.9998779296875, -5.727294921875, -5.4547119140625, -5.18212890625, -4.9095458984375, -4.636962890625, -4.3643798828125, -4.091796875, -3.8192138671875, -3.546630859375, -3.2740478515625, -3.00146484375, -2.7288818359375, -2.456298828125, -2.1837158203125, -1.9111328125, -1.6385498046875, -1.365966796875, -1.0933837890625, -0.82080078125, -0.5482177734375, -0.275634765625, -0.0030517578125, 0.26953125, 0.5421142578125, 0.814697265625, 1.0872802734375, 1.35986328125, 1.6324462890625, 1.905029296875, 2.1776123046875, 2.4501953125, 2.7227783203125, 2.995361328125, 3.2679443359375, 3.54052734375, 3.8131103515625, 4.085693359375, 4.3582763671875, 4.630859375, 4.9034423828125, 5.176025390625, 5.4486083984375, 5.72119140625, 5.9937744140625, 6.266357421875, 6.5389404296875, 6.8115234375, 7.0841064453125, 7.356689453125, 7.6292724609375, 7.90185546875, 8.1744384765625, 8.447021484375, 8.7196044921875, 8.9921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 6.0, 3.0, 10.0, 8.0, 13.0, 15.0, 20.0, 19.0, 20.0, 20.0, 27.0, 32.0, 43.0, 34.0, 39.0, 39.0, 48.0, 42.0, 46.0, 37.0, 51.0, 37.0, 37.0, 34.0, 37.0, 32.0, 29.0, 29.0, 36.0, 29.0, 13.0, 24.0, 20.0, 10.0, 21.0, 13.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0703125, -6.83978271484375, -6.6092529296875, -6.37872314453125, -6.148193359375, -5.91766357421875, -5.6871337890625, -5.45660400390625, -5.22607421875, -4.99554443359375, -4.7650146484375, -4.53448486328125, -4.303955078125, -4.07342529296875, -3.8428955078125, -3.61236572265625, -3.3818359375, -3.15130615234375, -2.9207763671875, -2.69024658203125, -2.459716796875, -2.22918701171875, -1.9986572265625, -1.76812744140625, -1.53759765625, -1.30706787109375, -1.0765380859375, -0.84600830078125, -0.615478515625, -0.38494873046875, -0.1544189453125, 0.07611083984375, 0.306640625, 0.53717041015625, 0.7677001953125, 0.99822998046875, 1.228759765625, 1.45928955078125, 1.6898193359375, 1.92034912109375, 2.15087890625, 2.38140869140625, 2.6119384765625, 2.84246826171875, 3.072998046875, 3.30352783203125, 3.5340576171875, 3.76458740234375, 3.9951171875, 4.22564697265625, 4.4561767578125, 4.68670654296875, 4.917236328125, 5.14776611328125, 5.3782958984375, 5.60882568359375, 5.83935546875, 6.06988525390625, 6.3004150390625, 6.53094482421875, 6.761474609375, 6.99200439453125, 7.2225341796875, 7.45306396484375, 7.68359375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 8.0, 20.0, 12.0, 16.0, 25.0, 32.0, 46.0, 97.0, 110.0, 230.0, 332.0, 620.0, 1195.0, 2501.0, 6187.0, 16943.0, 57421.0, 226527.0, 461882.0, 198050.0, 50509.0, 15345.0, 5418.0, 2378.0, 1102.0, 592.0, 351.0, 217.0, 110.0, 78.0, 56.0, 37.0, 23.0, 15.0, 15.0, 11.0, 10.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.31640625, -6.133056640625, -5.94970703125, -5.766357421875, -5.5830078125, -5.399658203125, -5.21630859375, -5.032958984375, -4.849609375, -4.666259765625, -4.48291015625, -4.299560546875, -4.1162109375, -3.932861328125, -3.74951171875, -3.566162109375, -3.3828125, -3.199462890625, -3.01611328125, -2.832763671875, -2.6494140625, -2.466064453125, -2.28271484375, -2.099365234375, -1.916015625, -1.732666015625, -1.54931640625, -1.365966796875, -1.1826171875, -0.999267578125, -0.81591796875, -0.632568359375, -0.44921875, -0.265869140625, -0.08251953125, 0.100830078125, 0.2841796875, 0.467529296875, 0.65087890625, 0.834228515625, 1.017578125, 1.200927734375, 1.38427734375, 1.567626953125, 1.7509765625, 1.934326171875, 2.11767578125, 2.301025390625, 2.484375, 2.667724609375, 2.85107421875, 3.034423828125, 3.2177734375, 3.401123046875, 3.58447265625, 3.767822265625, 3.951171875, 4.134521484375, 4.31787109375, 4.501220703125, 4.6845703125, 4.867919921875, 5.05126953125, 5.234619140625, 5.41796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 1.0, 6.0, 9.0, 4.0, 12.0, 15.0, 18.0, 28.0, 45.0, 60.0, 90.0, 100.0, 129.0, 119.0, 89.0, 67.0, 52.0, 36.0, 25.0, 21.0, 17.0, 10.0, 9.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0010824203491210938, -0.0010512322187423706, -0.0010200440883636475, -0.0009888559579849243, -0.0009576678276062012, -0.000926479697227478, -0.0008952915668487549, -0.0008641034364700317, -0.0008329153060913086, -0.0008017271757125854, -0.0007705390453338623, -0.0007393509149551392, -0.000708162784576416, -0.0006769746541976929, -0.0006457865238189697, -0.0006145983934402466, -0.0005834102630615234, -0.0005522221326828003, -0.0005210340023040771, -0.000489845871925354, -0.00045865774154663086, -0.0004274696111679077, -0.00039628148078918457, -0.0003650933504104614, -0.0003339052200317383, -0.00030271708965301514, -0.000271528959274292, -0.00024034082889556885, -0.0002091526985168457, -0.00017796456813812256, -0.00014677643775939941, -0.00011558830738067627, -8.440017700195312e-05, -5.321204662322998e-05, -2.2023916244506836e-05, 9.164214134216309e-06, 4.035234451293945e-05, 7.15404748916626e-05, 0.00010272860527038574, 0.0001339167356491089, 0.00016510486602783203, 0.00019629299640655518, 0.00022748112678527832, 0.00025866925716400146, 0.0002898573875427246, 0.00032104551792144775, 0.0003522336483001709, 0.00038342177867889404, 0.0004146099090576172, 0.00044579803943634033, 0.0004769861698150635, 0.0005081743001937866, 0.0005393624305725098, 0.0005705505609512329, 0.0006017386913299561, 0.0006329268217086792, 0.0006641149520874023, 0.0006953030824661255, 0.0007264912128448486, 0.0007576793432235718, 0.0007888674736022949, 0.0008200556039810181, 0.0008512437343597412, 0.0008824318647384644, 0.0009136199951171875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 14.0, 17.0, 29.0, 69.0, 156.0, 432.0, 1366.0, 6219.0, 62667.0, 798406.0, 164916.0, 11173.0, 2031.0, 633.0, 208.0, 102.0, 42.0, 27.0, 19.0, 8.0, 9.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0078125, -13.5189208984375, -13.030029296875, -12.5411376953125, -12.05224609375, -11.5633544921875, -11.074462890625, -10.5855712890625, -10.0966796875, -9.6077880859375, -9.118896484375, -8.6300048828125, -8.14111328125, -7.6522216796875, -7.163330078125, -6.6744384765625, -6.185546875, -5.6966552734375, -5.207763671875, -4.7188720703125, -4.22998046875, -3.7410888671875, -3.252197265625, -2.7633056640625, -2.2744140625, -1.7855224609375, -1.296630859375, -0.8077392578125, -0.31884765625, 0.1700439453125, 0.658935546875, 1.1478271484375, 1.63671875, 2.1256103515625, 2.614501953125, 3.1033935546875, 3.59228515625, 4.0811767578125, 4.570068359375, 5.0589599609375, 5.5478515625, 6.0367431640625, 6.525634765625, 7.0145263671875, 7.50341796875, 7.9923095703125, 8.481201171875, 8.9700927734375, 9.458984375, 9.9478759765625, 10.436767578125, 10.9256591796875, 11.41455078125, 11.9034423828125, 12.392333984375, 12.8812255859375, 13.3701171875, 13.8590087890625, 14.347900390625, 14.8367919921875, 15.32568359375, 15.8145751953125, 16.303466796875, 16.7923583984375, 17.28125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 9.0, 14.0, 9.0, 8.0, 26.0, 36.0, 43.0, 62.0, 80.0, 80.0, 85.0, 110.0, 91.0, 70.0, 84.0, 45.0, 38.0, 28.0, 21.0, 10.0, 10.0, 11.0, 5.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.67578125, -4.50274658203125, -4.3297119140625, -4.15667724609375, -3.983642578125, -3.81060791015625, -3.6375732421875, -3.46453857421875, -3.29150390625, -3.11846923828125, -2.9454345703125, -2.77239990234375, -2.599365234375, -2.42633056640625, -2.2532958984375, -2.08026123046875, -1.9072265625, -1.73419189453125, -1.5611572265625, -1.38812255859375, -1.215087890625, -1.04205322265625, -0.8690185546875, -0.69598388671875, -0.52294921875, -0.34991455078125, -0.1768798828125, -0.00384521484375, 0.169189453125, 0.34222412109375, 0.5152587890625, 0.68829345703125, 0.861328125, 1.03436279296875, 1.2073974609375, 1.38043212890625, 1.553466796875, 1.72650146484375, 1.8995361328125, 2.07257080078125, 2.24560546875, 2.41864013671875, 2.5916748046875, 2.76470947265625, 2.937744140625, 3.11077880859375, 3.2838134765625, 3.45684814453125, 3.6298828125, 3.80291748046875, 3.9759521484375, 4.14898681640625, 4.322021484375, 4.49505615234375, 4.6680908203125, 4.84112548828125, 5.01416015625, 5.18719482421875, 5.3602294921875, 5.53326416015625, 5.706298828125, 5.87933349609375, 6.0523681640625, 6.22540283203125, 6.3984375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 16.0, 14.0, 19.0, 27.0, 44.0, 64.0, 102.0, 121.0, 120.0, 119.0, 109.0, 86.0, 53.0, 38.0, 21.0, 15.0, 15.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.699615478515625, -58.52817153930664, -56.35673141479492, -54.18528747558594, -52.01384735107422, -49.842403411865234, -47.67095947265625, -45.49951934814453, -43.32807922363281, -41.15663528442383, -38.98519515991211, -36.813751220703125, -34.642311096191406, -32.47086715698242, -30.29942512512207, -28.12798309326172, -25.956539154052734, -23.785097122192383, -21.61365509033203, -19.442211151123047, -17.270771026611328, -15.09932804107666, -12.927885055541992, -10.75644302368164, -8.585000991821289, -6.4135589599609375, -4.242116451263428, -2.070673942565918, 0.1007680892944336, 2.272210121154785, 4.443653106689453, 6.615095138549805, 8.786537170410156, 10.957979202270508, 13.12942123413086, 15.300864219665527, 17.472305297851562, 19.643749237060547, 21.8151912689209, 23.98663330078125, 26.1580753326416, 28.329517364501953, 30.500959396362305, 32.672401428222656, 34.84384536743164, 37.01528549194336, 39.186729431152344, 41.35816955566406, 43.52961349487305, 45.70105743408203, 47.87249755859375, 50.043941497802734, 52.21538162231445, 54.38682556152344, 56.558265686035156, 58.72970962524414, 60.901153564453125, 63.07259750366211, 65.2440414428711, 67.41548156738281, 69.58692169189453, 71.75836181640625, 73.9298095703125, 76.10124969482422, 78.27268981933594]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 7.0, 6.0, 10.0, 17.0, 15.0, 22.0, 16.0, 26.0, 41.0, 46.0, 43.0, 50.0, 47.0, 61.0, 49.0, 61.0, 51.0, 42.0, 54.0, 60.0, 52.0, 34.0, 31.0, 35.0, 35.0, 18.0, 17.0, 10.0, 23.0, 1.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-58.58982467651367, -56.99394989013672, -55.3980712890625, -53.80219650268555, -52.206321716308594, -50.610443115234375, -49.01456832885742, -47.41869354248047, -45.82281494140625, -44.2269401550293, -42.63106155395508, -41.035186767578125, -39.43931198120117, -37.84343719482422, -36.24755859375, -34.65168380737305, -33.055809020996094, -31.459932327270508, -29.864057540893555, -28.26818084716797, -26.672306060791016, -25.07642936706543, -23.480552673339844, -21.88467788696289, -20.288801193237305, -18.69292449951172, -17.097049713134766, -15.50117301940918, -13.90529727935791, -12.30942153930664, -10.713544845581055, -9.117669105529785, -7.521797180175781, -5.925921440124512, -4.330045223236084, -2.7341690063476562, -1.1382932662963867, 0.4575824737548828, 2.0534591674804688, 3.6493349075317383, 5.245210647583008, 6.841086387634277, 8.436962127685547, 10.032838821411133, 11.628714561462402, 13.224590301513672, 14.820466995239258, 16.416343688964844, 18.012218475341797, 19.608095169067383, 21.203969955444336, 22.799846649169922, 24.395721435546875, 25.99159812927246, 27.587474822998047, 29.183349609375, 30.779226303100586, 32.37510299682617, 33.970977783203125, 35.566856384277344, 37.1627311706543, 38.75860595703125, 40.35448455810547, 41.95035934448242, 43.546234130859375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 5.0, 7.0, 20.0, 15.0, 21.0, 34.0, 52.0, 72.0, 111.0, 174.0, 276.0, 498.0, 886.0, 1595.0, 3173.0, 6736.0, 15876.0, 43251.0, 157655.0, 1889351.0, 1845506.0, 157224.0, 42761.0, 15632.0, 6533.0, 3185.0, 1593.0, 784.0, 455.0, 281.0, 193.0, 123.0, 68.0, 42.0, 23.0, 20.0, 17.0, 15.0, 6.0, 5.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.8359375, -12.4793701171875, -12.122802734375, -11.7662353515625, -11.40966796875, -11.0531005859375, -10.696533203125, -10.3399658203125, -9.9833984375, -9.6268310546875, -9.270263671875, -8.9136962890625, -8.55712890625, -8.2005615234375, -7.843994140625, -7.4874267578125, -7.130859375, -6.7742919921875, -6.417724609375, -6.0611572265625, -5.70458984375, -5.3480224609375, -4.991455078125, -4.6348876953125, -4.2783203125, -3.9217529296875, -3.565185546875, -3.2086181640625, -2.85205078125, -2.4954833984375, -2.138916015625, -1.7823486328125, -1.42578125, -1.0692138671875, -0.712646484375, -0.3560791015625, 0.00048828125, 0.3570556640625, 0.713623046875, 1.0701904296875, 1.4267578125, 1.7833251953125, 2.139892578125, 2.4964599609375, 2.85302734375, 3.2095947265625, 3.566162109375, 3.9227294921875, 4.279296875, 4.6358642578125, 4.992431640625, 5.3489990234375, 5.70556640625, 6.0621337890625, 6.418701171875, 6.7752685546875, 7.1318359375, 7.4884033203125, 7.844970703125, 8.2015380859375, 8.55810546875, 8.9146728515625, 9.271240234375, 9.6278076171875, 9.984375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 9.0, 4.0, 13.0, 14.0, 20.0, 12.0, 18.0, 42.0, 37.0, 29.0, 27.0, 35.0, 53.0, 54.0, 62.0, 65.0, 64.0, 56.0, 62.0, 45.0, 40.0, 35.0, 38.0, 44.0, 16.0, 25.0, 12.0, 14.0, 11.0, 14.0, 5.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.013671875, -1.95428466796875, -1.8948974609375, -1.83551025390625, -1.776123046875, -1.71673583984375, -1.6573486328125, -1.59796142578125, -1.53857421875, -1.47918701171875, -1.4197998046875, -1.36041259765625, -1.301025390625, -1.24163818359375, -1.1822509765625, -1.12286376953125, -1.0634765625, -1.00408935546875, -0.9447021484375, -0.88531494140625, -0.825927734375, -0.76654052734375, -0.7071533203125, -0.64776611328125, -0.58837890625, -0.52899169921875, -0.4696044921875, -0.41021728515625, -0.350830078125, -0.29144287109375, -0.2320556640625, -0.17266845703125, -0.11328125, -0.05389404296875, 0.0054931640625, 0.06488037109375, 0.124267578125, 0.18365478515625, 0.2430419921875, 0.30242919921875, 0.36181640625, 0.42120361328125, 0.4805908203125, 0.53997802734375, 0.599365234375, 0.65875244140625, 0.7181396484375, 0.77752685546875, 0.8369140625, 0.89630126953125, 0.9556884765625, 1.01507568359375, 1.074462890625, 1.13385009765625, 1.1932373046875, 1.25262451171875, 1.31201171875, 1.37139892578125, 1.4307861328125, 1.49017333984375, 1.549560546875, 1.60894775390625, 1.6683349609375, 1.72772216796875, 1.787109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 10.0, 6.0, 16.0, 18.0, 12.0, 21.0, 35.0, 60.0, 69.0, 118.0, 215.0, 354.0, 600.0, 1062.0, 2406.0, 6875.0, 25685.0, 132507.0, 1690068.0, 2149963.0, 144573.0, 27174.0, 7183.0, 2493.0, 1081.0, 583.0, 362.0, 230.0, 144.0, 119.0, 58.0, 54.0, 38.0, 23.0, 17.0, 12.0, 8.0, 6.0, 8.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.9140625, -12.4691162109375, -12.024169921875, -11.5792236328125, -11.13427734375, -10.6893310546875, -10.244384765625, -9.7994384765625, -9.3544921875, -8.9095458984375, -8.464599609375, -8.0196533203125, -7.57470703125, -7.1297607421875, -6.684814453125, -6.2398681640625, -5.794921875, -5.3499755859375, -4.905029296875, -4.4600830078125, -4.01513671875, -3.5701904296875, -3.125244140625, -2.6802978515625, -2.2353515625, -1.7904052734375, -1.345458984375, -0.9005126953125, -0.45556640625, -0.0106201171875, 0.434326171875, 0.8792724609375, 1.32421875, 1.7691650390625, 2.214111328125, 2.6590576171875, 3.10400390625, 3.5489501953125, 3.993896484375, 4.4388427734375, 4.8837890625, 5.3287353515625, 5.773681640625, 6.2186279296875, 6.66357421875, 7.1085205078125, 7.553466796875, 7.9984130859375, 8.443359375, 8.8883056640625, 9.333251953125, 9.7781982421875, 10.22314453125, 10.6680908203125, 11.113037109375, 11.5579833984375, 12.0029296875, 12.4478759765625, 12.892822265625, 13.3377685546875, 13.78271484375, 14.2276611328125, 14.672607421875, 15.1175537109375, 15.5625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 11.0, 20.0, 20.0, 46.0, 65.0, 109.0, 186.0, 396.0, 989.0, 1270.0, 459.0, 208.0, 124.0, 68.0, 32.0, 28.0, 20.0, 7.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.234375, -5.0172119140625, -4.800048828125, -4.5828857421875, -4.36572265625, -4.1485595703125, -3.931396484375, -3.7142333984375, -3.4970703125, -3.2799072265625, -3.062744140625, -2.8455810546875, -2.62841796875, -2.4112548828125, -2.194091796875, -1.9769287109375, -1.759765625, -1.5426025390625, -1.325439453125, -1.1082763671875, -0.89111328125, -0.6739501953125, -0.456787109375, -0.2396240234375, -0.0224609375, 0.1947021484375, 0.411865234375, 0.6290283203125, 0.84619140625, 1.0633544921875, 1.280517578125, 1.4976806640625, 1.71484375, 1.9320068359375, 2.149169921875, 2.3663330078125, 2.58349609375, 2.8006591796875, 3.017822265625, 3.2349853515625, 3.4521484375, 3.6693115234375, 3.886474609375, 4.1036376953125, 4.32080078125, 4.5379638671875, 4.755126953125, 4.9722900390625, 5.189453125, 5.4066162109375, 5.623779296875, 5.8409423828125, 6.05810546875, 6.2752685546875, 6.492431640625, 6.7095947265625, 6.9267578125, 7.1439208984375, 7.361083984375, 7.5782470703125, 7.79541015625, 8.0125732421875, 8.229736328125, 8.4468994140625, 8.6640625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 17.0, 20.0, 31.0, 48.0, 72.0, 120.0, 133.0, 156.0, 154.0, 98.0, 63.0, 33.0, 26.0, 9.0, 3.0, 4.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.974544525146484, -38.56621551513672, -37.15789031982422, -35.74956512451172, -34.34123611450195, -32.93290710449219, -31.524581909179688, -30.116254806518555, -28.707927703857422, -27.29960060119629, -25.891273498535156, -24.482946395874023, -23.07461929321289, -21.666292190551758, -20.257965087890625, -18.849637985229492, -17.44131088256836, -16.032983779907227, -14.624656677246094, -13.216329574584961, -11.808002471923828, -10.399675369262695, -8.991348266601562, -7.58302116394043, -6.174694061279297, -4.766366958618164, -3.3580398559570312, -1.9497127532958984, -0.5413856506347656, 0.8669414520263672, 2.2752685546875, 3.683595657348633, 5.091926574707031, 6.500253677368164, 7.908580780029297, 9.31690788269043, 10.725234985351562, 12.133562088012695, 13.541889190673828, 14.950216293334961, 16.358543395996094, 17.766870498657227, 19.17519760131836, 20.583524703979492, 21.991851806640625, 23.400178909301758, 24.80850601196289, 26.216833114624023, 27.625160217285156, 29.03348731994629, 30.441814422607422, 31.850141525268555, 33.25846862792969, 34.66679382324219, 36.07512283325195, 37.48345184326172, 38.89177703857422, 40.30010223388672, 41.708431243896484, 43.11676025390625, 44.52508544921875, 45.93341064453125, 47.341739654541016, 48.75006866455078, 50.15839385986328]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 2.0, 7.0, 8.0, 5.0, 13.0, 14.0, 15.0, 18.0, 14.0, 17.0, 32.0, 28.0, 34.0, 42.0, 35.0, 53.0, 31.0, 43.0, 32.0, 55.0, 42.0, 60.0, 55.0, 40.0, 39.0, 30.0, 33.0, 30.0, 28.0, 20.0, 19.0, 23.0, 13.0, 16.0, 12.0, 8.0, 8.0, 10.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.589323043823242, -16.017658233642578, -15.44599437713623, -14.874330520629883, -14.302665710449219, -13.731000900268555, -13.159337043762207, -12.58767318725586, -12.016008377075195, -11.444343566894531, -10.872679710388184, -10.301015853881836, -9.729351043701172, -9.157686233520508, -8.58602237701416, -8.014358520507812, -7.442693710327148, -6.871029376983643, -6.299365043640137, -5.727700710296631, -5.156036376953125, -4.584372043609619, -4.012707710266113, -3.4410433769226074, -2.8693790435791016, -2.2977147102355957, -1.7260503768920898, -1.154386043548584, -0.5827217102050781, -0.011057376861572266, 0.5606069564819336, 1.1322712898254395, 1.7039375305175781, 2.275601863861084, 2.84726619720459, 3.4189305305480957, 3.9905948638916016, 4.562259197235107, 5.133923530578613, 5.705587863922119, 6.277252197265625, 6.848916530609131, 7.420580863952637, 7.992245197296143, 8.563909530639648, 9.135574340820312, 9.70723819732666, 10.278902053833008, 10.850566864013672, 11.422231674194336, 11.993895530700684, 12.565559387207031, 13.137224197387695, 13.70888900756836, 14.280552864074707, 14.852216720581055, 15.423881530761719, 15.995546340942383, 16.567211151123047, 17.138874053955078, 17.710538864135742, 18.282203674316406, 18.853866577148438, 19.4255313873291, 19.997196197509766]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 8.0, 12.0, 25.0, 36.0, 69.0, 97.0, 180.0, 325.0, 644.0, 1231.0, 2746.0, 6725.0, 17982.0, 51486.0, 150126.0, 388346.0, 278851.0, 96531.0, 32949.0, 11659.0, 4592.0, 1908.0, 904.0, 502.0, 260.0, 138.0, 78.0, 48.0, 31.0, 28.0, 13.0, 5.0, 10.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.1640625, -13.80810546875, -13.4521484375, -13.09619140625, -12.740234375, -12.38427734375, -12.0283203125, -11.67236328125, -11.31640625, -10.96044921875, -10.6044921875, -10.24853515625, -9.892578125, -9.53662109375, -9.1806640625, -8.82470703125, -8.46875, -8.11279296875, -7.7568359375, -7.40087890625, -7.044921875, -6.68896484375, -6.3330078125, -5.97705078125, -5.62109375, -5.26513671875, -4.9091796875, -4.55322265625, -4.197265625, -3.84130859375, -3.4853515625, -3.12939453125, -2.7734375, -2.41748046875, -2.0615234375, -1.70556640625, -1.349609375, -0.99365234375, -0.6376953125, -0.28173828125, 0.07421875, 0.43017578125, 0.7861328125, 1.14208984375, 1.498046875, 1.85400390625, 2.2099609375, 2.56591796875, 2.921875, 3.27783203125, 3.6337890625, 3.98974609375, 4.345703125, 4.70166015625, 5.0576171875, 5.41357421875, 5.76953125, 6.12548828125, 6.4814453125, 6.83740234375, 7.193359375, 7.54931640625, 7.9052734375, 8.26123046875, 8.6171875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 8.0, 9.0, 7.0, 11.0, 14.0, 14.0, 17.0, 22.0, 24.0, 35.0, 34.0, 45.0, 38.0, 54.0, 56.0, 47.0, 48.0, 53.0, 58.0, 43.0, 53.0, 52.0, 41.0, 41.0, 22.0, 26.0, 23.0, 19.0, 22.0, 15.0, 10.0, 8.0, 4.0, 5.0, 1.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6806640625, -1.6247711181640625, -1.568878173828125, -1.5129852294921875, -1.45709228515625, -1.4011993408203125, -1.345306396484375, -1.2894134521484375, -1.2335205078125, -1.1776275634765625, -1.121734619140625, -1.0658416748046875, -1.00994873046875, -0.9540557861328125, -0.898162841796875, -0.8422698974609375, -0.786376953125, -0.7304840087890625, -0.674591064453125, -0.6186981201171875, -0.56280517578125, -0.5069122314453125, -0.451019287109375, -0.3951263427734375, -0.3392333984375, -0.2833404541015625, -0.227447509765625, -0.1715545654296875, -0.11566162109375, -0.0597686767578125, -0.003875732421875, 0.0520172119140625, 0.10791015625, 0.1638031005859375, 0.219696044921875, 0.2755889892578125, 0.33148193359375, 0.3873748779296875, 0.443267822265625, 0.4991607666015625, 0.5550537109375, 0.6109466552734375, 0.666839599609375, 0.7227325439453125, 0.77862548828125, 0.8345184326171875, 0.890411376953125, 0.9463043212890625, 1.002197265625, 1.0580902099609375, 1.113983154296875, 1.1698760986328125, 1.22576904296875, 1.2816619873046875, 1.337554931640625, 1.3934478759765625, 1.4493408203125, 1.5052337646484375, 1.561126708984375, 1.6170196533203125, 1.67291259765625, 1.7288055419921875, 1.784698486328125, 1.8405914306640625, 1.896484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 8.0, 7.0, 8.0, 16.0, 20.0, 23.0, 41.0, 40.0, 65.0, 79.0, 120.0, 156.0, 265.0, 407.0, 639.0, 1025.0, 1996.0, 4000.0, 8615.0, 20133.0, 49137.0, 117932.0, 273958.0, 317045.0, 146545.0, 60440.0, 25108.0, 10564.0, 4616.0, 2287.0, 1186.0, 754.0, 426.0, 265.0, 194.0, 122.0, 94.0, 49.0, 42.0, 37.0, 34.0, 17.0, 12.0, 11.0, 10.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.24609375, -7.0205078125, -6.794921875, -6.5693359375, -6.34375, -6.1181640625, -5.892578125, -5.6669921875, -5.44140625, -5.2158203125, -4.990234375, -4.7646484375, -4.5390625, -4.3134765625, -4.087890625, -3.8623046875, -3.63671875, -3.4111328125, -3.185546875, -2.9599609375, -2.734375, -2.5087890625, -2.283203125, -2.0576171875, -1.83203125, -1.6064453125, -1.380859375, -1.1552734375, -0.9296875, -0.7041015625, -0.478515625, -0.2529296875, -0.02734375, 0.1982421875, 0.423828125, 0.6494140625, 0.875, 1.1005859375, 1.326171875, 1.5517578125, 1.77734375, 2.0029296875, 2.228515625, 2.4541015625, 2.6796875, 2.9052734375, 3.130859375, 3.3564453125, 3.58203125, 3.8076171875, 4.033203125, 4.2587890625, 4.484375, 4.7099609375, 4.935546875, 5.1611328125, 5.38671875, 5.6123046875, 5.837890625, 6.0634765625, 6.2890625, 6.5146484375, 6.740234375, 6.9658203125, 7.19140625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 3.0, 3.0, 8.0, 8.0, 10.0, 15.0, 19.0, 17.0, 29.0, 25.0, 30.0, 35.0, 44.0, 30.0, 39.0, 50.0, 46.0, 44.0, 46.0, 45.0, 46.0, 45.0, 46.0, 44.0, 37.0, 41.0, 34.0, 33.0, 23.0, 24.0, 16.0, 14.0, 12.0, 5.0, 12.0, 6.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0], "bins": [-8.4453125, -8.20184326171875, -7.9583740234375, -7.71490478515625, -7.471435546875, -7.22796630859375, -6.9844970703125, -6.74102783203125, -6.49755859375, -6.25408935546875, -6.0106201171875, -5.76715087890625, -5.523681640625, -5.28021240234375, -5.0367431640625, -4.79327392578125, -4.5498046875, -4.30633544921875, -4.0628662109375, -3.81939697265625, -3.575927734375, -3.33245849609375, -3.0889892578125, -2.84552001953125, -2.60205078125, -2.35858154296875, -2.1151123046875, -1.87164306640625, -1.628173828125, -1.38470458984375, -1.1412353515625, -0.89776611328125, -0.654296875, -0.41082763671875, -0.1673583984375, 0.07611083984375, 0.319580078125, 0.56304931640625, 0.8065185546875, 1.04998779296875, 1.29345703125, 1.53692626953125, 1.7803955078125, 2.02386474609375, 2.267333984375, 2.51080322265625, 2.7542724609375, 2.99774169921875, 3.2412109375, 3.48468017578125, 3.7281494140625, 3.97161865234375, 4.215087890625, 4.45855712890625, 4.7020263671875, 4.94549560546875, 5.18896484375, 5.43243408203125, 5.6759033203125, 5.91937255859375, 6.162841796875, 6.40631103515625, 6.6497802734375, 6.89324951171875, 7.13671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 6.0, 16.0, 11.0, 15.0, 28.0, 31.0, 51.0, 61.0, 90.0, 131.0, 189.0, 335.0, 513.0, 883.0, 1681.0, 3164.0, 6885.0, 15546.0, 39867.0, 108398.0, 286047.0, 347353.0, 146058.0, 53318.0, 20671.0, 8580.0, 3901.0, 1991.0, 1003.0, 604.0, 371.0, 253.0, 160.0, 111.0, 60.0, 60.0, 31.0, 20.0, 23.0, 9.0, 6.0, 9.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.982421875, -3.862274169921875, -3.74212646484375, -3.621978759765625, -3.5018310546875, -3.381683349609375, -3.26153564453125, -3.141387939453125, -3.021240234375, -2.901092529296875, -2.78094482421875, -2.660797119140625, -2.5406494140625, -2.420501708984375, -2.30035400390625, -2.180206298828125, -2.06005859375, -1.939910888671875, -1.81976318359375, -1.699615478515625, -1.5794677734375, -1.459320068359375, -1.33917236328125, -1.219024658203125, -1.098876953125, -0.978729248046875, -0.85858154296875, -0.738433837890625, -0.6182861328125, -0.498138427734375, -0.37799072265625, -0.257843017578125, -0.1376953125, -0.017547607421875, 0.10260009765625, 0.222747802734375, 0.3428955078125, 0.463043212890625, 0.58319091796875, 0.703338623046875, 0.823486328125, 0.943634033203125, 1.06378173828125, 1.183929443359375, 1.3040771484375, 1.424224853515625, 1.54437255859375, 1.664520263671875, 1.78466796875, 1.904815673828125, 2.02496337890625, 2.145111083984375, 2.2652587890625, 2.385406494140625, 2.50555419921875, 2.625701904296875, 2.745849609375, 2.865997314453125, 2.98614501953125, 3.106292724609375, 3.2264404296875, 3.346588134765625, 3.46673583984375, 3.586883544921875, 3.70703125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 7.0, 16.0, 12.0, 27.0, 22.0, 33.0, 45.0, 59.0, 102.0, 130.0, 148.0, 103.0, 75.0, 34.0, 34.0, 28.0, 29.0, 16.0, 11.0, 13.0, 8.0, 8.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00084686279296875, -0.0008221343159675598, -0.0007974058389663696, -0.0007726773619651794, -0.0007479488849639893, -0.0007232204079627991, -0.0006984919309616089, -0.0006737634539604187, -0.0006490349769592285, -0.0006243064999580383, -0.0005995780229568481, -0.000574849545955658, -0.0005501210689544678, -0.0005253925919532776, -0.0005006641149520874, -0.0004759356379508972, -0.00045120716094970703, -0.00042647868394851685, -0.00040175020694732666, -0.0003770217299461365, -0.0003522932529449463, -0.0003275647759437561, -0.0003028362989425659, -0.00027810782194137573, -0.00025337934494018555, -0.00022865086793899536, -0.00020392239093780518, -0.000179193913936615, -0.0001544654369354248, -0.00012973695993423462, -0.00010500848293304443, -8.028000593185425e-05, -5.555152893066406e-05, -3.082305192947388e-05, -6.094574928283691e-06, 1.8633902072906494e-05, 4.336237907409668e-05, 6.809085607528687e-05, 9.281933307647705e-05, 0.00011754781007766724, 0.00014227628707885742, 0.0001670047640800476, 0.0001917332410812378, 0.00021646171808242798, 0.00024119019508361816, 0.00026591867208480835, 0.00029064714908599854, 0.0003153756260871887, 0.0003401041030883789, 0.0003648325800895691, 0.0003895610570907593, 0.00041428953409194946, 0.00043901801109313965, 0.00046374648809432983, 0.00048847496509552, 0.0005132034420967102, 0.0005379319190979004, 0.0005626603960990906, 0.0005873888731002808, 0.000612117350101471, 0.0006368458271026611, 0.0006615743041038513, 0.0006863027811050415, 0.0007110312581062317, 0.0007357597351074219]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 7.0, 7.0, 16.0, 11.0, 26.0, 25.0, 44.0, 54.0, 89.0, 135.0, 240.0, 361.0, 592.0, 1066.0, 1820.0, 3710.0, 8037.0, 20179.0, 58492.0, 188818.0, 416795.0, 231820.0, 72578.0, 24580.0, 9592.0, 4209.0, 2230.0, 1215.0, 678.0, 373.0, 237.0, 156.0, 96.0, 79.0, 48.0, 39.0, 25.0, 21.0, 17.0, 10.0, 7.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.53125, -4.3878173828125, -4.244384765625, -4.1009521484375, -3.95751953125, -3.8140869140625, -3.670654296875, -3.5272216796875, -3.3837890625, -3.2403564453125, -3.096923828125, -2.9534912109375, -2.81005859375, -2.6666259765625, -2.523193359375, -2.3797607421875, -2.236328125, -2.0928955078125, -1.949462890625, -1.8060302734375, -1.66259765625, -1.5191650390625, -1.375732421875, -1.2322998046875, -1.0888671875, -0.9454345703125, -0.802001953125, -0.6585693359375, -0.51513671875, -0.3717041015625, -0.228271484375, -0.0848388671875, 0.05859375, 0.2020263671875, 0.345458984375, 0.4888916015625, 0.63232421875, 0.7757568359375, 0.919189453125, 1.0626220703125, 1.2060546875, 1.3494873046875, 1.492919921875, 1.6363525390625, 1.77978515625, 1.9232177734375, 2.066650390625, 2.2100830078125, 2.353515625, 2.4969482421875, 2.640380859375, 2.7838134765625, 2.92724609375, 3.0706787109375, 3.214111328125, 3.3575439453125, 3.5009765625, 3.6444091796875, 3.787841796875, 3.9312744140625, 4.07470703125, 4.2181396484375, 4.361572265625, 4.5050048828125, 4.6484375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 10.0, 12.0, 14.0, 23.0, 24.0, 20.0, 20.0, 36.0, 55.0, 53.0, 77.0, 89.0, 79.0, 90.0, 84.0, 62.0, 60.0, 48.0, 33.0, 26.0, 24.0, 16.0, 12.0, 8.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.07421875, -4.940765380859375, -4.80731201171875, -4.673858642578125, -4.5404052734375, -4.406951904296875, -4.27349853515625, -4.140045166015625, -4.006591796875, -3.873138427734375, -3.73968505859375, -3.606231689453125, -3.4727783203125, -3.339324951171875, -3.20587158203125, -3.072418212890625, -2.93896484375, -2.805511474609375, -2.67205810546875, -2.538604736328125, -2.4051513671875, -2.271697998046875, -2.13824462890625, -2.004791259765625, -1.871337890625, -1.737884521484375, -1.60443115234375, -1.470977783203125, -1.3375244140625, -1.204071044921875, -1.07061767578125, -0.937164306640625, -0.8037109375, -0.670257568359375, -0.53680419921875, -0.403350830078125, -0.2698974609375, -0.136444091796875, -0.00299072265625, 0.130462646484375, 0.263916015625, 0.397369384765625, 0.53082275390625, 0.664276123046875, 0.7977294921875, 0.931182861328125, 1.06463623046875, 1.198089599609375, 1.33154296875, 1.464996337890625, 1.59844970703125, 1.731903076171875, 1.8653564453125, 1.998809814453125, 2.13226318359375, 2.265716552734375, 2.399169921875, 2.532623291015625, 2.66607666015625, 2.799530029296875, 2.9329833984375, 3.066436767578125, 3.19989013671875, 3.333343505859375, 3.466796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 9.0, 10.0, 15.0, 31.0, 38.0, 46.0, 80.0, 82.0, 105.0, 109.0, 106.0, 108.0, 66.0, 67.0, 37.0, 37.0, 16.0, 11.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.15516662597656, -63.38795471191406, -61.62074661254883, -59.85353469848633, -58.086326599121094, -56.319114685058594, -54.551902770996094, -52.78469467163086, -51.01748275756836, -49.25027084350586, -47.483062744140625, -45.715850830078125, -43.94864273071289, -42.18143081665039, -40.414222717285156, -38.647010803222656, -36.879798889160156, -35.112586975097656, -33.34537887573242, -31.578166961669922, -29.810956954956055, -28.043746948242188, -26.27653694152832, -24.509326934814453, -22.74211883544922, -20.97490882873535, -19.207698822021484, -17.440486907958984, -15.673276901245117, -13.90606689453125, -12.138856887817383, -10.3716459274292, -8.604434967041016, -6.83722448348999, -5.070013999938965, -3.3028039932250977, -1.5355935096740723, 0.23161697387695312, 1.9988269805908203, 3.766037940979004, 5.533247947692871, 7.3004584312438965, 9.067668914794922, 10.834878921508789, 12.602088928222656, 14.36929988861084, 16.13650894165039, 17.90372085571289, 19.670930862426758, 21.438140869140625, 23.205350875854492, 24.97256088256836, 26.73977279663086, 28.506982803344727, 30.274192810058594, 32.041404724121094, 33.80861282348633, 35.57582473754883, 37.34303283691406, 39.11024475097656, 40.8774528503418, 42.6446647644043, 44.41187286376953, 46.17908477783203, 47.94629669189453]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 2.0, 4.0, 9.0, 8.0, 6.0, 9.0, 11.0, 17.0, 20.0, 15.0, 24.0, 29.0, 34.0, 27.0, 34.0, 33.0, 39.0, 35.0, 44.0, 35.0, 46.0, 39.0, 36.0, 42.0, 33.0, 38.0, 32.0, 30.0, 34.0, 28.0, 34.0, 17.0, 20.0, 20.0, 21.0, 17.0, 14.0, 14.0, 10.0, 6.0, 11.0, 7.0, 5.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.24681854248047, -32.092681884765625, -30.938547134399414, -29.784412384033203, -28.63027572631836, -27.476139068603516, -26.322004318237305, -25.167869567871094, -24.01373291015625, -22.859596252441406, -21.705461502075195, -20.551326751708984, -19.39719009399414, -18.243053436279297, -17.088918685913086, -15.934782981872559, -14.780647277832031, -13.626511573791504, -12.472375869750977, -11.31824016571045, -10.164104461669922, -9.009968757629395, -7.855833053588867, -6.70169734954834, -5.5475616455078125, -4.393425941467285, -3.239290237426758, -2.0851545333862305, -0.9310188293457031, 0.22311687469482422, 1.3772525787353516, 2.531388282775879, 3.685527801513672, 4.839663505554199, 5.993799209594727, 7.147934913635254, 8.302070617675781, 9.456206321716309, 10.610342025756836, 11.764477729797363, 12.91861343383789, 14.072749137878418, 15.226884841918945, 16.381019592285156, 17.53515625, 18.689292907714844, 19.843427658081055, 20.997562408447266, 22.15169906616211, 23.305835723876953, 24.459970474243164, 25.614105224609375, 26.76824188232422, 27.922378540039062, 29.076513290405273, 30.230648040771484, 31.384784698486328, 32.53892135620117, 33.69305419921875, 34.847190856933594, 36.00132751464844, 37.15546417236328, 38.309600830078125, 39.4637336730957, 40.61787033081055]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 3.0, 7.0, 11.0, 14.0, 17.0, 22.0, 46.0, 58.0, 63.0, 105.0, 140.0, 248.0, 335.0, 558.0, 901.0, 1477.0, 2442.0, 4428.0, 8619.0, 18928.0, 50633.0, 196520.0, 3246779.0, 520062.0, 86979.0, 28487.0, 12065.0, 5995.0, 3132.0, 1889.0, 1202.0, 669.0, 439.0, 315.0, 196.0, 136.0, 99.0, 64.0, 46.0, 35.0, 24.0, 21.0, 15.0, 15.0, 13.0, 5.0, 4.0, 0.0, 1.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-8.640625, -8.3499755859375, -8.059326171875, -7.7686767578125, -7.47802734375, -7.1873779296875, -6.896728515625, -6.6060791015625, -6.3154296875, -6.0247802734375, -5.734130859375, -5.4434814453125, -5.15283203125, -4.8621826171875, -4.571533203125, -4.2808837890625, -3.990234375, -3.6995849609375, -3.408935546875, -3.1182861328125, -2.82763671875, -2.5369873046875, -2.246337890625, -1.9556884765625, -1.6650390625, -1.3743896484375, -1.083740234375, -0.7930908203125, -0.50244140625, -0.2117919921875, 0.078857421875, 0.3695068359375, 0.66015625, 0.9508056640625, 1.241455078125, 1.5321044921875, 1.82275390625, 2.1134033203125, 2.404052734375, 2.6947021484375, 2.9853515625, 3.2760009765625, 3.566650390625, 3.8572998046875, 4.14794921875, 4.4385986328125, 4.729248046875, 5.0198974609375, 5.310546875, 5.6011962890625, 5.891845703125, 6.1824951171875, 6.47314453125, 6.7637939453125, 7.054443359375, 7.3450927734375, 7.6357421875, 7.9263916015625, 8.217041015625, 8.5076904296875, 8.79833984375, 9.0889892578125, 9.379638671875, 9.6702880859375, 9.9609375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 1.0, 3.0, 5.0, 8.0, 6.0, 8.0, 13.0, 15.0, 15.0, 22.0, 26.0, 31.0, 30.0, 30.0, 32.0, 53.0, 50.0, 50.0, 56.0, 46.0, 49.0, 57.0, 52.0, 49.0, 40.0, 30.0, 40.0, 37.0, 22.0, 21.0, 19.0, 16.0, 13.0, 16.0, 12.0, 7.0, 4.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.67578125, -1.6198272705078125, -1.563873291015625, -1.5079193115234375, -1.45196533203125, -1.3960113525390625, -1.340057373046875, -1.2841033935546875, -1.2281494140625, -1.1721954345703125, -1.116241455078125, -1.0602874755859375, -1.00433349609375, -0.9483795166015625, -0.892425537109375, -0.8364715576171875, -0.780517578125, -0.7245635986328125, -0.668609619140625, -0.6126556396484375, -0.55670166015625, -0.5007476806640625, -0.444793701171875, -0.3888397216796875, -0.3328857421875, -0.2769317626953125, -0.220977783203125, -0.1650238037109375, -0.10906982421875, -0.0531158447265625, 0.002838134765625, 0.0587921142578125, 0.11474609375, 0.1707000732421875, 0.226654052734375, 0.2826080322265625, 0.33856201171875, 0.3945159912109375, 0.450469970703125, 0.5064239501953125, 0.5623779296875, 0.6183319091796875, 0.674285888671875, 0.7302398681640625, 0.78619384765625, 0.8421478271484375, 0.898101806640625, 0.9540557861328125, 1.010009765625, 1.0659637451171875, 1.121917724609375, 1.1778717041015625, 1.23382568359375, 1.2897796630859375, 1.345733642578125, 1.4016876220703125, 1.4576416015625, 1.5135955810546875, 1.569549560546875, 1.6255035400390625, 1.68145751953125, 1.7374114990234375, 1.793365478515625, 1.8493194580078125, 1.9052734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 5.0, 8.0, 5.0, 7.0, 10.0, 16.0, 15.0, 27.0, 24.0, 36.0, 48.0, 54.0, 80.0, 115.0, 261.0, 635.0, 1764.0, 5655.0, 22868.0, 131629.0, 3098176.0, 841639.0, 71412.0, 13894.0, 3571.0, 1200.0, 485.0, 239.0, 114.0, 73.0, 63.0, 41.0, 21.0, 24.0, 20.0, 14.0, 3.0, 8.0, 5.0, 1.0, 5.0, 5.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.3359375, -11.8929443359375, -11.449951171875, -11.0069580078125, -10.56396484375, -10.1209716796875, -9.677978515625, -9.2349853515625, -8.7919921875, -8.3489990234375, -7.906005859375, -7.4630126953125, -7.02001953125, -6.5770263671875, -6.134033203125, -5.6910400390625, -5.248046875, -4.8050537109375, -4.362060546875, -3.9190673828125, -3.47607421875, -3.0330810546875, -2.590087890625, -2.1470947265625, -1.7041015625, -1.2611083984375, -0.818115234375, -0.3751220703125, 0.06787109375, 0.5108642578125, 0.953857421875, 1.3968505859375, 1.83984375, 2.2828369140625, 2.725830078125, 3.1688232421875, 3.61181640625, 4.0548095703125, 4.497802734375, 4.9407958984375, 5.3837890625, 5.8267822265625, 6.269775390625, 6.7127685546875, 7.15576171875, 7.5987548828125, 8.041748046875, 8.4847412109375, 8.927734375, 9.3707275390625, 9.813720703125, 10.2567138671875, 10.69970703125, 11.1427001953125, 11.585693359375, 12.0286865234375, 12.4716796875, 12.9146728515625, 13.357666015625, 13.8006591796875, 14.24365234375, 14.6866455078125, 15.129638671875, 15.5726318359375, 16.015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 11.0, 7.0, 10.0, 16.0, 28.0, 52.0, 90.0, 152.0, 303.0, 1026.0, 1641.0, 398.0, 148.0, 92.0, 44.0, 25.0, 17.0, 10.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.58984375, -7.39569091796875, -7.2015380859375, -7.00738525390625, -6.813232421875, -6.61907958984375, -6.4249267578125, -6.23077392578125, -6.03662109375, -5.84246826171875, -5.6483154296875, -5.45416259765625, -5.260009765625, -5.06585693359375, -4.8717041015625, -4.67755126953125, -4.4833984375, -4.28924560546875, -4.0950927734375, -3.90093994140625, -3.706787109375, -3.51263427734375, -3.3184814453125, -3.12432861328125, -2.93017578125, -2.73602294921875, -2.5418701171875, -2.34771728515625, -2.153564453125, -1.95941162109375, -1.7652587890625, -1.57110595703125, -1.376953125, -1.18280029296875, -0.9886474609375, -0.79449462890625, -0.600341796875, -0.40618896484375, -0.2120361328125, -0.01788330078125, 0.17626953125, 0.37042236328125, 0.5645751953125, 0.75872802734375, 0.952880859375, 1.14703369140625, 1.3411865234375, 1.53533935546875, 1.7294921875, 1.92364501953125, 2.1177978515625, 2.31195068359375, 2.506103515625, 2.70025634765625, 2.8944091796875, 3.08856201171875, 3.28271484375, 3.47686767578125, 3.6710205078125, 3.86517333984375, 4.059326171875, 4.25347900390625, 4.4476318359375, 4.64178466796875, 4.8359375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 15.0, 30.0, 46.0, 76.0, 104.0, 141.0, 141.0, 136.0, 110.0, 74.0, 53.0, 34.0, 8.0, 13.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.1578369140625, -34.22833251953125, -33.298828125, -32.369327545166016, -31.439823150634766, -30.510318756103516, -29.580814361572266, -28.651309967041016, -27.7218074798584, -26.79230308532715, -25.86280059814453, -24.93329620361328, -24.00379180908203, -23.074289321899414, -22.144784927368164, -21.215282440185547, -20.285778045654297, -19.356273651123047, -18.42677116394043, -17.49726676940918, -16.567764282226562, -15.638259887695312, -14.708755493164062, -13.779252052307129, -12.849748611450195, -11.920245170593262, -10.990741729736328, -10.061237335205078, -9.131733894348145, -8.202230453491211, -7.272726535797119, -6.343222618103027, -5.413719177246094, -4.48421573638916, -3.5547118186950684, -2.6252081394195557, -1.695704460144043, -0.7662010192871094, 0.16330289840698242, 1.0928068161010742, 2.022310256958008, 2.9518139362335205, 3.881317615509033, 4.810821533203125, 5.740324974060059, 6.669828414916992, 7.599332332611084, 8.528836250305176, 9.45833969116211, 10.387843132019043, 11.317346572875977, 12.246850967407227, 13.17635440826416, 14.105857849121094, 15.035362243652344, 15.964865684509277, 16.89436912536621, 17.82387351989746, 18.753376007080078, 19.682880401611328, 20.612384796142578, 21.541887283325195, 22.471391677856445, 23.400894165039062, 24.330398559570312]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 9.0, 9.0, 9.0, 18.0, 23.0, 31.0, 39.0, 34.0, 46.0, 38.0, 45.0, 40.0, 55.0, 53.0, 54.0, 40.0, 65.0, 52.0, 54.0, 42.0, 47.0, 33.0, 35.0, 32.0, 23.0, 18.0, 10.0, 14.0, 11.0, 7.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.483598709106445, -18.97551155090332, -18.467424392700195, -17.95933723449707, -17.451250076293945, -16.94316291809082, -16.435075759887695, -15.92698860168457, -15.418901443481445, -14.91081428527832, -14.402727127075195, -13.89463996887207, -13.386552810668945, -12.87846565246582, -12.370378494262695, -11.86229133605957, -11.354205131530762, -10.846117973327637, -10.338030815124512, -9.829943656921387, -9.321856498718262, -8.813769340515137, -8.305683135986328, -7.797595500946045, -7.28950834274292, -6.781421184539795, -6.27333402633667, -5.765247344970703, -5.257160186767578, -4.749073028564453, -4.240985870361328, -3.732898712158203, -3.2248125076293945, -2.7167253494262695, -2.2086381912231445, -1.7005512714385986, -1.1924641132354736, -0.6843769550323486, -0.17629003524780273, 0.33179712295532227, 0.8398842811584473, 1.3479714393615723, 1.8560584783554077, 2.364145517349243, 2.872232675552368, 3.380319833755493, 3.888406753540039, 4.396493911743164, 4.904581069946289, 5.412668228149414, 5.920755386352539, 6.428842544555664, 6.936929702758789, 7.445016860961914, 7.953103542327881, 8.461191177368164, 8.969278335571289, 9.477365493774414, 9.985452651977539, 10.493539810180664, 11.001626968383789, 11.509714126586914, 12.017801284790039, 12.525888442993164, 13.033974647521973]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 8.0, 6.0, 32.0, 44.0, 59.0, 118.0, 211.0, 417.0, 724.0, 1474.0, 3367.0, 9005.0, 25506.0, 80244.0, 255167.0, 423416.0, 167964.0, 52592.0, 17155.0, 6146.0, 2503.0, 1110.0, 576.0, 281.0, 156.0, 100.0, 65.0, 38.0, 29.0, 17.0, 10.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1640625, -11.775634765625, -11.38720703125, -10.998779296875, -10.6103515625, -10.221923828125, -9.83349609375, -9.445068359375, -9.056640625, -8.668212890625, -8.27978515625, -7.891357421875, -7.5029296875, -7.114501953125, -6.72607421875, -6.337646484375, -5.94921875, -5.560791015625, -5.17236328125, -4.783935546875, -4.3955078125, -4.007080078125, -3.61865234375, -3.230224609375, -2.841796875, -2.453369140625, -2.06494140625, -1.676513671875, -1.2880859375, -0.899658203125, -0.51123046875, -0.122802734375, 0.265625, 0.654052734375, 1.04248046875, 1.430908203125, 1.8193359375, 2.207763671875, 2.59619140625, 2.984619140625, 3.373046875, 3.761474609375, 4.14990234375, 4.538330078125, 4.9267578125, 5.315185546875, 5.70361328125, 6.092041015625, 6.48046875, 6.868896484375, 7.25732421875, 7.645751953125, 8.0341796875, 8.422607421875, 8.81103515625, 9.199462890625, 9.587890625, 9.976318359375, 10.36474609375, 10.753173828125, 11.1416015625, 11.530029296875, 11.91845703125, 12.306884765625, 12.6953125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 5.0, 8.0, 13.0, 17.0, 16.0, 27.0, 20.0, 22.0, 30.0, 40.0, 43.0, 38.0, 50.0, 52.0, 47.0, 54.0, 57.0, 58.0, 38.0, 59.0, 53.0, 26.0, 28.0, 33.0, 16.0, 26.0, 24.0, 12.0, 13.0, 12.0, 14.0, 10.0, 5.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.662109375, -1.6068115234375, -1.551513671875, -1.4962158203125, -1.44091796875, -1.3856201171875, -1.330322265625, -1.2750244140625, -1.2197265625, -1.1644287109375, -1.109130859375, -1.0538330078125, -0.99853515625, -0.9432373046875, -0.887939453125, -0.8326416015625, -0.77734375, -0.7220458984375, -0.666748046875, -0.6114501953125, -0.55615234375, -0.5008544921875, -0.445556640625, -0.3902587890625, -0.3349609375, -0.2796630859375, -0.224365234375, -0.1690673828125, -0.11376953125, -0.0584716796875, -0.003173828125, 0.0521240234375, 0.107421875, 0.1627197265625, 0.218017578125, 0.2733154296875, 0.32861328125, 0.3839111328125, 0.439208984375, 0.4945068359375, 0.5498046875, 0.6051025390625, 0.660400390625, 0.7156982421875, 0.77099609375, 0.8262939453125, 0.881591796875, 0.9368896484375, 0.9921875, 1.0474853515625, 1.102783203125, 1.1580810546875, 1.21337890625, 1.2686767578125, 1.323974609375, 1.3792724609375, 1.4345703125, 1.4898681640625, 1.545166015625, 1.6004638671875, 1.65576171875, 1.7110595703125, 1.766357421875, 1.8216552734375, 1.876953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 11.0, 15.0, 13.0, 14.0, 35.0, 45.0, 51.0, 77.0, 93.0, 126.0, 179.0, 224.0, 335.0, 557.0, 1054.0, 2069.0, 5115.0, 14131.0, 45575.0, 152977.0, 404537.0, 287158.0, 90903.0, 27261.0, 8877.0, 3373.0, 1496.0, 752.0, 438.0, 297.0, 196.0, 154.0, 118.0, 78.0, 53.0, 37.0, 38.0, 27.0, 28.0, 9.0, 15.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.58984375, -7.30645751953125, -7.0230712890625, -6.73968505859375, -6.456298828125, -6.17291259765625, -5.8895263671875, -5.60614013671875, -5.32275390625, -5.03936767578125, -4.7559814453125, -4.47259521484375, -4.189208984375, -3.90582275390625, -3.6224365234375, -3.33905029296875, -3.0556640625, -2.77227783203125, -2.4888916015625, -2.20550537109375, -1.922119140625, -1.63873291015625, -1.3553466796875, -1.07196044921875, -0.78857421875, -0.50518798828125, -0.2218017578125, 0.06158447265625, 0.344970703125, 0.62835693359375, 0.9117431640625, 1.19512939453125, 1.478515625, 1.76190185546875, 2.0452880859375, 2.32867431640625, 2.612060546875, 2.89544677734375, 3.1788330078125, 3.46221923828125, 3.74560546875, 4.02899169921875, 4.3123779296875, 4.59576416015625, 4.879150390625, 5.16253662109375, 5.4459228515625, 5.72930908203125, 6.0126953125, 6.29608154296875, 6.5794677734375, 6.86285400390625, 7.146240234375, 7.42962646484375, 7.7130126953125, 7.99639892578125, 8.27978515625, 8.56317138671875, 8.8465576171875, 9.12994384765625, 9.413330078125, 9.69671630859375, 9.9801025390625, 10.26348876953125, 10.546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 6.0, 5.0, 10.0, 9.0, 6.0, 6.0, 10.0, 9.0, 11.0, 12.0, 15.0, 16.0, 26.0, 29.0, 34.0, 30.0, 21.0, 26.0, 34.0, 36.0, 39.0, 51.0, 43.0, 41.0, 37.0, 42.0, 40.0, 30.0, 39.0, 29.0, 30.0, 20.0, 25.0, 27.0, 15.0, 20.0, 7.0, 25.0, 15.0, 16.0, 12.0, 4.0, 3.0, 11.0, 8.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-6.23828125, -6.0538330078125, -5.869384765625, -5.6849365234375, -5.50048828125, -5.3160400390625, -5.131591796875, -4.9471435546875, -4.7626953125, -4.5782470703125, -4.393798828125, -4.2093505859375, -4.02490234375, -3.8404541015625, -3.656005859375, -3.4715576171875, -3.287109375, -3.1026611328125, -2.918212890625, -2.7337646484375, -2.54931640625, -2.3648681640625, -2.180419921875, -1.9959716796875, -1.8115234375, -1.6270751953125, -1.442626953125, -1.2581787109375, -1.07373046875, -0.8892822265625, -0.704833984375, -0.5203857421875, -0.3359375, -0.1514892578125, 0.032958984375, 0.2174072265625, 0.40185546875, 0.5863037109375, 0.770751953125, 0.9552001953125, 1.1396484375, 1.3240966796875, 1.508544921875, 1.6929931640625, 1.87744140625, 2.0618896484375, 2.246337890625, 2.4307861328125, 2.615234375, 2.7996826171875, 2.984130859375, 3.1685791015625, 3.35302734375, 3.5374755859375, 3.721923828125, 3.9063720703125, 4.0908203125, 4.2752685546875, 4.459716796875, 4.6441650390625, 4.82861328125, 5.0130615234375, 5.197509765625, 5.3819580078125, 5.56640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 3.0, 7.0, 11.0, 14.0, 26.0, 34.0, 47.0, 60.0, 142.0, 251.0, 479.0, 920.0, 1964.0, 4926.0, 14872.0, 60206.0, 348255.0, 496320.0, 88784.0, 20093.0, 6408.0, 2335.0, 1124.0, 561.0, 302.0, 146.0, 82.0, 63.0, 37.0, 18.0, 14.0, 10.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.65234375, -7.4344482421875, -7.216552734375, -6.9986572265625, -6.78076171875, -6.5628662109375, -6.344970703125, -6.1270751953125, -5.9091796875, -5.6912841796875, -5.473388671875, -5.2554931640625, -5.03759765625, -4.8197021484375, -4.601806640625, -4.3839111328125, -4.166015625, -3.9481201171875, -3.730224609375, -3.5123291015625, -3.29443359375, -3.0765380859375, -2.858642578125, -2.6407470703125, -2.4228515625, -2.2049560546875, -1.987060546875, -1.7691650390625, -1.55126953125, -1.3333740234375, -1.115478515625, -0.8975830078125, -0.6796875, -0.4617919921875, -0.243896484375, -0.0260009765625, 0.19189453125, 0.4097900390625, 0.627685546875, 0.8455810546875, 1.0634765625, 1.2813720703125, 1.499267578125, 1.7171630859375, 1.93505859375, 2.1529541015625, 2.370849609375, 2.5887451171875, 2.806640625, 3.0245361328125, 3.242431640625, 3.4603271484375, 3.67822265625, 3.8961181640625, 4.114013671875, 4.3319091796875, 4.5498046875, 4.7677001953125, 4.985595703125, 5.2034912109375, 5.42138671875, 5.6392822265625, 5.857177734375, 6.0750732421875, 6.29296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 4.0, 2.0, 4.0, 6.0, 4.0, 5.0, 15.0, 14.0, 16.0, 21.0, 23.0, 19.0, 46.0, 48.0, 63.0, 99.0, 115.0, 118.0, 77.0, 65.0, 47.0, 25.0, 36.0, 22.0, 20.0, 13.0, 14.0, 9.0, 9.0, 6.0, 12.0, 3.0, 2.0, 2.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007076263427734375, -0.0006838887929916382, -0.0006601512432098389, -0.0006364136934280396, -0.0006126761436462402, -0.0005889385938644409, -0.0005652010440826416, -0.0005414634943008423, -0.000517725944519043, -0.0004939883947372437, -0.00047025084495544434, -0.000446513295173645, -0.0004227757453918457, -0.0003990381956100464, -0.00037530064582824707, -0.00035156309604644775, -0.00032782554626464844, -0.0003040879964828491, -0.0002803504467010498, -0.0002566128969192505, -0.00023287534713745117, -0.00020913779735565186, -0.00018540024757385254, -0.00016166269779205322, -0.0001379251480102539, -0.00011418759822845459, -9.045004844665527e-05, -6.671249866485596e-05, -4.297494888305664e-05, -1.9237399101257324e-05, 4.500150680541992e-06, 2.823770046234131e-05, 5.1975250244140625e-05, 7.571280002593994e-05, 9.945034980773926e-05, 0.00012318789958953857, 0.0001469254493713379, 0.0001706629991531372, 0.00019440054893493652, 0.00021813809871673584, 0.00024187564849853516, 0.00026561319828033447, 0.0002893507480621338, 0.0003130882978439331, 0.0003368258476257324, 0.00036056339740753174, 0.00038430094718933105, 0.00040803849697113037, 0.0004317760467529297, 0.000455513596534729, 0.0004792511463165283, 0.0005029886960983276, 0.000526726245880127, 0.0005504637956619263, 0.0005742013454437256, 0.0005979388952255249, 0.0006216764450073242, 0.0006454139947891235, 0.0006691515445709229, 0.0006928890943527222, 0.0007166266441345215, 0.0007403641939163208, 0.0007641017436981201, 0.0007878392934799194, 0.0008115768432617188]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 0.0, 6.0, 9.0, 7.0, 11.0, 15.0, 17.0, 26.0, 39.0, 73.0, 133.0, 178.0, 369.0, 687.0, 1380.0, 3723.0, 12357.0, 66040.0, 614306.0, 302259.0, 34307.0, 7503.0, 2653.0, 1146.0, 591.0, 302.0, 145.0, 107.0, 44.0, 37.0, 23.0, 11.0, 9.0, 7.0, 8.0, 3.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.515625, -8.2095947265625, -7.903564453125, -7.5975341796875, -7.29150390625, -6.9854736328125, -6.679443359375, -6.3734130859375, -6.0673828125, -5.7613525390625, -5.455322265625, -5.1492919921875, -4.84326171875, -4.5372314453125, -4.231201171875, -3.9251708984375, -3.619140625, -3.3131103515625, -3.007080078125, -2.7010498046875, -2.39501953125, -2.0889892578125, -1.782958984375, -1.4769287109375, -1.1708984375, -0.8648681640625, -0.558837890625, -0.2528076171875, 0.05322265625, 0.3592529296875, 0.665283203125, 0.9713134765625, 1.27734375, 1.5833740234375, 1.889404296875, 2.1954345703125, 2.50146484375, 2.8074951171875, 3.113525390625, 3.4195556640625, 3.7255859375, 4.0316162109375, 4.337646484375, 4.6436767578125, 4.94970703125, 5.2557373046875, 5.561767578125, 5.8677978515625, 6.173828125, 6.4798583984375, 6.785888671875, 7.0919189453125, 7.39794921875, 7.7039794921875, 8.010009765625, 8.3160400390625, 8.6220703125, 8.9281005859375, 9.234130859375, 9.5401611328125, 9.84619140625, 10.1522216796875, 10.458251953125, 10.7642822265625, 11.0703125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 8.0, 8.0, 11.0, 23.0, 33.0, 37.0, 57.0, 82.0, 125.0, 148.0, 117.0, 114.0, 80.0, 35.0, 31.0, 27.0, 14.0, 13.0, 11.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.14453125, -6.9388427734375, -6.733154296875, -6.5274658203125, -6.32177734375, -6.1160888671875, -5.910400390625, -5.7047119140625, -5.4990234375, -5.2933349609375, -5.087646484375, -4.8819580078125, -4.67626953125, -4.4705810546875, -4.264892578125, -4.0592041015625, -3.853515625, -3.6478271484375, -3.442138671875, -3.2364501953125, -3.03076171875, -2.8250732421875, -2.619384765625, -2.4136962890625, -2.2080078125, -2.0023193359375, -1.796630859375, -1.5909423828125, -1.38525390625, -1.1795654296875, -0.973876953125, -0.7681884765625, -0.5625, -0.3568115234375, -0.151123046875, 0.0545654296875, 0.26025390625, 0.4659423828125, 0.671630859375, 0.8773193359375, 1.0830078125, 1.2886962890625, 1.494384765625, 1.7000732421875, 1.90576171875, 2.1114501953125, 2.317138671875, 2.5228271484375, 2.728515625, 2.9342041015625, 3.139892578125, 3.3455810546875, 3.55126953125, 3.7569580078125, 3.962646484375, 4.1683349609375, 4.3740234375, 4.5797119140625, 4.785400390625, 4.9910888671875, 5.19677734375, 5.4024658203125, 5.608154296875, 5.8138427734375, 6.01953125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 19.0, 54.0, 127.0, 215.0, 218.0, 191.0, 89.0, 38.0, 22.0, 11.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.28690338134766, -106.39412689208984, -102.5013427734375, -98.60856628417969, -94.71578216552734, -90.82300567626953, -86.93022155761719, -83.03744506835938, -79.14466857910156, -75.25189208984375, -71.3591079711914, -67.4663314819336, -63.57354736328125, -59.68077087402344, -55.78799057006836, -51.89521026611328, -48.00242614746094, -44.10964584350586, -40.21686553955078, -36.32408905029297, -32.431304931640625, -28.53852653503418, -24.645748138427734, -20.752967834472656, -16.860187530517578, -12.9674072265625, -9.074627876281738, -5.181848526000977, -1.2890682220458984, 2.6037120819091797, 6.496490478515625, 10.389270782470703, 14.282058715820312, 18.17483901977539, 22.06761932373047, 25.960397720336914, 29.853178024291992, 33.74595642089844, 37.638736724853516, 41.531517028808594, 45.42429733276367, 49.31707763671875, 53.20985794067383, 57.102638244628906, 60.99541473388672, 64.88819885253906, 68.78097534179688, 72.67375183105469, 76.56653594970703, 80.45931243896484, 84.35209655761719, 88.244873046875, 92.13765716552734, 96.03043365478516, 99.9232177734375, 103.81599426269531, 107.70877075195312, 111.60154724121094, 115.49433135986328, 119.3871078491211, 123.27989196777344, 127.17266845703125, 131.06544494628906, 134.95822143554688, 138.85101318359375]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 2.0, 8.0, 9.0, 13.0, 14.0, 14.0, 20.0, 30.0, 18.0, 22.0, 27.0, 29.0, 26.0, 41.0, 36.0, 34.0, 47.0, 30.0, 36.0, 36.0, 54.0, 38.0, 36.0, 29.0, 34.0, 32.0, 28.0, 25.0, 26.0, 25.0, 24.0, 19.0, 28.0, 18.0, 13.0, 10.0, 10.0, 5.0, 9.0, 5.0, 10.0, 2.0, 5.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0], "bins": [-32.232086181640625, -31.216745376586914, -30.20140266418457, -29.18606185913086, -28.17072105407715, -27.155380249023438, -26.140037536621094, -25.124696731567383, -24.109355926513672, -23.09401512145996, -22.078672409057617, -21.063331604003906, -20.047990798950195, -19.032649993896484, -18.01730728149414, -17.00196647644043, -15.986623764038086, -14.971282005310059, -13.955941200256348, -12.94059944152832, -11.92525863647461, -10.909916877746582, -9.894575119018555, -8.879234313964844, -7.863892555236816, -6.848551273345947, -5.833209991455078, -4.817868232727051, -3.8025269508361816, -2.7871856689453125, -1.7718439102172852, -0.756502628326416, 0.2588386535644531, 1.2741800546646118, 2.2895214557647705, 3.3048629760742188, 4.320204257965088, 5.335545539855957, 6.350887298583984, 7.3662285804748535, 8.381569862365723, 9.39691162109375, 10.412252426147461, 11.427594184875488, 12.442935943603516, 13.458276748657227, 14.473618507385254, 15.488960266113281, 16.504301071166992, 17.519641876220703, 18.534984588623047, 19.550325393676758, 20.56566619873047, 21.581008911132812, 22.596349716186523, 23.611690521240234, 24.627033233642578, 25.64237403869629, 26.657716751098633, 27.673057556152344, 28.688398361206055, 29.703739166259766, 30.71908187866211, 31.73442268371582, 32.74976348876953]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 8.0, 7.0, 13.0, 16.0, 30.0, 33.0, 40.0, 66.0, 109.0, 152.0, 213.0, 290.0, 512.0, 705.0, 1219.0, 1996.0, 3675.0, 7423.0, 15352.0, 39644.0, 138888.0, 1448404.0, 2307405.0, 152852.0, 41890.0, 16195.0, 7458.0, 3819.0, 2158.0, 1287.0, 816.0, 532.0, 341.0, 216.0, 148.0, 104.0, 74.0, 52.0, 40.0, 27.0, 16.0, 13.0, 11.0, 8.0, 14.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.5078125, -9.201416015625, -8.89501953125, -8.588623046875, -8.2822265625, -7.975830078125, -7.66943359375, -7.363037109375, -7.056640625, -6.750244140625, -6.44384765625, -6.137451171875, -5.8310546875, -5.524658203125, -5.21826171875, -4.911865234375, -4.60546875, -4.299072265625, -3.99267578125, -3.686279296875, -3.3798828125, -3.073486328125, -2.76708984375, -2.460693359375, -2.154296875, -1.847900390625, -1.54150390625, -1.235107421875, -0.9287109375, -0.622314453125, -0.31591796875, -0.009521484375, 0.296875, 0.603271484375, 0.90966796875, 1.216064453125, 1.5224609375, 1.828857421875, 2.13525390625, 2.441650390625, 2.748046875, 3.054443359375, 3.36083984375, 3.667236328125, 3.9736328125, 4.280029296875, 4.58642578125, 4.892822265625, 5.19921875, 5.505615234375, 5.81201171875, 6.118408203125, 6.4248046875, 6.731201171875, 7.03759765625, 7.343994140625, 7.650390625, 7.956787109375, 8.26318359375, 8.569580078125, 8.8759765625, 9.182373046875, 9.48876953125, 9.795166015625, 10.1015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 3.0, 10.0, 4.0, 4.0, 11.0, 15.0, 11.0, 18.0, 18.0, 30.0, 36.0, 39.0, 44.0, 48.0, 51.0, 46.0, 68.0, 41.0, 61.0, 53.0, 49.0, 55.0, 32.0, 37.0, 41.0, 35.0, 20.0, 25.0, 17.0, 14.0, 17.0, 10.0, 10.0, 4.0, 3.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8251953125, -1.766265869140625, -1.70733642578125, -1.648406982421875, -1.5894775390625, -1.530548095703125, -1.47161865234375, -1.412689208984375, -1.353759765625, -1.294830322265625, -1.23590087890625, -1.176971435546875, -1.1180419921875, -1.059112548828125, -1.00018310546875, -0.941253662109375, -0.88232421875, -0.823394775390625, -0.76446533203125, -0.705535888671875, -0.6466064453125, -0.587677001953125, -0.52874755859375, -0.469818115234375, -0.410888671875, -0.351959228515625, -0.29302978515625, -0.234100341796875, -0.1751708984375, -0.116241455078125, -0.05731201171875, 0.001617431640625, 0.060546875, 0.119476318359375, 0.17840576171875, 0.237335205078125, 0.2962646484375, 0.355194091796875, 0.41412353515625, 0.473052978515625, 0.531982421875, 0.590911865234375, 0.64984130859375, 0.708770751953125, 0.7677001953125, 0.826629638671875, 0.88555908203125, 0.944488525390625, 1.00341796875, 1.062347412109375, 1.12127685546875, 1.180206298828125, 1.2391357421875, 1.298065185546875, 1.35699462890625, 1.415924072265625, 1.474853515625, 1.533782958984375, 1.59271240234375, 1.651641845703125, 1.7105712890625, 1.769500732421875, 1.82843017578125, 1.887359619140625, 1.9462890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 8.0, 9.0, 3.0, 19.0, 16.0, 41.0, 51.0, 88.0, 109.0, 206.0, 307.0, 569.0, 1137.0, 2476.0, 5722.0, 16424.0, 55370.0, 260046.0, 2930399.0, 762927.0, 111972.0, 29282.0, 9588.0, 3884.0, 1668.0, 794.0, 419.0, 253.0, 166.0, 94.0, 73.0, 40.0, 44.0, 22.0, 19.0, 11.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.7734375, -9.465576171875, -9.15771484375, -8.849853515625, -8.5419921875, -8.234130859375, -7.92626953125, -7.618408203125, -7.310546875, -7.002685546875, -6.69482421875, -6.386962890625, -6.0791015625, -5.771240234375, -5.46337890625, -5.155517578125, -4.84765625, -4.539794921875, -4.23193359375, -3.924072265625, -3.6162109375, -3.308349609375, -3.00048828125, -2.692626953125, -2.384765625, -2.076904296875, -1.76904296875, -1.461181640625, -1.1533203125, -0.845458984375, -0.53759765625, -0.229736328125, 0.078125, 0.385986328125, 0.69384765625, 1.001708984375, 1.3095703125, 1.617431640625, 1.92529296875, 2.233154296875, 2.541015625, 2.848876953125, 3.15673828125, 3.464599609375, 3.7724609375, 4.080322265625, 4.38818359375, 4.696044921875, 5.00390625, 5.311767578125, 5.61962890625, 5.927490234375, 6.2353515625, 6.543212890625, 6.85107421875, 7.158935546875, 7.466796875, 7.774658203125, 8.08251953125, 8.390380859375, 8.6982421875, 9.006103515625, 9.31396484375, 9.621826171875, 9.9296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 4.0, 13.0, 9.0, 10.0, 27.0, 37.0, 62.0, 95.0, 185.0, 382.0, 1125.0, 1231.0, 413.0, 193.0, 98.0, 57.0, 49.0, 27.0, 22.0, 8.0, 12.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2265625, -5.04010009765625, -4.8536376953125, -4.66717529296875, -4.480712890625, -4.29425048828125, -4.1077880859375, -3.92132568359375, -3.73486328125, -3.54840087890625, -3.3619384765625, -3.17547607421875, -2.989013671875, -2.80255126953125, -2.6160888671875, -2.42962646484375, -2.2431640625, -2.05670166015625, -1.8702392578125, -1.68377685546875, -1.497314453125, -1.31085205078125, -1.1243896484375, -0.93792724609375, -0.75146484375, -0.56500244140625, -0.3785400390625, -0.19207763671875, -0.005615234375, 0.18084716796875, 0.3673095703125, 0.55377197265625, 0.740234375, 0.92669677734375, 1.1131591796875, 1.29962158203125, 1.486083984375, 1.67254638671875, 1.8590087890625, 2.04547119140625, 2.23193359375, 2.41839599609375, 2.6048583984375, 2.79132080078125, 2.977783203125, 3.16424560546875, 3.3507080078125, 3.53717041015625, 3.7236328125, 3.91009521484375, 4.0965576171875, 4.28302001953125, 4.469482421875, 4.65594482421875, 4.8424072265625, 5.02886962890625, 5.21533203125, 5.40179443359375, 5.5882568359375, 5.77471923828125, 5.961181640625, 6.14764404296875, 6.3341064453125, 6.52056884765625, 6.70703125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 11.0, 8.0, 19.0, 46.0, 73.0, 120.0, 170.0, 184.0, 137.0, 93.0, 64.0, 37.0, 20.0, 9.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.404075622558594, -60.989295959472656, -59.57451248168945, -58.15972900390625, -56.74494934082031, -55.330169677734375, -53.91538619995117, -52.50060272216797, -51.08582305908203, -49.671043395996094, -48.25625991821289, -46.84147644042969, -45.42669677734375, -44.01191711425781, -42.59713363647461, -41.182350158691406, -39.76757049560547, -38.35279083251953, -36.93800735473633, -35.523223876953125, -34.10844421386719, -32.69366455078125, -31.278881072998047, -29.864099502563477, -28.449317932128906, -27.034536361694336, -25.619754791259766, -24.204973220825195, -22.790191650390625, -21.375410079956055, -19.960628509521484, -18.545846939086914, -17.131061553955078, -15.716279983520508, -14.301498413085938, -12.886716842651367, -11.471935272216797, -10.057153701782227, -8.642372131347656, -7.227590560913086, -5.812808990478516, -4.398027420043945, -2.983245849609375, -1.5684642791748047, -0.15368270874023438, 1.261098861694336, 2.6758804321289062, 4.090662002563477, 5.505443572998047, 6.920225143432617, 8.335006713867188, 9.749788284301758, 11.164569854736328, 12.579351425170898, 13.994132995605469, 15.408914566040039, 16.82369613647461, 18.23847770690918, 19.65325927734375, 21.06804084777832, 22.48282241821289, 23.89760398864746, 25.31238555908203, 26.7271671295166, 28.141948699951172]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 10.0, 19.0, 17.0, 11.0, 18.0, 27.0, 25.0, 39.0, 35.0, 42.0, 60.0, 56.0, 50.0, 61.0, 59.0, 53.0, 43.0, 47.0, 41.0, 44.0, 39.0, 43.0, 30.0, 23.0, 24.0, 12.0, 12.0, 16.0, 11.0, 6.0, 11.0, 1.0, 3.0, 7.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.431673049926758, -22.79859161376953, -22.165510177612305, -21.532428741455078, -20.899349212646484, -20.266267776489258, -19.63318634033203, -19.000104904174805, -18.367023468017578, -17.73394203186035, -17.100860595703125, -16.4677791595459, -15.834698677062988, -15.201617240905762, -14.568536758422852, -13.935455322265625, -13.302373886108398, -12.669292449951172, -12.036211013793945, -11.403130531311035, -10.770049095153809, -10.136967658996582, -9.503887176513672, -8.870805740356445, -8.237724304199219, -7.604642868041992, -6.971561908721924, -6.3384809494018555, -5.705399513244629, -5.072318077087402, -4.439237117767334, -3.8061561584472656, -3.173074722290039, -2.5399935245513916, -1.9069123268127441, -1.2738311290740967, -0.6407499313354492, -0.007668733596801758, 0.6254124641418457, 1.258493423461914, 1.8915748596191406, 2.524656057357788, 3.1577372550964355, 3.790818452835083, 4.4238996505737305, 5.056981086730957, 5.690062046051025, 6.323143005371094, 6.95622444152832, 7.589305877685547, 8.222387313842773, 8.855467796325684, 9.48854923248291, 10.121630668640137, 10.754711151123047, 11.387792587280273, 12.0208740234375, 12.653955459594727, 13.287036895751953, 13.920117378234863, 14.55319881439209, 15.186280250549316, 15.819360733032227, 16.452442169189453, 17.08552360534668]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 6.0, 11.0, 15.0, 20.0, 28.0, 42.0, 65.0, 93.0, 174.0, 257.0, 430.0, 831.0, 1576.0, 3087.0, 6709.0, 16127.0, 40776.0, 121133.0, 504450.0, 241195.0, 67518.0, 24984.0, 10014.0, 4350.0, 2057.0, 1107.0, 601.0, 366.0, 203.0, 113.0, 74.0, 49.0, 19.0, 20.0, 17.0, 19.0, 8.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.578125, -8.244873046875, -7.91162109375, -7.578369140625, -7.2451171875, -6.911865234375, -6.57861328125, -6.245361328125, -5.912109375, -5.578857421875, -5.24560546875, -4.912353515625, -4.5791015625, -4.245849609375, -3.91259765625, -3.579345703125, -3.24609375, -2.912841796875, -2.57958984375, -2.246337890625, -1.9130859375, -1.579833984375, -1.24658203125, -0.913330078125, -0.580078125, -0.246826171875, 0.08642578125, 0.419677734375, 0.7529296875, 1.086181640625, 1.41943359375, 1.752685546875, 2.0859375, 2.419189453125, 2.75244140625, 3.085693359375, 3.4189453125, 3.752197265625, 4.08544921875, 4.418701171875, 4.751953125, 5.085205078125, 5.41845703125, 5.751708984375, 6.0849609375, 6.418212890625, 6.75146484375, 7.084716796875, 7.41796875, 7.751220703125, 8.08447265625, 8.417724609375, 8.7509765625, 9.084228515625, 9.41748046875, 9.750732421875, 10.083984375, 10.417236328125, 10.75048828125, 11.083740234375, 11.4169921875, 11.750244140625, 12.08349609375, 12.416748046875, 12.75]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 9.0, 10.0, 13.0, 24.0, 21.0, 35.0, 30.0, 34.0, 61.0, 55.0, 56.0, 61.0, 63.0, 57.0, 58.0, 57.0, 62.0, 36.0, 39.0, 38.0, 41.0, 20.0, 24.0, 19.0, 17.0, 14.0, 6.0, 6.0, 7.0, 3.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.888519287109375, -1.82196044921875, -1.755401611328125, -1.6888427734375, -1.622283935546875, -1.55572509765625, -1.489166259765625, -1.422607421875, -1.356048583984375, -1.28948974609375, -1.222930908203125, -1.1563720703125, -1.089813232421875, -1.02325439453125, -0.956695556640625, -0.89013671875, -0.823577880859375, -0.75701904296875, -0.690460205078125, -0.6239013671875, -0.557342529296875, -0.49078369140625, -0.424224853515625, -0.357666015625, -0.291107177734375, -0.22454833984375, -0.157989501953125, -0.0914306640625, -0.024871826171875, 0.04168701171875, 0.108245849609375, 0.1748046875, 0.241363525390625, 0.30792236328125, 0.374481201171875, 0.4410400390625, 0.507598876953125, 0.57415771484375, 0.640716552734375, 0.707275390625, 0.773834228515625, 0.84039306640625, 0.906951904296875, 0.9735107421875, 1.040069580078125, 1.10662841796875, 1.173187255859375, 1.23974609375, 1.306304931640625, 1.37286376953125, 1.439422607421875, 1.5059814453125, 1.572540283203125, 1.63909912109375, 1.705657958984375, 1.772216796875, 1.838775634765625, 1.90533447265625, 1.971893310546875, 2.0384521484375, 2.105010986328125, 2.17156982421875, 2.238128662109375, 2.3046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 9.0, 9.0, 13.0, 22.0, 25.0, 25.0, 44.0, 73.0, 96.0, 107.0, 175.0, 280.0, 425.0, 811.0, 1691.0, 4735.0, 16285.0, 66500.0, 354950.0, 487204.0, 84732.0, 20413.0, 5745.0, 1967.0, 865.0, 459.0, 257.0, 207.0, 125.0, 91.0, 59.0, 42.0, 29.0, 22.0, 17.0, 10.0, 7.0, 9.0, 1.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-12.125, -11.7794189453125, -11.433837890625, -11.0882568359375, -10.74267578125, -10.3970947265625, -10.051513671875, -9.7059326171875, -9.3603515625, -9.0147705078125, -8.669189453125, -8.3236083984375, -7.97802734375, -7.6324462890625, -7.286865234375, -6.9412841796875, -6.595703125, -6.2501220703125, -5.904541015625, -5.5589599609375, -5.21337890625, -4.8677978515625, -4.522216796875, -4.1766357421875, -3.8310546875, -3.4854736328125, -3.139892578125, -2.7943115234375, -2.44873046875, -2.1031494140625, -1.757568359375, -1.4119873046875, -1.06640625, -0.7208251953125, -0.375244140625, -0.0296630859375, 0.31591796875, 0.6614990234375, 1.007080078125, 1.3526611328125, 1.6982421875, 2.0438232421875, 2.389404296875, 2.7349853515625, 3.08056640625, 3.4261474609375, 3.771728515625, 4.1173095703125, 4.462890625, 4.8084716796875, 5.154052734375, 5.4996337890625, 5.84521484375, 6.1907958984375, 6.536376953125, 6.8819580078125, 7.2275390625, 7.5731201171875, 7.918701171875, 8.2642822265625, 8.60986328125, 8.9554443359375, 9.301025390625, 9.6466064453125, 9.9921875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 6.0, 10.0, 10.0, 12.0, 19.0, 22.0, 23.0, 18.0, 31.0, 34.0, 49.0, 31.0, 47.0, 39.0, 48.0, 51.0, 45.0, 44.0, 52.0, 48.0, 31.0, 49.0, 50.0, 47.0, 39.0, 24.0, 23.0, 16.0, 16.0, 13.0, 17.0, 7.0, 13.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.11865234375, -7.8701171875, -7.62158203125, -7.373046875, -7.12451171875, -6.8759765625, -6.62744140625, -6.37890625, -6.13037109375, -5.8818359375, -5.63330078125, -5.384765625, -5.13623046875, -4.8876953125, -4.63916015625, -4.390625, -4.14208984375, -3.8935546875, -3.64501953125, -3.396484375, -3.14794921875, -2.8994140625, -2.65087890625, -2.40234375, -2.15380859375, -1.9052734375, -1.65673828125, -1.408203125, -1.15966796875, -0.9111328125, -0.66259765625, -0.4140625, -0.16552734375, 0.0830078125, 0.33154296875, 0.580078125, 0.82861328125, 1.0771484375, 1.32568359375, 1.57421875, 1.82275390625, 2.0712890625, 2.31982421875, 2.568359375, 2.81689453125, 3.0654296875, 3.31396484375, 3.5625, 3.81103515625, 4.0595703125, 4.30810546875, 4.556640625, 4.80517578125, 5.0537109375, 5.30224609375, 5.55078125, 5.79931640625, 6.0478515625, 6.29638671875, 6.544921875, 6.79345703125, 7.0419921875, 7.29052734375, 7.5390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 9.0, 13.0, 7.0, 27.0, 40.0, 47.0, 115.0, 199.0, 445.0, 1179.0, 4266.0, 23192.0, 191657.0, 741442.0, 71036.0, 10980.0, 2487.0, 750.0, 300.0, 157.0, 80.0, 43.0, 21.0, 22.0, 14.0, 12.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.015625, -9.7396240234375, -9.463623046875, -9.1876220703125, -8.91162109375, -8.6356201171875, -8.359619140625, -8.0836181640625, -7.8076171875, -7.5316162109375, -7.255615234375, -6.9796142578125, -6.70361328125, -6.4276123046875, -6.151611328125, -5.8756103515625, -5.599609375, -5.3236083984375, -5.047607421875, -4.7716064453125, -4.49560546875, -4.2196044921875, -3.943603515625, -3.6676025390625, -3.3916015625, -3.1156005859375, -2.839599609375, -2.5635986328125, -2.28759765625, -2.0115966796875, -1.735595703125, -1.4595947265625, -1.18359375, -0.9075927734375, -0.631591796875, -0.3555908203125, -0.07958984375, 0.1964111328125, 0.472412109375, 0.7484130859375, 1.0244140625, 1.3004150390625, 1.576416015625, 1.8524169921875, 2.12841796875, 2.4044189453125, 2.680419921875, 2.9564208984375, 3.232421875, 3.5084228515625, 3.784423828125, 4.0604248046875, 4.33642578125, 4.6124267578125, 4.888427734375, 5.1644287109375, 5.4404296875, 5.7164306640625, 5.992431640625, 6.2684326171875, 6.54443359375, 6.8204345703125, 7.096435546875, 7.3724365234375, 7.6484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 9.0, 6.0, 16.0, 6.0, 10.0, 9.0, 20.0, 15.0, 19.0, 23.0, 29.0, 66.0, 168.0, 221.0, 118.0, 51.0, 34.0, 25.0, 24.0, 19.0, 14.0, 16.0, 17.0, 18.0, 10.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007333755493164062, -0.0007106810808181763, -0.0006879866123199463, -0.0006652921438217163, -0.0006425976753234863, -0.0006199032068252563, -0.0005972087383270264, -0.0005745142698287964, -0.0005518198013305664, -0.0005291253328323364, -0.0005064308643341064, -0.00048373639583587646, -0.0004610419273376465, -0.0004383474588394165, -0.0004156529903411865, -0.00039295852184295654, -0.00037026405334472656, -0.0003475695848464966, -0.0003248751163482666, -0.0003021806478500366, -0.00027948617935180664, -0.00025679171085357666, -0.00023409724235534668, -0.0002114027738571167, -0.00018870830535888672, -0.00016601383686065674, -0.00014331936836242676, -0.00012062489986419678, -9.79304313659668e-05, -7.523596286773682e-05, -5.2541494369506836e-05, -2.9847025871276855e-05, -7.152557373046875e-06, 1.5541911125183105e-05, 3.8236379623413086e-05, 6.0930848121643066e-05, 8.362531661987305e-05, 0.00010631978511810303, 0.000129014253616333, 0.000151708722114563, 0.00017440319061279297, 0.00019709765911102295, 0.00021979212760925293, 0.0002424865961074829, 0.0002651810646057129, 0.00028787553310394287, 0.00031057000160217285, 0.00033326447010040283, 0.0003559589385986328, 0.0003786534070968628, 0.0004013478755950928, 0.00042404234409332275, 0.00044673681259155273, 0.0004694312810897827, 0.0004921257495880127, 0.0005148202180862427, 0.0005375146865844727, 0.0005602091550827026, 0.0005829036235809326, 0.0006055980920791626, 0.0006282925605773926, 0.0006509870290756226, 0.0006736814975738525, 0.0006963759660720825, 0.0007190704345703125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 14.0, 11.0, 16.0, 30.0, 32.0, 70.0, 86.0, 164.0, 285.0, 483.0, 992.0, 2500.0, 8375.0, 43579.0, 427824.0, 501678.0, 48472.0, 9051.0, 2540.0, 1075.0, 536.0, 290.0, 168.0, 71.0, 70.0, 37.0, 25.0, 17.0, 12.0, 8.0, 7.0, 4.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-10.4140625, -10.1328125, -9.8515625, -9.5703125, -9.2890625, -9.0078125, -8.7265625, -8.4453125, -8.1640625, -7.8828125, -7.6015625, -7.3203125, -7.0390625, -6.7578125, -6.4765625, -6.1953125, -5.9140625, -5.6328125, -5.3515625, -5.0703125, -4.7890625, -4.5078125, -4.2265625, -3.9453125, -3.6640625, -3.3828125, -3.1015625, -2.8203125, -2.5390625, -2.2578125, -1.9765625, -1.6953125, -1.4140625, -1.1328125, -0.8515625, -0.5703125, -0.2890625, -0.0078125, 0.2734375, 0.5546875, 0.8359375, 1.1171875, 1.3984375, 1.6796875, 1.9609375, 2.2421875, 2.5234375, 2.8046875, 3.0859375, 3.3671875, 3.6484375, 3.9296875, 4.2109375, 4.4921875, 4.7734375, 5.0546875, 5.3359375, 5.6171875, 5.8984375, 6.1796875, 6.4609375, 6.7421875, 7.0234375, 7.3046875, 7.5859375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 6.0, 6.0, 3.0, 7.0, 9.0, 11.0, 10.0, 19.0, 23.0, 33.0, 36.0, 58.0, 80.0, 95.0, 106.0, 127.0, 100.0, 63.0, 49.0, 33.0, 28.0, 21.0, 14.0, 21.0, 12.0, 8.0, 10.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33203125, -5.18798828125, -5.0439453125, -4.89990234375, -4.755859375, -4.61181640625, -4.4677734375, -4.32373046875, -4.1796875, -4.03564453125, -3.8916015625, -3.74755859375, -3.603515625, -3.45947265625, -3.3154296875, -3.17138671875, -3.02734375, -2.88330078125, -2.7392578125, -2.59521484375, -2.451171875, -2.30712890625, -2.1630859375, -2.01904296875, -1.875, -1.73095703125, -1.5869140625, -1.44287109375, -1.298828125, -1.15478515625, -1.0107421875, -0.86669921875, -0.72265625, -0.57861328125, -0.4345703125, -0.29052734375, -0.146484375, -0.00244140625, 0.1416015625, 0.28564453125, 0.4296875, 0.57373046875, 0.7177734375, 0.86181640625, 1.005859375, 1.14990234375, 1.2939453125, 1.43798828125, 1.58203125, 1.72607421875, 1.8701171875, 2.01416015625, 2.158203125, 2.30224609375, 2.4462890625, 2.59033203125, 2.734375, 2.87841796875, 3.0224609375, 3.16650390625, 3.310546875, 3.45458984375, 3.5986328125, 3.74267578125, 3.88671875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 31.0, 145.0, 360.0, 303.0, 118.0, 28.0, 6.0, 2.0, 1.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.74913024902344, -107.72673034667969, -101.70433044433594, -95.68193054199219, -89.65953063964844, -83.63713073730469, -77.61473846435547, -71.59233856201172, -65.56993865966797, -59.54753875732422, -53.52513885498047, -47.502742767333984, -41.480342864990234, -35.457942962646484, -29.435546875, -23.41314697265625, -17.3907470703125, -11.368348121643066, -5.345949172973633, 0.6764488220214844, 6.698848724365234, 12.721248626708984, 18.74364471435547, 24.76604461669922, 30.78844451904297, 36.81084442138672, 42.83324432373047, 48.85564041137695, 54.8780403137207, 60.90044021606445, 66.92283630371094, 72.94523620605469, 78.96762084960938, 84.99002075195312, 91.01242065429688, 97.03482055664062, 103.05722045898438, 109.07962036132812, 115.10201263427734, 121.1244125366211, 127.14681243896484, 133.16920471191406, 139.1916046142578, 145.21400451660156, 151.2364044189453, 157.25880432128906, 163.2812042236328, 169.30360412597656, 175.3260040283203, 181.34840393066406, 187.3708038330078, 193.39320373535156, 199.4156036376953, 205.43800354003906, 211.46038818359375, 217.4827880859375, 223.50518798828125, 229.527587890625, 235.54998779296875, 241.5723876953125, 247.59478759765625, 253.6171875, 259.63958740234375, 265.6619873046875, 271.68438720703125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 9.0, 3.0, 8.0, 12.0, 19.0, 16.0, 14.0, 21.0, 24.0, 29.0, 27.0, 24.0, 34.0, 34.0, 34.0, 31.0, 37.0, 40.0, 34.0, 40.0, 36.0, 37.0, 32.0, 30.0, 31.0, 34.0, 38.0, 31.0, 40.0, 23.0, 21.0, 27.0, 18.0, 22.0, 12.0, 11.0, 14.0, 8.0, 5.0, 4.0, 10.0, 2.0, 6.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0], "bins": [-35.04864501953125, -34.04417037963867, -33.03969192504883, -32.03521728515625, -31.03074073791504, -30.026264190673828, -29.02178955078125, -28.01731300354004, -27.012836456298828, -26.008359909057617, -25.003883361816406, -23.999408721923828, -22.994932174682617, -21.990455627441406, -20.985980987548828, -19.981504440307617, -18.977027893066406, -17.972551345825195, -16.968074798583984, -15.963600158691406, -14.959123611450195, -13.954647064208984, -12.95017147064209, -11.945695877075195, -10.941219329833984, -9.936742782592773, -8.932267189025879, -7.927791118621826, -6.923315048217773, -5.918838977813721, -4.914362907409668, -3.9098868370056152, -2.905406951904297, -1.9009308815002441, -0.8964548110961914, 0.10802125930786133, 1.112497329711914, 2.116973400115967, 3.1214494705200195, 4.125925540924072, 5.130401611328125, 6.134877681732178, 7.1393537521362305, 8.143829345703125, 9.148305892944336, 10.152782440185547, 11.157258033752441, 12.161733627319336, 13.166210174560547, 14.170686721801758, 15.175162315368652, 16.179637908935547, 17.184114456176758, 18.18859100341797, 19.193065643310547, 20.197542190551758, 21.20201873779297, 22.20649528503418, 23.21097183227539, 24.21544647216797, 25.21992301940918, 26.22439956665039, 27.22887420654297, 28.23335075378418, 29.23782730102539]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 7.0, 7.0, 5.0, 14.0, 20.0, 15.0, 23.0, 38.0, 51.0, 120.0, 168.0, 319.0, 720.0, 1606.0, 4665.0, 17145.0, 102341.0, 3710296.0, 313140.0, 31516.0, 7464.0, 2490.0, 1033.0, 445.0, 220.0, 142.0, 81.0, 54.0, 41.0, 20.0, 18.0, 14.0, 7.0, 8.0, 9.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.703125, -22.0087890625, -21.314453125, -20.6201171875, -19.92578125, -19.2314453125, -18.537109375, -17.8427734375, -17.1484375, -16.4541015625, -15.759765625, -15.0654296875, -14.37109375, -13.6767578125, -12.982421875, -12.2880859375, -11.59375, -10.8994140625, -10.205078125, -9.5107421875, -8.81640625, -8.1220703125, -7.427734375, -6.7333984375, -6.0390625, -5.3447265625, -4.650390625, -3.9560546875, -3.26171875, -2.5673828125, -1.873046875, -1.1787109375, -0.484375, 0.2099609375, 0.904296875, 1.5986328125, 2.29296875, 2.9873046875, 3.681640625, 4.3759765625, 5.0703125, 5.7646484375, 6.458984375, 7.1533203125, 7.84765625, 8.5419921875, 9.236328125, 9.9306640625, 10.625, 11.3193359375, 12.013671875, 12.7080078125, 13.40234375, 14.0966796875, 14.791015625, 15.4853515625, 16.1796875, 16.8740234375, 17.568359375, 18.2626953125, 18.95703125, 19.6513671875, 20.345703125, 21.0400390625, 21.734375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 11.0, 15.0, 14.0, 14.0, 18.0, 23.0, 29.0, 23.0, 39.0, 52.0, 51.0, 50.0, 49.0, 46.0, 72.0, 68.0, 54.0, 33.0, 40.0, 51.0, 51.0, 30.0, 25.0, 22.0, 17.0, 24.0, 16.0, 9.0, 8.0, 6.0, 6.0, 7.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9873046875, -1.9262237548828125, -1.865142822265625, -1.8040618896484375, -1.74298095703125, -1.6819000244140625, -1.620819091796875, -1.5597381591796875, -1.4986572265625, -1.4375762939453125, -1.376495361328125, -1.3154144287109375, -1.25433349609375, -1.1932525634765625, -1.132171630859375, -1.0710906982421875, -1.010009765625, -0.9489288330078125, -0.887847900390625, -0.8267669677734375, -0.76568603515625, -0.7046051025390625, -0.643524169921875, -0.5824432373046875, -0.5213623046875, -0.4602813720703125, -0.399200439453125, -0.3381195068359375, -0.27703857421875, -0.2159576416015625, -0.154876708984375, -0.0937957763671875, -0.03271484375, 0.0283660888671875, 0.089447021484375, 0.1505279541015625, 0.21160888671875, 0.2726898193359375, 0.333770751953125, 0.3948516845703125, 0.4559326171875, 0.5170135498046875, 0.578094482421875, 0.6391754150390625, 0.70025634765625, 0.7613372802734375, 0.822418212890625, 0.8834991455078125, 0.944580078125, 1.0056610107421875, 1.066741943359375, 1.1278228759765625, 1.18890380859375, 1.2499847412109375, 1.311065673828125, 1.3721466064453125, 1.4332275390625, 1.4943084716796875, 1.555389404296875, 1.6164703369140625, 1.67755126953125, 1.7386322021484375, 1.799713134765625, 1.8607940673828125, 1.921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 11.0, 12.0, 15.0, 22.0, 41.0, 52.0, 80.0, 133.0, 203.0, 407.0, 853.0, 2087.0, 6042.0, 19968.0, 87870.0, 1059606.0, 2844683.0, 132911.0, 26641.0, 7781.0, 2673.0, 1043.0, 500.0, 255.0, 150.0, 77.0, 51.0, 38.0, 20.0, 25.0, 15.0, 7.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6484375, -11.248291015625, -10.84814453125, -10.447998046875, -10.0478515625, -9.647705078125, -9.24755859375, -8.847412109375, -8.447265625, -8.047119140625, -7.64697265625, -7.246826171875, -6.8466796875, -6.446533203125, -6.04638671875, -5.646240234375, -5.24609375, -4.845947265625, -4.44580078125, -4.045654296875, -3.6455078125, -3.245361328125, -2.84521484375, -2.445068359375, -2.044921875, -1.644775390625, -1.24462890625, -0.844482421875, -0.4443359375, -0.044189453125, 0.35595703125, 0.756103515625, 1.15625, 1.556396484375, 1.95654296875, 2.356689453125, 2.7568359375, 3.156982421875, 3.55712890625, 3.957275390625, 4.357421875, 4.757568359375, 5.15771484375, 5.557861328125, 5.9580078125, 6.358154296875, 6.75830078125, 7.158447265625, 7.55859375, 7.958740234375, 8.35888671875, 8.759033203125, 9.1591796875, 9.559326171875, 9.95947265625, 10.359619140625, 10.759765625, 11.159912109375, 11.56005859375, 11.960205078125, 12.3603515625, 12.760498046875, 13.16064453125, 13.560791015625, 13.9609375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 0.0, 2.0, 5.0, 7.0, 11.0, 7.0, 12.0, 22.0, 19.0, 12.0, 33.0, 36.0, 64.0, 102.0, 161.0, 285.0, 535.0, 1313.0, 634.0, 292.0, 170.0, 98.0, 66.0, 48.0, 33.0, 30.0, 15.0, 10.0, 15.0, 10.0, 7.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.892608642578125, -2.77935791015625, -2.666107177734375, -2.5528564453125, -2.439605712890625, -2.32635498046875, -2.213104248046875, -2.099853515625, -1.986602783203125, -1.87335205078125, -1.760101318359375, -1.6468505859375, -1.533599853515625, -1.42034912109375, -1.307098388671875, -1.19384765625, -1.080596923828125, -0.96734619140625, -0.854095458984375, -0.7408447265625, -0.627593994140625, -0.51434326171875, -0.401092529296875, -0.287841796875, -0.174591064453125, -0.06134033203125, 0.051910400390625, 0.1651611328125, 0.278411865234375, 0.39166259765625, 0.504913330078125, 0.6181640625, 0.731414794921875, 0.84466552734375, 0.957916259765625, 1.0711669921875, 1.184417724609375, 1.29766845703125, 1.410919189453125, 1.524169921875, 1.637420654296875, 1.75067138671875, 1.863922119140625, 1.9771728515625, 2.090423583984375, 2.20367431640625, 2.316925048828125, 2.43017578125, 2.543426513671875, 2.65667724609375, 2.769927978515625, 2.8831787109375, 2.996429443359375, 3.10968017578125, 3.222930908203125, 3.336181640625, 3.449432373046875, 3.56268310546875, 3.675933837890625, 3.7891845703125, 3.902435302734375, 4.01568603515625, 4.128936767578125, 4.2421875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 13.0, 18.0, 36.0, 52.0, 69.0, 85.0, 102.0, 112.0, 110.0, 97.0, 84.0, 70.0, 46.0, 23.0, 28.0, 14.0, 14.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.307350158691406, -26.50409698486328, -25.70084571838379, -24.897592544555664, -24.09433937072754, -23.291088104248047, -22.487834930419922, -21.684581756591797, -20.881328582763672, -20.078075408935547, -19.274824142456055, -18.47157096862793, -17.668317794799805, -16.865066528320312, -16.061813354492188, -15.258560180664062, -14.45530891418457, -13.652056694030762, -12.848803520202637, -12.045551300048828, -11.242298126220703, -10.439045906066895, -9.635793685913086, -8.832540512084961, -8.029288291931152, -7.2260355949401855, -6.422782897949219, -5.61953067779541, -4.816277980804443, -4.013025283813477, -3.209773063659668, -2.406520366668701, -1.6032676696777344, -0.8000150918960571, 0.003237485885620117, 0.8064899444580078, 1.6097426414489746, 2.4129953384399414, 3.21624755859375, 4.019500255584717, 4.822752952575684, 5.62600564956665, 6.429258346557617, 7.232510566711426, 8.035762786865234, 8.83901596069336, 9.642268180847168, 10.445520401000977, 11.248773574829102, 12.05202579498291, 12.855278968811035, 13.658531188964844, 14.461784362792969, 15.265036582946777, 16.068288803100586, 16.87154197692871, 17.674793243408203, 18.478046417236328, 19.28129768371582, 20.084550857543945, 20.88780403137207, 21.691055297851562, 22.494308471679688, 23.297561645507812, 24.100814819335938]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 10.0, 9.0, 19.0, 15.0, 19.0, 16.0, 33.0, 28.0, 27.0, 56.0, 45.0, 33.0, 41.0, 48.0, 47.0, 46.0, 64.0, 53.0, 44.0, 47.0, 57.0, 37.0, 41.0, 38.0, 35.0, 22.0, 18.0, 11.0, 12.0, 12.0, 8.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.987573623657227, -14.501357078552246, -14.01513957977295, -13.528923034667969, -13.042705535888672, -12.556488990783691, -12.070271492004395, -11.584054946899414, -11.097837448120117, -10.611620903015137, -10.12540340423584, -9.63918685913086, -9.152969360351562, -8.666752815246582, -8.180535316467285, -7.694318771362305, -7.208101749420166, -6.721884727478027, -6.235667705535889, -5.74945068359375, -5.263233661651611, -4.777016639709473, -4.290800094604492, -3.8045828342437744, -3.3183658123016357, -2.832148790359497, -2.3459317684173584, -1.8597148656845093, -1.3734978437423706, -0.8872809410095215, -0.4010639190673828, 0.08515310287475586, 0.5713701248168945, 1.0575871467590332, 1.5438041687011719, 2.0300211906433105, 2.516238212585449, 3.002454996109009, 3.4886720180511475, 3.974889039993286, 4.461106300354004, 4.947323322296143, 5.433540344238281, 5.91975736618042, 6.405974388122559, 6.892190933227539, 7.378408432006836, 7.864624977111816, 8.350841522216797, 8.837058067321777, 9.323275566101074, 9.809492111206055, 10.295709609985352, 10.781926155090332, 11.268143653869629, 11.75436019897461, 12.240577697753906, 12.726794242858887, 13.213011741638184, 13.699228286743164, 14.185445785522461, 14.671662330627441, 15.157879829406738, 15.644096374511719, 16.130313873291016]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 6.0, 5.0, 11.0, 17.0, 23.0, 37.0, 55.0, 102.0, 196.0, 328.0, 718.0, 1545.0, 3911.0, 12302.0, 44446.0, 199308.0, 629482.0, 113290.0, 29141.0, 8392.0, 2872.0, 1109.0, 576.0, 296.0, 155.0, 88.0, 44.0, 34.0, 16.0, 14.0, 14.0, 8.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.6571044921875, -11.197021484375, -10.7369384765625, -10.27685546875, -9.8167724609375, -9.356689453125, -8.8966064453125, -8.4365234375, -7.9764404296875, -7.516357421875, -7.0562744140625, -6.59619140625, -6.1361083984375, -5.676025390625, -5.2159423828125, -4.755859375, -4.2957763671875, -3.835693359375, -3.3756103515625, -2.91552734375, -2.4554443359375, -1.995361328125, -1.5352783203125, -1.0751953125, -0.6151123046875, -0.155029296875, 0.3050537109375, 0.76513671875, 1.2252197265625, 1.685302734375, 2.1453857421875, 2.60546875, 3.0655517578125, 3.525634765625, 3.9857177734375, 4.44580078125, 4.9058837890625, 5.365966796875, 5.8260498046875, 6.2861328125, 6.7462158203125, 7.206298828125, 7.6663818359375, 8.12646484375, 8.5865478515625, 9.046630859375, 9.5067138671875, 9.966796875, 10.4268798828125, 10.886962890625, 11.3470458984375, 11.80712890625, 12.2672119140625, 12.727294921875, 13.1873779296875, 13.6474609375, 14.1075439453125, 14.567626953125, 15.0277099609375, 15.48779296875, 15.9478759765625, 16.407958984375, 16.8680419921875, 17.328125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 1.0, 5.0, 8.0, 6.0, 15.0, 7.0, 13.0, 23.0, 20.0, 28.0, 30.0, 35.0, 41.0, 57.0, 42.0, 64.0, 55.0, 48.0, 60.0, 61.0, 50.0, 44.0, 34.0, 50.0, 42.0, 25.0, 24.0, 20.0, 18.0, 17.0, 11.0, 9.0, 5.0, 11.0, 2.0, 3.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9794921875, -1.9173736572265625, -1.855255126953125, -1.7931365966796875, -1.73101806640625, -1.6688995361328125, -1.606781005859375, -1.5446624755859375, -1.4825439453125, -1.4204254150390625, -1.358306884765625, -1.2961883544921875, -1.23406982421875, -1.1719512939453125, -1.109832763671875, -1.0477142333984375, -0.985595703125, -0.9234771728515625, -0.861358642578125, -0.7992401123046875, -0.73712158203125, -0.6750030517578125, -0.612884521484375, -0.5507659912109375, -0.4886474609375, -0.4265289306640625, -0.364410400390625, -0.3022918701171875, -0.24017333984375, -0.1780548095703125, -0.115936279296875, -0.0538177490234375, 0.00830078125, 0.0704193115234375, 0.132537841796875, 0.1946563720703125, 0.25677490234375, 0.3188934326171875, 0.381011962890625, 0.4431304931640625, 0.5052490234375, 0.5673675537109375, 0.629486083984375, 0.6916046142578125, 0.75372314453125, 0.8158416748046875, 0.877960205078125, 0.9400787353515625, 1.002197265625, 1.0643157958984375, 1.126434326171875, 1.1885528564453125, 1.25067138671875, 1.3127899169921875, 1.374908447265625, 1.4370269775390625, 1.4991455078125, 1.5612640380859375, 1.623382568359375, 1.6855010986328125, 1.74761962890625, 1.8097381591796875, 1.871856689453125, 1.9339752197265625, 1.99609375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 10.0, 6.0, 10.0, 13.0, 20.0, 16.0, 38.0, 43.0, 63.0, 100.0, 143.0, 228.0, 391.0, 790.0, 1610.0, 3395.0, 7831.0, 18768.0, 45849.0, 124923.0, 456732.0, 257153.0, 77229.0, 30222.0, 12639.0, 5399.0, 2361.0, 1113.0, 623.0, 288.0, 176.0, 132.0, 60.0, 56.0, 33.0, 29.0, 25.0, 15.0, 5.0, 7.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.21875, -7.9952392578125, -7.771728515625, -7.5482177734375, -7.32470703125, -7.1011962890625, -6.877685546875, -6.6541748046875, -6.4306640625, -6.2071533203125, -5.983642578125, -5.7601318359375, -5.53662109375, -5.3131103515625, -5.089599609375, -4.8660888671875, -4.642578125, -4.4190673828125, -4.195556640625, -3.9720458984375, -3.74853515625, -3.5250244140625, -3.301513671875, -3.0780029296875, -2.8544921875, -2.6309814453125, -2.407470703125, -2.1839599609375, -1.96044921875, -1.7369384765625, -1.513427734375, -1.2899169921875, -1.06640625, -0.8428955078125, -0.619384765625, -0.3958740234375, -0.17236328125, 0.0511474609375, 0.274658203125, 0.4981689453125, 0.7216796875, 0.9451904296875, 1.168701171875, 1.3922119140625, 1.61572265625, 1.8392333984375, 2.062744140625, 2.2862548828125, 2.509765625, 2.7332763671875, 2.956787109375, 3.1802978515625, 3.40380859375, 3.6273193359375, 3.850830078125, 4.0743408203125, 4.2978515625, 4.5213623046875, 4.744873046875, 4.9683837890625, 5.19189453125, 5.4154052734375, 5.638916015625, 5.8624267578125, 6.0859375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 10.0, 7.0, 11.0, 12.0, 13.0, 14.0, 17.0, 14.0, 19.0, 23.0, 23.0, 34.0, 29.0, 44.0, 38.0, 39.0, 37.0, 37.0, 47.0, 47.0, 38.0, 40.0, 31.0, 51.0, 25.0, 34.0, 24.0, 36.0, 26.0, 29.0, 23.0, 16.0, 21.0, 23.0, 17.0, 7.0, 9.0, 6.0, 9.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30859375, -6.1004638671875, -5.892333984375, -5.6842041015625, -5.47607421875, -5.2679443359375, -5.059814453125, -4.8516845703125, -4.6435546875, -4.4354248046875, -4.227294921875, -4.0191650390625, -3.81103515625, -3.6029052734375, -3.394775390625, -3.1866455078125, -2.978515625, -2.7703857421875, -2.562255859375, -2.3541259765625, -2.14599609375, -1.9378662109375, -1.729736328125, -1.5216064453125, -1.3134765625, -1.1053466796875, -0.897216796875, -0.6890869140625, -0.48095703125, -0.2728271484375, -0.064697265625, 0.1434326171875, 0.3515625, 0.5596923828125, 0.767822265625, 0.9759521484375, 1.18408203125, 1.3922119140625, 1.600341796875, 1.8084716796875, 2.0166015625, 2.2247314453125, 2.432861328125, 2.6409912109375, 2.84912109375, 3.0572509765625, 3.265380859375, 3.4735107421875, 3.681640625, 3.8897705078125, 4.097900390625, 4.3060302734375, 4.51416015625, 4.7222900390625, 4.930419921875, 5.1385498046875, 5.3466796875, 5.5548095703125, 5.762939453125, 5.9710693359375, 6.17919921875, 6.3873291015625, 6.595458984375, 6.8035888671875, 7.01171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 7.0, 15.0, 12.0, 38.0, 53.0, 92.0, 154.0, 352.0, 723.0, 2168.0, 7270.0, 31433.0, 189267.0, 676538.0, 111457.0, 20957.0, 5127.0, 1635.0, 596.0, 287.0, 172.0, 81.0, 44.0, 28.0, 18.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.234375, -5.0775146484375, -4.920654296875, -4.7637939453125, -4.60693359375, -4.4500732421875, -4.293212890625, -4.1363525390625, -3.9794921875, -3.8226318359375, -3.665771484375, -3.5089111328125, -3.35205078125, -3.1951904296875, -3.038330078125, -2.8814697265625, -2.724609375, -2.5677490234375, -2.410888671875, -2.2540283203125, -2.09716796875, -1.9403076171875, -1.783447265625, -1.6265869140625, -1.4697265625, -1.3128662109375, -1.156005859375, -0.9991455078125, -0.84228515625, -0.6854248046875, -0.528564453125, -0.3717041015625, -0.21484375, -0.0579833984375, 0.098876953125, 0.2557373046875, 0.41259765625, 0.5694580078125, 0.726318359375, 0.8831787109375, 1.0400390625, 1.1968994140625, 1.353759765625, 1.5106201171875, 1.66748046875, 1.8243408203125, 1.981201171875, 2.1380615234375, 2.294921875, 2.4517822265625, 2.608642578125, 2.7655029296875, 2.92236328125, 3.0792236328125, 3.236083984375, 3.3929443359375, 3.5498046875, 3.7066650390625, 3.863525390625, 4.0203857421875, 4.17724609375, 4.3341064453125, 4.490966796875, 4.6478271484375, 4.8046875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 5.0, 3.0, 5.0, 5.0, 9.0, 8.0, 16.0, 15.0, 12.0, 19.0, 38.0, 65.0, 126.0, 259.0, 172.0, 95.0, 43.0, 20.0, 11.0, 17.0, 17.0, 9.0, 9.0, 3.0, 2.0, 10.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005159378051757812, -0.0004931986331939697, -0.0004704594612121582, -0.0004477202892303467, -0.00042498111724853516, -0.00040224194526672363, -0.0003795027732849121, -0.0003567636013031006, -0.00033402442932128906, -0.00031128525733947754, -0.000288546085357666, -0.0002658069133758545, -0.00024306774139404297, -0.00022032856941223145, -0.00019758939743041992, -0.0001748502254486084, -0.00015211105346679688, -0.00012937188148498535, -0.00010663270950317383, -8.38935375213623e-05, -6.115436553955078e-05, -3.841519355773926e-05, -1.5676021575927734e-05, 7.063150405883789e-06, 2.9802322387695312e-05, 5.2541494369506836e-05, 7.528066635131836e-05, 9.801983833312988e-05, 0.0001207590103149414, 0.00014349818229675293, 0.00016623735427856445, 0.00018897652626037598, 0.0002117156982421875, 0.00023445487022399902, 0.00025719404220581055, 0.00027993321418762207, 0.0003026723861694336, 0.0003254115581512451, 0.00034815073013305664, 0.00037088990211486816, 0.0003936290740966797, 0.0004163682460784912, 0.00043910741806030273, 0.00046184659004211426, 0.0004845857620239258, 0.0005073249340057373, 0.0005300641059875488, 0.0005528032779693604, 0.0005755424499511719, 0.0005982816219329834, 0.0006210207939147949, 0.0006437599658966064, 0.000666499137878418, 0.0006892383098602295, 0.000711977481842041, 0.0007347166538238525, 0.0007574558258056641, 0.0007801949977874756, 0.0008029341697692871, 0.0008256733417510986, 0.0008484125137329102, 0.0008711516857147217, 0.0008938908576965332, 0.0009166300296783447, 0.0009393692016601562]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 5.0, 3.0, 5.0, 8.0, 14.0, 22.0, 21.0, 36.0, 62.0, 83.0, 167.0, 295.0, 567.0, 1028.0, 2192.0, 4719.0, 10633.0, 28625.0, 89029.0, 359700.0, 400845.0, 98501.0, 30683.0, 11530.0, 4972.0, 2326.0, 1090.0, 603.0, 300.0, 161.0, 104.0, 75.0, 45.0, 23.0, 19.0, 12.0, 16.0, 13.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.380859375, -3.268310546875, -3.15576171875, -3.043212890625, -2.9306640625, -2.818115234375, -2.70556640625, -2.593017578125, -2.48046875, -2.367919921875, -2.25537109375, -2.142822265625, -2.0302734375, -1.917724609375, -1.80517578125, -1.692626953125, -1.580078125, -1.467529296875, -1.35498046875, -1.242431640625, -1.1298828125, -1.017333984375, -0.90478515625, -0.792236328125, -0.6796875, -0.567138671875, -0.45458984375, -0.342041015625, -0.2294921875, -0.116943359375, -0.00439453125, 0.108154296875, 0.220703125, 0.333251953125, 0.44580078125, 0.558349609375, 0.6708984375, 0.783447265625, 0.89599609375, 1.008544921875, 1.12109375, 1.233642578125, 1.34619140625, 1.458740234375, 1.5712890625, 1.683837890625, 1.79638671875, 1.908935546875, 2.021484375, 2.134033203125, 2.24658203125, 2.359130859375, 2.4716796875, 2.584228515625, 2.69677734375, 2.809326171875, 2.921875, 3.034423828125, 3.14697265625, 3.259521484375, 3.3720703125, 3.484619140625, 3.59716796875, 3.709716796875, 3.822265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 8.0, 12.0, 5.0, 11.0, 11.0, 28.0, 25.0, 41.0, 42.0, 54.0, 41.0, 65.0, 80.0, 91.0, 80.0, 65.0, 52.0, 48.0, 43.0, 25.0, 27.0, 17.0, 15.0, 6.0, 8.0, 9.0, 10.0, 13.0, 5.0, 4.0, 3.0, 7.0, 6.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.140625, -3.0496826171875, -2.958740234375, -2.8677978515625, -2.77685546875, -2.6859130859375, -2.594970703125, -2.5040283203125, -2.4130859375, -2.3221435546875, -2.231201171875, -2.1402587890625, -2.04931640625, -1.9583740234375, -1.867431640625, -1.7764892578125, -1.685546875, -1.5946044921875, -1.503662109375, -1.4127197265625, -1.32177734375, -1.2308349609375, -1.139892578125, -1.0489501953125, -0.9580078125, -0.8670654296875, -0.776123046875, -0.6851806640625, -0.59423828125, -0.5032958984375, -0.412353515625, -0.3214111328125, -0.23046875, -0.1395263671875, -0.048583984375, 0.0423583984375, 0.13330078125, 0.2242431640625, 0.315185546875, 0.4061279296875, 0.4970703125, 0.5880126953125, 0.678955078125, 0.7698974609375, 0.86083984375, 0.9517822265625, 1.042724609375, 1.1336669921875, 1.224609375, 1.3155517578125, 1.406494140625, 1.4974365234375, 1.58837890625, 1.6793212890625, 1.770263671875, 1.8612060546875, 1.9521484375, 2.0430908203125, 2.134033203125, 2.2249755859375, 2.31591796875, 2.4068603515625, 2.497802734375, 2.5887451171875, 2.6796875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 8.0, 23.0, 44.0, 90.0, 170.0, 198.0, 219.0, 120.0, 71.0, 44.0, 10.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.873268127441406, -57.943050384521484, -55.0128288269043, -52.082611083984375, -49.15238952636719, -46.222171783447266, -43.291954040527344, -40.361732482910156, -37.431514739990234, -34.50129699707031, -31.571075439453125, -28.640857696533203, -25.71063804626465, -22.780418395996094, -19.850200653076172, -16.919981002807617, -13.989761352539062, -11.059541702270508, -8.12932300567627, -5.199104309082031, -2.2688846588134766, 0.6613349914550781, 3.591552734375, 6.521772384643555, 9.45199203491211, 12.382211685180664, 15.312430381774902, 18.24264907836914, 21.172868728637695, 24.10308837890625, 27.033306121826172, 29.963525772094727, 32.89374542236328, 35.8239631652832, 38.75418472290039, 41.68440246582031, 44.6146240234375, 47.54484176635742, 50.475059509277344, 53.40528106689453, 56.33549880981445, 59.265716552734375, 62.19593811035156, 65.12615966796875, 68.0563735961914, 70.9865951538086, 73.91680908203125, 76.84703063964844, 79.77725219726562, 82.70747375488281, 85.63768768310547, 88.56790924072266, 91.49813079833984, 94.4283447265625, 97.35856628417969, 100.28878784179688, 103.21900939941406, 106.14923095703125, 109.0794448852539, 112.0096664428711, 114.93988800048828, 117.87010192871094, 120.80032348632812, 123.73054504394531, 126.66075897216797]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 11.0, 7.0, 12.0, 9.0, 12.0, 11.0, 12.0, 11.0, 13.0, 17.0, 18.0, 38.0, 18.0, 23.0, 28.0, 33.0, 36.0, 35.0, 37.0, 27.0, 44.0, 47.0, 36.0, 36.0, 37.0, 37.0, 38.0, 42.0, 46.0, 33.0, 24.0, 29.0, 11.0, 17.0, 17.0, 17.0, 13.0, 15.0, 12.0, 12.0, 2.0, 3.0, 3.0, 7.0, 1.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-28.655441284179688, -27.728147506713867, -26.80085563659668, -25.87356185913086, -24.94626808166504, -24.01897430419922, -23.09168243408203, -22.16438865661621, -21.23709487915039, -20.30980110168457, -19.382509231567383, -18.455215454101562, -17.527921676635742, -16.600627899169922, -15.673336029052734, -14.746042251586914, -13.818750381469727, -12.891457557678223, -11.964163780212402, -11.036870956420898, -10.109577178955078, -9.182284355163574, -8.25499153137207, -7.327698230743408, -6.400404930114746, -5.473111629486084, -4.545818328857422, -3.618525505065918, -2.691232204437256, -1.7639389038085938, -0.8366460800170898, 0.09064722061157227, 1.0179405212402344, 1.945233702659607, 2.8725268840789795, 3.7998199462890625, 4.727113246917725, 5.654406547546387, 6.581699371337891, 7.508992671966553, 8.436285972595215, 9.363578796386719, 10.290872573852539, 11.218165397644043, 12.145458221435547, 13.072751998901367, 14.000044822692871, 14.927337646484375, 15.854631423950195, 16.781925201416016, 17.709217071533203, 18.636510848999023, 19.563804626464844, 20.49109649658203, 21.41839027404785, 22.345684051513672, 23.27297592163086, 24.20026969909668, 25.127561569213867, 26.054855346679688, 26.982149124145508, 27.909442901611328, 28.836734771728516, 29.764028549194336, 30.691322326660156]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 12.0, 18.0, 23.0, 25.0, 45.0, 70.0, 123.0, 220.0, 350.0, 676.0, 1365.0, 2986.0, 6890.0, 18902.0, 73868.0, 794071.0, 3144522.0, 109212.0, 25052.0, 8468.0, 3681.0, 1678.0, 850.0, 455.0, 263.0, 150.0, 99.0, 67.0, 42.0, 27.0, 18.0, 12.0, 13.0, 8.0, 4.0, 10.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.078125, -13.5390625, -13.0, -12.4609375, -11.921875, -11.3828125, -10.84375, -10.3046875, -9.765625, -9.2265625, -8.6875, -8.1484375, -7.609375, -7.0703125, -6.53125, -5.9921875, -5.453125, -4.9140625, -4.375, -3.8359375, -3.296875, -2.7578125, -2.21875, -1.6796875, -1.140625, -0.6015625, -0.0625, 0.4765625, 1.015625, 1.5546875, 2.09375, 2.6328125, 3.171875, 3.7109375, 4.25, 4.7890625, 5.328125, 5.8671875, 6.40625, 6.9453125, 7.484375, 8.0234375, 8.5625, 9.1015625, 9.640625, 10.1796875, 10.71875, 11.2578125, 11.796875, 12.3359375, 12.875, 13.4140625, 13.953125, 14.4921875, 15.03125, 15.5703125, 16.109375, 16.6484375, 17.1875, 17.7265625, 18.265625, 18.8046875, 19.34375, 19.8828125, 20.421875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 13.0, 5.0, 13.0, 18.0, 24.0, 15.0, 23.0, 41.0, 27.0, 49.0, 55.0, 47.0, 55.0, 50.0, 63.0, 49.0, 64.0, 50.0, 36.0, 40.0, 33.0, 34.0, 37.0, 29.0, 14.0, 15.0, 19.0, 14.0, 12.0, 6.0, 7.0, 6.0, 4.0, 4.0, 5.0, 0.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.90625, -1.8463134765625, -1.786376953125, -1.7264404296875, -1.66650390625, -1.6065673828125, -1.546630859375, -1.4866943359375, -1.4267578125, -1.3668212890625, -1.306884765625, -1.2469482421875, -1.18701171875, -1.1270751953125, -1.067138671875, -1.0072021484375, -0.947265625, -0.8873291015625, -0.827392578125, -0.7674560546875, -0.70751953125, -0.6475830078125, -0.587646484375, -0.5277099609375, -0.4677734375, -0.4078369140625, -0.347900390625, -0.2879638671875, -0.22802734375, -0.1680908203125, -0.108154296875, -0.0482177734375, 0.01171875, 0.0716552734375, 0.131591796875, 0.1915283203125, 0.25146484375, 0.3114013671875, 0.371337890625, 0.4312744140625, 0.4912109375, 0.5511474609375, 0.611083984375, 0.6710205078125, 0.73095703125, 0.7908935546875, 0.850830078125, 0.9107666015625, 0.970703125, 1.0306396484375, 1.090576171875, 1.1505126953125, 1.21044921875, 1.2703857421875, 1.330322265625, 1.3902587890625, 1.4501953125, 1.5101318359375, 1.570068359375, 1.6300048828125, 1.68994140625, 1.7498779296875, 1.809814453125, 1.8697509765625, 1.9296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 7.0, 9.0, 15.0, 21.0, 27.0, 38.0, 62.0, 80.0, 115.0, 179.0, 310.0, 485.0, 732.0, 1283.0, 2245.0, 4075.0, 8057.0, 16474.0, 37682.0, 98521.0, 339314.0, 2824601.0, 621842.0, 143635.0, 51216.0, 21585.0, 10193.0, 5022.0, 2679.0, 1510.0, 852.0, 501.0, 317.0, 198.0, 140.0, 88.0, 46.0, 40.0, 21.0, 20.0, 17.0, 14.0, 4.0, 6.0, 6.0, 5.0, 1.0], "bins": [-8.546875, -8.32586669921875, -8.1048583984375, -7.88385009765625, -7.662841796875, -7.44183349609375, -7.2208251953125, -6.99981689453125, -6.77880859375, -6.55780029296875, -6.3367919921875, -6.11578369140625, -5.894775390625, -5.67376708984375, -5.4527587890625, -5.23175048828125, -5.0107421875, -4.78973388671875, -4.5687255859375, -4.34771728515625, -4.126708984375, -3.90570068359375, -3.6846923828125, -3.46368408203125, -3.24267578125, -3.02166748046875, -2.8006591796875, -2.57965087890625, -2.358642578125, -2.13763427734375, -1.9166259765625, -1.69561767578125, -1.474609375, -1.25360107421875, -1.0325927734375, -0.81158447265625, -0.590576171875, -0.36956787109375, -0.1485595703125, 0.07244873046875, 0.29345703125, 0.51446533203125, 0.7354736328125, 0.95648193359375, 1.177490234375, 1.39849853515625, 1.6195068359375, 1.84051513671875, 2.0615234375, 2.28253173828125, 2.5035400390625, 2.72454833984375, 2.945556640625, 3.16656494140625, 3.3875732421875, 3.60858154296875, 3.82958984375, 4.05059814453125, 4.2716064453125, 4.49261474609375, 4.713623046875, 4.93463134765625, 5.1556396484375, 5.37664794921875, 5.59765625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 0.0, 4.0, 3.0, 10.0, 7.0, 14.0, 18.0, 23.0, 16.0, 44.0, 65.0, 75.0, 94.0, 160.0, 326.0, 616.0, 1503.0, 410.0, 229.0, 154.0, 89.0, 60.0, 37.0, 26.0, 20.0, 26.0, 10.0, 10.0, 7.0, 3.0, 1.0, 6.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.21875, -4.10260009765625, -3.9864501953125, -3.87030029296875, -3.754150390625, -3.63800048828125, -3.5218505859375, -3.40570068359375, -3.28955078125, -3.17340087890625, -3.0572509765625, -2.94110107421875, -2.824951171875, -2.70880126953125, -2.5926513671875, -2.47650146484375, -2.3603515625, -2.24420166015625, -2.1280517578125, -2.01190185546875, -1.895751953125, -1.77960205078125, -1.6634521484375, -1.54730224609375, -1.43115234375, -1.31500244140625, -1.1988525390625, -1.08270263671875, -0.966552734375, -0.85040283203125, -0.7342529296875, -0.61810302734375, -0.501953125, -0.38580322265625, -0.2696533203125, -0.15350341796875, -0.037353515625, 0.07879638671875, 0.1949462890625, 0.31109619140625, 0.42724609375, 0.54339599609375, 0.6595458984375, 0.77569580078125, 0.891845703125, 1.00799560546875, 1.1241455078125, 1.24029541015625, 1.3564453125, 1.47259521484375, 1.5887451171875, 1.70489501953125, 1.821044921875, 1.93719482421875, 2.0533447265625, 2.16949462890625, 2.28564453125, 2.40179443359375, 2.5179443359375, 2.63409423828125, 2.750244140625, 2.86639404296875, 2.9825439453125, 3.09869384765625, 3.21484375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 8.0, 7.0, 10.0, 22.0, 40.0, 68.0, 129.0, 151.0, 161.0, 163.0, 115.0, 60.0, 43.0, 15.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.11037063598633, -40.98886489868164, -39.86736297607422, -38.74585723876953, -37.624351501464844, -36.50284957885742, -35.381343841552734, -34.25984191894531, -33.138336181640625, -32.01683044433594, -30.895328521728516, -29.773822784423828, -28.652318954467773, -27.53081512451172, -26.40930938720703, -25.287805557250977, -24.166301727294922, -23.044797897338867, -21.923294067382812, -20.801788330078125, -19.68028450012207, -18.558780670166016, -17.437274932861328, -16.315771102905273, -15.194267272949219, -14.072763442993164, -12.951258659362793, -11.829753875732422, -10.708250045776367, -9.586746215820312, -8.465241432189941, -7.3437371253967285, -6.222236633300781, -5.100732326507568, -3.9792280197143555, -2.8577237129211426, -1.7362194061279297, -0.6147150993347168, 0.5067892074584961, 1.628293514251709, 2.749797821044922, 3.8713021278381348, 4.992806434631348, 6.1143107414245605, 7.235815048217773, 8.357318878173828, 9.4788236618042, 10.60032844543457, 11.721832275390625, 12.84333610534668, 13.96484088897705, 15.086345672607422, 16.207849502563477, 17.32935333251953, 18.45085906982422, 19.572362899780273, 20.693866729736328, 21.815370559692383, 22.936874389648438, 24.058380126953125, 25.17988395690918, 26.301387786865234, 27.422893524169922, 28.544397354125977, 29.66590118408203]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 6.0, 9.0, 11.0, 11.0, 10.0, 21.0, 25.0, 16.0, 25.0, 27.0, 24.0, 43.0, 33.0, 37.0, 39.0, 38.0, 42.0, 41.0, 43.0, 33.0, 45.0, 32.0, 25.0, 41.0, 34.0, 27.0, 37.0, 32.0, 19.0, 16.0, 22.0, 21.0, 15.0, 19.0, 14.0, 6.0, 11.0, 7.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.666410446166992, -9.317983627319336, -8.96955680847168, -8.621129989624023, -8.272703170776367, -7.924276351928711, -7.575850009918213, -7.227423191070557, -6.8789963722229, -6.530569553375244, -6.182142734527588, -5.83371639251709, -5.485289573669434, -5.136862754821777, -4.788435935974121, -4.440009117126465, -4.091582298278809, -3.7431554794311523, -3.394728660583496, -3.046302080154419, -2.6978752613067627, -2.3494484424591064, -2.0010218620300293, -1.652595043182373, -1.3041682243347168, -0.9557414650917053, -0.6073147058486938, -0.25888800621032715, 0.0895388126373291, 0.43796563148498535, 0.7863922119140625, 1.1348190307617188, 1.483245849609375, 1.8316726684570312, 2.1800994873046875, 2.5285260677337646, 2.876952886581421, 3.225379705429077, 3.5738062858581543, 3.9222331047058105, 4.270659923553467, 4.619086742401123, 4.967513561248779, 5.315939903259277, 5.664366722106934, 6.01279354095459, 6.361220359802246, 6.709647178649902, 7.058073997497559, 7.406500816345215, 7.754927635192871, 8.103354454040527, 8.451781272888184, 8.80020809173584, 9.14863395690918, 9.497060775756836, 9.845487594604492, 10.193914413452148, 10.542341232299805, 10.890768051147461, 11.239194869995117, 11.587621688842773, 11.93604850769043, 12.284475326538086, 12.632902145385742]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 7.0, 13.0, 20.0, 21.0, 31.0, 52.0, 56.0, 111.0, 209.0, 348.0, 544.0, 1129.0, 2076.0, 4519.0, 10475.0, 28450.0, 77314.0, 202670.0, 387776.0, 205715.0, 78002.0, 28929.0, 10947.0, 4569.0, 2081.0, 1038.0, 575.0, 361.0, 193.0, 130.0, 67.0, 35.0, 27.0, 23.0, 6.0, 5.0, 2.0, 9.0, 5.0, 8.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.421875, -10.11083984375, -9.7998046875, -9.48876953125, -9.177734375, -8.86669921875, -8.5556640625, -8.24462890625, -7.93359375, -7.62255859375, -7.3115234375, -7.00048828125, -6.689453125, -6.37841796875, -6.0673828125, -5.75634765625, -5.4453125, -5.13427734375, -4.8232421875, -4.51220703125, -4.201171875, -3.89013671875, -3.5791015625, -3.26806640625, -2.95703125, -2.64599609375, -2.3349609375, -2.02392578125, -1.712890625, -1.40185546875, -1.0908203125, -0.77978515625, -0.46875, -0.15771484375, 0.1533203125, 0.46435546875, 0.775390625, 1.08642578125, 1.3974609375, 1.70849609375, 2.01953125, 2.33056640625, 2.6416015625, 2.95263671875, 3.263671875, 3.57470703125, 3.8857421875, 4.19677734375, 4.5078125, 4.81884765625, 5.1298828125, 5.44091796875, 5.751953125, 6.06298828125, 6.3740234375, 6.68505859375, 6.99609375, 7.30712890625, 7.6181640625, 7.92919921875, 8.240234375, 8.55126953125, 8.8623046875, 9.17333984375, 9.484375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 8.0, 7.0, 9.0, 17.0, 17.0, 26.0, 30.0, 38.0, 41.0, 37.0, 44.0, 48.0, 55.0, 52.0, 42.0, 43.0, 57.0, 52.0, 50.0, 48.0, 42.0, 36.0, 32.0, 25.0, 23.0, 15.0, 23.0, 14.0, 10.0, 11.0, 9.0, 10.0, 2.0, 0.0, 4.0, 5.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.119140625, -2.05718994140625, -1.9952392578125, -1.93328857421875, -1.871337890625, -1.80938720703125, -1.7474365234375, -1.68548583984375, -1.62353515625, -1.56158447265625, -1.4996337890625, -1.43768310546875, -1.375732421875, -1.31378173828125, -1.2518310546875, -1.18988037109375, -1.1279296875, -1.06597900390625, -1.0040283203125, -0.94207763671875, -0.880126953125, -0.81817626953125, -0.7562255859375, -0.69427490234375, -0.63232421875, -0.57037353515625, -0.5084228515625, -0.44647216796875, -0.384521484375, -0.32257080078125, -0.2606201171875, -0.19866943359375, -0.13671875, -0.07476806640625, -0.0128173828125, 0.04913330078125, 0.111083984375, 0.17303466796875, 0.2349853515625, 0.29693603515625, 0.35888671875, 0.42083740234375, 0.4827880859375, 0.54473876953125, 0.606689453125, 0.66864013671875, 0.7305908203125, 0.79254150390625, 0.8544921875, 0.91644287109375, 0.9783935546875, 1.04034423828125, 1.102294921875, 1.16424560546875, 1.2261962890625, 1.28814697265625, 1.35009765625, 1.41204833984375, 1.4739990234375, 1.53594970703125, 1.597900390625, 1.65985107421875, 1.7218017578125, 1.78375244140625, 1.845703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 5.0, 3.0, 6.0, 10.0, 6.0, 21.0, 27.0, 30.0, 52.0, 50.0, 94.0, 128.0, 192.0, 242.0, 334.0, 556.0, 1075.0, 2511.0, 10934.0, 70083.0, 448922.0, 431655.0, 66259.0, 10225.0, 2338.0, 991.0, 563.0, 352.0, 240.0, 168.0, 122.0, 101.0, 79.0, 54.0, 43.0, 19.0, 18.0, 19.0, 10.0, 8.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.390625, -12.95849609375, -12.5263671875, -12.09423828125, -11.662109375, -11.22998046875, -10.7978515625, -10.36572265625, -9.93359375, -9.50146484375, -9.0693359375, -8.63720703125, -8.205078125, -7.77294921875, -7.3408203125, -6.90869140625, -6.4765625, -6.04443359375, -5.6123046875, -5.18017578125, -4.748046875, -4.31591796875, -3.8837890625, -3.45166015625, -3.01953125, -2.58740234375, -2.1552734375, -1.72314453125, -1.291015625, -0.85888671875, -0.4267578125, 0.00537109375, 0.4375, 0.86962890625, 1.3017578125, 1.73388671875, 2.166015625, 2.59814453125, 3.0302734375, 3.46240234375, 3.89453125, 4.32666015625, 4.7587890625, 5.19091796875, 5.623046875, 6.05517578125, 6.4873046875, 6.91943359375, 7.3515625, 7.78369140625, 8.2158203125, 8.64794921875, 9.080078125, 9.51220703125, 9.9443359375, 10.37646484375, 10.80859375, 11.24072265625, 11.6728515625, 12.10498046875, 12.537109375, 12.96923828125, 13.4013671875, 13.83349609375, 14.265625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 4.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 8.0, 10.0, 8.0, 10.0, 8.0, 17.0, 14.0, 14.0, 22.0, 28.0, 21.0, 25.0, 34.0, 37.0, 31.0, 40.0, 45.0, 51.0, 50.0, 41.0, 37.0, 46.0, 37.0, 27.0, 28.0, 33.0, 35.0, 29.0, 37.0, 27.0, 26.0, 18.0, 17.0, 18.0, 16.0, 11.0, 5.0, 9.0, 6.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.9453125, -6.71484375, -6.484375, -6.25390625, -6.0234375, -5.79296875, -5.5625, -5.33203125, -5.1015625, -4.87109375, -4.640625, -4.41015625, -4.1796875, -3.94921875, -3.71875, -3.48828125, -3.2578125, -3.02734375, -2.796875, -2.56640625, -2.3359375, -2.10546875, -1.875, -1.64453125, -1.4140625, -1.18359375, -0.953125, -0.72265625, -0.4921875, -0.26171875, -0.03125, 0.19921875, 0.4296875, 0.66015625, 0.890625, 1.12109375, 1.3515625, 1.58203125, 1.8125, 2.04296875, 2.2734375, 2.50390625, 2.734375, 2.96484375, 3.1953125, 3.42578125, 3.65625, 3.88671875, 4.1171875, 4.34765625, 4.578125, 4.80859375, 5.0390625, 5.26953125, 5.5, 5.73046875, 5.9609375, 6.19140625, 6.421875, 6.65234375, 6.8828125, 7.11328125, 7.34375, 7.57421875, 7.8046875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 8.0, 8.0, 13.0, 25.0, 37.0, 88.0, 206.0, 776.0, 17348.0, 1005975.0, 22775.0, 887.0, 217.0, 93.0, 42.0, 11.0, 15.0, 10.0, 11.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.25, -16.40966796875, -15.5693359375, -14.72900390625, -13.888671875, -13.04833984375, -12.2080078125, -11.36767578125, -10.52734375, -9.68701171875, -8.8466796875, -8.00634765625, -7.166015625, -6.32568359375, -5.4853515625, -4.64501953125, -3.8046875, -2.96435546875, -2.1240234375, -1.28369140625, -0.443359375, 0.39697265625, 1.2373046875, 2.07763671875, 2.91796875, 3.75830078125, 4.5986328125, 5.43896484375, 6.279296875, 7.11962890625, 7.9599609375, 8.80029296875, 9.640625, 10.48095703125, 11.3212890625, 12.16162109375, 13.001953125, 13.84228515625, 14.6826171875, 15.52294921875, 16.36328125, 17.20361328125, 18.0439453125, 18.88427734375, 19.724609375, 20.56494140625, 21.4052734375, 22.24560546875, 23.0859375, 23.92626953125, 24.7666015625, 25.60693359375, 26.447265625, 27.28759765625, 28.1279296875, 28.96826171875, 29.80859375, 30.64892578125, 31.4892578125, 32.32958984375, 33.169921875, 34.01025390625, 34.8505859375, 35.69091796875, 36.53125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 6.0, 4.0, 8.0, 14.0, 11.0, 22.0, 22.0, 31.0, 43.0, 43.0, 62.0, 92.0, 163.0, 129.0, 82.0, 58.0, 51.0, 32.0, 36.0, 20.0, 22.0, 11.0, 6.0, 7.0, 4.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0010175704956054688, -0.0009913444519042969, -0.000965118408203125, -0.0009388923645019531, -0.0009126663208007812, -0.0008864402770996094, -0.0008602142333984375, -0.0008339881896972656, -0.0008077621459960938, -0.0007815361022949219, -0.00075531005859375, -0.0007290840148925781, -0.0007028579711914062, -0.0006766319274902344, -0.0006504058837890625, -0.0006241798400878906, -0.0005979537963867188, -0.0005717277526855469, -0.000545501708984375, -0.0005192756652832031, -0.0004930496215820312, -0.0004668235778808594, -0.0004405975341796875, -0.0004143714904785156, -0.00038814544677734375, -0.0003619194030761719, -0.000335693359375, -0.0003094673156738281, -0.00028324127197265625, -0.0002570152282714844, -0.0002307891845703125, -0.00020456314086914062, -0.00017833709716796875, -0.00015211105346679688, -0.000125885009765625, -9.965896606445312e-05, -7.343292236328125e-05, -4.7206878662109375e-05, -2.09808349609375e-05, 5.245208740234375e-06, 3.147125244140625e-05, 5.7697296142578125e-05, 8.392333984375e-05, 0.00011014938354492188, 0.00013637542724609375, 0.00016260147094726562, 0.0001888275146484375, 0.00021505355834960938, 0.00024127960205078125, 0.0002675056457519531, 0.000293731689453125, 0.0003199577331542969, 0.00034618377685546875, 0.0003724098205566406, 0.0003986358642578125, 0.0004248619079589844, 0.00045108795166015625, 0.0004773139953613281, 0.0005035400390625, 0.0005297660827636719, 0.0005559921264648438, 0.0005822181701660156, 0.0006084442138671875, 0.0006346702575683594, 0.0006608963012695312]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 10.0, 17.0, 36.0, 73.0, 102.0, 277.0, 1274.0, 35294.0, 1003835.0, 6586.0, 609.0, 207.0, 100.0, 46.0, 34.0, 28.0, 18.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.0, -38.92822265625, -37.8564453125, -36.78466796875, -35.712890625, -34.64111328125, -33.5693359375, -32.49755859375, -31.42578125, -30.35400390625, -29.2822265625, -28.21044921875, -27.138671875, -26.06689453125, -24.9951171875, -23.92333984375, -22.8515625, -21.77978515625, -20.7080078125, -19.63623046875, -18.564453125, -17.49267578125, -16.4208984375, -15.34912109375, -14.27734375, -13.20556640625, -12.1337890625, -11.06201171875, -9.990234375, -8.91845703125, -7.8466796875, -6.77490234375, -5.703125, -4.63134765625, -3.5595703125, -2.48779296875, -1.416015625, -0.34423828125, 0.7275390625, 1.79931640625, 2.87109375, 3.94287109375, 5.0146484375, 6.08642578125, 7.158203125, 8.22998046875, 9.3017578125, 10.37353515625, 11.4453125, 12.51708984375, 13.5888671875, 14.66064453125, 15.732421875, 16.80419921875, 17.8759765625, 18.94775390625, 20.01953125, 21.09130859375, 22.1630859375, 23.23486328125, 24.306640625, 25.37841796875, 26.4501953125, 27.52197265625, 28.59375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 17.0, 30.0, 80.0, 188.0, 299.0, 214.0, 96.0, 42.0, 18.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.546875, -9.003173828125, -8.45947265625, -7.915771484375, -7.3720703125, -6.828369140625, -6.28466796875, -5.740966796875, -5.197265625, -4.653564453125, -4.10986328125, -3.566162109375, -3.0224609375, -2.478759765625, -1.93505859375, -1.391357421875, -0.84765625, -0.303955078125, 0.23974609375, 0.783447265625, 1.3271484375, 1.870849609375, 2.41455078125, 2.958251953125, 3.501953125, 4.045654296875, 4.58935546875, 5.133056640625, 5.6767578125, 6.220458984375, 6.76416015625, 7.307861328125, 7.8515625, 8.395263671875, 8.93896484375, 9.482666015625, 10.0263671875, 10.570068359375, 11.11376953125, 11.657470703125, 12.201171875, 12.744873046875, 13.28857421875, 13.832275390625, 14.3759765625, 14.919677734375, 15.46337890625, 16.007080078125, 16.55078125, 17.094482421875, 17.63818359375, 18.181884765625, 18.7255859375, 19.269287109375, 19.81298828125, 20.356689453125, 20.900390625, 21.444091796875, 21.98779296875, 22.531494140625, 23.0751953125, 23.618896484375, 24.16259765625, 24.706298828125, 25.25]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 90.0, 504.0, 368.0, 34.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-264.66839599609375, -253.05661010742188, -241.44482421875, -229.83303833007812, -218.22125244140625, -206.60946655273438, -194.9976806640625, -183.38589477539062, -171.77410888671875, -160.16232299804688, -148.550537109375, -136.93875122070312, -125.32696533203125, -113.71517944335938, -102.1033935546875, -90.49160766601562, -78.87982177734375, -67.26803588867188, -55.65625, -44.044464111328125, -32.43267822265625, -20.820892333984375, -9.2091064453125, 2.402679443359375, 14.01446533203125, 25.626251220703125, 37.238037109375, 48.849822998046875, 60.46160888671875, 72.07339477539062, 83.6851806640625, 95.29696655273438, 106.90875244140625, 118.52053833007812, 130.13232421875, 141.74411010742188, 153.35589599609375, 164.96768188476562, 176.5794677734375, 188.19125366210938, 199.80303955078125, 211.41482543945312, 223.026611328125, 234.63839721679688, 246.25018310546875, 257.8619689941406, 269.4737548828125, 281.0855407714844, 292.69732666015625, 304.3091125488281, 315.9208984375, 327.5326843261719, 339.14447021484375, 350.7562561035156, 362.3680419921875, 373.9798278808594, 385.59161376953125, 397.2033996582031, 408.815185546875, 420.4269714355469, 432.03875732421875, 443.6505432128906, 455.2623291015625, 466.8741149902344, 478.48590087890625]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 5.0, 7.0, 6.0, 2.0, 8.0, 16.0, 6.0, 15.0, 20.0, 17.0, 36.0, 23.0, 27.0, 28.0, 37.0, 29.0, 39.0, 30.0, 29.0, 53.0, 34.0, 36.0, 42.0, 30.0, 45.0, 42.0, 41.0, 25.0, 32.0, 27.0, 21.0, 36.0, 24.0, 22.0, 14.0, 15.0, 20.0, 10.0, 9.0, 6.0, 13.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.45487976074219, -34.274147033691406, -33.09341049194336, -31.912677764892578, -30.731945037841797, -29.551210403442383, -28.37047576904297, -27.189743041992188, -26.009010314941406, -24.828275680541992, -23.64754295349121, -22.466808319091797, -21.286075592041016, -20.1053409576416, -18.924606323242188, -17.743873596191406, -16.563138961791992, -15.382405281066895, -14.201671600341797, -13.020936965942383, -11.840204238891602, -10.659469604492188, -9.47873592376709, -8.298002243041992, -7.1172685623168945, -5.936534881591797, -4.755801200866699, -3.5750670433044434, -2.3943333625793457, -1.213599681854248, -0.03286552429199219, 1.1478681564331055, 2.328601837158203, 3.509335517883301, 4.690069198608398, 5.870803356170654, 7.051537036895752, 8.232271194458008, 9.413004875183105, 10.593738555908203, 11.7744722366333, 12.955205917358398, 14.135939598083496, 15.316673278808594, 16.497407913208008, 17.67814064025879, 18.858875274658203, 20.039608001708984, 21.2203426361084, 22.401077270507812, 23.581809997558594, 24.762544631958008, 25.94327735900879, 27.124011993408203, 28.304744720458984, 29.4854793548584, 30.666213989257812, 31.846948623657227, 33.02768325805664, 34.20841598510742, 35.3891487121582, 36.569881439208984, 37.75061798095703, 38.93135070800781, 40.112083435058594]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 9.0, 11.0, 11.0, 27.0, 33.0, 71.0, 94.0, 162.0, 314.0, 580.0, 1201.0, 2641.0, 6613.0, 19846.0, 79733.0, 633219.0, 3194755.0, 196299.0, 38902.0, 11431.0, 4367.0, 1854.0, 931.0, 446.0, 258.0, 164.0, 98.0, 60.0, 42.0, 21.0, 23.0, 20.0, 12.0, 8.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.0234375, -10.6190185546875, -10.214599609375, -9.8101806640625, -9.40576171875, -9.0013427734375, -8.596923828125, -8.1925048828125, -7.7880859375, -7.3836669921875, -6.979248046875, -6.5748291015625, -6.17041015625, -5.7659912109375, -5.361572265625, -4.9571533203125, -4.552734375, -4.1483154296875, -3.743896484375, -3.3394775390625, -2.93505859375, -2.5306396484375, -2.126220703125, -1.7218017578125, -1.3173828125, -0.9129638671875, -0.508544921875, -0.1041259765625, 0.30029296875, 0.7047119140625, 1.109130859375, 1.5135498046875, 1.91796875, 2.3223876953125, 2.726806640625, 3.1312255859375, 3.53564453125, 3.9400634765625, 4.344482421875, 4.7489013671875, 5.1533203125, 5.5577392578125, 5.962158203125, 6.3665771484375, 6.77099609375, 7.1754150390625, 7.579833984375, 7.9842529296875, 8.388671875, 8.7930908203125, 9.197509765625, 9.6019287109375, 10.00634765625, 10.4107666015625, 10.815185546875, 11.2196044921875, 11.6240234375, 12.0284423828125, 12.432861328125, 12.8372802734375, 13.24169921875, 13.6461181640625, 14.050537109375, 14.4549560546875, 14.859375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 7.0, 4.0, 4.0, 5.0, 3.0, 10.0, 15.0, 16.0, 29.0, 14.0, 35.0, 43.0, 36.0, 44.0, 53.0, 52.0, 52.0, 65.0, 57.0, 49.0, 45.0, 49.0, 53.0, 35.0, 44.0, 35.0, 26.0, 25.0, 13.0, 16.0, 15.0, 11.0, 10.0, 8.0, 7.0, 3.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.36328125, -2.2966461181640625, -2.230010986328125, -2.1633758544921875, -2.09674072265625, -2.0301055908203125, -1.963470458984375, -1.8968353271484375, -1.8302001953125, -1.7635650634765625, -1.696929931640625, -1.6302947998046875, -1.56365966796875, -1.4970245361328125, -1.430389404296875, -1.3637542724609375, -1.297119140625, -1.2304840087890625, -1.163848876953125, -1.0972137451171875, -1.03057861328125, -0.9639434814453125, -0.897308349609375, -0.8306732177734375, -0.7640380859375, -0.6974029541015625, -0.630767822265625, -0.5641326904296875, -0.49749755859375, -0.4308624267578125, -0.364227294921875, -0.2975921630859375, -0.23095703125, -0.1643218994140625, -0.097686767578125, -0.0310516357421875, 0.03558349609375, 0.1022186279296875, 0.168853759765625, 0.2354888916015625, 0.3021240234375, 0.3687591552734375, 0.435394287109375, 0.5020294189453125, 0.56866455078125, 0.6352996826171875, 0.701934814453125, 0.7685699462890625, 0.835205078125, 0.9018402099609375, 0.968475341796875, 1.0351104736328125, 1.10174560546875, 1.1683807373046875, 1.235015869140625, 1.3016510009765625, 1.3682861328125, 1.4349212646484375, 1.501556396484375, 1.5681915283203125, 1.63482666015625, 1.7014617919921875, 1.768096923828125, 1.8347320556640625, 1.9013671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 5.0, 13.0, 11.0, 26.0, 33.0, 42.0, 63.0, 78.0, 154.0, 226.0, 335.0, 548.0, 921.0, 1628.0, 3058.0, 6295.0, 14281.0, 36835.0, 112637.0, 476376.0, 2752271.0, 585670.0, 131035.0, 41635.0, 15707.0, 6723.0, 3252.0, 1766.0, 947.0, 597.0, 374.0, 257.0, 152.0, 91.0, 67.0, 50.0, 33.0, 22.0, 16.0, 8.0, 11.0, 7.0, 9.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.87890625, -6.64617919921875, -6.4134521484375, -6.18072509765625, -5.947998046875, -5.71527099609375, -5.4825439453125, -5.24981689453125, -5.01708984375, -4.78436279296875, -4.5516357421875, -4.31890869140625, -4.086181640625, -3.85345458984375, -3.6207275390625, -3.38800048828125, -3.1552734375, -2.92254638671875, -2.6898193359375, -2.45709228515625, -2.224365234375, -1.99163818359375, -1.7589111328125, -1.52618408203125, -1.29345703125, -1.06072998046875, -0.8280029296875, -0.59527587890625, -0.362548828125, -0.12982177734375, 0.1029052734375, 0.33563232421875, 0.568359375, 0.80108642578125, 1.0338134765625, 1.26654052734375, 1.499267578125, 1.73199462890625, 1.9647216796875, 2.19744873046875, 2.43017578125, 2.66290283203125, 2.8956298828125, 3.12835693359375, 3.361083984375, 3.59381103515625, 3.8265380859375, 4.05926513671875, 4.2919921875, 4.52471923828125, 4.7574462890625, 4.99017333984375, 5.222900390625, 5.45562744140625, 5.6883544921875, 5.92108154296875, 6.15380859375, 6.38653564453125, 6.6192626953125, 6.85198974609375, 7.084716796875, 7.31744384765625, 7.5501708984375, 7.78289794921875, 8.015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 7.0, 3.0, 6.0, 6.0, 9.0, 20.0, 13.0, 38.0, 45.0, 69.0, 95.0, 196.0, 360.0, 706.0, 1268.0, 523.0, 261.0, 162.0, 97.0, 62.0, 36.0, 25.0, 31.0, 13.0, 7.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3515625, -4.18621826171875, -4.0208740234375, -3.85552978515625, -3.690185546875, -3.52484130859375, -3.3594970703125, -3.19415283203125, -3.02880859375, -2.86346435546875, -2.6981201171875, -2.53277587890625, -2.367431640625, -2.20208740234375, -2.0367431640625, -1.87139892578125, -1.7060546875, -1.54071044921875, -1.3753662109375, -1.21002197265625, -1.044677734375, -0.87933349609375, -0.7139892578125, -0.54864501953125, -0.38330078125, -0.21795654296875, -0.0526123046875, 0.11273193359375, 0.278076171875, 0.44342041015625, 0.6087646484375, 0.77410888671875, 0.939453125, 1.10479736328125, 1.2701416015625, 1.43548583984375, 1.600830078125, 1.76617431640625, 1.9315185546875, 2.09686279296875, 2.26220703125, 2.42755126953125, 2.5928955078125, 2.75823974609375, 2.923583984375, 3.08892822265625, 3.2542724609375, 3.41961669921875, 3.5849609375, 3.75030517578125, 3.9156494140625, 4.08099365234375, 4.246337890625, 4.41168212890625, 4.5770263671875, 4.74237060546875, 4.90771484375, 5.07305908203125, 5.2384033203125, 5.40374755859375, 5.569091796875, 5.73443603515625, 5.8997802734375, 6.06512451171875, 6.23046875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 17.0, 64.0, 141.0, 206.0, 222.0, 173.0, 100.0, 41.0, 22.0, 9.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.925148010253906, -52.00737380981445, -50.089599609375, -48.17182159423828, -46.25404739379883, -44.336273193359375, -42.41849899291992, -40.50072479248047, -38.582950592041016, -36.66517639160156, -34.74740219116211, -32.829627990722656, -30.91185188293457, -28.994075775146484, -27.07630157470703, -25.158527374267578, -23.240751266479492, -21.32297706604004, -19.405200958251953, -17.4874267578125, -15.569652557373047, -13.651877403259277, -11.734102249145508, -9.816328048706055, -7.898552894592285, -5.980778217315674, -4.0630035400390625, -2.145228385925293, -0.22745370864868164, 1.6903209686279297, 3.608096122741699, 5.525870323181152, 7.443645477294922, 9.361420631408691, 11.279194831848145, 13.196969985961914, 15.114744186401367, 17.032520294189453, 18.950294494628906, 20.86806869506836, 22.785842895507812, 24.703617095947266, 26.62139320373535, 28.539167404174805, 30.456941604614258, 32.374717712402344, 34.2924919128418, 36.21026611328125, 38.12804412841797, 40.04581832885742, 41.963592529296875, 43.881370544433594, 45.79914474487305, 47.7169189453125, 49.63469314575195, 51.552467346191406, 53.47024154663086, 55.38801574707031, 57.305789947509766, 59.22356414794922, 61.14134216308594, 63.05911636352539, 64.97689056396484, 66.89466857910156, 68.81243896484375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 9.0, 9.0, 12.0, 16.0, 17.0, 19.0, 28.0, 23.0, 35.0, 33.0, 35.0, 42.0, 42.0, 47.0, 55.0, 40.0, 49.0, 48.0, 45.0, 58.0, 27.0, 43.0, 24.0, 30.0, 28.0, 29.0, 29.0, 27.0, 19.0, 16.0, 12.0, 10.0, 6.0, 7.0, 4.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.17355728149414, -15.631606101989746, -15.089654922485352, -14.547703742980957, -14.005752563476562, -13.463801383972168, -12.921850204467773, -12.379898071289062, -11.837947845458984, -11.29599666595459, -10.754045486450195, -10.2120943069458, -9.670143127441406, -9.128191947937012, -8.586240768432617, -8.044288635253906, -7.502337455749512, -6.960386276245117, -6.418435096740723, -5.876483917236328, -5.334532737731934, -4.792581558227539, -4.250629901885986, -3.708678722381592, -3.1667275428771973, -2.6247763633728027, -2.082825183868408, -1.5408737659454346, -0.99892258644104, -0.4569714069366455, 0.08498001098632812, 0.6269311904907227, 1.1688823699951172, 1.7108335494995117, 2.2527847290039062, 2.79473614692688, 3.3366873264312744, 3.878638505935669, 4.420589923858643, 4.962541103363037, 5.504492282867432, 6.046443462371826, 6.588394641876221, 7.130346298217773, 7.672297477722168, 8.214248657226562, 8.756199836730957, 9.298151016235352, 9.840102195739746, 10.38205337524414, 10.924004554748535, 11.46595573425293, 12.007906913757324, 12.549858093261719, 13.09181022644043, 13.633760452270508, 14.175712585449219, 14.717663764953613, 15.259614944458008, 15.801566123962402, 16.343517303466797, 16.885469436645508, 17.427419662475586, 17.969371795654297, 18.511322021484375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 10.0, 9.0, 7.0, 11.0, 32.0, 36.0, 58.0, 100.0, 161.0, 273.0, 427.0, 909.0, 1897.0, 4312.0, 10912.0, 30168.0, 91742.0, 258401.0, 372018.0, 181608.0, 60736.0, 20778.0, 7653.0, 3148.0, 1438.0, 717.0, 393.0, 224.0, 134.0, 85.0, 48.0, 38.0, 24.0, 10.0, 17.0, 2.0, 7.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4296875, -8.12109375, -7.8125, -7.50390625, -7.1953125, -6.88671875, -6.578125, -6.26953125, -5.9609375, -5.65234375, -5.34375, -5.03515625, -4.7265625, -4.41796875, -4.109375, -3.80078125, -3.4921875, -3.18359375, -2.875, -2.56640625, -2.2578125, -1.94921875, -1.640625, -1.33203125, -1.0234375, -0.71484375, -0.40625, -0.09765625, 0.2109375, 0.51953125, 0.828125, 1.13671875, 1.4453125, 1.75390625, 2.0625, 2.37109375, 2.6796875, 2.98828125, 3.296875, 3.60546875, 3.9140625, 4.22265625, 4.53125, 4.83984375, 5.1484375, 5.45703125, 5.765625, 6.07421875, 6.3828125, 6.69140625, 7.0, 7.30859375, 7.6171875, 7.92578125, 8.234375, 8.54296875, 8.8515625, 9.16015625, 9.46875, 9.77734375, 10.0859375, 10.39453125, 10.703125, 11.01171875, 11.3203125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 8.0, 8.0, 12.0, 18.0, 23.0, 23.0, 30.0, 46.0, 39.0, 49.0, 37.0, 49.0, 46.0, 53.0, 45.0, 51.0, 62.0, 58.0, 43.0, 42.0, 28.0, 32.0, 33.0, 32.0, 19.0, 17.0, 15.0, 15.0, 10.0, 12.0, 6.0, 2.0, 6.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-2.498046875, -2.428314208984375, -2.35858154296875, -2.288848876953125, -2.2191162109375, -2.149383544921875, -2.07965087890625, -2.009918212890625, -1.940185546875, -1.870452880859375, -1.80072021484375, -1.730987548828125, -1.6612548828125, -1.591522216796875, -1.52178955078125, -1.452056884765625, -1.38232421875, -1.312591552734375, -1.24285888671875, -1.173126220703125, -1.1033935546875, -1.033660888671875, -0.96392822265625, -0.894195556640625, -0.824462890625, -0.754730224609375, -0.68499755859375, -0.615264892578125, -0.5455322265625, -0.475799560546875, -0.40606689453125, -0.336334228515625, -0.2666015625, -0.196868896484375, -0.12713623046875, -0.057403564453125, 0.0123291015625, 0.082061767578125, 0.15179443359375, 0.221527099609375, 0.291259765625, 0.360992431640625, 0.43072509765625, 0.500457763671875, 0.5701904296875, 0.639923095703125, 0.70965576171875, 0.779388427734375, 0.84912109375, 0.918853759765625, 0.98858642578125, 1.058319091796875, 1.1280517578125, 1.197784423828125, 1.26751708984375, 1.337249755859375, 1.406982421875, 1.476715087890625, 1.54644775390625, 1.616180419921875, 1.6859130859375, 1.755645751953125, 1.82537841796875, 1.895111083984375, 1.96484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 0.0, 5.0, 4.0, 3.0, 5.0, 8.0, 6.0, 17.0, 18.0, 27.0, 33.0, 39.0, 57.0, 59.0, 77.0, 116.0, 151.0, 174.0, 208.0, 354.0, 469.0, 727.0, 1285.0, 3080.0, 11619.0, 67514.0, 430131.0, 442980.0, 70207.0, 12103.0, 3063.0, 1334.0, 785.0, 507.0, 313.0, 232.0, 198.0, 149.0, 114.0, 99.0, 71.0, 52.0, 37.0, 25.0, 27.0, 17.0, 18.0, 13.0, 7.0, 9.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-13.7265625, -13.283935546875, -12.84130859375, -12.398681640625, -11.9560546875, -11.513427734375, -11.07080078125, -10.628173828125, -10.185546875, -9.742919921875, -9.30029296875, -8.857666015625, -8.4150390625, -7.972412109375, -7.52978515625, -7.087158203125, -6.64453125, -6.201904296875, -5.75927734375, -5.316650390625, -4.8740234375, -4.431396484375, -3.98876953125, -3.546142578125, -3.103515625, -2.660888671875, -2.21826171875, -1.775634765625, -1.3330078125, -0.890380859375, -0.44775390625, -0.005126953125, 0.4375, 0.880126953125, 1.32275390625, 1.765380859375, 2.2080078125, 2.650634765625, 3.09326171875, 3.535888671875, 3.978515625, 4.421142578125, 4.86376953125, 5.306396484375, 5.7490234375, 6.191650390625, 6.63427734375, 7.076904296875, 7.51953125, 7.962158203125, 8.40478515625, 8.847412109375, 9.2900390625, 9.732666015625, 10.17529296875, 10.617919921875, 11.060546875, 11.503173828125, 11.94580078125, 12.388427734375, 12.8310546875, 13.273681640625, 13.71630859375, 14.158935546875, 14.6015625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 5.0, 7.0, 7.0, 11.0, 6.0, 17.0, 12.0, 17.0, 20.0, 22.0, 30.0, 29.0, 24.0, 44.0, 38.0, 41.0, 33.0, 45.0, 39.0, 37.0, 41.0, 54.0, 51.0, 46.0, 38.0, 38.0, 35.0, 27.0, 27.0, 26.0, 27.0, 22.0, 13.0, 16.0, 10.0, 9.0, 5.0, 7.0, 6.0, 4.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0703125, -7.7738037109375, -7.477294921875, -7.1807861328125, -6.88427734375, -6.5877685546875, -6.291259765625, -5.9947509765625, -5.6982421875, -5.4017333984375, -5.105224609375, -4.8087158203125, -4.51220703125, -4.2156982421875, -3.919189453125, -3.6226806640625, -3.326171875, -3.0296630859375, -2.733154296875, -2.4366455078125, -2.14013671875, -1.8436279296875, -1.547119140625, -1.2506103515625, -0.9541015625, -0.6575927734375, -0.361083984375, -0.0645751953125, 0.23193359375, 0.5284423828125, 0.824951171875, 1.1214599609375, 1.41796875, 1.7144775390625, 2.010986328125, 2.3074951171875, 2.60400390625, 2.9005126953125, 3.197021484375, 3.4935302734375, 3.7900390625, 4.0865478515625, 4.383056640625, 4.6795654296875, 4.97607421875, 5.2725830078125, 5.569091796875, 5.8656005859375, 6.162109375, 6.4586181640625, 6.755126953125, 7.0516357421875, 7.34814453125, 7.6446533203125, 7.941162109375, 8.2376708984375, 8.5341796875, 8.8306884765625, 9.127197265625, 9.4237060546875, 9.72021484375, 10.0167236328125, 10.313232421875, 10.6097412109375, 10.90625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 1.0, 4.0, 11.0, 8.0, 7.0, 26.0, 35.0, 83.0, 203.0, 542.0, 2439.0, 21764.0, 381120.0, 600378.0, 37199.0, 3621.0, 672.0, 226.0, 85.0, 47.0, 27.0, 11.0, 14.0, 11.0, 6.0, 9.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.5703125, -9.229736328125, -8.88916015625, -8.548583984375, -8.2080078125, -7.867431640625, -7.52685546875, -7.186279296875, -6.845703125, -6.505126953125, -6.16455078125, -5.823974609375, -5.4833984375, -5.142822265625, -4.80224609375, -4.461669921875, -4.12109375, -3.780517578125, -3.43994140625, -3.099365234375, -2.7587890625, -2.418212890625, -2.07763671875, -1.737060546875, -1.396484375, -1.055908203125, -0.71533203125, -0.374755859375, -0.0341796875, 0.306396484375, 0.64697265625, 0.987548828125, 1.328125, 1.668701171875, 2.00927734375, 2.349853515625, 2.6904296875, 3.031005859375, 3.37158203125, 3.712158203125, 4.052734375, 4.393310546875, 4.73388671875, 5.074462890625, 5.4150390625, 5.755615234375, 6.09619140625, 6.436767578125, 6.77734375, 7.117919921875, 7.45849609375, 7.799072265625, 8.1396484375, 8.480224609375, 8.82080078125, 9.161376953125, 9.501953125, 9.842529296875, 10.18310546875, 10.523681640625, 10.8642578125, 11.204833984375, 11.54541015625, 11.885986328125, 12.2265625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 6.0, 9.0, 6.0, 9.0, 16.0, 19.0, 25.0, 29.0, 36.0, 51.0, 45.0, 53.0, 51.0, 72.0, 84.0, 85.0, 77.0, 55.0, 66.0, 34.0, 33.0, 27.0, 22.0, 23.0, 16.0, 8.0, 9.0, 10.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007224082946777344, -0.0007015466690063477, -0.0006806850433349609, -0.0006598234176635742, -0.0006389617919921875, -0.0006181001663208008, -0.0005972385406494141, -0.0005763769149780273, -0.0005555152893066406, -0.0005346536636352539, -0.0005137920379638672, -0.0004929304122924805, -0.00047206878662109375, -0.00045120716094970703, -0.0004303455352783203, -0.0004094839096069336, -0.0003886222839355469, -0.00036776065826416016, -0.00034689903259277344, -0.0003260374069213867, -0.00030517578125, -0.0002843141555786133, -0.00026345252990722656, -0.00024259090423583984, -0.00022172927856445312, -0.0002008676528930664, -0.0001800060272216797, -0.00015914440155029297, -0.00013828277587890625, -0.00011742115020751953, -9.655952453613281e-05, -7.56978988647461e-05, -5.4836273193359375e-05, -3.3974647521972656e-05, -1.3113021850585938e-05, 7.748603820800781e-06, 2.86102294921875e-05, 4.947185516357422e-05, 7.033348083496094e-05, 9.119510650634766e-05, 0.00011205673217773438, 0.0001329183578491211, 0.0001537799835205078, 0.00017464160919189453, 0.00019550323486328125, 0.00021636486053466797, 0.0002372264862060547, 0.0002580881118774414, 0.0002789497375488281, 0.00029981136322021484, 0.00032067298889160156, 0.0003415346145629883, 0.000362396240234375, 0.0003832578659057617, 0.00040411949157714844, 0.00042498111724853516, 0.0004458427429199219, 0.0004667043685913086, 0.0004875659942626953, 0.000508427619934082, 0.0005292892456054688, 0.0005501508712768555, 0.0005710124969482422, 0.0005918741226196289, 0.0006127357482910156]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 8.0, 6.0, 5.0, 17.0, 20.0, 18.0, 30.0, 53.0, 48.0, 90.0, 123.0, 222.0, 317.0, 557.0, 1060.0, 2570.0, 8877.0, 54462.0, 431681.0, 471997.0, 61314.0, 9776.0, 2631.0, 1144.0, 538.0, 340.0, 207.0, 143.0, 101.0, 45.0, 50.0, 34.0, 20.0, 12.0, 9.0, 8.0, 3.0, 13.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.5234375, -8.286865234375, -8.05029296875, -7.813720703125, -7.5771484375, -7.340576171875, -7.10400390625, -6.867431640625, -6.630859375, -6.394287109375, -6.15771484375, -5.921142578125, -5.6845703125, -5.447998046875, -5.21142578125, -4.974853515625, -4.73828125, -4.501708984375, -4.26513671875, -4.028564453125, -3.7919921875, -3.555419921875, -3.31884765625, -3.082275390625, -2.845703125, -2.609130859375, -2.37255859375, -2.135986328125, -1.8994140625, -1.662841796875, -1.42626953125, -1.189697265625, -0.953125, -0.716552734375, -0.47998046875, -0.243408203125, -0.0068359375, 0.229736328125, 0.46630859375, 0.702880859375, 0.939453125, 1.176025390625, 1.41259765625, 1.649169921875, 1.8857421875, 2.122314453125, 2.35888671875, 2.595458984375, 2.83203125, 3.068603515625, 3.30517578125, 3.541748046875, 3.7783203125, 4.014892578125, 4.25146484375, 4.488037109375, 4.724609375, 4.961181640625, 5.19775390625, 5.434326171875, 5.6708984375, 5.907470703125, 6.14404296875, 6.380615234375, 6.6171875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 7.0, 2.0, 3.0, 3.0, 4.0, 9.0, 11.0, 18.0, 15.0, 28.0, 23.0, 27.0, 29.0, 46.0, 53.0, 74.0, 57.0, 74.0, 66.0, 64.0, 70.0, 47.0, 67.0, 41.0, 27.0, 28.0, 30.0, 20.0, 19.0, 9.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.91015625, -4.779266357421875, -4.64837646484375, -4.517486572265625, -4.3865966796875, -4.255706787109375, -4.12481689453125, -3.993927001953125, -3.863037109375, -3.732147216796875, -3.60125732421875, -3.470367431640625, -3.3394775390625, -3.208587646484375, -3.07769775390625, -2.946807861328125, -2.81591796875, -2.685028076171875, -2.55413818359375, -2.423248291015625, -2.2923583984375, -2.161468505859375, -2.03057861328125, -1.899688720703125, -1.768798828125, -1.637908935546875, -1.50701904296875, -1.376129150390625, -1.2452392578125, -1.114349365234375, -0.98345947265625, -0.852569580078125, -0.7216796875, -0.590789794921875, -0.45989990234375, -0.329010009765625, -0.1981201171875, -0.067230224609375, 0.06365966796875, 0.194549560546875, 0.325439453125, 0.456329345703125, 0.58721923828125, 0.718109130859375, 0.8489990234375, 0.979888916015625, 1.11077880859375, 1.241668701171875, 1.37255859375, 1.503448486328125, 1.63433837890625, 1.765228271484375, 1.8961181640625, 2.027008056640625, 2.15789794921875, 2.288787841796875, 2.419677734375, 2.550567626953125, 2.68145751953125, 2.812347412109375, 2.9432373046875, 3.074127197265625, 3.20501708984375, 3.335906982421875, 3.466796875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 9.0, 11.0, 24.0, 48.0, 93.0, 140.0, 174.0, 159.0, 152.0, 90.0, 44.0, 34.0, 18.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.52593231201172, -37.353511810302734, -34.181095123291016, -31.00867462158203, -27.83625602722168, -24.663837432861328, -21.491416931152344, -18.318998336791992, -15.14657974243164, -11.974161148071289, -8.801741600036621, -5.629322052001953, -2.4569034576416016, 0.71551513671875, 3.8879356384277344, 7.060354232788086, 10.232772827148438, 13.405191421508789, 16.57761001586914, 19.750030517578125, 22.922449111938477, 26.094867706298828, 29.267288208007812, 32.43970489501953, 35.612125396728516, 38.7845458984375, 41.95696258544922, 45.1293830871582, 48.30180358886719, 51.474220275878906, 54.64664077758789, 57.819061279296875, 60.991485595703125, 64.16390228271484, 67.3363265991211, 70.50874328613281, 73.68115997314453, 76.85357666015625, 80.0260009765625, 83.19841766357422, 86.37083435058594, 89.54325103759766, 92.7156753540039, 95.88809204101562, 99.06050872802734, 102.23292541503906, 105.40534973144531, 108.57776641845703, 111.75019073486328, 114.922607421875, 118.09503173828125, 121.26744842529297, 124.43986511230469, 127.61228942871094, 130.78469848632812, 133.95712280273438, 137.12954711914062, 140.30197143554688, 143.47438049316406, 146.6468048095703, 149.81922912597656, 152.99163818359375, 156.1640625, 159.33648681640625, 162.50889587402344]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 6.0, 5.0, 11.0, 12.0, 11.0, 11.0, 10.0, 19.0, 22.0, 34.0, 32.0, 29.0, 51.0, 41.0, 43.0, 49.0, 42.0, 47.0, 43.0, 53.0, 52.0, 39.0, 42.0, 32.0, 42.0, 36.0, 31.0, 26.0, 21.0, 22.0, 13.0, 18.0, 15.0, 9.0, 10.0, 10.0, 6.0, 3.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.214202880859375, -51.633819580078125, -50.053436279296875, -48.473052978515625, -46.892669677734375, -45.31228256225586, -43.73189926147461, -42.15151596069336, -40.57113265991211, -38.99074935913086, -37.41036605834961, -35.82998275756836, -34.249595642089844, -32.669212341308594, -31.088829040527344, -29.508445739746094, -27.928062438964844, -26.347679138183594, -24.767295837402344, -23.18691062927246, -21.60652732849121, -20.02614402770996, -18.445758819580078, -16.865375518798828, -15.284992218017578, -13.704608917236328, -12.124224662780762, -10.543840408325195, -8.963457107543945, -7.383073329925537, -5.802689552307129, -4.2223052978515625, -2.6419219970703125, -1.0615382194519043, 0.5188455581665039, 2.099229335784912, 3.6796131134033203, 5.2599968910217285, 6.840380668640137, 8.420764923095703, 10.001148223876953, 11.581531524658203, 13.16191577911377, 14.742300033569336, 16.322683334350586, 17.903066635131836, 19.48345184326172, 21.06383514404297, 22.64421844482422, 24.22460174560547, 25.80498504638672, 27.3853702545166, 28.96575355529785, 30.5461368560791, 32.126522064208984, 33.706905364990234, 35.287288665771484, 36.867671966552734, 38.448055267333984, 40.028438568115234, 41.60882568359375, 43.189208984375, 44.76959228515625, 46.3499755859375, 47.93035888671875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 6.0, 6.0, 12.0, 18.0, 22.0, 34.0, 51.0, 88.0, 141.0, 241.0, 529.0, 1124.0, 3159.0, 13661.0, 187536.0, 3947898.0, 30919.0, 5566.0, 1718.0, 712.0, 328.0, 188.0, 114.0, 76.0, 43.0, 32.0, 17.0, 8.0, 12.0, 9.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.4375, -19.626708984375, -18.81591796875, -18.005126953125, -17.1943359375, -16.383544921875, -15.57275390625, -14.761962890625, -13.951171875, -13.140380859375, -12.32958984375, -11.518798828125, -10.7080078125, -9.897216796875, -9.08642578125, -8.275634765625, -7.46484375, -6.654052734375, -5.84326171875, -5.032470703125, -4.2216796875, -3.410888671875, -2.60009765625, -1.789306640625, -0.978515625, -0.167724609375, 0.64306640625, 1.453857421875, 2.2646484375, 3.075439453125, 3.88623046875, 4.697021484375, 5.5078125, 6.318603515625, 7.12939453125, 7.940185546875, 8.7509765625, 9.561767578125, 10.37255859375, 11.183349609375, 11.994140625, 12.804931640625, 13.61572265625, 14.426513671875, 15.2373046875, 16.048095703125, 16.85888671875, 17.669677734375, 18.48046875, 19.291259765625, 20.10205078125, 20.912841796875, 21.7236328125, 22.534423828125, 23.34521484375, 24.156005859375, 24.966796875, 25.777587890625, 26.58837890625, 27.399169921875, 28.2099609375, 29.020751953125, 29.83154296875, 30.642333984375, 31.453125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 8.0, 3.0, 7.0, 8.0, 5.0, 7.0, 8.0, 12.0, 12.0, 28.0, 28.0, 27.0, 37.0, 38.0, 49.0, 51.0, 53.0, 48.0, 49.0, 53.0, 52.0, 43.0, 36.0, 46.0, 42.0, 31.0, 36.0, 31.0, 21.0, 27.0, 18.0, 19.0, 13.0, 14.0, 12.0, 10.0, 10.0, 4.0, 2.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.625, -2.549560546875, -2.47412109375, -2.398681640625, -2.3232421875, -2.247802734375, -2.17236328125, -2.096923828125, -2.021484375, -1.946044921875, -1.87060546875, -1.795166015625, -1.7197265625, -1.644287109375, -1.56884765625, -1.493408203125, -1.41796875, -1.342529296875, -1.26708984375, -1.191650390625, -1.1162109375, -1.040771484375, -0.96533203125, -0.889892578125, -0.814453125, -0.739013671875, -0.66357421875, -0.588134765625, -0.5126953125, -0.437255859375, -0.36181640625, -0.286376953125, -0.2109375, -0.135498046875, -0.06005859375, 0.015380859375, 0.0908203125, 0.166259765625, 0.24169921875, 0.317138671875, 0.392578125, 0.468017578125, 0.54345703125, 0.618896484375, 0.6943359375, 0.769775390625, 0.84521484375, 0.920654296875, 0.99609375, 1.071533203125, 1.14697265625, 1.222412109375, 1.2978515625, 1.373291015625, 1.44873046875, 1.524169921875, 1.599609375, 1.675048828125, 1.75048828125, 1.825927734375, 1.9013671875, 1.976806640625, 2.05224609375, 2.127685546875, 2.203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 9.0, 5.0, 13.0, 18.0, 23.0, 32.0, 42.0, 47.0, 74.0, 93.0, 150.0, 192.0, 317.0, 479.0, 709.0, 1134.0, 1954.0, 3432.0, 6593.0, 14675.0, 41752.0, 206909.0, 3690713.0, 160885.0, 36294.0, 13495.0, 6218.0, 3114.0, 1796.0, 1066.0, 713.0, 440.0, 262.0, 184.0, 136.0, 84.0, 66.0, 38.0, 38.0, 17.0, 19.0, 12.0, 10.0, 8.0, 7.0, 6.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0859375, -7.8203125, -7.5546875, -7.2890625, -7.0234375, -6.7578125, -6.4921875, -6.2265625, -5.9609375, -5.6953125, -5.4296875, -5.1640625, -4.8984375, -4.6328125, -4.3671875, -4.1015625, -3.8359375, -3.5703125, -3.3046875, -3.0390625, -2.7734375, -2.5078125, -2.2421875, -1.9765625, -1.7109375, -1.4453125, -1.1796875, -0.9140625, -0.6484375, -0.3828125, -0.1171875, 0.1484375, 0.4140625, 0.6796875, 0.9453125, 1.2109375, 1.4765625, 1.7421875, 2.0078125, 2.2734375, 2.5390625, 2.8046875, 3.0703125, 3.3359375, 3.6015625, 3.8671875, 4.1328125, 4.3984375, 4.6640625, 4.9296875, 5.1953125, 5.4609375, 5.7265625, 5.9921875, 6.2578125, 6.5234375, 6.7890625, 7.0546875, 7.3203125, 7.5859375, 7.8515625, 8.1171875, 8.3828125, 8.6484375, 8.9140625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 6.0, 6.0, 9.0, 15.0, 13.0, 19.0, 20.0, 53.0, 98.0, 172.0, 482.0, 2619.0, 227.0, 126.0, 61.0, 34.0, 29.0, 27.0, 13.0, 11.0, 2.0, 4.0, 9.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05859375, -1.998443603515625, -1.93829345703125, -1.878143310546875, -1.8179931640625, -1.757843017578125, -1.69769287109375, -1.637542724609375, -1.577392578125, -1.517242431640625, -1.45709228515625, -1.396942138671875, -1.3367919921875, -1.276641845703125, -1.21649169921875, -1.156341552734375, -1.09619140625, -1.036041259765625, -0.97589111328125, -0.915740966796875, -0.8555908203125, -0.795440673828125, -0.73529052734375, -0.675140380859375, -0.614990234375, -0.554840087890625, -0.49468994140625, -0.434539794921875, -0.3743896484375, -0.314239501953125, -0.25408935546875, -0.193939208984375, -0.1337890625, -0.073638916015625, -0.01348876953125, 0.046661376953125, 0.1068115234375, 0.166961669921875, 0.22711181640625, 0.287261962890625, 0.347412109375, 0.407562255859375, 0.46771240234375, 0.527862548828125, 0.5880126953125, 0.648162841796875, 0.70831298828125, 0.768463134765625, 0.82861328125, 0.888763427734375, 0.94891357421875, 1.009063720703125, 1.0692138671875, 1.129364013671875, 1.18951416015625, 1.249664306640625, 1.309814453125, 1.369964599609375, 1.43011474609375, 1.490264892578125, 1.5504150390625, 1.610565185546875, 1.67071533203125, 1.730865478515625, 1.791015625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 10.0, 8.0, 17.0, 34.0, 48.0, 72.0, 91.0, 115.0, 140.0, 95.0, 115.0, 78.0, 64.0, 46.0, 26.0, 10.0, 12.0, 8.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.410139083862305, -11.070477485656738, -10.730814933776855, -10.391153335571289, -10.051491737365723, -9.711830139160156, -9.372167587280273, -9.032505989074707, -8.69284439086914, -8.353182792663574, -8.013520240783691, -7.673858642578125, -7.334197044372559, -6.994534969329834, -6.654872894287109, -6.315211296081543, -5.97554874420166, -5.6358866691589355, -5.296225070953369, -4.9565629959106445, -4.616901397705078, -4.2772393226623535, -3.937577247619629, -3.5979154109954834, -3.258253574371338, -2.9185917377471924, -2.578929901123047, -2.2392678260803223, -1.8996059894561768, -1.5599441528320312, -1.2202820777893066, -0.8806202411651611, -0.5409584045410156, -0.20129650831222534, 0.13836538791656494, 0.47802734375, 0.8176891803741455, 1.157351016998291, 1.4970130920410156, 1.8366749286651611, 2.1763367652893066, 2.515998601913452, 2.8556604385375977, 3.1953225135803223, 3.5349843502044678, 3.8746461868286133, 4.214308261871338, 4.5539703369140625, 4.893631935119629, 5.2332940101623535, 5.57295560836792, 5.9126176834106445, 6.252279281616211, 6.5919413566589355, 6.93160343170166, 7.271265029907227, 7.610927104949951, 7.950589179992676, 8.290250778198242, 8.629913330078125, 8.969574928283691, 9.309236526489258, 9.64889907836914, 9.988560676574707, 10.328222274780273]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 7.0, 11.0, 18.0, 14.0, 24.0, 23.0, 23.0, 25.0, 23.0, 38.0, 27.0, 32.0, 31.0, 36.0, 47.0, 55.0, 47.0, 53.0, 36.0, 52.0, 41.0, 33.0, 33.0, 43.0, 21.0, 46.0, 28.0, 18.0, 22.0, 16.0, 13.0, 11.0, 5.0, 2.0, 5.0, 7.0, 8.0, 5.0, 4.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.415430068969727, -4.279882907867432, -4.144335746765137, -4.008788585662842, -3.873241424560547, -3.737694263458252, -3.602147340774536, -3.466600179672241, -3.3310530185699463, -3.1955058574676514, -3.0599586963653564, -2.9244115352630615, -2.7888646125793457, -2.653317451477051, -2.517770290374756, -2.382223129272461, -2.246675968170166, -2.111128807067871, -1.9755816459655762, -1.8400346040725708, -1.7044874429702759, -1.568940281867981, -1.4333932399749756, -1.2978460788726807, -1.1622989177703857, -1.0267517566680908, -0.8912046551704407, -0.7556575536727905, -0.6201103925704956, -0.4845632314682007, -0.34901612997055054, -0.2134690284729004, -0.07792186737060547, 0.057625263929367065, 0.1931723952293396, 0.32871952652931213, 0.46426665782928467, 0.5998138189315796, 0.7353609204292297, 0.8709080219268799, 1.0064551830291748, 1.1420023441314697, 1.2775495052337646, 1.41309654712677, 1.548643708229065, 1.6841908693313599, 1.8197379112243652, 1.9552850723266602, 2.090832233428955, 2.22637939453125, 2.361926555633545, 2.49747371673584, 2.6330208778381348, 2.7685680389404297, 2.9041149616241455, 3.0396621227264404, 3.1752092838287354, 3.3107564449310303, 3.446303606033325, 3.58185076713562, 3.717397689819336, 3.852944850921631, 3.988492012023926, 4.124039173126221, 4.259586334228516]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 14.0, 8.0, 18.0, 30.0, 44.0, 63.0, 83.0, 173.0, 289.0, 557.0, 988.0, 2307.0, 5515.0, 14224.0, 38736.0, 106931.0, 247877.0, 321451.0, 190615.0, 74384.0, 26766.0, 9928.0, 4001.0, 1676.0, 867.0, 413.0, 229.0, 144.0, 83.0, 61.0, 19.0, 21.0, 15.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.93359375, -5.67913818359375, -5.4246826171875, -5.17022705078125, -4.915771484375, -4.66131591796875, -4.4068603515625, -4.15240478515625, -3.89794921875, -3.64349365234375, -3.3890380859375, -3.13458251953125, -2.880126953125, -2.62567138671875, -2.3712158203125, -2.11676025390625, -1.8623046875, -1.60784912109375, -1.3533935546875, -1.09893798828125, -0.844482421875, -0.59002685546875, -0.3355712890625, -0.08111572265625, 0.17333984375, 0.42779541015625, 0.6822509765625, 0.93670654296875, 1.191162109375, 1.44561767578125, 1.7000732421875, 1.95452880859375, 2.208984375, 2.46343994140625, 2.7178955078125, 2.97235107421875, 3.226806640625, 3.48126220703125, 3.7357177734375, 3.99017333984375, 4.24462890625, 4.49908447265625, 4.7535400390625, 5.00799560546875, 5.262451171875, 5.51690673828125, 5.7713623046875, 6.02581787109375, 6.2802734375, 6.53472900390625, 6.7891845703125, 7.04364013671875, 7.298095703125, 7.55255126953125, 7.8070068359375, 8.06146240234375, 8.31591796875, 8.57037353515625, 8.8248291015625, 9.07928466796875, 9.333740234375, 9.58819580078125, 9.8426513671875, 10.09710693359375, 10.3515625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 9.0, 11.0, 5.0, 9.0, 19.0, 13.0, 17.0, 32.0, 27.0, 41.0, 40.0, 51.0, 45.0, 43.0, 42.0, 42.0, 52.0, 46.0, 43.0, 37.0, 58.0, 48.0, 32.0, 31.0, 27.0, 25.0, 28.0, 22.0, 15.0, 12.0, 18.0, 11.0, 8.0, 8.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.609375, -2.532379150390625, -2.45538330078125, -2.378387451171875, -2.3013916015625, -2.224395751953125, -2.14739990234375, -2.070404052734375, -1.993408203125, -1.916412353515625, -1.83941650390625, -1.762420654296875, -1.6854248046875, -1.608428955078125, -1.53143310546875, -1.454437255859375, -1.37744140625, -1.300445556640625, -1.22344970703125, -1.146453857421875, -1.0694580078125, -0.992462158203125, -0.91546630859375, -0.838470458984375, -0.761474609375, -0.684478759765625, -0.60748291015625, -0.530487060546875, -0.4534912109375, -0.376495361328125, -0.29949951171875, -0.222503662109375, -0.1455078125, -0.068511962890625, 0.00848388671875, 0.085479736328125, 0.1624755859375, 0.239471435546875, 0.31646728515625, 0.393463134765625, 0.470458984375, 0.547454833984375, 0.62445068359375, 0.701446533203125, 0.7784423828125, 0.855438232421875, 0.93243408203125, 1.009429931640625, 1.08642578125, 1.163421630859375, 1.24041748046875, 1.317413330078125, 1.3944091796875, 1.471405029296875, 1.54840087890625, 1.625396728515625, 1.702392578125, 1.779388427734375, 1.85638427734375, 1.933380126953125, 2.0103759765625, 2.087371826171875, 2.16436767578125, 2.241363525390625, 2.318359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 2.0, 8.0, 11.0, 6.0, 24.0, 16.0, 43.0, 59.0, 68.0, 97.0, 137.0, 225.0, 308.0, 390.0, 620.0, 1021.0, 1820.0, 5869.0, 48450.0, 613377.0, 343209.0, 24620.0, 4020.0, 1460.0, 880.0, 556.0, 345.0, 232.0, 189.0, 132.0, 102.0, 76.0, 56.0, 29.0, 34.0, 12.0, 13.0, 5.0, 9.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-18.109375, -17.541015625, -16.97265625, -16.404296875, -15.8359375, -15.267578125, -14.69921875, -14.130859375, -13.5625, -12.994140625, -12.42578125, -11.857421875, -11.2890625, -10.720703125, -10.15234375, -9.583984375, -9.015625, -8.447265625, -7.87890625, -7.310546875, -6.7421875, -6.173828125, -5.60546875, -5.037109375, -4.46875, -3.900390625, -3.33203125, -2.763671875, -2.1953125, -1.626953125, -1.05859375, -0.490234375, 0.078125, 0.646484375, 1.21484375, 1.783203125, 2.3515625, 2.919921875, 3.48828125, 4.056640625, 4.625, 5.193359375, 5.76171875, 6.330078125, 6.8984375, 7.466796875, 8.03515625, 8.603515625, 9.171875, 9.740234375, 10.30859375, 10.876953125, 11.4453125, 12.013671875, 12.58203125, 13.150390625, 13.71875, 14.287109375, 14.85546875, 15.423828125, 15.9921875, 16.560546875, 17.12890625, 17.697265625, 18.265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 2.0, 4.0, 7.0, 9.0, 8.0, 7.0, 9.0, 13.0, 14.0, 25.0, 21.0, 21.0, 29.0, 28.0, 27.0, 41.0, 46.0, 45.0, 43.0, 45.0, 51.0, 46.0, 39.0, 38.0, 38.0, 38.0, 34.0, 31.0, 35.0, 28.0, 35.0, 17.0, 24.0, 26.0, 16.0, 8.0, 12.0, 11.0, 5.0, 7.0, 8.0, 2.0, 4.0, 3.0, 0.0, 0.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-11.109375, -10.7779541015625, -10.446533203125, -10.1151123046875, -9.78369140625, -9.4522705078125, -9.120849609375, -8.7894287109375, -8.4580078125, -8.1265869140625, -7.795166015625, -7.4637451171875, -7.13232421875, -6.8009033203125, -6.469482421875, -6.1380615234375, -5.806640625, -5.4752197265625, -5.143798828125, -4.8123779296875, -4.48095703125, -4.1495361328125, -3.818115234375, -3.4866943359375, -3.1552734375, -2.8238525390625, -2.492431640625, -2.1610107421875, -1.82958984375, -1.4981689453125, -1.166748046875, -0.8353271484375, -0.50390625, -0.1724853515625, 0.158935546875, 0.4903564453125, 0.82177734375, 1.1531982421875, 1.484619140625, 1.8160400390625, 2.1474609375, 2.4788818359375, 2.810302734375, 3.1417236328125, 3.47314453125, 3.8045654296875, 4.135986328125, 4.4674072265625, 4.798828125, 5.1302490234375, 5.461669921875, 5.7930908203125, 6.12451171875, 6.4559326171875, 6.787353515625, 7.1187744140625, 7.4501953125, 7.7816162109375, 8.113037109375, 8.4444580078125, 8.77587890625, 9.1072998046875, 9.438720703125, 9.7701416015625, 10.1015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 7.0, 8.0, 10.0, 17.0, 26.0, 23.0, 36.0, 40.0, 59.0, 103.0, 182.0, 377.0, 834.0, 2742.0, 12621.0, 105025.0, 691926.0, 206760.0, 21667.0, 3931.0, 1142.0, 426.0, 214.0, 126.0, 61.0, 50.0, 39.0, 23.0, 18.0, 10.0, 5.0, 11.0, 9.0, 7.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.28778076171875, -6.0325927734375, -5.77740478515625, -5.522216796875, -5.26702880859375, -5.0118408203125, -4.75665283203125, -4.50146484375, -4.24627685546875, -3.9910888671875, -3.73590087890625, -3.480712890625, -3.22552490234375, -2.9703369140625, -2.71514892578125, -2.4599609375, -2.20477294921875, -1.9495849609375, -1.69439697265625, -1.439208984375, -1.18402099609375, -0.9288330078125, -0.67364501953125, -0.41845703125, -0.16326904296875, 0.0919189453125, 0.34710693359375, 0.602294921875, 0.85748291015625, 1.1126708984375, 1.36785888671875, 1.623046875, 1.87823486328125, 2.1334228515625, 2.38861083984375, 2.643798828125, 2.89898681640625, 3.1541748046875, 3.40936279296875, 3.66455078125, 3.91973876953125, 4.1749267578125, 4.43011474609375, 4.685302734375, 4.94049072265625, 5.1956787109375, 5.45086669921875, 5.7060546875, 5.96124267578125, 6.2164306640625, 6.47161865234375, 6.726806640625, 6.98199462890625, 7.2371826171875, 7.49237060546875, 7.74755859375, 8.00274658203125, 8.2579345703125, 8.51312255859375, 8.768310546875, 9.02349853515625, 9.2786865234375, 9.53387451171875, 9.7890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 8.0, 10.0, 7.0, 15.0, 21.0, 24.0, 54.0, 59.0, 62.0, 88.0, 84.0, 92.0, 88.0, 86.0, 69.0, 61.0, 46.0, 31.0, 23.0, 18.0, 11.0, 11.0, 5.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007295608520507812, -0.0007030069828033447, -0.0006764531135559082, -0.0006498992443084717, -0.0006233453750610352, -0.0005967915058135986, -0.0005702376365661621, -0.0005436837673187256, -0.0005171298980712891, -0.0004905760288238525, -0.000464022159576416, -0.0004374682903289795, -0.00041091442108154297, -0.00038436055183410645, -0.0003578066825866699, -0.0003312528133392334, -0.0003046989440917969, -0.00027814507484436035, -0.00025159120559692383, -0.0002250373363494873, -0.00019848346710205078, -0.00017192959785461426, -0.00014537572860717773, -0.00011882185935974121, -9.226799011230469e-05, -6.571412086486816e-05, -3.916025161743164e-05, -1.2606382369995117e-05, 1.3947486877441406e-05, 4.050135612487793e-05, 6.705522537231445e-05, 9.360909461975098e-05, 0.0001201629638671875, 0.00014671683311462402, 0.00017327070236206055, 0.00019982457160949707, 0.0002263784408569336, 0.0002529323101043701, 0.00027948617935180664, 0.00030604004859924316, 0.0003325939178466797, 0.0003591477870941162, 0.00038570165634155273, 0.00041225552558898926, 0.0004388093948364258, 0.0004653632640838623, 0.0004919171333312988, 0.0005184710025787354, 0.0005450248718261719, 0.0005715787410736084, 0.0005981326103210449, 0.0006246864795684814, 0.000651240348815918, 0.0006777942180633545, 0.000704348087310791, 0.0007309019565582275, 0.0007574558258056641, 0.0007840096950531006, 0.0008105635643005371, 0.0008371174335479736, 0.0008636713027954102, 0.0008902251720428467, 0.0009167790412902832, 0.0009433329105377197, 0.0009698867797851562]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 4.0, 3.0, 11.0, 7.0, 16.0, 14.0, 22.0, 47.0, 64.0, 92.0, 151.0, 298.0, 584.0, 1307.0, 3646.0, 16533.0, 216654.0, 729916.0, 66842.0, 8067.0, 2255.0, 962.0, 446.0, 219.0, 120.0, 64.0, 57.0, 36.0, 28.0, 19.0, 18.0, 14.0, 9.0, 5.0, 5.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.6953125, -10.400634765625, -10.10595703125, -9.811279296875, -9.5166015625, -9.221923828125, -8.92724609375, -8.632568359375, -8.337890625, -8.043212890625, -7.74853515625, -7.453857421875, -7.1591796875, -6.864501953125, -6.56982421875, -6.275146484375, -5.98046875, -5.685791015625, -5.39111328125, -5.096435546875, -4.8017578125, -4.507080078125, -4.21240234375, -3.917724609375, -3.623046875, -3.328369140625, -3.03369140625, -2.739013671875, -2.4443359375, -2.149658203125, -1.85498046875, -1.560302734375, -1.265625, -0.970947265625, -0.67626953125, -0.381591796875, -0.0869140625, 0.207763671875, 0.50244140625, 0.797119140625, 1.091796875, 1.386474609375, 1.68115234375, 1.975830078125, 2.2705078125, 2.565185546875, 2.85986328125, 3.154541015625, 3.44921875, 3.743896484375, 4.03857421875, 4.333251953125, 4.6279296875, 4.922607421875, 5.21728515625, 5.511962890625, 5.806640625, 6.101318359375, 6.39599609375, 6.690673828125, 6.9853515625, 7.280029296875, 7.57470703125, 7.869384765625, 8.1640625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 3.0, 14.0, 14.0, 27.0, 44.0, 76.0, 80.0, 119.0, 114.0, 111.0, 119.0, 107.0, 50.0, 40.0, 26.0, 21.0, 14.0, 7.0, 3.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.70703125, -7.45819091796875, -7.2093505859375, -6.96051025390625, -6.711669921875, -6.46282958984375, -6.2139892578125, -5.96514892578125, -5.71630859375, -5.46746826171875, -5.2186279296875, -4.96978759765625, -4.720947265625, -4.47210693359375, -4.2232666015625, -3.97442626953125, -3.7255859375, -3.47674560546875, -3.2279052734375, -2.97906494140625, -2.730224609375, -2.48138427734375, -2.2325439453125, -1.98370361328125, -1.73486328125, -1.48602294921875, -1.2371826171875, -0.98834228515625, -0.739501953125, -0.49066162109375, -0.2418212890625, 0.00701904296875, 0.255859375, 0.50469970703125, 0.7535400390625, 1.00238037109375, 1.251220703125, 1.50006103515625, 1.7489013671875, 1.99774169921875, 2.24658203125, 2.49542236328125, 2.7442626953125, 2.99310302734375, 3.241943359375, 3.49078369140625, 3.7396240234375, 3.98846435546875, 4.2373046875, 4.48614501953125, 4.7349853515625, 4.98382568359375, 5.232666015625, 5.48150634765625, 5.7303466796875, 5.97918701171875, 6.22802734375, 6.47686767578125, 6.7257080078125, 6.97454833984375, 7.223388671875, 7.47222900390625, 7.7210693359375, 7.96990966796875, 8.21875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 20.0, 35.0, 55.0, 114.0, 200.0, 185.0, 189.0, 108.0, 56.0, 24.0, 8.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.13990783691406, -140.05184936523438, -135.9637908935547, -131.875732421875, -127.78766632080078, -123.6996078491211, -119.61154174804688, -115.52348327636719, -111.4354248046875, -107.34736633300781, -103.25930786132812, -99.1712417602539, -95.08318328857422, -90.99512481689453, -86.90705871582031, -82.81900024414062, -78.73094177246094, -74.64288330078125, -70.55482482910156, -66.46675872802734, -62.378700256347656, -58.29064178466797, -54.202579498291016, -50.11451721191406, -46.026458740234375, -41.93840026855469, -37.850337982177734, -33.76227569580078, -29.674217224121094, -25.586156845092773, -21.498096466064453, -17.410036087036133, -13.321968078613281, -9.233907699584961, -5.145847320556641, -1.0577869415283203, 3.0302734375, 7.11833381652832, 11.20639419555664, 15.294454574584961, 19.38251495361328, 23.4705753326416, 27.558635711669922, 31.646696090698242, 35.73475646972656, 39.82281494140625, 43.9108772277832, 47.998939514160156, 52.086997985839844, 56.17505645751953, 60.263118743896484, 64.35118103027344, 68.43923950195312, 72.52729797363281, 76.6153564453125, 80.70342254638672, 84.7914810180664, 88.8795394897461, 92.96760559082031, 97.0556640625, 101.14372253417969, 105.23178100585938, 109.31983947753906, 113.40790557861328, 117.49596405029297]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 6.0, 2.0, 7.0, 8.0, 7.0, 11.0, 12.0, 17.0, 14.0, 28.0, 37.0, 30.0, 30.0, 42.0, 40.0, 41.0, 47.0, 38.0, 56.0, 41.0, 47.0, 46.0, 48.0, 40.0, 39.0, 37.0, 32.0, 40.0, 29.0, 18.0, 17.0, 15.0, 16.0, 13.0, 12.0, 10.0, 10.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-55.38923645019531, -53.77009201049805, -52.15094757080078, -50.53179931640625, -48.912654876708984, -47.29351043701172, -45.67436599731445, -44.05522155761719, -42.436073303222656, -40.81692886352539, -39.197784423828125, -37.578636169433594, -35.95949172973633, -34.34034729003906, -32.7212028503418, -31.10205841064453, -29.482913970947266, -27.86376953125, -26.2446231842041, -24.625478744506836, -23.006332397460938, -21.387187957763672, -19.768043518066406, -18.14889907836914, -16.529752731323242, -14.91060733795166, -13.291461944580078, -11.672317504882812, -10.05317211151123, -8.434026718139648, -6.814882278442383, -5.195736885070801, -3.5765953063964844, -1.9574501514434814, -0.3383049964904785, 1.2808399200439453, 2.8999853134155273, 4.519130706787109, 6.138275146484375, 7.757420539855957, 9.376565933227539, 10.995711326599121, 12.614856719970703, 14.234001159667969, 15.85314655303955, 17.472291946411133, 19.0914363861084, 20.710582733154297, 22.329727172851562, 23.948871612548828, 25.568017959594727, 27.187162399291992, 28.80630874633789, 30.425453186035156, 32.04459762573242, 33.66374206542969, 35.28289031982422, 36.902034759521484, 38.52117919921875, 40.14032745361328, 41.75947189331055, 43.37861633300781, 44.99776077270508, 46.616905212402344, 48.23604965209961]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 3.0, 7.0, 6.0, 12.0, 13.0, 27.0, 47.0, 49.0, 93.0, 136.0, 239.0, 434.0, 856.0, 1779.0, 4173.0, 12804.0, 89582.0, 3971405.0, 91547.0, 13056.0, 4198.0, 1816.0, 849.0, 478.0, 258.0, 150.0, 76.0, 53.0, 33.0, 26.0, 18.0, 13.0, 10.0, 6.0, 4.0, 4.0, 6.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3125, -12.79052734375, -12.2685546875, -11.74658203125, -11.224609375, -10.70263671875, -10.1806640625, -9.65869140625, -9.13671875, -8.61474609375, -8.0927734375, -7.57080078125, -7.048828125, -6.52685546875, -6.0048828125, -5.48291015625, -4.9609375, -4.43896484375, -3.9169921875, -3.39501953125, -2.873046875, -2.35107421875, -1.8291015625, -1.30712890625, -0.78515625, -0.26318359375, 0.2587890625, 0.78076171875, 1.302734375, 1.82470703125, 2.3466796875, 2.86865234375, 3.390625, 3.91259765625, 4.4345703125, 4.95654296875, 5.478515625, 6.00048828125, 6.5224609375, 7.04443359375, 7.56640625, 8.08837890625, 8.6103515625, 9.13232421875, 9.654296875, 10.17626953125, 10.6982421875, 11.22021484375, 11.7421875, 12.26416015625, 12.7861328125, 13.30810546875, 13.830078125, 14.35205078125, 14.8740234375, 15.39599609375, 15.91796875, 16.43994140625, 16.9619140625, 17.48388671875, 18.005859375, 18.52783203125, 19.0498046875, 19.57177734375, 20.09375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 10.0, 11.0, 11.0, 20.0, 22.0, 22.0, 22.0, 33.0, 31.0, 29.0, 32.0, 46.0, 46.0, 53.0, 54.0, 44.0, 59.0, 45.0, 39.0, 40.0, 45.0, 36.0, 35.0, 29.0, 33.0, 15.0, 22.0, 21.0, 12.0, 16.0, 8.0, 9.0, 9.0, 10.0, 4.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.6328125, -2.5555419921875, -2.478271484375, -2.4010009765625, -2.32373046875, -2.2464599609375, -2.169189453125, -2.0919189453125, -2.0146484375, -1.9373779296875, -1.860107421875, -1.7828369140625, -1.70556640625, -1.6282958984375, -1.551025390625, -1.4737548828125, -1.396484375, -1.3192138671875, -1.241943359375, -1.1646728515625, -1.08740234375, -1.0101318359375, -0.932861328125, -0.8555908203125, -0.7783203125, -0.7010498046875, -0.623779296875, -0.5465087890625, -0.46923828125, -0.3919677734375, -0.314697265625, -0.2374267578125, -0.16015625, -0.0828857421875, -0.005615234375, 0.0716552734375, 0.14892578125, 0.2261962890625, 0.303466796875, 0.3807373046875, 0.4580078125, 0.5352783203125, 0.612548828125, 0.6898193359375, 0.76708984375, 0.8443603515625, 0.921630859375, 0.9989013671875, 1.076171875, 1.1534423828125, 1.230712890625, 1.3079833984375, 1.38525390625, 1.4625244140625, 1.539794921875, 1.6170654296875, 1.6943359375, 1.7716064453125, 1.848876953125, 1.9261474609375, 2.00341796875, 2.0806884765625, 2.157958984375, 2.2352294921875, 2.3125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 7.0, 12.0, 12.0, 19.0, 17.0, 27.0, 27.0, 47.0, 48.0, 74.0, 112.0, 186.0, 242.0, 369.0, 543.0, 928.0, 1606.0, 3251.0, 7040.0, 21010.0, 102946.0, 3776841.0, 227750.0, 32016.0, 10010.0, 3969.0, 2069.0, 1093.0, 672.0, 388.0, 272.0, 157.0, 141.0, 113.0, 69.0, 50.0, 31.0, 33.0, 23.0, 13.0, 12.0, 3.0, 13.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.96875, -11.6131591796875, -11.257568359375, -10.9019775390625, -10.54638671875, -10.1907958984375, -9.835205078125, -9.4796142578125, -9.1240234375, -8.7684326171875, -8.412841796875, -8.0572509765625, -7.70166015625, -7.3460693359375, -6.990478515625, -6.6348876953125, -6.279296875, -5.9237060546875, -5.568115234375, -5.2125244140625, -4.85693359375, -4.5013427734375, -4.145751953125, -3.7901611328125, -3.4345703125, -3.0789794921875, -2.723388671875, -2.3677978515625, -2.01220703125, -1.6566162109375, -1.301025390625, -0.9454345703125, -0.58984375, -0.2342529296875, 0.121337890625, 0.4769287109375, 0.83251953125, 1.1881103515625, 1.543701171875, 1.8992919921875, 2.2548828125, 2.6104736328125, 2.966064453125, 3.3216552734375, 3.67724609375, 4.0328369140625, 4.388427734375, 4.7440185546875, 5.099609375, 5.4552001953125, 5.810791015625, 6.1663818359375, 6.52197265625, 6.8775634765625, 7.233154296875, 7.5887451171875, 7.9443359375, 8.2999267578125, 8.655517578125, 9.0111083984375, 9.36669921875, 9.7222900390625, 10.077880859375, 10.4334716796875, 10.7890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 5.0, 6.0, 2.0, 7.0, 8.0, 19.0, 26.0, 48.0, 84.0, 160.0, 759.0, 2516.0, 221.0, 95.0, 40.0, 24.0, 24.0, 8.0, 8.0, 7.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.908203125, -2.808197021484375, -2.70819091796875, -2.608184814453125, -2.5081787109375, -2.408172607421875, -2.30816650390625, -2.208160400390625, -2.108154296875, -2.008148193359375, -1.90814208984375, -1.808135986328125, -1.7081298828125, -1.608123779296875, -1.50811767578125, -1.408111572265625, -1.30810546875, -1.208099365234375, -1.10809326171875, -1.008087158203125, -0.9080810546875, -0.808074951171875, -0.70806884765625, -0.608062744140625, -0.508056640625, -0.408050537109375, -0.30804443359375, -0.208038330078125, -0.1080322265625, -0.008026123046875, 0.09197998046875, 0.191986083984375, 0.2919921875, 0.391998291015625, 0.49200439453125, 0.592010498046875, 0.6920166015625, 0.792022705078125, 0.89202880859375, 0.992034912109375, 1.092041015625, 1.192047119140625, 1.29205322265625, 1.392059326171875, 1.4920654296875, 1.592071533203125, 1.69207763671875, 1.792083740234375, 1.89208984375, 1.992095947265625, 2.09210205078125, 2.192108154296875, 2.2921142578125, 2.392120361328125, 2.49212646484375, 2.592132568359375, 2.692138671875, 2.792144775390625, 2.89215087890625, 2.992156982421875, 3.0921630859375, 3.192169189453125, 3.29217529296875, 3.392181396484375, 3.4921875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 7.0, 14.0, 12.0, 22.0, 18.0, 23.0, 29.0, 34.0, 52.0, 60.0, 69.0, 64.0, 69.0, 75.0, 69.0, 55.0, 62.0, 49.0, 41.0, 40.0, 36.0, 31.0, 19.0, 8.0, 10.0, 7.0, 4.0, 0.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.038154125213623, -6.782145023345947, -6.526135444641113, -6.2701263427734375, -6.0141167640686035, -5.758107662200928, -5.502098083496094, -5.246088981628418, -4.990079879760742, -4.734070777893066, -4.478061199188232, -4.222052097320557, -3.9660425186157227, -3.710033416748047, -3.454024076461792, -3.198014736175537, -2.942005157470703, -2.6859958171844482, -2.4299864768981934, -2.1739773750305176, -1.9179679155349731, -1.6619585752487183, -1.405949354171753, -1.149940013885498, -0.8939306735992432, -0.6379213333129883, -0.3819120526313782, -0.12590277194976807, 0.13010656833648682, 0.3861159086227417, 0.642125129699707, 0.8981344699859619, 1.1541433334350586, 1.4101526737213135, 1.6661620140075684, 1.9221712350845337, 2.178180694580078, 2.434189796447754, 2.690199136734009, 2.9462084770202637, 3.2022178173065186, 3.4582271575927734, 3.7142364978790283, 3.970245838165283, 4.226254940032959, 4.482264518737793, 4.738273620605469, 4.9942827224731445, 5.2502923011779785, 5.506301403045654, 5.762310981750488, 6.018320083618164, 6.274329662322998, 6.530338764190674, 6.786348342895508, 7.042357444763184, 7.298366546630859, 7.554375648498535, 7.810385227203369, 8.066394805908203, 8.322403907775879, 8.578413009643555, 8.83442211151123, 9.090431213378906, 9.346441268920898]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 5.0, 5.0, 20.0, 12.0, 12.0, 19.0, 11.0, 26.0, 22.0, 20.0, 29.0, 31.0, 35.0, 37.0, 37.0, 39.0, 35.0, 40.0, 53.0, 45.0, 58.0, 46.0, 30.0, 25.0, 35.0, 33.0, 32.0, 24.0, 20.0, 20.0, 29.0, 24.0, 14.0, 9.0, 11.0, 9.0, 7.0, 9.0, 6.0, 4.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-6.410158157348633, -6.222423553466797, -6.034688949584961, -5.846954345703125, -5.659219741821289, -5.471485137939453, -5.283750534057617, -5.096015930175781, -4.908281326293945, -4.720546722412109, -4.532812118530273, -4.3450775146484375, -4.157342910766602, -3.9696083068847656, -3.781873941421509, -3.594139337539673, -3.406404972076416, -3.21867036819458, -3.030935764312744, -2.843201160430908, -2.6554665565490723, -2.4677319526672363, -2.2799975872039795, -2.0922629833221436, -1.9045283794403076, -1.7167937755584717, -1.5290591716766357, -1.3413246870040894, -1.1535900831222534, -0.9658554792404175, -0.7781209945678711, -0.5903863906860352, -0.4026517868041992, -0.21491721272468567, -0.02718263864517212, 0.16055190563201904, 0.348286509513855, 0.5360211133956909, 0.7237555980682373, 0.9114902019500732, 1.0992248058319092, 1.2869594097137451, 1.474694013595581, 1.6624284982681274, 1.8501631021499634, 2.0378975868225098, 2.2256321907043457, 2.4133667945861816, 2.6011013984680176, 2.7888360023498535, 2.9765706062316895, 3.1643052101135254, 3.3520398139953613, 3.5397744178771973, 3.727508783340454, 3.91524338722229, 4.102977752685547, 4.290712356567383, 4.478446960449219, 4.666181564331055, 4.853916168212891, 5.041650772094727, 5.2293853759765625, 5.417119979858398, 5.604854583740234]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 6.0, 10.0, 10.0, 14.0, 20.0, 32.0, 48.0, 54.0, 96.0, 148.0, 257.0, 413.0, 696.0, 1193.0, 2198.0, 4321.0, 9469.0, 22358.0, 58429.0, 147224.0, 283885.0, 278959.0, 142129.0, 56388.0, 21825.0, 9199.0, 4166.0, 2170.0, 1134.0, 656.0, 393.0, 235.0, 150.0, 91.0, 53.0, 33.0, 27.0, 15.0, 20.0, 7.0, 11.0, 6.0, 3.0, 1.0, 0.0, 2.0, 4.0], "bins": [-7.05859375, -6.87274169921875, -6.6868896484375, -6.50103759765625, -6.315185546875, -6.12933349609375, -5.9434814453125, -5.75762939453125, -5.57177734375, -5.38592529296875, -5.2000732421875, -5.01422119140625, -4.828369140625, -4.64251708984375, -4.4566650390625, -4.27081298828125, -4.0849609375, -3.89910888671875, -3.7132568359375, -3.52740478515625, -3.341552734375, -3.15570068359375, -2.9698486328125, -2.78399658203125, -2.59814453125, -2.41229248046875, -2.2264404296875, -2.04058837890625, -1.854736328125, -1.66888427734375, -1.4830322265625, -1.29718017578125, -1.111328125, -0.92547607421875, -0.7396240234375, -0.55377197265625, -0.367919921875, -0.18206787109375, 0.0037841796875, 0.18963623046875, 0.37548828125, 0.56134033203125, 0.7471923828125, 0.93304443359375, 1.118896484375, 1.30474853515625, 1.4906005859375, 1.67645263671875, 1.8623046875, 2.04815673828125, 2.2340087890625, 2.41986083984375, 2.605712890625, 2.79156494140625, 2.9774169921875, 3.16326904296875, 3.34912109375, 3.53497314453125, 3.7208251953125, 3.90667724609375, 4.092529296875, 4.27838134765625, 4.4642333984375, 4.65008544921875, 4.8359375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 12.0, 8.0, 5.0, 8.0, 14.0, 11.0, 26.0, 17.0, 29.0, 27.0, 35.0, 35.0, 37.0, 35.0, 47.0, 40.0, 51.0, 56.0, 38.0, 48.0, 49.0, 41.0, 36.0, 39.0, 36.0, 25.0, 25.0, 23.0, 26.0, 18.0, 21.0, 15.0, 9.0, 15.0, 9.0, 12.0, 3.0, 3.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.482421875, -2.4034423828125, -2.324462890625, -2.2454833984375, -2.16650390625, -2.0875244140625, -2.008544921875, -1.9295654296875, -1.8505859375, -1.7716064453125, -1.692626953125, -1.6136474609375, -1.53466796875, -1.4556884765625, -1.376708984375, -1.2977294921875, -1.21875, -1.1397705078125, -1.060791015625, -0.9818115234375, -0.90283203125, -0.8238525390625, -0.744873046875, -0.6658935546875, -0.5869140625, -0.5079345703125, -0.428955078125, -0.3499755859375, -0.27099609375, -0.1920166015625, -0.113037109375, -0.0340576171875, 0.044921875, 0.1239013671875, 0.202880859375, 0.2818603515625, 0.36083984375, 0.4398193359375, 0.518798828125, 0.5977783203125, 0.6767578125, 0.7557373046875, 0.834716796875, 0.9136962890625, 0.99267578125, 1.0716552734375, 1.150634765625, 1.2296142578125, 1.30859375, 1.3875732421875, 1.466552734375, 1.5455322265625, 1.62451171875, 1.7034912109375, 1.782470703125, 1.8614501953125, 1.9404296875, 2.0194091796875, 2.098388671875, 2.1773681640625, 2.25634765625, 2.3353271484375, 2.414306640625, 2.4932861328125, 2.572265625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 5.0, 10.0, 16.0, 21.0, 24.0, 24.0, 43.0, 49.0, 88.0, 94.0, 158.0, 232.0, 270.0, 440.0, 602.0, 863.0, 1381.0, 3098.0, 12630.0, 134399.0, 760477.0, 115099.0, 11352.0, 2986.0, 1385.0, 865.0, 574.0, 385.0, 263.0, 219.0, 107.0, 94.0, 84.0, 65.0, 35.0, 27.0, 17.0, 18.0, 12.0, 6.0, 10.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.703125, -12.2569580078125, -11.810791015625, -11.3646240234375, -10.91845703125, -10.4722900390625, -10.026123046875, -9.5799560546875, -9.1337890625, -8.6876220703125, -8.241455078125, -7.7952880859375, -7.34912109375, -6.9029541015625, -6.456787109375, -6.0106201171875, -5.564453125, -5.1182861328125, -4.672119140625, -4.2259521484375, -3.77978515625, -3.3336181640625, -2.887451171875, -2.4412841796875, -1.9951171875, -1.5489501953125, -1.102783203125, -0.6566162109375, -0.21044921875, 0.2357177734375, 0.681884765625, 1.1280517578125, 1.57421875, 2.0203857421875, 2.466552734375, 2.9127197265625, 3.35888671875, 3.8050537109375, 4.251220703125, 4.6973876953125, 5.1435546875, 5.5897216796875, 6.035888671875, 6.4820556640625, 6.92822265625, 7.3743896484375, 7.820556640625, 8.2667236328125, 8.712890625, 9.1590576171875, 9.605224609375, 10.0513916015625, 10.49755859375, 10.9437255859375, 11.389892578125, 11.8360595703125, 12.2822265625, 12.7283935546875, 13.174560546875, 13.6207275390625, 14.06689453125, 14.5130615234375, 14.959228515625, 15.4053955078125, 15.8515625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 5.0, 15.0, 14.0, 7.0, 13.0, 16.0, 23.0, 23.0, 39.0, 30.0, 29.0, 27.0, 31.0, 43.0, 45.0, 56.0, 45.0, 50.0, 52.0, 42.0, 45.0, 35.0, 34.0, 38.0, 33.0, 29.0, 31.0, 19.0, 19.0, 17.0, 16.0, 15.0, 18.0, 9.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-12.875, -12.5174560546875, -12.159912109375, -11.8023681640625, -11.44482421875, -11.0872802734375, -10.729736328125, -10.3721923828125, -10.0146484375, -9.6571044921875, -9.299560546875, -8.9420166015625, -8.58447265625, -8.2269287109375, -7.869384765625, -7.5118408203125, -7.154296875, -6.7967529296875, -6.439208984375, -6.0816650390625, -5.72412109375, -5.3665771484375, -5.009033203125, -4.6514892578125, -4.2939453125, -3.9364013671875, -3.578857421875, -3.2213134765625, -2.86376953125, -2.5062255859375, -2.148681640625, -1.7911376953125, -1.43359375, -1.0760498046875, -0.718505859375, -0.3609619140625, -0.00341796875, 0.3541259765625, 0.711669921875, 1.0692138671875, 1.4267578125, 1.7843017578125, 2.141845703125, 2.4993896484375, 2.85693359375, 3.2144775390625, 3.572021484375, 3.9295654296875, 4.287109375, 4.6446533203125, 5.002197265625, 5.3597412109375, 5.71728515625, 6.0748291015625, 6.432373046875, 6.7899169921875, 7.1474609375, 7.5050048828125, 7.862548828125, 8.2200927734375, 8.57763671875, 8.9351806640625, 9.292724609375, 9.6502685546875, 10.0078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 7.0, 6.0, 15.0, 23.0, 35.0, 53.0, 86.0, 174.0, 351.0, 905.0, 3515.0, 54568.0, 955350.0, 29509.0, 2580.0, 720.0, 285.0, 169.0, 82.0, 41.0, 19.0, 20.0, 11.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3828125, -13.8582763671875, -13.333740234375, -12.8092041015625, -12.28466796875, -11.7601318359375, -11.235595703125, -10.7110595703125, -10.1865234375, -9.6619873046875, -9.137451171875, -8.6129150390625, -8.08837890625, -7.5638427734375, -7.039306640625, -6.5147705078125, -5.990234375, -5.4656982421875, -4.941162109375, -4.4166259765625, -3.89208984375, -3.3675537109375, -2.843017578125, -2.3184814453125, -1.7939453125, -1.2694091796875, -0.744873046875, -0.2203369140625, 0.30419921875, 0.8287353515625, 1.353271484375, 1.8778076171875, 2.40234375, 2.9268798828125, 3.451416015625, 3.9759521484375, 4.50048828125, 5.0250244140625, 5.549560546875, 6.0740966796875, 6.5986328125, 7.1231689453125, 7.647705078125, 8.1722412109375, 8.69677734375, 9.2213134765625, 9.745849609375, 10.2703857421875, 10.794921875, 11.3194580078125, 11.843994140625, 12.3685302734375, 12.89306640625, 13.4176025390625, 13.942138671875, 14.4666748046875, 14.9912109375, 15.5157470703125, 16.040283203125, 16.5648193359375, 17.08935546875, 17.6138916015625, 18.138427734375, 18.6629638671875, 19.1875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 9.0, 13.0, 12.0, 25.0, 31.0, 52.0, 84.0, 105.0, 171.0, 154.0, 109.0, 77.0, 49.0, 47.0, 25.0, 14.0, 10.0, 3.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010347366333007812, -0.0009977370500564575, -0.0009607374668121338, -0.0009237378835678101, -0.0008867383003234863, -0.0008497387170791626, -0.0008127391338348389, -0.0007757395505905151, -0.0007387399673461914, -0.0007017403841018677, -0.0006647408008575439, -0.0006277412176132202, -0.0005907416343688965, -0.0005537420511245728, -0.000516742467880249, -0.0004797428846359253, -0.00044274330139160156, -0.00040574371814727783, -0.0003687441349029541, -0.00033174455165863037, -0.00029474496841430664, -0.0002577453851699829, -0.00022074580192565918, -0.00018374621868133545, -0.00014674663543701172, -0.00010974705219268799, -7.274746894836426e-05, -3.574788570404053e-05, 1.2516975402832031e-06, 3.8251280784606934e-05, 7.525086402893066e-05, 0.0001122504472732544, 0.00014925003051757812, 0.00018624961376190186, 0.00022324919700622559, 0.0002602487802505493, 0.00029724836349487305, 0.0003342479467391968, 0.0003712475299835205, 0.00040824711322784424, 0.00044524669647216797, 0.0004822462797164917, 0.0005192458629608154, 0.0005562454462051392, 0.0005932450294494629, 0.0006302446126937866, 0.0006672441959381104, 0.0007042437791824341, 0.0007412433624267578, 0.0007782429456710815, 0.0008152425289154053, 0.000852242112159729, 0.0008892416954040527, 0.0009262412786483765, 0.0009632408618927002, 0.001000240445137024, 0.0010372400283813477, 0.0010742396116256714, 0.0011112391948699951, 0.0011482387781143188, 0.0011852383613586426, 0.0012222379446029663, 0.00125923752784729, 0.0012962371110916138, 0.0013332366943359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 9.0, 23.0, 18.0, 27.0, 33.0, 71.0, 140.0, 273.0, 785.0, 2718.0, 31832.0, 976543.0, 31933.0, 2826.0, 745.0, 291.0, 118.0, 77.0, 39.0, 19.0, 11.0, 3.0, 9.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.421875, -25.71728515625, -25.0126953125, -24.30810546875, -23.603515625, -22.89892578125, -22.1943359375, -21.48974609375, -20.78515625, -20.08056640625, -19.3759765625, -18.67138671875, -17.966796875, -17.26220703125, -16.5576171875, -15.85302734375, -15.1484375, -14.44384765625, -13.7392578125, -13.03466796875, -12.330078125, -11.62548828125, -10.9208984375, -10.21630859375, -9.51171875, -8.80712890625, -8.1025390625, -7.39794921875, -6.693359375, -5.98876953125, -5.2841796875, -4.57958984375, -3.875, -3.17041015625, -2.4658203125, -1.76123046875, -1.056640625, -0.35205078125, 0.3525390625, 1.05712890625, 1.76171875, 2.46630859375, 3.1708984375, 3.87548828125, 4.580078125, 5.28466796875, 5.9892578125, 6.69384765625, 7.3984375, 8.10302734375, 8.8076171875, 9.51220703125, 10.216796875, 10.92138671875, 11.6259765625, 12.33056640625, 13.03515625, 13.73974609375, 14.4443359375, 15.14892578125, 15.853515625, 16.55810546875, 17.2626953125, 17.96728515625, 18.671875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 9.0, 26.0, 24.0, 33.0, 48.0, 82.0, 104.0, 160.0, 150.0, 112.0, 89.0, 57.0, 31.0, 20.0, 24.0, 10.0, 5.0, 7.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0859375, -10.740234375, -10.39453125, -10.048828125, -9.703125, -9.357421875, -9.01171875, -8.666015625, -8.3203125, -7.974609375, -7.62890625, -7.283203125, -6.9375, -6.591796875, -6.24609375, -5.900390625, -5.5546875, -5.208984375, -4.86328125, -4.517578125, -4.171875, -3.826171875, -3.48046875, -3.134765625, -2.7890625, -2.443359375, -2.09765625, -1.751953125, -1.40625, -1.060546875, -0.71484375, -0.369140625, -0.0234375, 0.322265625, 0.66796875, 1.013671875, 1.359375, 1.705078125, 2.05078125, 2.396484375, 2.7421875, 3.087890625, 3.43359375, 3.779296875, 4.125, 4.470703125, 4.81640625, 5.162109375, 5.5078125, 5.853515625, 6.19921875, 6.544921875, 6.890625, 7.236328125, 7.58203125, 7.927734375, 8.2734375, 8.619140625, 8.96484375, 9.310546875, 9.65625, 10.001953125, 10.34765625, 10.693359375, 11.0390625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 11.0, 20.0, 56.0, 156.0, 271.0, 284.0, 130.0, 50.0, 15.0, 9.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.652587890625, -127.0541763305664, -121.45575714111328, -115.85734558105469, -110.25892639160156, -104.66051483154297, -99.06210327148438, -93.46368408203125, -87.86526489257812, -82.26685333251953, -76.6684341430664, -71.07002258300781, -65.47160339355469, -59.873191833496094, -54.274776458740234, -48.676361083984375, -43.07794952392578, -37.47953414916992, -31.881118774414062, -26.282705307006836, -20.684289932250977, -15.085874557495117, -9.48746109008789, -3.8890457153320312, 1.7093696594238281, 7.307784557342529, 12.90619945526123, 18.504613876342773, 24.103029251098633, 29.701444625854492, 35.29985809326172, 40.89827346801758, 46.49668884277344, 52.0951042175293, 57.693519592285156, 63.29193115234375, 68.89035034179688, 74.48876190185547, 80.08717346191406, 85.68559265136719, 91.28401184082031, 96.8824234008789, 102.48084259033203, 108.07925415039062, 113.67767333984375, 119.27608489990234, 124.87449645996094, 130.47291564941406, 136.07131958007812, 141.66973876953125, 147.2681427001953, 152.86656188964844, 158.46498107910156, 164.0634002685547, 169.66180419921875, 175.26022338867188, 180.858642578125, 186.45706176757812, 192.0554656982422, 197.6538848876953, 203.25230407714844, 208.85072326660156, 214.44912719726562, 220.04754638671875, 225.64596557617188]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 11.0, 8.0, 7.0, 5.0, 17.0, 18.0, 15.0, 28.0, 36.0, 27.0, 33.0, 41.0, 42.0, 47.0, 53.0, 45.0, 41.0, 50.0, 41.0, 34.0, 45.0, 43.0, 40.0, 43.0, 24.0, 36.0, 32.0, 26.0, 24.0, 10.0, 20.0, 14.0, 11.0, 11.0, 3.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.297813415527344, -55.48482131958008, -53.67182922363281, -51.85883712768555, -50.04584503173828, -48.232852935791016, -46.41986083984375, -44.606868743896484, -42.79387664794922, -40.98088455200195, -39.16789245605469, -37.35490036010742, -35.541908264160156, -33.72891616821289, -31.915924072265625, -30.10293197631836, -28.28993797302246, -26.476945877075195, -24.66395378112793, -22.850961685180664, -21.0379695892334, -19.2249755859375, -17.411983489990234, -15.598992347717285, -13.78600025177002, -11.973008155822754, -10.160016059875488, -8.347023010253906, -6.534031391143799, -4.721038818359375, -2.9080467224121094, -1.0950546264648438, 0.7179374694824219, 2.5309295654296875, 4.343921661376953, 6.156914234161377, 7.969906330108643, 9.782898902893066, 11.595890998840332, 13.408883094787598, 15.221875190734863, 17.034868240356445, 18.84786033630371, 20.660852432250977, 22.473844528198242, 24.286836624145508, 26.099828720092773, 27.91282081604004, 29.725812911987305, 31.53880500793457, 33.35179901123047, 35.164791107177734, 36.977783203125, 38.790775299072266, 40.60376739501953, 42.4167594909668, 44.22975158691406, 46.04274368286133, 47.855735778808594, 49.66872787475586, 51.481719970703125, 53.29471206665039, 55.107704162597656, 56.92069625854492, 58.73368835449219]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 2.0, 3.0, 4.0, 9.0, 9.0, 14.0, 23.0, 49.0, 60.0, 105.0, 166.0, 249.0, 396.0, 716.0, 1306.0, 2677.0, 8370.0, 47398.0, 4059162.0, 58008.0, 9372.0, 2933.0, 1309.0, 788.0, 443.0, 275.0, 175.0, 86.0, 64.0, 33.0, 22.0, 21.0, 10.0, 9.0, 8.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.71875, -18.16064453125, -17.6025390625, -17.04443359375, -16.486328125, -15.92822265625, -15.3701171875, -14.81201171875, -14.25390625, -13.69580078125, -13.1376953125, -12.57958984375, -12.021484375, -11.46337890625, -10.9052734375, -10.34716796875, -9.7890625, -9.23095703125, -8.6728515625, -8.11474609375, -7.556640625, -6.99853515625, -6.4404296875, -5.88232421875, -5.32421875, -4.76611328125, -4.2080078125, -3.64990234375, -3.091796875, -2.53369140625, -1.9755859375, -1.41748046875, -0.859375, -0.30126953125, 0.2568359375, 0.81494140625, 1.373046875, 1.93115234375, 2.4892578125, 3.04736328125, 3.60546875, 4.16357421875, 4.7216796875, 5.27978515625, 5.837890625, 6.39599609375, 6.9541015625, 7.51220703125, 8.0703125, 8.62841796875, 9.1865234375, 9.74462890625, 10.302734375, 10.86083984375, 11.4189453125, 11.97705078125, 12.53515625, 13.09326171875, 13.6513671875, 14.20947265625, 14.767578125, 15.32568359375, 15.8837890625, 16.44189453125, 17.0]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 4.0, 9.0, 13.0, 8.0, 22.0, 30.0, 31.0, 36.0, 46.0, 34.0, 53.0, 49.0, 54.0, 63.0, 58.0, 51.0, 56.0, 51.0, 49.0, 43.0, 33.0, 40.0, 30.0, 22.0, 18.0, 21.0, 8.0, 15.0, 9.0, 10.0, 5.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.892578125, -2.79168701171875, -2.6907958984375, -2.58990478515625, -2.489013671875, -2.38812255859375, -2.2872314453125, -2.18634033203125, -2.08544921875, -1.98455810546875, -1.8836669921875, -1.78277587890625, -1.681884765625, -1.58099365234375, -1.4801025390625, -1.37921142578125, -1.2783203125, -1.17742919921875, -1.0765380859375, -0.97564697265625, -0.874755859375, -0.77386474609375, -0.6729736328125, -0.57208251953125, -0.47119140625, -0.37030029296875, -0.2694091796875, -0.16851806640625, -0.067626953125, 0.03326416015625, 0.1341552734375, 0.23504638671875, 0.3359375, 0.43682861328125, 0.5377197265625, 0.63861083984375, 0.739501953125, 0.84039306640625, 0.9412841796875, 1.04217529296875, 1.14306640625, 1.24395751953125, 1.3448486328125, 1.44573974609375, 1.546630859375, 1.64752197265625, 1.7484130859375, 1.84930419921875, 1.9501953125, 2.05108642578125, 2.1519775390625, 2.25286865234375, 2.353759765625, 2.45465087890625, 2.5555419921875, 2.65643310546875, 2.75732421875, 2.85821533203125, 2.9591064453125, 3.05999755859375, 3.160888671875, 3.26177978515625, 3.3626708984375, 3.46356201171875, 3.564453125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 4.0, 0.0, 6.0, 4.0, 3.0, 7.0, 6.0, 1.0, 8.0, 8.0, 5.0, 9.0, 12.0, 14.0, 18.0, 17.0, 32.0, 26.0, 43.0, 39.0, 69.0, 96.0, 147.0, 249.0, 520.0, 1158.0, 3204.0, 12547.0, 325323.0, 3828703.0, 15692.0, 3619.0, 1244.0, 575.0, 273.0, 150.0, 115.0, 74.0, 54.0, 32.0, 26.0, 23.0, 19.0, 19.0, 17.0, 15.0, 13.0, 11.0, 5.0, 12.0, 9.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.609375, -19.966552734375, -19.32373046875, -18.680908203125, -18.0380859375, -17.395263671875, -16.75244140625, -16.109619140625, -15.466796875, -14.823974609375, -14.18115234375, -13.538330078125, -12.8955078125, -12.252685546875, -11.60986328125, -10.967041015625, -10.32421875, -9.681396484375, -9.03857421875, -8.395751953125, -7.7529296875, -7.110107421875, -6.46728515625, -5.824462890625, -5.181640625, -4.538818359375, -3.89599609375, -3.253173828125, -2.6103515625, -1.967529296875, -1.32470703125, -0.681884765625, -0.0390625, 0.603759765625, 1.24658203125, 1.889404296875, 2.5322265625, 3.175048828125, 3.81787109375, 4.460693359375, 5.103515625, 5.746337890625, 6.38916015625, 7.031982421875, 7.6748046875, 8.317626953125, 8.96044921875, 9.603271484375, 10.24609375, 10.888916015625, 11.53173828125, 12.174560546875, 12.8173828125, 13.460205078125, 14.10302734375, 14.745849609375, 15.388671875, 16.031494140625, 16.67431640625, 17.317138671875, 17.9599609375, 18.602783203125, 19.24560546875, 19.888427734375, 20.53125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 10.0, 23.0, 50.0, 197.0, 3541.0, 165.0, 40.0, 22.0, 8.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.263671875, -3.111541748046875, -2.95941162109375, -2.807281494140625, -2.6551513671875, -2.503021240234375, -2.35089111328125, -2.198760986328125, -2.046630859375, -1.894500732421875, -1.74237060546875, -1.590240478515625, -1.4381103515625, -1.285980224609375, -1.13385009765625, -0.981719970703125, -0.82958984375, -0.677459716796875, -0.52532958984375, -0.373199462890625, -0.2210693359375, -0.068939208984375, 0.08319091796875, 0.235321044921875, 0.387451171875, 0.539581298828125, 0.69171142578125, 0.843841552734375, 0.9959716796875, 1.148101806640625, 1.30023193359375, 1.452362060546875, 1.6044921875, 1.756622314453125, 1.90875244140625, 2.060882568359375, 2.2130126953125, 2.365142822265625, 2.51727294921875, 2.669403076171875, 2.821533203125, 2.973663330078125, 3.12579345703125, 3.277923583984375, 3.4300537109375, 3.582183837890625, 3.73431396484375, 3.886444091796875, 4.03857421875, 4.190704345703125, 4.34283447265625, 4.494964599609375, 4.6470947265625, 4.799224853515625, 4.95135498046875, 5.103485107421875, 5.255615234375, 5.407745361328125, 5.55987548828125, 5.712005615234375, 5.8641357421875, 6.016265869140625, 6.16839599609375, 6.320526123046875, 6.47265625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 8.0, 8.0, 33.0, 57.0, 83.0, 126.0, 144.0, 148.0, 146.0, 95.0, 57.0, 39.0, 22.0, 15.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.874612808227539, -15.409102439880371, -14.943591117858887, -14.478080749511719, -14.012569427490234, -13.547059059143066, -13.081548690795898, -12.616037368774414, -12.15052604675293, -11.685015678405762, -11.219504356384277, -10.75399398803711, -10.288482666015625, -9.822972297668457, -9.357461929321289, -8.891950607299805, -8.426440238952637, -7.9609293937683105, -7.495418548583984, -7.029908180236816, -6.564396858215332, -6.098886489868164, -5.633375644683838, -5.167864799499512, -4.7023539543151855, -4.236843109130859, -3.771332263946533, -3.305821657180786, -2.84031081199646, -2.374799966812134, -1.9092893600463867, -1.4437785148620605, -0.978266716003418, -0.5127559304237366, -0.047245144844055176, 0.41826558113098145, 0.8837764263153076, 1.3492872714996338, 1.8147978782653809, 2.280308723449707, 2.745819568634033, 3.2113304138183594, 3.6768412590026855, 4.142352104187012, 4.60786247253418, 5.073373794555664, 5.538884162902832, 6.004395008087158, 6.469905853271484, 6.9354166984558105, 7.400927543640137, 7.866437911987305, 8.331949234008789, 8.797459602355957, 9.262969970703125, 9.72848129272461, 10.193992614746094, 10.659502983093262, 11.125014305114746, 11.590524673461914, 12.056035995483398, 12.521546363830566, 12.987056732177734, 13.452568054199219, 13.918078422546387]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 9.0, 5.0, 12.0, 9.0, 10.0, 17.0, 16.0, 13.0, 26.0, 28.0, 31.0, 22.0, 35.0, 35.0, 35.0, 49.0, 35.0, 29.0, 39.0, 45.0, 40.0, 38.0, 27.0, 44.0, 36.0, 35.0, 22.0, 26.0, 38.0, 30.0, 28.0, 30.0, 12.0, 19.0, 14.0, 10.0, 7.0, 8.0, 6.0, 9.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-5.357210159301758, -5.199270248413086, -5.041330337524414, -4.8833909034729, -4.7254509925842285, -4.567511081695557, -4.409571647644043, -4.251631736755371, -4.093691825866699, -3.9357519149780273, -3.7778122425079346, -3.619872570037842, -3.46193265914917, -3.303992748260498, -3.1460530757904053, -2.9881134033203125, -2.8301734924316406, -2.6722335815429688, -2.514293909072876, -2.356354236602783, -2.1984143257141113, -2.0404744148254395, -1.8825347423553467, -1.7245949506759644, -1.566655158996582, -1.4087153673171997, -1.2507755756378174, -1.092835783958435, -0.9348959922790527, -0.7769562005996704, -0.6190164089202881, -0.46107661724090576, -0.30313634872436523, -0.1451965570449829, 0.012743234634399414, 0.17068302631378174, 0.32862281799316406, 0.4865626096725464, 0.6445024013519287, 0.802442193031311, 0.9603819847106934, 1.1183217763900757, 1.276261568069458, 1.4342013597488403, 1.5921411514282227, 1.750080943107605, 1.9080207347869873, 2.06596040725708, 2.223900318145752, 2.381840229034424, 2.5397799015045166, 2.6977195739746094, 2.8556594848632812, 3.013599395751953, 3.171539068222046, 3.3294787406921387, 3.4874186515808105, 3.6453585624694824, 3.803298234939575, 3.961237907409668, 4.11917781829834, 4.277117729187012, 4.435057640075684, 4.592997074127197, 4.750936985015869]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 11.0, 13.0, 20.0, 19.0, 20.0, 42.0, 75.0, 118.0, 191.0, 377.0, 735.0, 1694.0, 4536.0, 14710.0, 57599.0, 242718.0, 490131.0, 176305.0, 41805.0, 11161.0, 3546.0, 1328.0, 649.0, 318.0, 168.0, 82.0, 73.0, 29.0, 20.0, 23.0, 11.0, 8.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6171875, -9.34539794921875, -9.0736083984375, -8.80181884765625, -8.530029296875, -8.25823974609375, -7.9864501953125, -7.71466064453125, -7.44287109375, -7.17108154296875, -6.8992919921875, -6.62750244140625, -6.355712890625, -6.08392333984375, -5.8121337890625, -5.54034423828125, -5.2685546875, -4.99676513671875, -4.7249755859375, -4.45318603515625, -4.181396484375, -3.90960693359375, -3.6378173828125, -3.36602783203125, -3.09423828125, -2.82244873046875, -2.5506591796875, -2.27886962890625, -2.007080078125, -1.73529052734375, -1.4635009765625, -1.19171142578125, -0.919921875, -0.64813232421875, -0.3763427734375, -0.10455322265625, 0.167236328125, 0.43902587890625, 0.7108154296875, 0.98260498046875, 1.25439453125, 1.52618408203125, 1.7979736328125, 2.06976318359375, 2.341552734375, 2.61334228515625, 2.8851318359375, 3.15692138671875, 3.4287109375, 3.70050048828125, 3.9722900390625, 4.24407958984375, 4.515869140625, 4.78765869140625, 5.0594482421875, 5.33123779296875, 5.60302734375, 5.87481689453125, 6.1466064453125, 6.41839599609375, 6.690185546875, 6.96197509765625, 7.2337646484375, 7.50555419921875, 7.77734375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 7.0, 3.0, 7.0, 9.0, 9.0, 14.0, 17.0, 28.0, 32.0, 39.0, 38.0, 36.0, 48.0, 43.0, 52.0, 51.0, 59.0, 64.0, 59.0, 49.0, 52.0, 42.0, 43.0, 36.0, 34.0, 33.0, 19.0, 12.0, 14.0, 10.0, 13.0, 11.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.203125, -3.096527099609375, -2.98992919921875, -2.883331298828125, -2.7767333984375, -2.670135498046875, -2.56353759765625, -2.456939697265625, -2.350341796875, -2.243743896484375, -2.13714599609375, -2.030548095703125, -1.9239501953125, -1.817352294921875, -1.71075439453125, -1.604156494140625, -1.49755859375, -1.390960693359375, -1.28436279296875, -1.177764892578125, -1.0711669921875, -0.964569091796875, -0.85797119140625, -0.751373291015625, -0.644775390625, -0.538177490234375, -0.43157958984375, -0.324981689453125, -0.2183837890625, -0.111785888671875, -0.00518798828125, 0.101409912109375, 0.2080078125, 0.314605712890625, 0.42120361328125, 0.527801513671875, 0.6343994140625, 0.740997314453125, 0.84759521484375, 0.954193115234375, 1.060791015625, 1.167388916015625, 1.27398681640625, 1.380584716796875, 1.4871826171875, 1.593780517578125, 1.70037841796875, 1.806976318359375, 1.91357421875, 2.020172119140625, 2.12677001953125, 2.233367919921875, 2.3399658203125, 2.446563720703125, 2.55316162109375, 2.659759521484375, 2.766357421875, 2.872955322265625, 2.97955322265625, 3.086151123046875, 3.1927490234375, 3.299346923828125, 3.40594482421875, 3.512542724609375, 3.619140625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 4.0, 10.0, 19.0, 36.0, 57.0, 94.0, 170.0, 346.0, 637.0, 1643.0, 9568.0, 765231.0, 262785.0, 5484.0, 1329.0, 538.0, 255.0, 145.0, 68.0, 42.0, 38.0, 16.0, 10.0, 8.0, 7.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.375, -26.458984375, -25.54296875, -24.626953125, -23.7109375, -22.794921875, -21.87890625, -20.962890625, -20.046875, -19.130859375, -18.21484375, -17.298828125, -16.3828125, -15.466796875, -14.55078125, -13.634765625, -12.71875, -11.802734375, -10.88671875, -9.970703125, -9.0546875, -8.138671875, -7.22265625, -6.306640625, -5.390625, -4.474609375, -3.55859375, -2.642578125, -1.7265625, -0.810546875, 0.10546875, 1.021484375, 1.9375, 2.853515625, 3.76953125, 4.685546875, 5.6015625, 6.517578125, 7.43359375, 8.349609375, 9.265625, 10.181640625, 11.09765625, 12.013671875, 12.9296875, 13.845703125, 14.76171875, 15.677734375, 16.59375, 17.509765625, 18.42578125, 19.341796875, 20.2578125, 21.173828125, 22.08984375, 23.005859375, 23.921875, 24.837890625, 25.75390625, 26.669921875, 27.5859375, 28.501953125, 29.41796875, 30.333984375, 31.25]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 15.0, 25.0, 23.0, 29.0, 43.0, 43.0, 58.0, 72.0, 83.0, 93.0, 67.0, 66.0, 66.0, 53.0, 47.0, 45.0, 34.0, 31.0, 28.0, 15.0, 16.0, 5.0, 13.0, 8.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.625, -18.95068359375, -18.2763671875, -17.60205078125, -16.927734375, -16.25341796875, -15.5791015625, -14.90478515625, -14.23046875, -13.55615234375, -12.8818359375, -12.20751953125, -11.533203125, -10.85888671875, -10.1845703125, -9.51025390625, -8.8359375, -8.16162109375, -7.4873046875, -6.81298828125, -6.138671875, -5.46435546875, -4.7900390625, -4.11572265625, -3.44140625, -2.76708984375, -2.0927734375, -1.41845703125, -0.744140625, -0.06982421875, 0.6044921875, 1.27880859375, 1.953125, 2.62744140625, 3.3017578125, 3.97607421875, 4.650390625, 5.32470703125, 5.9990234375, 6.67333984375, 7.34765625, 8.02197265625, 8.6962890625, 9.37060546875, 10.044921875, 10.71923828125, 11.3935546875, 12.06787109375, 12.7421875, 13.41650390625, 14.0908203125, 14.76513671875, 15.439453125, 16.11376953125, 16.7880859375, 17.46240234375, 18.13671875, 18.81103515625, 19.4853515625, 20.15966796875, 20.833984375, 21.50830078125, 22.1826171875, 22.85693359375, 23.53125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 3.0, 1.0, 3.0, 9.0, 7.0, 8.0, 10.0, 13.0, 26.0, 31.0, 42.0, 75.0, 104.0, 194.0, 388.0, 986.0, 3880.0, 36743.0, 941442.0, 57802.0, 4540.0, 1224.0, 440.0, 212.0, 140.0, 82.0, 48.0, 28.0, 21.0, 17.0, 7.0, 11.0, 3.0, 6.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9140625, -12.5048828125, -12.095703125, -11.6865234375, -11.27734375, -10.8681640625, -10.458984375, -10.0498046875, -9.640625, -9.2314453125, -8.822265625, -8.4130859375, -8.00390625, -7.5947265625, -7.185546875, -6.7763671875, -6.3671875, -5.9580078125, -5.548828125, -5.1396484375, -4.73046875, -4.3212890625, -3.912109375, -3.5029296875, -3.09375, -2.6845703125, -2.275390625, -1.8662109375, -1.45703125, -1.0478515625, -0.638671875, -0.2294921875, 0.1796875, 0.5888671875, 0.998046875, 1.4072265625, 1.81640625, 2.2255859375, 2.634765625, 3.0439453125, 3.453125, 3.8623046875, 4.271484375, 4.6806640625, 5.08984375, 5.4990234375, 5.908203125, 6.3173828125, 6.7265625, 7.1357421875, 7.544921875, 7.9541015625, 8.36328125, 8.7724609375, 9.181640625, 9.5908203125, 10.0, 10.4091796875, 10.818359375, 11.2275390625, 11.63671875, 12.0458984375, 12.455078125, 12.8642578125, 13.2734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 4.0, 16.0, 16.0, 20.0, 46.0, 62.0, 117.0, 179.0, 253.0, 108.0, 60.0, 39.0, 30.0, 12.0, 18.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014667510986328125, -0.0014225691556930542, -0.001378387212753296, -0.0013342052698135376, -0.0012900233268737793, -0.001245841383934021, -0.0012016594409942627, -0.0011574774980545044, -0.001113295555114746, -0.0010691136121749878, -0.0010249316692352295, -0.0009807497262954712, -0.0009365677833557129, -0.0008923858404159546, -0.0008482038974761963, -0.000804021954536438, -0.0007598400115966797, -0.0007156580686569214, -0.0006714761257171631, -0.0006272941827774048, -0.0005831122398376465, -0.0005389302968978882, -0.0004947483539581299, -0.0004505664110183716, -0.0004063844680786133, -0.000362202525138855, -0.0003180205821990967, -0.0002738386392593384, -0.00022965669631958008, -0.00018547475337982178, -0.00014129281044006348, -9.711086750030518e-05, -5.2928924560546875e-05, -8.746981620788574e-06, 3.5434961318969727e-05, 7.961690425872803e-05, 0.00012379884719848633, 0.00016798079013824463, 0.00021216273307800293, 0.00025634467601776123, 0.00030052661895751953, 0.00034470856189727783, 0.00038889050483703613, 0.00043307244777679443, 0.00047725439071655273, 0.000521436333656311, 0.0005656182765960693, 0.0006098002195358276, 0.0006539821624755859, 0.0006981641054153442, 0.0007423460483551025, 0.0007865279912948608, 0.0008307099342346191, 0.0008748918771743774, 0.0009190738201141357, 0.000963255763053894, 0.0010074377059936523, 0.0010516196489334106, 0.001095801591873169, 0.0011399835348129272, 0.0011841654777526855, 0.0012283474206924438, 0.0012725293636322021, 0.0013167113065719604, 0.0013608932495117188]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 11.0, 11.0, 9.0, 17.0, 32.0, 50.0, 78.0, 119.0, 197.0, 349.0, 792.0, 1661.0, 5023.0, 28470.0, 630954.0, 353961.0, 19842.0, 3993.0, 1450.0, 695.0, 335.0, 183.0, 89.0, 73.0, 49.0, 36.0, 15.0, 11.0, 10.0, 13.0, 6.0, 2.0, 6.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4140625, -8.1014404296875, -7.788818359375, -7.4761962890625, -7.16357421875, -6.8509521484375, -6.538330078125, -6.2257080078125, -5.9130859375, -5.6004638671875, -5.287841796875, -4.9752197265625, -4.66259765625, -4.3499755859375, -4.037353515625, -3.7247314453125, -3.412109375, -3.0994873046875, -2.786865234375, -2.4742431640625, -2.16162109375, -1.8489990234375, -1.536376953125, -1.2237548828125, -0.9111328125, -0.5985107421875, -0.285888671875, 0.0267333984375, 0.33935546875, 0.6519775390625, 0.964599609375, 1.2772216796875, 1.58984375, 1.9024658203125, 2.215087890625, 2.5277099609375, 2.84033203125, 3.1529541015625, 3.465576171875, 3.7781982421875, 4.0908203125, 4.4034423828125, 4.716064453125, 5.0286865234375, 5.34130859375, 5.6539306640625, 5.966552734375, 6.2791748046875, 6.591796875, 6.9044189453125, 7.217041015625, 7.5296630859375, 7.84228515625, 8.1549072265625, 8.467529296875, 8.7801513671875, 9.0927734375, 9.4053955078125, 9.718017578125, 10.0306396484375, 10.34326171875, 10.6558837890625, 10.968505859375, 11.2811279296875, 11.59375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 0.0, 4.0, 3.0, 5.0, 12.0, 11.0, 15.0, 19.0, 28.0, 51.0, 62.0, 98.0, 140.0, 150.0, 102.0, 75.0, 64.0, 48.0, 26.0, 26.0, 21.0, 9.0, 7.0, 4.0, 3.0, 1.0, 4.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.528564453125, -6.26806640625, -6.007568359375, -5.7470703125, -5.486572265625, -5.22607421875, -4.965576171875, -4.705078125, -4.444580078125, -4.18408203125, -3.923583984375, -3.6630859375, -3.402587890625, -3.14208984375, -2.881591796875, -2.62109375, -2.360595703125, -2.10009765625, -1.839599609375, -1.5791015625, -1.318603515625, -1.05810546875, -0.797607421875, -0.537109375, -0.276611328125, -0.01611328125, 0.244384765625, 0.5048828125, 0.765380859375, 1.02587890625, 1.286376953125, 1.546875, 1.807373046875, 2.06787109375, 2.328369140625, 2.5888671875, 2.849365234375, 3.10986328125, 3.370361328125, 3.630859375, 3.891357421875, 4.15185546875, 4.412353515625, 4.6728515625, 4.933349609375, 5.19384765625, 5.454345703125, 5.71484375, 5.975341796875, 6.23583984375, 6.496337890625, 6.7568359375, 7.017333984375, 7.27783203125, 7.538330078125, 7.798828125, 8.059326171875, 8.31982421875, 8.580322265625, 8.8408203125, 9.101318359375, 9.36181640625, 9.622314453125, 9.8828125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 11.0, 50.0, 152.0, 286.0, 291.0, 141.0, 44.0, 13.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.44915771484375, -137.2250213623047, -131.00086975097656, -124.77672576904297, -118.55258178710938, -112.32843780517578, -106.10429382324219, -99.88015747070312, -93.656005859375, -87.4318618774414, -81.20771789550781, -74.98357391357422, -68.75942993164062, -62.53528594970703, -56.3111457824707, -50.08700180053711, -43.86286163330078, -37.63871765136719, -31.414573669433594, -25.190431594848633, -18.96628761291504, -12.742143630981445, -6.518001556396484, -0.2938575744628906, 5.930286407470703, 12.154430389404297, 18.37857437133789, 24.60271644592285, 30.826860427856445, 37.051002502441406, 43.275146484375, 49.499290466308594, 55.72343444824219, 61.94757843017578, 68.17172241210938, 74.39586639404297, 80.62001037597656, 86.84415435791016, 93.06829833984375, 99.29243469238281, 105.51658630371094, 111.74073028564453, 117.96487426757812, 124.18901824951172, 130.4131622314453, 136.63729858398438, 142.8614501953125, 149.08558654785156, 155.30972290039062, 161.5338592529297, 167.7580108642578, 173.98214721679688, 180.206298828125, 186.43043518066406, 192.6545867919922, 198.87872314453125, 205.10287475585938, 211.32701110839844, 217.55116271972656, 223.77529907226562, 229.99945068359375, 236.2235870361328, 242.44773864746094, 248.671875, 254.89602661132812]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 4.0, 8.0, 11.0, 10.0, 13.0, 11.0, 14.0, 14.0, 33.0, 24.0, 30.0, 30.0, 56.0, 40.0, 43.0, 52.0, 43.0, 53.0, 62.0, 39.0, 53.0, 38.0, 47.0, 33.0, 34.0, 31.0, 30.0, 17.0, 21.0, 28.0, 16.0, 12.0, 13.0, 11.0, 6.0, 7.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.47263717651367, -61.5108757019043, -59.54911422729492, -57.58735275268555, -55.62559127807617, -53.6638298034668, -51.70207214355469, -49.74031066894531, -47.77854919433594, -45.81678771972656, -43.85502624511719, -41.89326477050781, -39.93150329589844, -37.96974182128906, -36.00798034667969, -34.04621887207031, -32.08445739746094, -30.122695922851562, -28.160934448242188, -26.199172973632812, -24.237411499023438, -22.275650024414062, -20.31389045715332, -18.352128982543945, -16.39036750793457, -14.428606033325195, -12.46684455871582, -10.505084037780762, -8.543322563171387, -6.581561088562012, -4.619800567626953, -2.658039093017578, -0.6962776184082031, 1.2654836177825928, 3.2272448539733887, 5.1890058517456055, 7.1507673263549805, 9.112528800964355, 11.074289321899414, 13.036050796508789, 14.997812271118164, 16.95957374572754, 18.921335220336914, 20.883094787597656, 22.84485626220703, 24.806617736816406, 26.76837921142578, 28.730140686035156, 30.69190216064453, 32.653663635253906, 34.61542510986328, 36.577186584472656, 38.53894805908203, 40.500709533691406, 42.46247100830078, 44.424232482910156, 46.38599395751953, 48.347755432128906, 50.30951690673828, 52.271278381347656, 54.23303985595703, 56.194801330566406, 58.15656280517578, 60.118324279785156, 62.080081939697266]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 4.0, 9.0, 8.0, 11.0, 15.0, 14.0, 40.0, 48.0, 57.0, 114.0, 163.0, 233.0, 388.0, 530.0, 975.0, 1627.0, 2937.0, 6700.0, 21905.0, 185031.0, 3892474.0, 58408.0, 12267.0, 4694.0, 2329.0, 1197.0, 765.0, 446.0, 288.0, 185.0, 125.0, 85.0, 68.0, 37.0, 32.0, 22.0, 11.0, 10.0, 9.0, 7.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.09375, -11.7071533203125, -11.320556640625, -10.9339599609375, -10.54736328125, -10.1607666015625, -9.774169921875, -9.3875732421875, -9.0009765625, -8.6143798828125, -8.227783203125, -7.8411865234375, -7.45458984375, -7.0679931640625, -6.681396484375, -6.2947998046875, -5.908203125, -5.5216064453125, -5.135009765625, -4.7484130859375, -4.36181640625, -3.9752197265625, -3.588623046875, -3.2020263671875, -2.8154296875, -2.4288330078125, -2.042236328125, -1.6556396484375, -1.26904296875, -0.8824462890625, -0.495849609375, -0.1092529296875, 0.27734375, 0.6639404296875, 1.050537109375, 1.4371337890625, 1.82373046875, 2.2103271484375, 2.596923828125, 2.9835205078125, 3.3701171875, 3.7567138671875, 4.143310546875, 4.5299072265625, 4.91650390625, 5.3031005859375, 5.689697265625, 6.0762939453125, 6.462890625, 6.8494873046875, 7.236083984375, 7.6226806640625, 8.00927734375, 8.3958740234375, 8.782470703125, 9.1690673828125, 9.5556640625, 9.9422607421875, 10.328857421875, 10.7154541015625, 11.10205078125, 11.4886474609375, 11.875244140625, 12.2618408203125, 12.6484375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 3.0, 6.0, 7.0, 12.0, 8.0, 15.0, 23.0, 19.0, 21.0, 34.0, 30.0, 41.0, 46.0, 37.0, 52.0, 70.0, 65.0, 59.0, 64.0, 43.0, 50.0, 38.0, 35.0, 43.0, 37.0, 33.0, 20.0, 21.0, 15.0, 13.0, 9.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.23046875, -3.129852294921875, -3.02923583984375, -2.928619384765625, -2.8280029296875, -2.727386474609375, -2.62677001953125, -2.526153564453125, -2.425537109375, -2.324920654296875, -2.22430419921875, -2.123687744140625, -2.0230712890625, -1.922454833984375, -1.82183837890625, -1.721221923828125, -1.62060546875, -1.519989013671875, -1.41937255859375, -1.318756103515625, -1.2181396484375, -1.117523193359375, -1.01690673828125, -0.916290283203125, -0.815673828125, -0.715057373046875, -0.61444091796875, -0.513824462890625, -0.4132080078125, -0.312591552734375, -0.21197509765625, -0.111358642578125, -0.0107421875, 0.089874267578125, 0.19049072265625, 0.291107177734375, 0.3917236328125, 0.492340087890625, 0.59295654296875, 0.693572998046875, 0.794189453125, 0.894805908203125, 0.99542236328125, 1.096038818359375, 1.1966552734375, 1.297271728515625, 1.39788818359375, 1.498504638671875, 1.59912109375, 1.699737548828125, 1.80035400390625, 1.900970458984375, 2.0015869140625, 2.102203369140625, 2.20281982421875, 2.303436279296875, 2.404052734375, 2.504669189453125, 2.60528564453125, 2.705902099609375, 2.8065185546875, 2.907135009765625, 3.00775146484375, 3.108367919921875, 3.208984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 8.0, 6.0, 12.0, 8.0, 15.0, 12.0, 16.0, 28.0, 26.0, 29.0, 69.0, 99.0, 182.0, 291.0, 648.0, 1394.0, 4048.0, 17027.0, 327715.0, 3807366.0, 26360.0, 5418.0, 1801.0, 760.0, 366.0, 198.0, 102.0, 64.0, 56.0, 31.0, 20.0, 13.0, 15.0, 11.0, 8.0, 9.0, 17.0, 5.0, 6.0, 3.0, 3.0, 7.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.078125, -18.5499267578125, -18.021728515625, -17.4935302734375, -16.96533203125, -16.4371337890625, -15.908935546875, -15.3807373046875, -14.8525390625, -14.3243408203125, -13.796142578125, -13.2679443359375, -12.73974609375, -12.2115478515625, -11.683349609375, -11.1551513671875, -10.626953125, -10.0987548828125, -9.570556640625, -9.0423583984375, -8.51416015625, -7.9859619140625, -7.457763671875, -6.9295654296875, -6.4013671875, -5.8731689453125, -5.344970703125, -4.8167724609375, -4.28857421875, -3.7603759765625, -3.232177734375, -2.7039794921875, -2.17578125, -1.6475830078125, -1.119384765625, -0.5911865234375, -0.06298828125, 0.4652099609375, 0.993408203125, 1.5216064453125, 2.0498046875, 2.5780029296875, 3.106201171875, 3.6343994140625, 4.16259765625, 4.6907958984375, 5.218994140625, 5.7471923828125, 6.275390625, 6.8035888671875, 7.331787109375, 7.8599853515625, 8.38818359375, 8.9163818359375, 9.444580078125, 9.9727783203125, 10.5009765625, 11.0291748046875, 11.557373046875, 12.0855712890625, 12.61376953125, 13.1419677734375, 13.670166015625, 14.1983642578125, 14.7265625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 7.0, 11.0, 19.0, 38.0, 85.0, 273.0, 3154.0, 313.0, 89.0, 26.0, 19.0, 11.0, 10.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91015625, -4.70159912109375, -4.4930419921875, -4.28448486328125, -4.075927734375, -3.86737060546875, -3.6588134765625, -3.45025634765625, -3.24169921875, -3.03314208984375, -2.8245849609375, -2.61602783203125, -2.407470703125, -2.19891357421875, -1.9903564453125, -1.78179931640625, -1.5732421875, -1.36468505859375, -1.1561279296875, -0.94757080078125, -0.739013671875, -0.53045654296875, -0.3218994140625, -0.11334228515625, 0.09521484375, 0.30377197265625, 0.5123291015625, 0.72088623046875, 0.929443359375, 1.13800048828125, 1.3465576171875, 1.55511474609375, 1.763671875, 1.97222900390625, 2.1807861328125, 2.38934326171875, 2.597900390625, 2.80645751953125, 3.0150146484375, 3.22357177734375, 3.43212890625, 3.64068603515625, 3.8492431640625, 4.05780029296875, 4.266357421875, 4.47491455078125, 4.6834716796875, 4.89202880859375, 5.1005859375, 5.30914306640625, 5.5177001953125, 5.72625732421875, 5.934814453125, 6.14337158203125, 6.3519287109375, 6.56048583984375, 6.76904296875, 6.97760009765625, 7.1861572265625, 7.39471435546875, 7.603271484375, 7.81182861328125, 8.0203857421875, 8.22894287109375, 8.4375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 6.0, 7.0, 9.0, 12.0, 21.0, 37.0, 55.0, 99.0, 130.0, 157.0, 158.0, 119.0, 75.0, 47.0, 34.0, 13.0, 13.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.69977569580078, -30.904190063476562, -30.10860252380371, -29.313016891479492, -28.517431259155273, -27.721845626831055, -26.926258087158203, -26.130672454833984, -25.335086822509766, -24.539501190185547, -23.743913650512695, -22.948328018188477, -22.152742385864258, -21.35715675354004, -20.561569213867188, -19.76598358154297, -18.97039794921875, -18.17481231689453, -17.37922477722168, -16.58363914489746, -15.788053512573242, -14.992466926574707, -14.196880340576172, -13.401294708251953, -12.605707168579102, -11.810120582580566, -11.014534950256348, -10.218948364257812, -9.423362731933594, -8.627776145935059, -7.832190036773682, -7.036603927612305, -6.241018295288086, -5.445432186126709, -4.649846076965332, -3.854259729385376, -3.058673620223999, -2.263087511062622, -1.467501163482666, -0.6719150543212891, 0.12367105484008789, 0.9192572236061096, 1.7148433923721313, 2.510429620742798, 3.306015729904175, 4.101601600646973, 4.897188186645508, 5.692774295806885, 6.488360404968262, 7.283946514129639, 8.079532623291016, 8.87511920928955, 9.67070484161377, 10.466291427612305, 11.261877059936523, 12.057463645935059, 12.853050231933594, 13.648636817932129, 14.444222450256348, 15.239809036254883, 16.0353946685791, 16.83098030090332, 17.626567840576172, 18.42215347290039, 19.21773910522461]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 7.0, 3.0, 5.0, 9.0, 11.0, 6.0, 12.0, 16.0, 15.0, 15.0, 23.0, 46.0, 38.0, 41.0, 36.0, 41.0, 42.0, 36.0, 50.0, 32.0, 38.0, 35.0, 44.0, 40.0, 33.0, 37.0, 34.0, 52.0, 33.0, 22.0, 21.0, 20.0, 18.0, 16.0, 18.0, 13.0, 7.0, 6.0, 9.0, 4.0, 5.0, 4.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-9.77528190612793, -9.477632522583008, -9.179983139038086, -8.882333755493164, -8.584684371948242, -8.28703498840332, -7.989386081695557, -7.691737174987793, -7.394087791442871, -7.096438407897949, -6.798789024353027, -6.5011396408081055, -6.203490734100342, -5.90584135055542, -5.608191967010498, -5.310543060302734, -5.012893199920654, -4.715243816375732, -4.4175944328308105, -4.119945526123047, -3.822296142578125, -3.524646759033203, -3.2269973754882812, -2.9293482303619385, -2.6316988468170166, -2.3340494632720947, -2.036400318145752, -1.73875093460083, -1.4411016702651978, -1.1434524059295654, -0.8458030223846436, -0.5481538772583008, -0.2505044937133789, 0.047144800424575806, 0.3447940945625305, 0.6424434185028076, 0.9400926828384399, 1.2377419471740723, 1.5353913307189941, 1.833040475845337, 2.130689859390259, 2.4283392429351807, 2.7259883880615234, 3.0236377716064453, 3.321287155151367, 3.61893630027771, 3.916585683822632, 4.214234828948975, 4.5118842124938965, 4.809533596038818, 5.10718297958374, 5.404831886291504, 5.702481269836426, 6.000130653381348, 6.2977800369262695, 6.595429420471191, 6.893078804016113, 7.190728187561035, 7.488377571105957, 7.786026954650879, 8.0836763381958, 8.381324768066406, 8.678974151611328, 8.97662353515625, 9.274272918701172]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 7.0, 2.0, 9.0, 14.0, 17.0, 30.0, 55.0, 82.0, 179.0, 372.0, 679.0, 1513.0, 4020.0, 13001.0, 52889.0, 238275.0, 524980.0, 161407.0, 36063.0, 9444.0, 3058.0, 1264.0, 587.0, 258.0, 140.0, 82.0, 56.0, 27.0, 22.0, 10.0, 8.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.59375, -8.2095947265625, -7.825439453125, -7.4412841796875, -7.05712890625, -6.6729736328125, -6.288818359375, -5.9046630859375, -5.5205078125, -5.1363525390625, -4.752197265625, -4.3680419921875, -3.98388671875, -3.5997314453125, -3.215576171875, -2.8314208984375, -2.447265625, -2.0631103515625, -1.678955078125, -1.2947998046875, -0.91064453125, -0.5264892578125, -0.142333984375, 0.2418212890625, 0.6259765625, 1.0101318359375, 1.394287109375, 1.7784423828125, 2.16259765625, 2.5467529296875, 2.930908203125, 3.3150634765625, 3.69921875, 4.0833740234375, 4.467529296875, 4.8516845703125, 5.23583984375, 5.6199951171875, 6.004150390625, 6.3883056640625, 6.7724609375, 7.1566162109375, 7.540771484375, 7.9249267578125, 8.30908203125, 8.6932373046875, 9.077392578125, 9.4615478515625, 9.845703125, 10.2298583984375, 10.614013671875, 10.9981689453125, 11.38232421875, 11.7664794921875, 12.150634765625, 12.5347900390625, 12.9189453125, 13.3031005859375, 13.687255859375, 14.0714111328125, 14.45556640625, 14.8397216796875, 15.223876953125, 15.6080322265625, 15.9921875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 9.0, 10.0, 4.0, 10.0, 11.0, 14.0, 14.0, 16.0, 30.0, 30.0, 28.0, 47.0, 38.0, 42.0, 50.0, 52.0, 59.0, 50.0, 59.0, 55.0, 46.0, 45.0, 35.0, 40.0, 31.0, 47.0, 30.0, 16.0, 17.0, 12.0, 6.0, 9.0, 13.0, 6.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.90740966796875, -2.8089599609375, -2.71051025390625, -2.612060546875, -2.51361083984375, -2.4151611328125, -2.31671142578125, -2.21826171875, -2.11981201171875, -2.0213623046875, -1.92291259765625, -1.824462890625, -1.72601318359375, -1.6275634765625, -1.52911376953125, -1.4306640625, -1.33221435546875, -1.2337646484375, -1.13531494140625, -1.036865234375, -0.93841552734375, -0.8399658203125, -0.74151611328125, -0.64306640625, -0.54461669921875, -0.4461669921875, -0.34771728515625, -0.249267578125, -0.15081787109375, -0.0523681640625, 0.04608154296875, 0.14453125, 0.24298095703125, 0.3414306640625, 0.43988037109375, 0.538330078125, 0.63677978515625, 0.7352294921875, 0.83367919921875, 0.93212890625, 1.03057861328125, 1.1290283203125, 1.22747802734375, 1.325927734375, 1.42437744140625, 1.5228271484375, 1.62127685546875, 1.7197265625, 1.81817626953125, 1.9166259765625, 2.01507568359375, 2.113525390625, 2.21197509765625, 2.3104248046875, 2.40887451171875, 2.50732421875, 2.60577392578125, 2.7042236328125, 2.80267333984375, 2.901123046875, 2.99957275390625, 3.0980224609375, 3.19647216796875, 3.294921875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 1.0, 5.0, 13.0, 10.0, 14.0, 17.0, 19.0, 41.0, 57.0, 73.0, 127.0, 170.0, 251.0, 484.0, 1008.0, 3317.0, 30820.0, 853500.0, 148323.0, 7006.0, 1604.0, 668.0, 358.0, 181.0, 161.0, 96.0, 71.0, 42.0, 27.0, 18.0, 11.0, 15.0, 13.0, 4.0, 5.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-28.40625, -27.563720703125, -26.72119140625, -25.878662109375, -25.0361328125, -24.193603515625, -23.35107421875, -22.508544921875, -21.666015625, -20.823486328125, -19.98095703125, -19.138427734375, -18.2958984375, -17.453369140625, -16.61083984375, -15.768310546875, -14.92578125, -14.083251953125, -13.24072265625, -12.398193359375, -11.5556640625, -10.713134765625, -9.87060546875, -9.028076171875, -8.185546875, -7.343017578125, -6.50048828125, -5.657958984375, -4.8154296875, -3.972900390625, -3.13037109375, -2.287841796875, -1.4453125, -0.602783203125, 0.23974609375, 1.082275390625, 1.9248046875, 2.767333984375, 3.60986328125, 4.452392578125, 5.294921875, 6.137451171875, 6.97998046875, 7.822509765625, 8.6650390625, 9.507568359375, 10.35009765625, 11.192626953125, 12.03515625, 12.877685546875, 13.72021484375, 14.562744140625, 15.4052734375, 16.247802734375, 17.09033203125, 17.932861328125, 18.775390625, 19.617919921875, 20.46044921875, 21.302978515625, 22.1455078125, 22.988037109375, 23.83056640625, 24.673095703125, 25.515625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 3.0, 6.0, 8.0, 17.0, 12.0, 13.0, 25.0, 34.0, 53.0, 49.0, 43.0, 61.0, 73.0, 77.0, 68.0, 60.0, 68.0, 59.0, 43.0, 54.0, 38.0, 28.0, 31.0, 19.0, 21.0, 8.0, 7.0, 7.0, 4.0, 2.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.546875, -21.97607421875, -21.4052734375, -20.83447265625, -20.263671875, -19.69287109375, -19.1220703125, -18.55126953125, -17.98046875, -17.40966796875, -16.8388671875, -16.26806640625, -15.697265625, -15.12646484375, -14.5556640625, -13.98486328125, -13.4140625, -12.84326171875, -12.2724609375, -11.70166015625, -11.130859375, -10.56005859375, -9.9892578125, -9.41845703125, -8.84765625, -8.27685546875, -7.7060546875, -7.13525390625, -6.564453125, -5.99365234375, -5.4228515625, -4.85205078125, -4.28125, -3.71044921875, -3.1396484375, -2.56884765625, -1.998046875, -1.42724609375, -0.8564453125, -0.28564453125, 0.28515625, 0.85595703125, 1.4267578125, 1.99755859375, 2.568359375, 3.13916015625, 3.7099609375, 4.28076171875, 4.8515625, 5.42236328125, 5.9931640625, 6.56396484375, 7.134765625, 7.70556640625, 8.2763671875, 8.84716796875, 9.41796875, 9.98876953125, 10.5595703125, 11.13037109375, 11.701171875, 12.27197265625, 12.8427734375, 13.41357421875, 13.984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 10.0, 11.0, 24.0, 20.0, 35.0, 59.0, 81.0, 155.0, 292.0, 620.0, 1584.0, 5752.0, 31440.0, 342556.0, 602933.0, 51424.0, 7924.0, 2075.0, 770.0, 348.0, 149.0, 94.0, 65.0, 36.0, 23.0, 18.0, 16.0, 9.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2265625, -6.02642822265625, -5.8262939453125, -5.62615966796875, -5.426025390625, -5.22589111328125, -5.0257568359375, -4.82562255859375, -4.62548828125, -4.42535400390625, -4.2252197265625, -4.02508544921875, -3.824951171875, -3.62481689453125, -3.4246826171875, -3.22454833984375, -3.0244140625, -2.82427978515625, -2.6241455078125, -2.42401123046875, -2.223876953125, -2.02374267578125, -1.8236083984375, -1.62347412109375, -1.42333984375, -1.22320556640625, -1.0230712890625, -0.82293701171875, -0.622802734375, -0.42266845703125, -0.2225341796875, -0.02239990234375, 0.177734375, 0.37786865234375, 0.5780029296875, 0.77813720703125, 0.978271484375, 1.17840576171875, 1.3785400390625, 1.57867431640625, 1.77880859375, 1.97894287109375, 2.1790771484375, 2.37921142578125, 2.579345703125, 2.77947998046875, 2.9796142578125, 3.17974853515625, 3.3798828125, 3.58001708984375, 3.7801513671875, 3.98028564453125, 4.180419921875, 4.38055419921875, 4.5806884765625, 4.78082275390625, 4.98095703125, 5.18109130859375, 5.3812255859375, 5.58135986328125, 5.781494140625, 5.98162841796875, 6.1817626953125, 6.38189697265625, 6.58203125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 11.0, 5.0, 10.0, 14.0, 14.0, 23.0, 18.0, 42.0, 38.0, 48.0, 59.0, 112.0, 148.0, 117.0, 73.0, 55.0, 38.0, 27.0, 39.0, 31.0, 19.0, 9.0, 9.0, 2.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00104522705078125, -0.001012369990348816, -0.0009795129299163818, -0.0009466558694839478, -0.0009137988090515137, -0.0008809417486190796, -0.0008480846881866455, -0.0008152276277542114, -0.0007823705673217773, -0.0007495135068893433, -0.0007166564464569092, -0.0006837993860244751, -0.000650942325592041, -0.0006180852651596069, -0.0005852282047271729, -0.0005523711442947388, -0.0005195140838623047, -0.0004866570234298706, -0.0004537999629974365, -0.00042094290256500244, -0.00038808584213256836, -0.0003552287817001343, -0.0003223717212677002, -0.0002895146608352661, -0.00025665760040283203, -0.00022380053997039795, -0.00019094347953796387, -0.00015808641910552979, -0.0001252293586730957, -9.237229824066162e-05, -5.951523780822754e-05, -2.6658177375793457e-05, 6.198883056640625e-06, 3.905594348907471e-05, 7.191300392150879e-05, 0.00010477006435394287, 0.00013762712478637695, 0.00017048418521881104, 0.00020334124565124512, 0.0002361983060836792, 0.0002690553665161133, 0.00030191242694854736, 0.00033476948738098145, 0.00036762654781341553, 0.0004004836082458496, 0.0004333406686782837, 0.0004661977291107178, 0.0004990547895431519, 0.0005319118499755859, 0.00056476891040802, 0.0005976259708404541, 0.0006304830312728882, 0.0006633400917053223, 0.0006961971521377563, 0.0007290542125701904, 0.0007619112730026245, 0.0007947683334350586, 0.0008276253938674927, 0.0008604824542999268, 0.0008933395147323608, 0.0009261965751647949, 0.000959053635597229, 0.000991910696029663, 0.0010247677564620972, 0.0010576248168945312]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 5.0, 13.0, 15.0, 9.0, 21.0, 33.0, 38.0, 79.0, 102.0, 120.0, 222.0, 366.0, 601.0, 1372.0, 3890.0, 20518.0, 238107.0, 704697.0, 65677.0, 8246.0, 2319.0, 867.0, 469.0, 244.0, 183.0, 93.0, 56.0, 47.0, 51.0, 23.0, 21.0, 15.0, 7.0, 8.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.671875, -6.46502685546875, -6.2581787109375, -6.05133056640625, -5.844482421875, -5.63763427734375, -5.4307861328125, -5.22393798828125, -5.01708984375, -4.81024169921875, -4.6033935546875, -4.39654541015625, -4.189697265625, -3.98284912109375, -3.7760009765625, -3.56915283203125, -3.3623046875, -3.15545654296875, -2.9486083984375, -2.74176025390625, -2.534912109375, -2.32806396484375, -2.1212158203125, -1.91436767578125, -1.70751953125, -1.50067138671875, -1.2938232421875, -1.08697509765625, -0.880126953125, -0.67327880859375, -0.4664306640625, -0.25958251953125, -0.052734375, 0.15411376953125, 0.3609619140625, 0.56781005859375, 0.774658203125, 0.98150634765625, 1.1883544921875, 1.39520263671875, 1.60205078125, 1.80889892578125, 2.0157470703125, 2.22259521484375, 2.429443359375, 2.63629150390625, 2.8431396484375, 3.04998779296875, 3.2568359375, 3.46368408203125, 3.6705322265625, 3.87738037109375, 4.084228515625, 4.29107666015625, 4.4979248046875, 4.70477294921875, 4.91162109375, 5.11846923828125, 5.3253173828125, 5.53216552734375, 5.739013671875, 5.94586181640625, 6.1527099609375, 6.35955810546875, 6.56640625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 3.0, 7.0, 8.0, 9.0, 19.0, 5.0, 18.0, 25.0, 16.0, 29.0, 27.0, 28.0, 31.0, 29.0, 38.0, 57.0, 47.0, 59.0, 62.0, 53.0, 56.0, 46.0, 43.0, 37.0, 40.0, 33.0, 24.0, 19.0, 20.0, 16.0, 16.0, 10.0, 12.0, 12.0, 6.0, 5.0, 6.0, 5.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.26171875, -3.16217041015625, -3.0626220703125, -2.96307373046875, -2.863525390625, -2.76397705078125, -2.6644287109375, -2.56488037109375, -2.46533203125, -2.36578369140625, -2.2662353515625, -2.16668701171875, -2.067138671875, -1.96759033203125, -1.8680419921875, -1.76849365234375, -1.6689453125, -1.56939697265625, -1.4698486328125, -1.37030029296875, -1.270751953125, -1.17120361328125, -1.0716552734375, -0.97210693359375, -0.87255859375, -0.77301025390625, -0.6734619140625, -0.57391357421875, -0.474365234375, -0.37481689453125, -0.2752685546875, -0.17572021484375, -0.076171875, 0.02337646484375, 0.1229248046875, 0.22247314453125, 0.322021484375, 0.42156982421875, 0.5211181640625, 0.62066650390625, 0.72021484375, 0.81976318359375, 0.9193115234375, 1.01885986328125, 1.118408203125, 1.21795654296875, 1.3175048828125, 1.41705322265625, 1.5166015625, 1.61614990234375, 1.7156982421875, 1.81524658203125, 1.914794921875, 2.01434326171875, 2.1138916015625, 2.21343994140625, 2.31298828125, 2.41253662109375, 2.5120849609375, 2.61163330078125, 2.711181640625, 2.81072998046875, 2.9102783203125, 3.00982666015625, 3.109375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 22.0, 38.0, 105.0, 186.0, 267.0, 199.0, 105.0, 42.0, 15.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-189.07131958007812, -183.71221923828125, -178.35311889648438, -172.9940185546875, -167.6349334716797, -162.2758331298828, -156.91673278808594, -151.55763244628906, -146.19854736328125, -140.83944702148438, -135.4803466796875, -130.12124633789062, -124.76216125488281, -119.40306091308594, -114.04396057128906, -108.68486022949219, -103.32575988769531, -97.96665954589844, -92.6075668334961, -87.24846649169922, -81.88937377929688, -76.5302734375, -71.17117309570312, -65.81207275390625, -60.452980041503906, -55.0938835144043, -49.73478698730469, -44.37568664550781, -39.0165901184082, -33.657493591308594, -28.29839324951172, -22.93929672241211, -17.5802001953125, -12.221102714538574, -6.862005233764648, -1.5029067993164062, 3.856189727783203, 9.215286254882812, 14.574386596679688, 19.933483123779297, 25.292579650878906, 30.651676177978516, 36.010772705078125, 41.369873046875, 46.72896957397461, 52.08806610107422, 57.447166442871094, 62.8062629699707, 68.16535949707031, 73.52445983886719, 78.88355255126953, 84.2426528930664, 89.60174560546875, 94.96084594726562, 100.3199462890625, 105.67904663085938, 111.03813934326172, 116.3972396850586, 121.75633239746094, 127.11543273925781, 132.4745330810547, 137.8336181640625, 143.19271850585938, 148.55181884765625, 153.91091918945312]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 1.0, 4.0, 6.0, 4.0, 7.0, 11.0, 10.0, 14.0, 16.0, 16.0, 28.0, 29.0, 30.0, 51.0, 41.0, 50.0, 41.0, 59.0, 45.0, 52.0, 58.0, 38.0, 48.0, 40.0, 47.0, 27.0, 44.0, 32.0, 25.0, 28.0, 16.0, 16.0, 12.0, 14.0, 11.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-59.929161071777344, -58.04840850830078, -56.16765594482422, -54.286903381347656, -52.406150817871094, -50.52539825439453, -48.644649505615234, -46.76389694213867, -44.88314437866211, -43.00239181518555, -41.121639251708984, -39.24088668823242, -37.360137939453125, -35.47938537597656, -33.5986328125, -31.717880249023438, -29.837127685546875, -27.956375122070312, -26.07562255859375, -24.19487190246582, -22.314119338989258, -20.433366775512695, -18.552616119384766, -16.671863555908203, -14.79111099243164, -12.910358428955078, -11.029606819152832, -9.148855209350586, -7.268102645874023, -5.387350082397461, -3.506598472595215, -1.6258468627929688, 0.25490570068359375, 2.135657787322998, 4.016409873962402, 5.897161960601807, 7.777914047241211, 9.658666610717773, 11.53941822052002, 13.420169830322266, 15.300922393798828, 17.18167495727539, 19.062427520751953, 20.943178176879883, 22.823930740356445, 24.704683303833008, 26.585433959960938, 28.4661865234375, 30.346939086914062, 32.227691650390625, 34.10844421386719, 35.98919677734375, 37.86994934082031, 39.750701904296875, 41.63145065307617, 43.512203216552734, 45.3929557800293, 47.27370834350586, 49.15446090698242, 51.035213470458984, 52.91596221923828, 54.796714782714844, 56.677467346191406, 58.55821990966797, 60.43897247314453]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 7.0, 15.0, 16.0, 30.0, 51.0, 86.0, 133.0, 231.0, 413.0, 778.0, 1620.0, 3599.0, 9096.0, 26271.0, 107681.0, 1264759.0, 2557272.0, 166692.0, 36068.0, 11328.0, 4355.0, 1861.0, 841.0, 456.0, 266.0, 130.0, 90.0, 53.0, 33.0, 20.0, 11.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.45703125, -7.23187255859375, -7.0067138671875, -6.78155517578125, -6.556396484375, -6.33123779296875, -6.1060791015625, -5.88092041015625, -5.65576171875, -5.43060302734375, -5.2054443359375, -4.98028564453125, -4.755126953125, -4.52996826171875, -4.3048095703125, -4.07965087890625, -3.8544921875, -3.62933349609375, -3.4041748046875, -3.17901611328125, -2.953857421875, -2.72869873046875, -2.5035400390625, -2.27838134765625, -2.05322265625, -1.82806396484375, -1.6029052734375, -1.37774658203125, -1.152587890625, -0.92742919921875, -0.7022705078125, -0.47711181640625, -0.251953125, -0.02679443359375, 0.1983642578125, 0.42352294921875, 0.648681640625, 0.87384033203125, 1.0989990234375, 1.32415771484375, 1.54931640625, 1.77447509765625, 1.9996337890625, 2.22479248046875, 2.449951171875, 2.67510986328125, 2.9002685546875, 3.12542724609375, 3.3505859375, 3.57574462890625, 3.8009033203125, 4.02606201171875, 4.251220703125, 4.47637939453125, 4.7015380859375, 4.92669677734375, 5.15185546875, 5.37701416015625, 5.6021728515625, 5.82733154296875, 6.052490234375, 6.27764892578125, 6.5028076171875, 6.72796630859375, 6.953125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 6.0, 6.0, 6.0, 7.0, 8.0, 13.0, 14.0, 20.0, 21.0, 18.0, 33.0, 52.0, 36.0, 43.0, 54.0, 60.0, 57.0, 61.0, 56.0, 56.0, 49.0, 44.0, 45.0, 38.0, 49.0, 31.0, 26.0, 23.0, 18.0, 20.0, 9.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.806640625, -3.70263671875, -3.5986328125, -3.49462890625, -3.390625, -3.28662109375, -3.1826171875, -3.07861328125, -2.974609375, -2.87060546875, -2.7666015625, -2.66259765625, -2.55859375, -2.45458984375, -2.3505859375, -2.24658203125, -2.142578125, -2.03857421875, -1.9345703125, -1.83056640625, -1.7265625, -1.62255859375, -1.5185546875, -1.41455078125, -1.310546875, -1.20654296875, -1.1025390625, -0.99853515625, -0.89453125, -0.79052734375, -0.6865234375, -0.58251953125, -0.478515625, -0.37451171875, -0.2705078125, -0.16650390625, -0.0625, 0.04150390625, 0.1455078125, 0.24951171875, 0.353515625, 0.45751953125, 0.5615234375, 0.66552734375, 0.76953125, 0.87353515625, 0.9775390625, 1.08154296875, 1.185546875, 1.28955078125, 1.3935546875, 1.49755859375, 1.6015625, 1.70556640625, 1.8095703125, 1.91357421875, 2.017578125, 2.12158203125, 2.2255859375, 2.32958984375, 2.43359375, 2.53759765625, 2.6416015625, 2.74560546875, 2.849609375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 13.0, 9.0, 21.0, 51.0, 92.0, 178.0, 447.0, 1430.0, 5442.0, 29708.0, 405270.0, 3624568.0, 108096.0, 14249.0, 3145.0, 902.0, 319.0, 143.0, 86.0, 24.0, 29.0, 15.0, 9.0, 7.0, 2.0, 7.0, 2.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.828125, -14.4195556640625, -14.010986328125, -13.6024169921875, -13.19384765625, -12.7852783203125, -12.376708984375, -11.9681396484375, -11.5595703125, -11.1510009765625, -10.742431640625, -10.3338623046875, -9.92529296875, -9.5167236328125, -9.108154296875, -8.6995849609375, -8.291015625, -7.8824462890625, -7.473876953125, -7.0653076171875, -6.65673828125, -6.2481689453125, -5.839599609375, -5.4310302734375, -5.0224609375, -4.6138916015625, -4.205322265625, -3.7967529296875, -3.38818359375, -2.9796142578125, -2.571044921875, -2.1624755859375, -1.75390625, -1.3453369140625, -0.936767578125, -0.5281982421875, -0.11962890625, 0.2889404296875, 0.697509765625, 1.1060791015625, 1.5146484375, 1.9232177734375, 2.331787109375, 2.7403564453125, 3.14892578125, 3.5574951171875, 3.966064453125, 4.3746337890625, 4.783203125, 5.1917724609375, 5.600341796875, 6.0089111328125, 6.41748046875, 6.8260498046875, 7.234619140625, 7.6431884765625, 8.0517578125, 8.4603271484375, 8.868896484375, 9.2774658203125, 9.68603515625, 10.0946044921875, 10.503173828125, 10.9117431640625, 11.3203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 7.0, 5.0, 14.0, 26.0, 34.0, 52.0, 59.0, 86.0, 140.0, 281.0, 628.0, 1045.0, 787.0, 377.0, 174.0, 108.0, 64.0, 48.0, 35.0, 22.0, 21.0, 10.0, 11.0, 1.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3984375, -8.115478515625, -7.83251953125, -7.549560546875, -7.2666015625, -6.983642578125, -6.70068359375, -6.417724609375, -6.134765625, -5.851806640625, -5.56884765625, -5.285888671875, -5.0029296875, -4.719970703125, -4.43701171875, -4.154052734375, -3.87109375, -3.588134765625, -3.30517578125, -3.022216796875, -2.7392578125, -2.456298828125, -2.17333984375, -1.890380859375, -1.607421875, -1.324462890625, -1.04150390625, -0.758544921875, -0.4755859375, -0.192626953125, 0.09033203125, 0.373291015625, 0.65625, 0.939208984375, 1.22216796875, 1.505126953125, 1.7880859375, 2.071044921875, 2.35400390625, 2.636962890625, 2.919921875, 3.202880859375, 3.48583984375, 3.768798828125, 4.0517578125, 4.334716796875, 4.61767578125, 4.900634765625, 5.18359375, 5.466552734375, 5.74951171875, 6.032470703125, 6.3154296875, 6.598388671875, 6.88134765625, 7.164306640625, 7.447265625, 7.730224609375, 8.01318359375, 8.296142578125, 8.5791015625, 8.862060546875, 9.14501953125, 9.427978515625, 9.7109375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 12.0, 8.0, 19.0, 52.0, 100.0, 217.0, 238.0, 183.0, 99.0, 32.0, 14.0, 12.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.02342224121094, -89.48925018310547, -85.95508575439453, -82.42091369628906, -78.88674926757812, -75.35257720947266, -71.81840515136719, -68.28424072265625, -64.75006866455078, -61.21590042114258, -57.681732177734375, -54.147560119628906, -50.6133918762207, -47.0792236328125, -43.5450553894043, -40.010887145996094, -36.47671890258789, -32.94255065917969, -29.40838050842285, -25.87421226501465, -22.340042114257812, -18.80587387084961, -15.271705627441406, -11.73753547668457, -8.203367233276367, -4.669198036193848, -1.1350293159484863, 2.399139404296875, 5.9333086013793945, 9.467477798461914, 13.001646041870117, 16.535816192626953, 20.069984436035156, 23.60415267944336, 27.138322830200195, 30.6724910736084, 34.206661224365234, 37.74082946777344, 41.27499771118164, 44.809165954589844, 48.34333801269531, 51.877506256103516, 55.41167449951172, 58.94584655761719, 62.48001480102539, 66.0141830444336, 69.54835510253906, 73.08251953125, 76.61668395996094, 80.1508560180664, 83.68502044677734, 87.21919250488281, 90.75335693359375, 94.28752899169922, 97.82170104980469, 101.35586547851562, 104.8900375366211, 108.42420959472656, 111.9583740234375, 115.49254608154297, 119.0267105102539, 122.56088256835938, 126.09504699707031, 129.6292266845703, 133.16339111328125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 5.0, 3.0, 12.0, 13.0, 14.0, 6.0, 11.0, 21.0, 21.0, 24.0, 30.0, 35.0, 35.0, 35.0, 48.0, 41.0, 57.0, 42.0, 49.0, 55.0, 42.0, 41.0, 48.0, 43.0, 38.0, 34.0, 23.0, 27.0, 19.0, 27.0, 24.0, 19.0, 16.0, 7.0, 5.0, 7.0, 5.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-37.557533264160156, -36.48500442504883, -35.412471771240234, -34.339942932128906, -33.26741409301758, -32.194881439208984, -31.122352600097656, -30.049821853637695, -28.977291107177734, -27.904760360717773, -26.832231521606445, -25.759700775146484, -24.687170028686523, -23.614639282226562, -22.542110443115234, -21.469579696655273, -20.397050857543945, -19.324520111083984, -18.251991271972656, -17.179460525512695, -16.106929779052734, -15.03439998626709, -13.961870193481445, -12.889339447021484, -11.81680965423584, -10.744279861450195, -9.671749114990234, -8.59921932220459, -7.526689052581787, -6.454158782958984, -5.38162899017334, -4.309098720550537, -3.236570358276367, -2.1640400886535645, -1.0915100574493408, -0.018980026245117188, 1.0535502433776855, 2.1260805130004883, 3.198610305786133, 4.2711405754089355, 5.343670845031738, 6.416201114654541, 7.488731384277344, 8.561261177062988, 9.633790969848633, 10.706321716308594, 11.778851509094238, 12.851381301879883, 13.923912048339844, 14.996441841125488, 16.068971633911133, 17.141502380371094, 18.214033126831055, 19.286563873291016, 20.359092712402344, 21.431623458862305, 22.504154205322266, 23.576684951782227, 24.649213790893555, 25.721744537353516, 26.794275283813477, 27.866806030273438, 28.939334869384766, 30.011865615844727, 31.084394454956055]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 8.0, 19.0, 24.0, 36.0, 68.0, 85.0, 160.0, 232.0, 367.0, 640.0, 1051.0, 1803.0, 3281.0, 6007.0, 12021.0, 24831.0, 55095.0, 133859.0, 343133.0, 277241.0, 102737.0, 44168.0, 20144.0, 9715.0, 5128.0, 2652.0, 1573.0, 923.0, 556.0, 349.0, 224.0, 151.0, 75.0, 49.0, 36.0, 27.0, 20.0, 19.0, 10.0, 3.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-6.28125, -6.0841064453125, -5.886962890625, -5.6898193359375, -5.49267578125, -5.2955322265625, -5.098388671875, -4.9012451171875, -4.7041015625, -4.5069580078125, -4.309814453125, -4.1126708984375, -3.91552734375, -3.7183837890625, -3.521240234375, -3.3240966796875, -3.126953125, -2.9298095703125, -2.732666015625, -2.5355224609375, -2.33837890625, -2.1412353515625, -1.944091796875, -1.7469482421875, -1.5498046875, -1.3526611328125, -1.155517578125, -0.9583740234375, -0.76123046875, -0.5640869140625, -0.366943359375, -0.1697998046875, 0.02734375, 0.2244873046875, 0.421630859375, 0.6187744140625, 0.81591796875, 1.0130615234375, 1.210205078125, 1.4073486328125, 1.6044921875, 1.8016357421875, 1.998779296875, 2.1959228515625, 2.39306640625, 2.5902099609375, 2.787353515625, 2.9844970703125, 3.181640625, 3.3787841796875, 3.575927734375, 3.7730712890625, 3.97021484375, 4.1673583984375, 4.364501953125, 4.5616455078125, 4.7587890625, 4.9559326171875, 5.153076171875, 5.3502197265625, 5.54736328125, 5.7445068359375, 5.941650390625, 6.1387939453125, 6.3359375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 8.0, 6.0, 7.0, 6.0, 15.0, 15.0, 6.0, 17.0, 22.0, 25.0, 29.0, 31.0, 26.0, 32.0, 37.0, 48.0, 41.0, 61.0, 47.0, 43.0, 50.0, 44.0, 48.0, 40.0, 41.0, 29.0, 31.0, 27.0, 23.0, 29.0, 21.0, 21.0, 16.0, 15.0, 9.0, 9.0, 5.0, 4.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.4921875, -2.4073486328125, -2.322509765625, -2.2376708984375, -2.15283203125, -2.0679931640625, -1.983154296875, -1.8983154296875, -1.8134765625, -1.7286376953125, -1.643798828125, -1.5589599609375, -1.47412109375, -1.3892822265625, -1.304443359375, -1.2196044921875, -1.134765625, -1.0499267578125, -0.965087890625, -0.8802490234375, -0.79541015625, -0.7105712890625, -0.625732421875, -0.5408935546875, -0.4560546875, -0.3712158203125, -0.286376953125, -0.2015380859375, -0.11669921875, -0.0318603515625, 0.052978515625, 0.1378173828125, 0.22265625, 0.3074951171875, 0.392333984375, 0.4771728515625, 0.56201171875, 0.6468505859375, 0.731689453125, 0.8165283203125, 0.9013671875, 0.9862060546875, 1.071044921875, 1.1558837890625, 1.24072265625, 1.3255615234375, 1.410400390625, 1.4952392578125, 1.580078125, 1.6649169921875, 1.749755859375, 1.8345947265625, 1.91943359375, 2.0042724609375, 2.089111328125, 2.1739501953125, 2.2587890625, 2.3436279296875, 2.428466796875, 2.5133056640625, 2.59814453125, 2.6829833984375, 2.767822265625, 2.8526611328125, 2.9375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 6.0, 10.0, 11.0, 20.0, 20.0, 27.0, 38.0, 64.0, 96.0, 114.0, 183.0, 318.0, 573.0, 1520.0, 5880.0, 88029.0, 904499.0, 40662.0, 4034.0, 1145.0, 493.0, 258.0, 168.0, 104.0, 78.0, 47.0, 33.0, 27.0, 14.0, 18.0, 12.0, 11.0, 7.0, 2.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.15625, -21.375732421875, -20.59521484375, -19.814697265625, -19.0341796875, -18.253662109375, -17.47314453125, -16.692626953125, -15.912109375, -15.131591796875, -14.35107421875, -13.570556640625, -12.7900390625, -12.009521484375, -11.22900390625, -10.448486328125, -9.66796875, -8.887451171875, -8.10693359375, -7.326416015625, -6.5458984375, -5.765380859375, -4.98486328125, -4.204345703125, -3.423828125, -2.643310546875, -1.86279296875, -1.082275390625, -0.3017578125, 0.478759765625, 1.25927734375, 2.039794921875, 2.8203125, 3.600830078125, 4.38134765625, 5.161865234375, 5.9423828125, 6.722900390625, 7.50341796875, 8.283935546875, 9.064453125, 9.844970703125, 10.62548828125, 11.406005859375, 12.1865234375, 12.967041015625, 13.74755859375, 14.528076171875, 15.30859375, 16.089111328125, 16.86962890625, 17.650146484375, 18.4306640625, 19.211181640625, 19.99169921875, 20.772216796875, 21.552734375, 22.333251953125, 23.11376953125, 23.894287109375, 24.6748046875, 25.455322265625, 26.23583984375, 27.016357421875, 27.796875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 5.0, 9.0, 9.0, 18.0, 15.0, 15.0, 17.0, 19.0, 25.0, 21.0, 32.0, 31.0, 41.0, 36.0, 49.0, 40.0, 42.0, 48.0, 43.0, 45.0, 41.0, 46.0, 37.0, 35.0, 41.0, 32.0, 27.0, 17.0, 15.0, 18.0, 19.0, 20.0, 11.0, 10.0, 13.0, 10.0, 6.0, 6.0, 7.0, 2.0, 5.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.7734375, -11.4317626953125, -11.090087890625, -10.7484130859375, -10.40673828125, -10.0650634765625, -9.723388671875, -9.3817138671875, -9.0400390625, -8.6983642578125, -8.356689453125, -8.0150146484375, -7.67333984375, -7.3316650390625, -6.989990234375, -6.6483154296875, -6.306640625, -5.9649658203125, -5.623291015625, -5.2816162109375, -4.93994140625, -4.5982666015625, -4.256591796875, -3.9149169921875, -3.5732421875, -3.2315673828125, -2.889892578125, -2.5482177734375, -2.20654296875, -1.8648681640625, -1.523193359375, -1.1815185546875, -0.83984375, -0.4981689453125, -0.156494140625, 0.1851806640625, 0.52685546875, 0.8685302734375, 1.210205078125, 1.5518798828125, 1.8935546875, 2.2352294921875, 2.576904296875, 2.9185791015625, 3.26025390625, 3.6019287109375, 3.943603515625, 4.2852783203125, 4.626953125, 4.9686279296875, 5.310302734375, 5.6519775390625, 5.99365234375, 6.3353271484375, 6.677001953125, 7.0186767578125, 7.3603515625, 7.7020263671875, 8.043701171875, 8.3853759765625, 8.72705078125, 9.0687255859375, 9.410400390625, 9.7520751953125, 10.09375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 1.0, 1.0, 6.0, 16.0, 10.0, 14.0, 23.0, 34.0, 44.0, 74.0, 158.0, 263.0, 657.0, 2252.0, 12520.0, 232739.0, 768008.0, 26440.0, 3552.0, 966.0, 336.0, 185.0, 93.0, 63.0, 31.0, 17.0, 17.0, 8.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.91015625, -7.62921142578125, -7.3482666015625, -7.06732177734375, -6.786376953125, -6.50543212890625, -6.2244873046875, -5.94354248046875, -5.66259765625, -5.38165283203125, -5.1007080078125, -4.81976318359375, -4.538818359375, -4.25787353515625, -3.9769287109375, -3.69598388671875, -3.4150390625, -3.13409423828125, -2.8531494140625, -2.57220458984375, -2.291259765625, -2.01031494140625, -1.7293701171875, -1.44842529296875, -1.16748046875, -0.88653564453125, -0.6055908203125, -0.32464599609375, -0.043701171875, 0.23724365234375, 0.5181884765625, 0.79913330078125, 1.080078125, 1.36102294921875, 1.6419677734375, 1.92291259765625, 2.203857421875, 2.48480224609375, 2.7657470703125, 3.04669189453125, 3.32763671875, 3.60858154296875, 3.8895263671875, 4.17047119140625, 4.451416015625, 4.73236083984375, 5.0133056640625, 5.29425048828125, 5.5751953125, 5.85614013671875, 6.1370849609375, 6.41802978515625, 6.698974609375, 6.97991943359375, 7.2608642578125, 7.54180908203125, 7.82275390625, 8.10369873046875, 8.3846435546875, 8.66558837890625, 8.946533203125, 9.22747802734375, 9.5084228515625, 9.78936767578125, 10.0703125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 8.0, 5.0, 8.0, 12.0, 7.0, 17.0, 17.0, 24.0, 24.0, 43.0, 45.0, 68.0, 109.0, 147.0, 127.0, 75.0, 53.0, 26.0, 28.0, 17.0, 24.0, 18.0, 15.0, 17.0, 13.0, 13.0, 6.0, 7.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008487701416015625, -0.0008218884468078613, -0.0007950067520141602, -0.000768125057220459, -0.0007412433624267578, -0.0007143616676330566, -0.0006874799728393555, -0.0006605982780456543, -0.0006337165832519531, -0.000606834888458252, -0.0005799531936645508, -0.0005530714988708496, -0.0005261898040771484, -0.0004993081092834473, -0.0004724264144897461, -0.0004455447196960449, -0.00041866302490234375, -0.0003917813301086426, -0.0003648996353149414, -0.00033801794052124023, -0.00031113624572753906, -0.0002842545509338379, -0.0002573728561401367, -0.00023049116134643555, -0.00020360946655273438, -0.0001767277717590332, -0.00014984607696533203, -0.00012296438217163086, -9.608268737792969e-05, -6.920099258422852e-05, -4.2319297790527344e-05, -1.5437602996826172e-05, 1.1444091796875e-05, 3.832578659057617e-05, 6.520748138427734e-05, 9.208917617797852e-05, 0.00011897087097167969, 0.00014585256576538086, 0.00017273426055908203, 0.0001996159553527832, 0.00022649765014648438, 0.00025337934494018555, 0.0002802610397338867, 0.0003071427345275879, 0.00033402442932128906, 0.00036090612411499023, 0.0003877878189086914, 0.0004146695137023926, 0.00044155120849609375, 0.0004684329032897949, 0.0004953145980834961, 0.0005221962928771973, 0.0005490779876708984, 0.0005759596824645996, 0.0006028413772583008, 0.000629723072052002, 0.0006566047668457031, 0.0006834864616394043, 0.0007103681564331055, 0.0007372498512268066, 0.0007641315460205078, 0.000791013240814209, 0.0008178949356079102, 0.0008447766304016113, 0.0008716583251953125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 7.0, 9.0, 9.0, 14.0, 16.0, 33.0, 25.0, 44.0, 72.0, 128.0, 177.0, 330.0, 675.0, 1602.0, 5338.0, 36323.0, 766925.0, 216643.0, 14692.0, 3141.0, 1112.0, 517.0, 255.0, 167.0, 103.0, 51.0, 42.0, 43.0, 16.0, 16.0, 10.0, 4.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.70703125, -6.45672607421875, -6.2064208984375, -5.95611572265625, -5.705810546875, -5.45550537109375, -5.2052001953125, -4.95489501953125, -4.70458984375, -4.45428466796875, -4.2039794921875, -3.95367431640625, -3.703369140625, -3.45306396484375, -3.2027587890625, -2.95245361328125, -2.7021484375, -2.45184326171875, -2.2015380859375, -1.95123291015625, -1.700927734375, -1.45062255859375, -1.2003173828125, -0.95001220703125, -0.69970703125, -0.44940185546875, -0.1990966796875, 0.05120849609375, 0.301513671875, 0.55181884765625, 0.8021240234375, 1.05242919921875, 1.302734375, 1.55303955078125, 1.8033447265625, 2.05364990234375, 2.303955078125, 2.55426025390625, 2.8045654296875, 3.05487060546875, 3.30517578125, 3.55548095703125, 3.8057861328125, 4.05609130859375, 4.306396484375, 4.55670166015625, 4.8070068359375, 5.05731201171875, 5.3076171875, 5.55792236328125, 5.8082275390625, 6.05853271484375, 6.308837890625, 6.55914306640625, 6.8094482421875, 7.05975341796875, 7.31005859375, 7.56036376953125, 7.8106689453125, 8.06097412109375, 8.311279296875, 8.56158447265625, 8.8118896484375, 9.06219482421875, 9.3125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 10.0, 8.0, 9.0, 7.0, 18.0, 28.0, 22.0, 48.0, 64.0, 79.0, 105.0, 107.0, 121.0, 79.0, 76.0, 48.0, 36.0, 36.0, 21.0, 22.0, 12.0, 11.0, 12.0, 6.0, 2.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.9375, -3.77142333984375, -3.6053466796875, -3.43927001953125, -3.273193359375, -3.10711669921875, -2.9410400390625, -2.77496337890625, -2.60888671875, -2.44281005859375, -2.2767333984375, -2.11065673828125, -1.944580078125, -1.77850341796875, -1.6124267578125, -1.44635009765625, -1.2802734375, -1.11419677734375, -0.9481201171875, -0.78204345703125, -0.615966796875, -0.44989013671875, -0.2838134765625, -0.11773681640625, 0.04833984375, 0.21441650390625, 0.3804931640625, 0.54656982421875, 0.712646484375, 0.87872314453125, 1.0447998046875, 1.21087646484375, 1.376953125, 1.54302978515625, 1.7091064453125, 1.87518310546875, 2.041259765625, 2.20733642578125, 2.3734130859375, 2.53948974609375, 2.70556640625, 2.87164306640625, 3.0377197265625, 3.20379638671875, 3.369873046875, 3.53594970703125, 3.7020263671875, 3.86810302734375, 4.0341796875, 4.20025634765625, 4.3663330078125, 4.53240966796875, 4.698486328125, 4.86456298828125, 5.0306396484375, 5.19671630859375, 5.36279296875, 5.52886962890625, 5.6949462890625, 5.86102294921875, 6.027099609375, 6.19317626953125, 6.3592529296875, 6.52532958984375, 6.69140625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 7.0, 6.0, 11.0, 35.0, 83.0, 170.0, 259.0, 238.0, 101.0, 42.0, 16.0, 14.0, 6.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-123.66731262207031, -119.63440704345703, -115.60150146484375, -111.56859588623047, -107.53569030761719, -103.5027847290039, -99.46987915039062, -95.43698120117188, -91.40406799316406, -87.37116241455078, -83.3382568359375, -79.30535125732422, -75.27244567871094, -71.23954010009766, -67.20663452148438, -63.17373275756836, -59.140830993652344, -55.10792541503906, -51.07501983642578, -47.0421142578125, -43.00920867919922, -38.97630310058594, -34.94340133666992, -30.91049575805664, -26.87759017944336, -22.844684600830078, -18.811779022216797, -14.778875350952148, -10.745969772338867, -6.713064193725586, -2.6801605224609375, 1.3527450561523438, 5.385650634765625, 9.418556213378906, 13.451460838317871, 17.484365463256836, 21.517271041870117, 25.5501766204834, 29.583080291748047, 33.61598587036133, 37.64889144897461, 41.68179702758789, 45.71470260620117, 49.74760437011719, 53.78050994873047, 57.81341552734375, 61.84632110595703, 65.87922668457031, 69.9121322631836, 73.94503784179688, 77.97794342041016, 82.01084899902344, 86.04375457763672, 90.07666015625, 94.10955810546875, 98.14247131347656, 102.17536926269531, 106.2082748413086, 110.24118041992188, 114.27408599853516, 118.30699157714844, 122.33989715576172, 126.372802734375, 130.40570068359375, 134.43861389160156]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 6.0, 6.0, 9.0, 14.0, 10.0, 20.0, 19.0, 37.0, 23.0, 26.0, 36.0, 36.0, 42.0, 47.0, 66.0, 46.0, 58.0, 66.0, 48.0, 44.0, 58.0, 41.0, 42.0, 38.0, 34.0, 23.0, 22.0, 24.0, 12.0, 8.0, 9.0, 3.0, 10.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.27438735961914, -38.66165542602539, -37.04892349243164, -35.436187744140625, -33.823455810546875, -32.210723876953125, -30.597991943359375, -28.985260009765625, -27.372526168823242, -25.759794235229492, -24.14706039428711, -22.53432846069336, -20.92159652709961, -19.308862686157227, -17.696130752563477, -16.083396911621094, -14.470664978027344, -12.857932090759277, -11.245199203491211, -9.632467269897461, -8.019734382629395, -6.407001495361328, -4.794269561767578, -3.1815366744995117, -1.5688037872314453, 0.04392886161804199, 1.6566615104675293, 3.2693939208984375, 4.882126808166504, 6.49485969543457, 8.10759162902832, 9.720324516296387, 11.333053588867188, 12.945786476135254, 14.55851936340332, 16.17125129699707, 17.783985137939453, 19.396717071533203, 21.009449005126953, 22.622180938720703, 24.234914779663086, 25.847646713256836, 27.46038055419922, 29.07311248779297, 30.68584442138672, 32.29857635498047, 33.91130828857422, 35.524044036865234, 37.136775970458984, 38.749507904052734, 40.362239837646484, 41.9749755859375, 43.58770751953125, 45.200439453125, 46.81317138671875, 48.4259033203125, 50.03863525390625, 51.6513671875, 53.26409912109375, 54.8768310546875, 56.489566802978516, 58.102298736572266, 59.715030670166016, 61.327762603759766, 62.94049835205078]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 4.0, 15.0, 12.0, 19.0, 20.0, 19.0, 19.0, 32.0, 58.0, 59.0, 56.0, 88.0, 133.0, 153.0, 305.0, 1097.0, 13700.0, 4053043.0, 121080.0, 2984.0, 547.0, 233.0, 156.0, 95.0, 78.0, 57.0, 47.0, 40.0, 27.0, 18.0, 22.0, 12.0, 11.0, 4.0, 8.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.46875, -20.694580078125, -19.92041015625, -19.146240234375, -18.3720703125, -17.597900390625, -16.82373046875, -16.049560546875, -15.275390625, -14.501220703125, -13.72705078125, -12.952880859375, -12.1787109375, -11.404541015625, -10.63037109375, -9.856201171875, -9.08203125, -8.307861328125, -7.53369140625, -6.759521484375, -5.9853515625, -5.211181640625, -4.43701171875, -3.662841796875, -2.888671875, -2.114501953125, -1.34033203125, -0.566162109375, 0.2080078125, 0.982177734375, 1.75634765625, 2.530517578125, 3.3046875, 4.078857421875, 4.85302734375, 5.627197265625, 6.4013671875, 7.175537109375, 7.94970703125, 8.723876953125, 9.498046875, 10.272216796875, 11.04638671875, 11.820556640625, 12.5947265625, 13.368896484375, 14.14306640625, 14.917236328125, 15.69140625, 16.465576171875, 17.23974609375, 18.013916015625, 18.7880859375, 19.562255859375, 20.33642578125, 21.110595703125, 21.884765625, 22.658935546875, 23.43310546875, 24.207275390625, 24.9814453125, 25.755615234375, 26.52978515625, 27.303955078125, 28.078125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 9.0, 6.0, 3.0, 8.0, 13.0, 24.0, 24.0, 33.0, 41.0, 53.0, 54.0, 86.0, 90.0, 95.0, 92.0, 74.0, 74.0, 72.0, 39.0, 34.0, 27.0, 22.0, 16.0, 12.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.41015625, -5.25823974609375, -5.1063232421875, -4.95440673828125, -4.802490234375, -4.65057373046875, -4.4986572265625, -4.34674072265625, -4.19482421875, -4.04290771484375, -3.8909912109375, -3.73907470703125, -3.587158203125, -3.43524169921875, -3.2833251953125, -3.13140869140625, -2.9794921875, -2.82757568359375, -2.6756591796875, -2.52374267578125, -2.371826171875, -2.21990966796875, -2.0679931640625, -1.91607666015625, -1.76416015625, -1.61224365234375, -1.4603271484375, -1.30841064453125, -1.156494140625, -1.00457763671875, -0.8526611328125, -0.70074462890625, -0.548828125, -0.39691162109375, -0.2449951171875, -0.09307861328125, 0.058837890625, 0.21075439453125, 0.3626708984375, 0.51458740234375, 0.66650390625, 0.81842041015625, 0.9703369140625, 1.12225341796875, 1.274169921875, 1.42608642578125, 1.5780029296875, 1.72991943359375, 1.8818359375, 2.03375244140625, 2.1856689453125, 2.33758544921875, 2.489501953125, 2.64141845703125, 2.7933349609375, 2.94525146484375, 3.09716796875, 3.24908447265625, 3.4010009765625, 3.55291748046875, 3.704833984375, 3.85675048828125, 4.0086669921875, 4.16058349609375, 4.3125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 6.0, 9.0, 11.0, 16.0, 27.0, 50.0, 104.0, 206.0, 434.0, 858.0, 1800.0, 4175.0, 10360.0, 31446.0, 150956.0, 2469850.0, 1380529.0, 102452.0, 24516.0, 8740.0, 3857.0, 1858.0, 927.0, 507.0, 274.0, 136.0, 76.0, 44.0, 25.0, 14.0, 6.0, 5.0, 7.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.23828125, -7.0308837890625, -6.823486328125, -6.6160888671875, -6.40869140625, -6.2012939453125, -5.993896484375, -5.7864990234375, -5.5791015625, -5.3717041015625, -5.164306640625, -4.9569091796875, -4.74951171875, -4.5421142578125, -4.334716796875, -4.1273193359375, -3.919921875, -3.7125244140625, -3.505126953125, -3.2977294921875, -3.09033203125, -2.8829345703125, -2.675537109375, -2.4681396484375, -2.2607421875, -2.0533447265625, -1.845947265625, -1.6385498046875, -1.43115234375, -1.2237548828125, -1.016357421875, -0.8089599609375, -0.6015625, -0.3941650390625, -0.186767578125, 0.0206298828125, 0.22802734375, 0.4354248046875, 0.642822265625, 0.8502197265625, 1.0576171875, 1.2650146484375, 1.472412109375, 1.6798095703125, 1.88720703125, 2.0946044921875, 2.302001953125, 2.5093994140625, 2.716796875, 2.9241943359375, 3.131591796875, 3.3389892578125, 3.54638671875, 3.7537841796875, 3.961181640625, 4.1685791015625, 4.3759765625, 4.5833740234375, 4.790771484375, 4.9981689453125, 5.20556640625, 5.4129638671875, 5.620361328125, 5.8277587890625, 6.03515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 4.0, 7.0, 16.0, 11.0, 17.0, 28.0, 43.0, 54.0, 93.0, 165.0, 242.0, 479.0, 822.0, 775.0, 532.0, 293.0, 179.0, 84.0, 54.0, 47.0, 29.0, 16.0, 10.0, 9.0, 12.0, 6.0, 7.0, 1.0, 5.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.46484375, -5.26318359375, -5.0615234375, -4.85986328125, -4.658203125, -4.45654296875, -4.2548828125, -4.05322265625, -3.8515625, -3.64990234375, -3.4482421875, -3.24658203125, -3.044921875, -2.84326171875, -2.6416015625, -2.43994140625, -2.23828125, -2.03662109375, -1.8349609375, -1.63330078125, -1.431640625, -1.22998046875, -1.0283203125, -0.82666015625, -0.625, -0.42333984375, -0.2216796875, -0.02001953125, 0.181640625, 0.38330078125, 0.5849609375, 0.78662109375, 0.98828125, 1.18994140625, 1.3916015625, 1.59326171875, 1.794921875, 1.99658203125, 2.1982421875, 2.39990234375, 2.6015625, 2.80322265625, 3.0048828125, 3.20654296875, 3.408203125, 3.60986328125, 3.8115234375, 4.01318359375, 4.21484375, 4.41650390625, 4.6181640625, 4.81982421875, 5.021484375, 5.22314453125, 5.4248046875, 5.62646484375, 5.828125, 6.02978515625, 6.2314453125, 6.43310546875, 6.634765625, 6.83642578125, 7.0380859375, 7.23974609375, 7.44140625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 0.0, 3.0, 2.0, 6.0, 8.0, 17.0, 32.0, 68.0, 102.0, 208.0, 239.0, 173.0, 86.0, 29.0, 14.0, 8.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-107.73631286621094, -105.00628662109375, -102.2762680053711, -99.54624938964844, -96.81622314453125, -94.08619689941406, -91.3561782836914, -88.62615966796875, -85.89613342285156, -83.16610717773438, -80.43608856201172, -77.70606994628906, -74.97604370117188, -72.24601745605469, -69.51599884033203, -66.78598022460938, -64.05595397949219, -61.325931549072266, -58.595909118652344, -55.86588668823242, -53.1358642578125, -50.40584182739258, -47.675819396972656, -44.945796966552734, -42.21577453613281, -39.48575210571289, -36.75572967529297, -34.02570724487305, -31.295684814453125, -28.565662384033203, -25.83563995361328, -23.10561752319336, -20.375587463378906, -17.645565032958984, -14.915542602539062, -12.18552017211914, -9.455497741699219, -6.725475311279297, -3.995452880859375, -1.2654304504394531, 1.4645919799804688, 4.194614410400391, 6.9246368408203125, 9.654659271240234, 12.384681701660156, 15.114704132080078, 17.8447265625, 20.574748992919922, 23.304771423339844, 26.034793853759766, 28.764816284179688, 31.49483871459961, 34.22486114501953, 36.95488357543945, 39.684906005859375, 42.4149284362793, 45.14495086669922, 47.87497329711914, 50.60499572753906, 53.335018157958984, 56.065040588378906, 58.79506301879883, 61.52508544921875, 64.25511169433594, 66.9851303100586]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 6.0, 9.0, 9.0, 9.0, 15.0, 10.0, 18.0, 25.0, 28.0, 34.0, 33.0, 44.0, 43.0, 38.0, 52.0, 62.0, 49.0, 61.0, 56.0, 66.0, 41.0, 38.0, 28.0, 27.0, 36.0, 29.0, 31.0, 22.0, 13.0, 21.0, 15.0, 8.0, 10.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-30.920757293701172, -30.000701904296875, -29.080646514892578, -28.16058921813965, -27.24053382873535, -26.320478439331055, -25.400421142578125, -24.480365753173828, -23.56031036376953, -22.640254974365234, -21.720199584960938, -20.800142288208008, -19.88008689880371, -18.960031509399414, -18.039974212646484, -17.119918823242188, -16.19986343383789, -15.279808044433594, -14.35975170135498, -13.439695358276367, -12.51963996887207, -11.599584579467773, -10.67952823638916, -9.759471893310547, -8.83941650390625, -7.919360637664795, -6.99930477142334, -6.079248905181885, -5.15919303894043, -4.239137172698975, -3.3190813064575195, -2.3990254402160645, -1.4789695739746094, -0.5589137077331543, 0.3611421585083008, 1.2811980247497559, 2.201253890991211, 3.121309757232666, 4.041365623474121, 4.961421489715576, 5.881477355957031, 6.801533222198486, 7.721589088439941, 8.641645431518555, 9.561700820922852, 10.481756210327148, 11.401812553405762, 12.321868896484375, 13.241924285888672, 14.161979675292969, 15.082036018371582, 16.002092361450195, 16.922147750854492, 17.84220314025879, 18.76226043701172, 19.682315826416016, 20.602371215820312, 21.52242660522461, 22.442481994628906, 23.362539291381836, 24.282594680786133, 25.20265007019043, 26.12270736694336, 27.042762756347656, 27.962818145751953]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 2.0, 6.0, 14.0, 21.0, 27.0, 42.0, 68.0, 108.0, 177.0, 313.0, 591.0, 1042.0, 2092.0, 4260.0, 9477.0, 22316.0, 57484.0, 168194.0, 422462.0, 232522.0, 76062.0, 28543.0, 12028.0, 5340.0, 2595.0, 1292.0, 608.0, 361.0, 198.0, 117.0, 62.0, 52.0, 20.0, 27.0, 6.0, 10.0, 7.0, 7.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83203125, -5.63525390625, -5.4384765625, -5.24169921875, -5.044921875, -4.84814453125, -4.6513671875, -4.45458984375, -4.2578125, -4.06103515625, -3.8642578125, -3.66748046875, -3.470703125, -3.27392578125, -3.0771484375, -2.88037109375, -2.68359375, -2.48681640625, -2.2900390625, -2.09326171875, -1.896484375, -1.69970703125, -1.5029296875, -1.30615234375, -1.109375, -0.91259765625, -0.7158203125, -0.51904296875, -0.322265625, -0.12548828125, 0.0712890625, 0.26806640625, 0.46484375, 0.66162109375, 0.8583984375, 1.05517578125, 1.251953125, 1.44873046875, 1.6455078125, 1.84228515625, 2.0390625, 2.23583984375, 2.4326171875, 2.62939453125, 2.826171875, 3.02294921875, 3.2197265625, 3.41650390625, 3.61328125, 3.81005859375, 4.0068359375, 4.20361328125, 4.400390625, 4.59716796875, 4.7939453125, 4.99072265625, 5.1875, 5.38427734375, 5.5810546875, 5.77783203125, 5.974609375, 6.17138671875, 6.3681640625, 6.56494140625, 6.76171875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 8.0, 6.0, 5.0, 11.0, 10.0, 13.0, 15.0, 7.0, 21.0, 19.0, 17.0, 37.0, 38.0, 39.0, 42.0, 40.0, 49.0, 57.0, 60.0, 50.0, 49.0, 50.0, 50.0, 39.0, 40.0, 29.0, 35.0, 31.0, 22.0, 23.0, 16.0, 11.0, 19.0, 6.0, 9.0, 11.0, 2.0, 6.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.748046875, -2.6590576171875, -2.570068359375, -2.4810791015625, -2.39208984375, -2.3031005859375, -2.214111328125, -2.1251220703125, -2.0361328125, -1.9471435546875, -1.858154296875, -1.7691650390625, -1.68017578125, -1.5911865234375, -1.502197265625, -1.4132080078125, -1.32421875, -1.2352294921875, -1.146240234375, -1.0572509765625, -0.96826171875, -0.8792724609375, -0.790283203125, -0.7012939453125, -0.6123046875, -0.5233154296875, -0.434326171875, -0.3453369140625, -0.25634765625, -0.1673583984375, -0.078369140625, 0.0106201171875, 0.099609375, 0.1885986328125, 0.277587890625, 0.3665771484375, 0.45556640625, 0.5445556640625, 0.633544921875, 0.7225341796875, 0.8115234375, 0.9005126953125, 0.989501953125, 1.0784912109375, 1.16748046875, 1.2564697265625, 1.345458984375, 1.4344482421875, 1.5234375, 1.6124267578125, 1.701416015625, 1.7904052734375, 1.87939453125, 1.9683837890625, 2.057373046875, 2.1463623046875, 2.2353515625, 2.3243408203125, 2.413330078125, 2.5023193359375, 2.59130859375, 2.6802978515625, 2.769287109375, 2.8582763671875, 2.947265625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 1.0, 2.0, 6.0, 7.0, 9.0, 20.0, 17.0, 51.0, 62.0, 136.0, 229.0, 450.0, 1157.0, 4387.0, 38469.0, 776206.0, 210383.0, 13136.0, 2290.0, 765.0, 346.0, 166.0, 85.0, 61.0, 34.0, 25.0, 20.0, 13.0, 7.0, 4.0, 8.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.390625, -17.82958984375, -17.2685546875, -16.70751953125, -16.146484375, -15.58544921875, -15.0244140625, -14.46337890625, -13.90234375, -13.34130859375, -12.7802734375, -12.21923828125, -11.658203125, -11.09716796875, -10.5361328125, -9.97509765625, -9.4140625, -8.85302734375, -8.2919921875, -7.73095703125, -7.169921875, -6.60888671875, -6.0478515625, -5.48681640625, -4.92578125, -4.36474609375, -3.8037109375, -3.24267578125, -2.681640625, -2.12060546875, -1.5595703125, -0.99853515625, -0.4375, 0.12353515625, 0.6845703125, 1.24560546875, 1.806640625, 2.36767578125, 2.9287109375, 3.48974609375, 4.05078125, 4.61181640625, 5.1728515625, 5.73388671875, 6.294921875, 6.85595703125, 7.4169921875, 7.97802734375, 8.5390625, 9.10009765625, 9.6611328125, 10.22216796875, 10.783203125, 11.34423828125, 11.9052734375, 12.46630859375, 13.02734375, 13.58837890625, 14.1494140625, 14.71044921875, 15.271484375, 15.83251953125, 16.3935546875, 16.95458984375, 17.515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 6.0, 2.0, 6.0, 3.0, 6.0, 8.0, 9.0, 14.0, 16.0, 20.0, 18.0, 26.0, 31.0, 20.0, 32.0, 47.0, 37.0, 51.0, 49.0, 57.0, 47.0, 38.0, 52.0, 42.0, 43.0, 37.0, 34.0, 27.0, 34.0, 29.0, 26.0, 21.0, 19.0, 18.0, 18.0, 15.0, 6.0, 3.0, 8.0, 4.0, 2.0, 8.0, 5.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.34375, -9.033935546875, -8.72412109375, -8.414306640625, -8.1044921875, -7.794677734375, -7.48486328125, -7.175048828125, -6.865234375, -6.555419921875, -6.24560546875, -5.935791015625, -5.6259765625, -5.316162109375, -5.00634765625, -4.696533203125, -4.38671875, -4.076904296875, -3.76708984375, -3.457275390625, -3.1474609375, -2.837646484375, -2.52783203125, -2.218017578125, -1.908203125, -1.598388671875, -1.28857421875, -0.978759765625, -0.6689453125, -0.359130859375, -0.04931640625, 0.260498046875, 0.5703125, 0.880126953125, 1.18994140625, 1.499755859375, 1.8095703125, 2.119384765625, 2.42919921875, 2.739013671875, 3.048828125, 3.358642578125, 3.66845703125, 3.978271484375, 4.2880859375, 4.597900390625, 4.90771484375, 5.217529296875, 5.52734375, 5.837158203125, 6.14697265625, 6.456787109375, 6.7666015625, 7.076416015625, 7.38623046875, 7.696044921875, 8.005859375, 8.315673828125, 8.62548828125, 8.935302734375, 9.2451171875, 9.554931640625, 9.86474609375, 10.174560546875, 10.484375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 6.0, 10.0, 15.0, 23.0, 42.0, 43.0, 96.0, 217.0, 647.0, 2544.0, 23619.0, 967395.0, 48950.0, 3561.0, 788.0, 260.0, 123.0, 65.0, 43.0, 29.0, 20.0, 11.0, 12.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.1640625, -13.754638671875, -13.34521484375, -12.935791015625, -12.5263671875, -12.116943359375, -11.70751953125, -11.298095703125, -10.888671875, -10.479248046875, -10.06982421875, -9.660400390625, -9.2509765625, -8.841552734375, -8.43212890625, -8.022705078125, -7.61328125, -7.203857421875, -6.79443359375, -6.385009765625, -5.9755859375, -5.566162109375, -5.15673828125, -4.747314453125, -4.337890625, -3.928466796875, -3.51904296875, -3.109619140625, -2.7001953125, -2.290771484375, -1.88134765625, -1.471923828125, -1.0625, -0.653076171875, -0.24365234375, 0.165771484375, 0.5751953125, 0.984619140625, 1.39404296875, 1.803466796875, 2.212890625, 2.622314453125, 3.03173828125, 3.441162109375, 3.8505859375, 4.260009765625, 4.66943359375, 5.078857421875, 5.48828125, 5.897705078125, 6.30712890625, 6.716552734375, 7.1259765625, 7.535400390625, 7.94482421875, 8.354248046875, 8.763671875, 9.173095703125, 9.58251953125, 9.991943359375, 10.4013671875, 10.810791015625, 11.22021484375, 11.629638671875, 12.0390625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 7.0, 3.0, 8.0, 5.0, 3.0, 14.0, 9.0, 16.0, 18.0, 24.0, 29.0, 36.0, 59.0, 50.0, 80.0, 90.0, 106.0, 96.0, 82.0, 47.0, 43.0, 24.0, 28.0, 24.0, 10.0, 17.0, 10.0, 13.0, 11.0, 8.0, 4.0, 6.0, 3.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0006394386291503906, -0.0006213411688804626, -0.0006032437086105347, -0.0005851462483406067, -0.0005670487880706787, -0.0005489513278007507, -0.0005308538675308228, -0.0005127564072608948, -0.0004946589469909668, -0.0004765614867210388, -0.00045846402645111084, -0.00044036656618118286, -0.0004222691059112549, -0.0004041716456413269, -0.0003860741853713989, -0.00036797672510147095, -0.00034987926483154297, -0.000331781804561615, -0.000313684344291687, -0.00029558688402175903, -0.00027748942375183105, -0.0002593919634819031, -0.0002412945032119751, -0.00022319704294204712, -0.00020509958267211914, -0.00018700212240219116, -0.00016890466213226318, -0.0001508072018623352, -0.00013270974159240723, -0.00011461228132247925, -9.651482105255127e-05, -7.841736078262329e-05, -6.031990051269531e-05, -4.2222440242767334e-05, -2.4124979972839355e-05, -6.027519702911377e-06, 1.2069940567016602e-05, 3.016740083694458e-05, 4.826486110687256e-05, 6.636232137680054e-05, 8.445978164672852e-05, 0.0001025572419166565, 0.00012065470218658447, 0.00013875216245651245, 0.00015684962272644043, 0.0001749470829963684, 0.0001930445432662964, 0.00021114200353622437, 0.00022923946380615234, 0.0002473369240760803, 0.0002654343843460083, 0.0002835318446159363, 0.00030162930488586426, 0.00031972676515579224, 0.0003378242254257202, 0.0003559216856956482, 0.00037401914596557617, 0.00039211660623550415, 0.00041021406650543213, 0.0004283115267753601, 0.0004464089870452881, 0.00046450644731521606, 0.00048260390758514404, 0.000500701367855072, 0.000518798828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 8.0, 5.0, 9.0, 10.0, 17.0, 32.0, 34.0, 51.0, 89.0, 140.0, 218.0, 349.0, 695.0, 1492.0, 3492.0, 12651.0, 103249.0, 790575.0, 114887.0, 13630.0, 3696.0, 1528.0, 694.0, 370.0, 239.0, 107.0, 90.0, 55.0, 31.0, 26.0, 16.0, 20.0, 7.0, 6.0, 6.0, 9.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.04296875, -4.86614990234375, -4.6893310546875, -4.51251220703125, -4.335693359375, -4.15887451171875, -3.9820556640625, -3.80523681640625, -3.62841796875, -3.45159912109375, -3.2747802734375, -3.09796142578125, -2.921142578125, -2.74432373046875, -2.5675048828125, -2.39068603515625, -2.2138671875, -2.03704833984375, -1.8602294921875, -1.68341064453125, -1.506591796875, -1.32977294921875, -1.1529541015625, -0.97613525390625, -0.79931640625, -0.62249755859375, -0.4456787109375, -0.26885986328125, -0.092041015625, 0.08477783203125, 0.2615966796875, 0.43841552734375, 0.615234375, 0.79205322265625, 0.9688720703125, 1.14569091796875, 1.322509765625, 1.49932861328125, 1.6761474609375, 1.85296630859375, 2.02978515625, 2.20660400390625, 2.3834228515625, 2.56024169921875, 2.737060546875, 2.91387939453125, 3.0906982421875, 3.26751708984375, 3.4443359375, 3.62115478515625, 3.7979736328125, 3.97479248046875, 4.151611328125, 4.32843017578125, 4.5052490234375, 4.68206787109375, 4.85888671875, 5.03570556640625, 5.2125244140625, 5.38934326171875, 5.566162109375, 5.74298095703125, 5.9197998046875, 6.09661865234375, 6.2734375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 6.0, 9.0, 8.0, 15.0, 14.0, 17.0, 31.0, 38.0, 51.0, 53.0, 78.0, 69.0, 90.0, 95.0, 82.0, 78.0, 61.0, 48.0, 40.0, 27.0, 27.0, 16.0, 13.0, 13.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.4375, -4.320404052734375, -4.20330810546875, -4.086212158203125, -3.9691162109375, -3.852020263671875, -3.73492431640625, -3.617828369140625, -3.500732421875, -3.383636474609375, -3.26654052734375, -3.149444580078125, -3.0323486328125, -2.915252685546875, -2.79815673828125, -2.681060791015625, -2.56396484375, -2.446868896484375, -2.32977294921875, -2.212677001953125, -2.0955810546875, -1.978485107421875, -1.86138916015625, -1.744293212890625, -1.627197265625, -1.510101318359375, -1.39300537109375, -1.275909423828125, -1.1588134765625, -1.041717529296875, -0.92462158203125, -0.807525634765625, -0.6904296875, -0.573333740234375, -0.45623779296875, -0.339141845703125, -0.2220458984375, -0.104949951171875, 0.01214599609375, 0.129241943359375, 0.246337890625, 0.363433837890625, 0.48052978515625, 0.597625732421875, 0.7147216796875, 0.831817626953125, 0.94891357421875, 1.066009521484375, 1.18310546875, 1.300201416015625, 1.41729736328125, 1.534393310546875, 1.6514892578125, 1.768585205078125, 1.88568115234375, 2.002777099609375, 2.119873046875, 2.236968994140625, 2.35406494140625, 2.471160888671875, 2.5882568359375, 2.705352783203125, 2.82244873046875, 2.939544677734375, 3.056640625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 12.0, 11.0, 17.0, 80.0, 195.0, 348.0, 231.0, 73.0, 20.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.63168334960938, -139.75608825683594, -134.8804931640625, -130.00489807128906, -125.12930297851562, -120.25370788574219, -115.37811279296875, -110.50251770019531, -105.62692260742188, -100.75132751464844, -95.875732421875, -91.00013732910156, -86.12454223632812, -81.24894714355469, -76.37335205078125, -71.49775695800781, -66.62215423583984, -61.746559143066406, -56.87096405029297, -51.99536895751953, -47.119773864746094, -42.244178771972656, -37.36857986450195, -32.492984771728516, -27.617389678955078, -22.74179458618164, -17.866199493408203, -12.990602493286133, -8.115007400512695, -3.239412307739258, 1.6361846923828125, 6.51177978515625, 11.387374877929688, 16.262969970703125, 21.138565063476562, 26.014162063598633, 30.88975715637207, 35.765350341796875, 40.64094924926758, 45.516544342041016, 50.39213943481445, 55.26773452758789, 60.14332962036133, 65.01892852783203, 69.89452362060547, 74.7701187133789, 79.64571380615234, 84.52130889892578, 89.39690399169922, 94.27249908447266, 99.1480941772461, 104.02368927001953, 108.89928436279297, 113.7748794555664, 118.65048217773438, 123.52607727050781, 128.40167236328125, 133.2772674560547, 138.15286254882812, 143.02845764160156, 147.904052734375, 152.77964782714844, 157.65524291992188, 162.5308380126953, 167.40643310546875]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 9.0, 9.0, 14.0, 9.0, 15.0, 17.0, 25.0, 24.0, 21.0, 32.0, 30.0, 36.0, 63.0, 65.0, 54.0, 54.0, 67.0, 58.0, 60.0, 51.0, 34.0, 39.0, 24.0, 24.0, 25.0, 20.0, 18.0, 15.0, 19.0, 11.0, 9.0, 15.0, 11.0, 5.0, 6.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0], "bins": [-54.15583801269531, -52.63431930541992, -51.112796783447266, -49.591278076171875, -48.069759368896484, -46.54823684692383, -45.02671813964844, -43.50519561767578, -41.98367691040039, -40.462158203125, -38.940635681152344, -37.41911697387695, -35.89759826660156, -34.376075744628906, -32.854557037353516, -31.333036422729492, -29.8115177154541, -28.289997100830078, -26.768478393554688, -25.246957778930664, -23.72543716430664, -22.20391845703125, -20.682397842407227, -19.160877227783203, -17.639358520507812, -16.11783790588379, -14.596318244934082, -13.074798583984375, -11.553277969360352, -10.031758308410645, -8.510238647460938, -6.988718032836914, -5.467197418212891, -3.9456772804260254, -2.4241573810577393, -0.9026374816894531, 0.6188826560974121, 2.1404027938842773, 3.6619224548339844, 5.183443069458008, 6.704962730407715, 8.226482391357422, 9.748003005981445, 11.269522666931152, 12.79104232788086, 14.312562942504883, 15.83408260345459, 17.355602264404297, 18.87712287902832, 20.398643493652344, 21.920162200927734, 23.441682815551758, 24.96320343017578, 26.484722137451172, 28.006242752075195, 29.52776336669922, 31.04928207397461, 32.57080078125, 34.092323303222656, 35.61384201049805, 37.13536071777344, 38.656883239746094, 40.178401947021484, 41.699920654296875, 43.22144317626953]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 7.0, 7.0, 7.0, 16.0, 21.0, 36.0, 65.0, 100.0, 223.0, 507.0, 1694.0, 7806.0, 48856.0, 827523.0, 3122828.0, 161965.0, 17480.0, 3466.0, 940.0, 338.0, 139.0, 96.0, 52.0, 20.0, 21.0, 22.0, 9.0, 3.0, 4.0, 10.0, 4.0, 2.0, 0.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.9639892578125, -7.717041015625, -7.4700927734375, -7.22314453125, -6.9761962890625, -6.729248046875, -6.4822998046875, -6.2353515625, -5.9884033203125, -5.741455078125, -5.4945068359375, -5.24755859375, -5.0006103515625, -4.753662109375, -4.5067138671875, -4.259765625, -4.0128173828125, -3.765869140625, -3.5189208984375, -3.27197265625, -3.0250244140625, -2.778076171875, -2.5311279296875, -2.2841796875, -2.0372314453125, -1.790283203125, -1.5433349609375, -1.29638671875, -1.0494384765625, -0.802490234375, -0.5555419921875, -0.30859375, -0.0616455078125, 0.185302734375, 0.4322509765625, 0.67919921875, 0.9261474609375, 1.173095703125, 1.4200439453125, 1.6669921875, 1.9139404296875, 2.160888671875, 2.4078369140625, 2.65478515625, 2.9017333984375, 3.148681640625, 3.3956298828125, 3.642578125, 3.8895263671875, 4.136474609375, 4.3834228515625, 4.63037109375, 4.8773193359375, 5.124267578125, 5.3712158203125, 5.6181640625, 5.8651123046875, 6.112060546875, 6.3590087890625, 6.60595703125, 6.8529052734375, 7.099853515625, 7.3468017578125, 7.59375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 3.0, 9.0, 9.0, 20.0, 6.0, 32.0, 23.0, 39.0, 59.0, 61.0, 65.0, 95.0, 75.0, 76.0, 85.0, 82.0, 63.0, 56.0, 35.0, 38.0, 23.0, 18.0, 12.0, 10.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.10333251953125, -1.9722900390625, -1.84124755859375, -1.710205078125, -1.57916259765625, -1.4481201171875, -1.31707763671875, -1.18603515625, -1.05499267578125, -0.9239501953125, -0.79290771484375, -0.661865234375, -0.53082275390625, -0.3997802734375, -0.26873779296875, -0.1376953125, -0.00665283203125, 0.1243896484375, 0.25543212890625, 0.386474609375, 0.51751708984375, 0.6485595703125, 0.77960205078125, 0.91064453125, 1.04168701171875, 1.1727294921875, 1.30377197265625, 1.434814453125, 1.56585693359375, 1.6968994140625, 1.82794189453125, 1.958984375, 2.09002685546875, 2.2210693359375, 2.35211181640625, 2.483154296875, 2.61419677734375, 2.7452392578125, 2.87628173828125, 3.00732421875, 3.13836669921875, 3.2694091796875, 3.40045166015625, 3.531494140625, 3.66253662109375, 3.7935791015625, 3.92462158203125, 4.0556640625, 4.18670654296875, 4.3177490234375, 4.44879150390625, 4.579833984375, 4.71087646484375, 4.8419189453125, 4.97296142578125, 5.10400390625, 5.23504638671875, 5.3660888671875, 5.49713134765625, 5.628173828125, 5.75921630859375, 5.8902587890625, 6.02130126953125, 6.15234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 4.0, 10.0, 16.0, 27.0, 27.0, 38.0, 63.0, 120.0, 210.0, 385.0, 842.0, 1845.0, 4776.0, 13803.0, 49158.0, 248095.0, 2394157.0, 1266631.0, 154282.0, 38782.0, 12275.0, 4724.0, 1984.0, 885.0, 455.0, 255.0, 139.0, 91.0, 53.0, 41.0, 22.0, 21.0, 12.0, 17.0, 13.0, 9.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.18359375, -5.00994873046875, -4.8363037109375, -4.66265869140625, -4.489013671875, -4.31536865234375, -4.1417236328125, -3.96807861328125, -3.79443359375, -3.62078857421875, -3.4471435546875, -3.27349853515625, -3.099853515625, -2.92620849609375, -2.7525634765625, -2.57891845703125, -2.4052734375, -2.23162841796875, -2.0579833984375, -1.88433837890625, -1.710693359375, -1.53704833984375, -1.3634033203125, -1.18975830078125, -1.01611328125, -0.84246826171875, -0.6688232421875, -0.49517822265625, -0.321533203125, -0.14788818359375, 0.0257568359375, 0.19940185546875, 0.373046875, 0.54669189453125, 0.7203369140625, 0.89398193359375, 1.067626953125, 1.24127197265625, 1.4149169921875, 1.58856201171875, 1.76220703125, 1.93585205078125, 2.1094970703125, 2.28314208984375, 2.456787109375, 2.63043212890625, 2.8040771484375, 2.97772216796875, 3.1513671875, 3.32501220703125, 3.4986572265625, 3.67230224609375, 3.845947265625, 4.01959228515625, 4.1932373046875, 4.36688232421875, 4.54052734375, 4.71417236328125, 4.8878173828125, 5.06146240234375, 5.235107421875, 5.40875244140625, 5.5823974609375, 5.75604248046875, 5.9296875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 4.0, 8.0, 15.0, 8.0, 11.0, 18.0, 21.0, 31.0, 42.0, 66.0, 86.0, 97.0, 147.0, 191.0, 286.0, 409.0, 478.0, 506.0, 397.0, 308.0, 225.0, 151.0, 114.0, 76.0, 73.0, 59.0, 46.0, 40.0, 35.0, 20.0, 17.0, 11.0, 11.0, 15.0, 9.0, 11.0, 5.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.03125, -3.86480712890625, -3.6983642578125, -3.53192138671875, -3.365478515625, -3.19903564453125, -3.0325927734375, -2.86614990234375, -2.69970703125, -2.53326416015625, -2.3668212890625, -2.20037841796875, -2.033935546875, -1.86749267578125, -1.7010498046875, -1.53460693359375, -1.3681640625, -1.20172119140625, -1.0352783203125, -0.86883544921875, -0.702392578125, -0.53594970703125, -0.3695068359375, -0.20306396484375, -0.03662109375, 0.12982177734375, 0.2962646484375, 0.46270751953125, 0.629150390625, 0.79559326171875, 0.9620361328125, 1.12847900390625, 1.294921875, 1.46136474609375, 1.6278076171875, 1.79425048828125, 1.960693359375, 2.12713623046875, 2.2935791015625, 2.46002197265625, 2.62646484375, 2.79290771484375, 2.9593505859375, 3.12579345703125, 3.292236328125, 3.45867919921875, 3.6251220703125, 3.79156494140625, 3.9580078125, 4.12445068359375, 4.2908935546875, 4.45733642578125, 4.623779296875, 4.79022216796875, 4.9566650390625, 5.12310791015625, 5.28955078125, 5.45599365234375, 5.6224365234375, 5.78887939453125, 5.955322265625, 6.12176513671875, 6.2882080078125, 6.45465087890625, 6.62109375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 10.0, 41.0, 134.0, 278.0, 321.0, 141.0, 54.0, 9.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.74945068359375, -102.31724548339844, -97.88504791259766, -93.45284271240234, -89.02064514160156, -84.58843994140625, -80.15623474121094, -75.72402954101562, -71.29183197021484, -66.85962677001953, -62.42742919921875, -57.99522399902344, -53.56302261352539, -49.130821228027344, -44.69861602783203, -40.266414642333984, -35.83421325683594, -31.40201187133789, -26.96980857849121, -22.53760528564453, -18.105403900146484, -13.673202514648438, -9.240999221801758, -4.808795928955078, -0.37659454345703125, 4.055607795715332, 8.487810134887695, 12.920012474060059, 17.352214813232422, 21.78441619873047, 26.21661949157715, 30.648822784423828, 35.081024169921875, 39.51322555541992, 43.94542694091797, 48.37763214111328, 52.80983352661133, 57.242034912109375, 61.67424011230469, 66.1064453125, 70.53864288330078, 74.9708480834961, 79.40304565429688, 83.83525085449219, 88.2674560546875, 92.69965362548828, 97.1318588256836, 101.56405639648438, 105.99626159667969, 110.428466796875, 114.86066436767578, 119.2928695678711, 123.72506713867188, 128.1572723388672, 132.5894775390625, 137.0216827392578, 141.45388793945312, 145.88609313964844, 150.31829833984375, 154.75048828125, 159.1826934814453, 163.61489868164062, 168.04710388183594, 172.47930908203125, 176.9114990234375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 6.0, 8.0, 10.0, 10.0, 20.0, 23.0, 25.0, 33.0, 27.0, 48.0, 48.0, 50.0, 47.0, 68.0, 49.0, 54.0, 61.0, 55.0, 43.0, 62.0, 38.0, 38.0, 30.0, 29.0, 26.0, 24.0, 20.0, 17.0, 5.0, 3.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-54.768924713134766, -53.43083572387695, -52.09274673461914, -50.75465774536133, -49.416568756103516, -48.07848358154297, -46.740394592285156, -45.402305603027344, -44.06421661376953, -42.72612762451172, -41.388038635253906, -40.049949645996094, -38.71186065673828, -37.37377166748047, -36.035682678222656, -34.69759750366211, -33.35950469970703, -32.02141571044922, -30.683326721191406, -29.345237731933594, -28.007150650024414, -26.6690616607666, -25.33097267150879, -23.99288558959961, -22.654796600341797, -21.316707611083984, -19.978618621826172, -18.64052963256836, -17.30244255065918, -15.964353561401367, -14.626264572143555, -13.288176536560059, -11.950088500976562, -10.61199951171875, -9.273911476135254, -7.935822486877441, -6.597733974456787, -5.259645462036133, -3.9215564727783203, -2.583468437194824, -1.2453794479370117, 0.09270918369293213, 1.430797815322876, 2.7688865661621094, 4.106975078582764, 5.445063591003418, 6.7831525802612305, 8.121240615844727, 9.459329605102539, 10.797418594360352, 12.135506629943848, 13.47359561920166, 14.811683654785156, 16.14977264404297, 17.48786163330078, 18.825950622558594, 20.164039611816406, 21.50212860107422, 22.84021759033203, 24.178306579589844, 25.516393661499023, 26.854482650756836, 28.19257164001465, 29.530658721923828, 30.86874771118164]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 9.0, 9.0, 16.0, 26.0, 52.0, 61.0, 138.0, 204.0, 347.0, 609.0, 1236.0, 2533.0, 5862.0, 15779.0, 46153.0, 138796.0, 388171.0, 297527.0, 98109.0, 32701.0, 11543.0, 4418.0, 2087.0, 984.0, 497.0, 253.0, 143.0, 91.0, 77.0, 37.0, 22.0, 22.0, 11.0, 7.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.56640625, -6.34637451171875, -6.1263427734375, -5.90631103515625, -5.686279296875, -5.46624755859375, -5.2462158203125, -5.02618408203125, -4.80615234375, -4.58612060546875, -4.3660888671875, -4.14605712890625, -3.926025390625, -3.70599365234375, -3.4859619140625, -3.26593017578125, -3.0458984375, -2.82586669921875, -2.6058349609375, -2.38580322265625, -2.165771484375, -1.94573974609375, -1.7257080078125, -1.50567626953125, -1.28564453125, -1.06561279296875, -0.8455810546875, -0.62554931640625, -0.405517578125, -0.18548583984375, 0.0345458984375, 0.25457763671875, 0.474609375, 0.69464111328125, 0.9146728515625, 1.13470458984375, 1.354736328125, 1.57476806640625, 1.7947998046875, 2.01483154296875, 2.23486328125, 2.45489501953125, 2.6749267578125, 2.89495849609375, 3.114990234375, 3.33502197265625, 3.5550537109375, 3.77508544921875, 3.9951171875, 4.21514892578125, 4.4351806640625, 4.65521240234375, 4.875244140625, 5.09527587890625, 5.3153076171875, 5.53533935546875, 5.75537109375, 5.97540283203125, 6.1954345703125, 6.41546630859375, 6.635498046875, 6.85552978515625, 7.0755615234375, 7.29559326171875, 7.515625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 12.0, 11.0, 13.0, 18.0, 11.0, 21.0, 20.0, 28.0, 33.0, 34.0, 37.0, 39.0, 47.0, 41.0, 47.0, 61.0, 58.0, 42.0, 44.0, 47.0, 42.0, 40.0, 37.0, 34.0, 23.0, 25.0, 18.0, 23.0, 19.0, 13.0, 14.0, 9.0, 5.0, 8.0, 3.0, 6.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.310546875, -2.232391357421875, -2.15423583984375, -2.076080322265625, -1.9979248046875, -1.919769287109375, -1.84161376953125, -1.763458251953125, -1.685302734375, -1.607147216796875, -1.52899169921875, -1.450836181640625, -1.3726806640625, -1.294525146484375, -1.21636962890625, -1.138214111328125, -1.06005859375, -0.981903076171875, -0.90374755859375, -0.825592041015625, -0.7474365234375, -0.669281005859375, -0.59112548828125, -0.512969970703125, -0.434814453125, -0.356658935546875, -0.27850341796875, -0.200347900390625, -0.1221923828125, -0.044036865234375, 0.03411865234375, 0.112274169921875, 0.1904296875, 0.268585205078125, 0.34674072265625, 0.424896240234375, 0.5030517578125, 0.581207275390625, 0.65936279296875, 0.737518310546875, 0.815673828125, 0.893829345703125, 0.97198486328125, 1.050140380859375, 1.1282958984375, 1.206451416015625, 1.28460693359375, 1.362762451171875, 1.44091796875, 1.519073486328125, 1.59722900390625, 1.675384521484375, 1.7535400390625, 1.831695556640625, 1.90985107421875, 1.988006591796875, 2.066162109375, 2.144317626953125, 2.22247314453125, 2.300628662109375, 2.3787841796875, 2.456939697265625, 2.53509521484375, 2.613250732421875, 2.69140625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 7.0, 4.0, 5.0, 11.0, 20.0, 18.0, 31.0, 35.0, 43.0, 89.0, 116.0, 179.0, 276.0, 481.0, 942.0, 2212.0, 7619.0, 97878.0, 876056.0, 53119.0, 5631.0, 1778.0, 834.0, 435.0, 255.0, 136.0, 102.0, 64.0, 56.0, 35.0, 23.0, 16.0, 13.0, 8.0, 5.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.671875, -19.02490234375, -18.3779296875, -17.73095703125, -17.083984375, -16.43701171875, -15.7900390625, -15.14306640625, -14.49609375, -13.84912109375, -13.2021484375, -12.55517578125, -11.908203125, -11.26123046875, -10.6142578125, -9.96728515625, -9.3203125, -8.67333984375, -8.0263671875, -7.37939453125, -6.732421875, -6.08544921875, -5.4384765625, -4.79150390625, -4.14453125, -3.49755859375, -2.8505859375, -2.20361328125, -1.556640625, -0.90966796875, -0.2626953125, 0.38427734375, 1.03125, 1.67822265625, 2.3251953125, 2.97216796875, 3.619140625, 4.26611328125, 4.9130859375, 5.56005859375, 6.20703125, 6.85400390625, 7.5009765625, 8.14794921875, 8.794921875, 9.44189453125, 10.0888671875, 10.73583984375, 11.3828125, 12.02978515625, 12.6767578125, 13.32373046875, 13.970703125, 14.61767578125, 15.2646484375, 15.91162109375, 16.55859375, 17.20556640625, 17.8525390625, 18.49951171875, 19.146484375, 19.79345703125, 20.4404296875, 21.08740234375, 21.734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 2.0, 5.0, 6.0, 8.0, 5.0, 6.0, 8.0, 14.0, 17.0, 16.0, 17.0, 18.0, 26.0, 28.0, 27.0, 33.0, 32.0, 37.0, 38.0, 50.0, 52.0, 38.0, 47.0, 46.0, 46.0, 44.0, 35.0, 48.0, 35.0, 31.0, 33.0, 23.0, 22.0, 15.0, 21.0, 19.0, 10.0, 7.0, 7.0, 9.0, 2.0, 5.0, 3.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.6796875, -11.337158203125, -10.99462890625, -10.652099609375, -10.3095703125, -9.967041015625, -9.62451171875, -9.281982421875, -8.939453125, -8.596923828125, -8.25439453125, -7.911865234375, -7.5693359375, -7.226806640625, -6.88427734375, -6.541748046875, -6.19921875, -5.856689453125, -5.51416015625, -5.171630859375, -4.8291015625, -4.486572265625, -4.14404296875, -3.801513671875, -3.458984375, -3.116455078125, -2.77392578125, -2.431396484375, -2.0888671875, -1.746337890625, -1.40380859375, -1.061279296875, -0.71875, -0.376220703125, -0.03369140625, 0.308837890625, 0.6513671875, 0.993896484375, 1.33642578125, 1.678955078125, 2.021484375, 2.364013671875, 2.70654296875, 3.049072265625, 3.3916015625, 3.734130859375, 4.07666015625, 4.419189453125, 4.76171875, 5.104248046875, 5.44677734375, 5.789306640625, 6.1318359375, 6.474365234375, 6.81689453125, 7.159423828125, 7.501953125, 7.844482421875, 8.18701171875, 8.529541015625, 8.8720703125, 9.214599609375, 9.55712890625, 9.899658203125, 10.2421875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 8.0, 3.0, 6.0, 11.0, 12.0, 14.0, 22.0, 30.0, 60.0, 71.0, 169.0, 345.0, 768.0, 2171.0, 8678.0, 91603.0, 864385.0, 69318.0, 7481.0, 1951.0, 677.0, 325.0, 161.0, 79.0, 65.0, 33.0, 16.0, 16.0, 20.0, 11.0, 5.0, 7.0, 7.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-7.69140625, -7.46148681640625, -7.2315673828125, -7.00164794921875, -6.771728515625, -6.54180908203125, -6.3118896484375, -6.08197021484375, -5.85205078125, -5.62213134765625, -5.3922119140625, -5.16229248046875, -4.932373046875, -4.70245361328125, -4.4725341796875, -4.24261474609375, -4.0126953125, -3.78277587890625, -3.5528564453125, -3.32293701171875, -3.093017578125, -2.86309814453125, -2.6331787109375, -2.40325927734375, -2.17333984375, -1.94342041015625, -1.7135009765625, -1.48358154296875, -1.253662109375, -1.02374267578125, -0.7938232421875, -0.56390380859375, -0.333984375, -0.10406494140625, 0.1258544921875, 0.35577392578125, 0.585693359375, 0.81561279296875, 1.0455322265625, 1.27545166015625, 1.50537109375, 1.73529052734375, 1.9652099609375, 2.19512939453125, 2.425048828125, 2.65496826171875, 2.8848876953125, 3.11480712890625, 3.3447265625, 3.57464599609375, 3.8045654296875, 4.03448486328125, 4.264404296875, 4.49432373046875, 4.7242431640625, 4.95416259765625, 5.18408203125, 5.41400146484375, 5.6439208984375, 5.87384033203125, 6.103759765625, 6.33367919921875, 6.5635986328125, 6.79351806640625, 7.0234375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 4.0, 6.0, 10.0, 14.0, 10.0, 9.0, 28.0, 20.0, 29.0, 36.0, 49.0, 43.0, 69.0, 110.0, 141.0, 119.0, 55.0, 46.0, 27.0, 36.0, 27.0, 16.0, 19.0, 13.0, 14.0, 8.0, 7.0, 10.0, 5.0, 6.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0008974075317382812, -0.0008689090609550476, -0.000840410590171814, -0.0008119121193885803, -0.0007834136486053467, -0.000754915177822113, -0.0007264167070388794, -0.0006979182362556458, -0.0006694197654724121, -0.0006409212946891785, -0.0006124228239059448, -0.0005839243531227112, -0.0005554258823394775, -0.0005269274115562439, -0.0004984289407730103, -0.0004699304699897766, -0.00044143199920654297, -0.0004129335284233093, -0.0003844350576400757, -0.00035593658685684204, -0.0003274381160736084, -0.00029893964529037476, -0.0002704411745071411, -0.00024194270372390747, -0.00021344423294067383, -0.00018494576215744019, -0.00015644729137420654, -0.0001279488205909729, -9.945034980773926e-05, -7.095187902450562e-05, -4.245340824127197e-05, -1.395493745803833e-05, 1.4543533325195312e-05, 4.3042004108428955e-05, 7.15404748916626e-05, 0.00010003894567489624, 0.00012853741645812988, 0.00015703588724136353, 0.00018553435802459717, 0.0002140328288078308, 0.00024253129959106445, 0.0002710297703742981, 0.00029952824115753174, 0.0003280267119407654, 0.000356525182723999, 0.00038502365350723267, 0.0004135221242904663, 0.00044202059507369995, 0.0004705190658569336, 0.0004990175366401672, 0.0005275160074234009, 0.0005560144782066345, 0.0005845129489898682, 0.0006130114197731018, 0.0006415098905563354, 0.0006700083613395691, 0.0006985068321228027, 0.0007270053029060364, 0.00075550377368927, 0.0007840022444725037, 0.0008125007152557373, 0.000840999186038971, 0.0008694976568222046, 0.0008979961276054382, 0.0009264945983886719]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 9.0, 4.0, 8.0, 11.0, 12.0, 22.0, 17.0, 34.0, 51.0, 63.0, 83.0, 166.0, 257.0, 484.0, 1026.0, 2534.0, 8574.0, 55348.0, 828955.0, 131100.0, 13446.0, 3506.0, 1330.0, 614.0, 342.0, 222.0, 110.0, 64.0, 43.0, 33.0, 27.0, 13.0, 16.0, 10.0, 2.0, 5.0, 8.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.12890625, -5.928955078125, -5.72900390625, -5.529052734375, -5.3291015625, -5.129150390625, -4.92919921875, -4.729248046875, -4.529296875, -4.329345703125, -4.12939453125, -3.929443359375, -3.7294921875, -3.529541015625, -3.32958984375, -3.129638671875, -2.9296875, -2.729736328125, -2.52978515625, -2.329833984375, -2.1298828125, -1.929931640625, -1.72998046875, -1.530029296875, -1.330078125, -1.130126953125, -0.93017578125, -0.730224609375, -0.5302734375, -0.330322265625, -0.13037109375, 0.069580078125, 0.26953125, 0.469482421875, 0.66943359375, 0.869384765625, 1.0693359375, 1.269287109375, 1.46923828125, 1.669189453125, 1.869140625, 2.069091796875, 2.26904296875, 2.468994140625, 2.6689453125, 2.868896484375, 3.06884765625, 3.268798828125, 3.46875, 3.668701171875, 3.86865234375, 4.068603515625, 4.2685546875, 4.468505859375, 4.66845703125, 4.868408203125, 5.068359375, 5.268310546875, 5.46826171875, 5.668212890625, 5.8681640625, 6.068115234375, 6.26806640625, 6.468017578125, 6.66796875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 8.0, 8.0, 13.0, 13.0, 16.0, 28.0, 41.0, 68.0, 68.0, 96.0, 129.0, 106.0, 104.0, 67.0, 53.0, 48.0, 32.0, 22.0, 14.0, 19.0, 10.0, 5.0, 9.0, 1.0, 4.0, 0.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.25390625, -6.08905029296875, -5.9241943359375, -5.75933837890625, -5.594482421875, -5.42962646484375, -5.2647705078125, -5.09991455078125, -4.93505859375, -4.77020263671875, -4.6053466796875, -4.44049072265625, -4.275634765625, -4.11077880859375, -3.9459228515625, -3.78106689453125, -3.6162109375, -3.45135498046875, -3.2864990234375, -3.12164306640625, -2.956787109375, -2.79193115234375, -2.6270751953125, -2.46221923828125, -2.29736328125, -2.13250732421875, -1.9676513671875, -1.80279541015625, -1.637939453125, -1.47308349609375, -1.3082275390625, -1.14337158203125, -0.978515625, -0.81365966796875, -0.6488037109375, -0.48394775390625, -0.319091796875, -0.15423583984375, 0.0106201171875, 0.17547607421875, 0.34033203125, 0.50518798828125, 0.6700439453125, 0.83489990234375, 0.999755859375, 1.16461181640625, 1.3294677734375, 1.49432373046875, 1.6591796875, 1.82403564453125, 1.9888916015625, 2.15374755859375, 2.318603515625, 2.48345947265625, 2.6483154296875, 2.81317138671875, 2.97802734375, 3.14288330078125, 3.3077392578125, 3.47259521484375, 3.637451171875, 3.80230712890625, 3.9671630859375, 4.13201904296875, 4.296875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 6.0, 16.0, 43.0, 73.0, 160.0, 265.0, 235.0, 119.0, 44.0, 19.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.18270874023438, -170.46676635742188, -166.75083923339844, -163.03489685058594, -159.3189697265625, -155.60302734375, -151.8870849609375, -148.17115783691406, -144.45521545410156, -140.73927307128906, -137.02334594726562, -133.30740356445312, -129.5914764404297, -125.87553405761719, -122.15959930419922, -118.44366455078125, -114.72772216796875, -111.01178741455078, -107.29585266113281, -103.57991027832031, -99.86397552490234, -96.14804077148438, -92.4321060180664, -88.71617126464844, -85.00023651123047, -81.2843017578125, -77.56836700439453, -73.85242462158203, -70.13648986816406, -66.4205551147461, -62.704620361328125, -58.98868179321289, -55.27273941040039, -51.55680465698242, -47.84086608886719, -44.12493133544922, -40.408992767333984, -36.693058013916016, -32.97711944580078, -29.261184692382812, -25.54524803161621, -21.82931137084961, -18.113374710083008, -14.397439002990723, -10.681502342224121, -6.965566635131836, -3.2496299743652344, 0.4663066864013672, 4.182243347167969, 7.89818000793457, 11.614116668701172, 15.330052375793457, 19.045989990234375, 22.761924743652344, 26.477861404418945, 30.193798065185547, 33.90973663330078, 37.62567138671875, 41.341609954833984, 45.05754470825195, 48.77348327636719, 52.489418029785156, 56.205352783203125, 59.92129135131836, 63.63722610473633]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 8.0, 4.0, 3.0, 8.0, 8.0, 10.0, 8.0, 14.0, 15.0, 11.0, 11.0, 18.0, 22.0, 27.0, 46.0, 47.0, 41.0, 43.0, 53.0, 77.0, 81.0, 78.0, 53.0, 34.0, 43.0, 24.0, 34.0, 29.0, 25.0, 24.0, 13.0, 23.0, 9.0, 12.0, 13.0, 11.0, 4.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.00893783569336, -45.45629119873047, -43.90364074707031, -42.35099411010742, -40.798343658447266, -39.245697021484375, -37.69304656982422, -36.14039993286133, -34.58775329589844, -33.03510665893555, -31.48245620727539, -29.9298095703125, -28.377159118652344, -26.824512481689453, -25.27186393737793, -23.719215393066406, -22.16656494140625, -20.613916397094727, -19.061267852783203, -17.508621215820312, -15.955971717834473, -14.40332317352295, -12.850675582885742, -11.298027038574219, -9.745378494262695, -8.192729949951172, -6.640081882476807, -5.087433815002441, -3.534785270690918, -1.9821367263793945, -0.4294891357421875, 1.123159408569336, 2.675811767578125, 4.228460311889648, 5.781108379364014, 7.333756446838379, 8.886404991149902, 10.439053535461426, 11.991701126098633, 13.544349670410156, 15.09699821472168, 16.649646759033203, 18.202295303344727, 19.75494384765625, 21.30759048461914, 22.860240936279297, 24.412887573242188, 25.96553611755371, 27.518184661865234, 29.070833206176758, 30.62348175048828, 32.17612838745117, 33.72877883911133, 35.28142547607422, 36.834075927734375, 38.386722564697266, 39.939369201660156, 41.49201583862305, 43.0446662902832, 44.597312927246094, 46.14996337890625, 47.70261001586914, 49.25525665283203, 50.80790710449219, 52.360557556152344]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 7.0, 11.0, 16.0, 21.0, 34.0, 70.0, 95.0, 183.0, 348.0, 703.0, 1717.0, 4714.0, 17269.0, 88455.0, 1157674.0, 2689196.0, 191897.0, 29661.0, 7543.0, 2577.0, 1017.0, 525.0, 226.0, 129.0, 82.0, 44.0, 31.0, 11.0, 8.0, 7.0, 4.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7421875, -5.56378173828125, -5.3853759765625, -5.20697021484375, -5.028564453125, -4.85015869140625, -4.6717529296875, -4.49334716796875, -4.31494140625, -4.13653564453125, -3.9581298828125, -3.77972412109375, -3.601318359375, -3.42291259765625, -3.2445068359375, -3.06610107421875, -2.8876953125, -2.70928955078125, -2.5308837890625, -2.35247802734375, -2.174072265625, -1.99566650390625, -1.8172607421875, -1.63885498046875, -1.46044921875, -1.28204345703125, -1.1036376953125, -0.92523193359375, -0.746826171875, -0.56842041015625, -0.3900146484375, -0.21160888671875, -0.033203125, 0.14520263671875, 0.3236083984375, 0.50201416015625, 0.680419921875, 0.85882568359375, 1.0372314453125, 1.21563720703125, 1.39404296875, 1.57244873046875, 1.7508544921875, 1.92926025390625, 2.107666015625, 2.28607177734375, 2.4644775390625, 2.64288330078125, 2.8212890625, 2.99969482421875, 3.1781005859375, 3.35650634765625, 3.534912109375, 3.71331787109375, 3.8917236328125, 4.07012939453125, 4.24853515625, 4.42694091796875, 4.6053466796875, 4.78375244140625, 4.962158203125, 5.14056396484375, 5.3189697265625, 5.49737548828125, 5.67578125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 9.0, 7.0, 12.0, 15.0, 11.0, 21.0, 31.0, 31.0, 33.0, 41.0, 52.0, 47.0, 62.0, 52.0, 57.0, 54.0, 70.0, 48.0, 51.0, 33.0, 55.0, 41.0, 34.0, 25.0, 25.0, 22.0, 19.0, 8.0, 13.0, 8.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.76934814453125, -2.6715087890625, -2.57366943359375, -2.475830078125, -2.37799072265625, -2.2801513671875, -2.18231201171875, -2.08447265625, -1.98663330078125, -1.8887939453125, -1.79095458984375, -1.693115234375, -1.59527587890625, -1.4974365234375, -1.39959716796875, -1.3017578125, -1.20391845703125, -1.1060791015625, -1.00823974609375, -0.910400390625, -0.81256103515625, -0.7147216796875, -0.61688232421875, -0.51904296875, -0.42120361328125, -0.3233642578125, -0.22552490234375, -0.127685546875, -0.02984619140625, 0.0679931640625, 0.16583251953125, 0.263671875, 0.36151123046875, 0.4593505859375, 0.55718994140625, 0.655029296875, 0.75286865234375, 0.8507080078125, 0.94854736328125, 1.04638671875, 1.14422607421875, 1.2420654296875, 1.33990478515625, 1.437744140625, 1.53558349609375, 1.6334228515625, 1.73126220703125, 1.8291015625, 1.92694091796875, 2.0247802734375, 2.12261962890625, 2.220458984375, 2.31829833984375, 2.4161376953125, 2.51397705078125, 2.61181640625, 2.70965576171875, 2.8074951171875, 2.90533447265625, 3.003173828125, 3.10101318359375, 3.1988525390625, 3.29669189453125, 3.39453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 16.0, 14.0, 26.0, 51.0, 46.0, 88.0, 129.0, 225.0, 476.0, 1017.0, 3274.0, 20689.0, 497659.0, 3571612.0, 86116.0, 9273.0, 2033.0, 730.0, 332.0, 180.0, 93.0, 68.0, 42.0, 21.0, 29.0, 10.0, 6.0, 9.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.15625, -14.7796630859375, -14.403076171875, -14.0264892578125, -13.64990234375, -13.2733154296875, -12.896728515625, -12.5201416015625, -12.1435546875, -11.7669677734375, -11.390380859375, -11.0137939453125, -10.63720703125, -10.2606201171875, -9.884033203125, -9.5074462890625, -9.130859375, -8.7542724609375, -8.377685546875, -8.0010986328125, -7.62451171875, -7.2479248046875, -6.871337890625, -6.4947509765625, -6.1181640625, -5.7415771484375, -5.364990234375, -4.9884033203125, -4.61181640625, -4.2352294921875, -3.858642578125, -3.4820556640625, -3.10546875, -2.7288818359375, -2.352294921875, -1.9757080078125, -1.59912109375, -1.2225341796875, -0.845947265625, -0.4693603515625, -0.0927734375, 0.2838134765625, 0.660400390625, 1.0369873046875, 1.41357421875, 1.7901611328125, 2.166748046875, 2.5433349609375, 2.919921875, 3.2965087890625, 3.673095703125, 4.0496826171875, 4.42626953125, 4.8028564453125, 5.179443359375, 5.5560302734375, 5.9326171875, 6.3092041015625, 6.685791015625, 7.0623779296875, 7.43896484375, 7.8155517578125, 8.192138671875, 8.5687255859375, 8.9453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 10.0, 12.0, 15.0, 11.0, 20.0, 40.0, 46.0, 114.0, 167.0, 311.0, 556.0, 871.0, 761.0, 435.0, 245.0, 141.0, 95.0, 53.0, 44.0, 35.0, 22.0, 15.0, 14.0, 13.0, 7.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0234375, -7.7628173828125, -7.502197265625, -7.2415771484375, -6.98095703125, -6.7203369140625, -6.459716796875, -6.1990966796875, -5.9384765625, -5.6778564453125, -5.417236328125, -5.1566162109375, -4.89599609375, -4.6353759765625, -4.374755859375, -4.1141357421875, -3.853515625, -3.5928955078125, -3.332275390625, -3.0716552734375, -2.81103515625, -2.5504150390625, -2.289794921875, -2.0291748046875, -1.7685546875, -1.5079345703125, -1.247314453125, -0.9866943359375, -0.72607421875, -0.4654541015625, -0.204833984375, 0.0557861328125, 0.31640625, 0.5770263671875, 0.837646484375, 1.0982666015625, 1.35888671875, 1.6195068359375, 1.880126953125, 2.1407470703125, 2.4013671875, 2.6619873046875, 2.922607421875, 3.1832275390625, 3.44384765625, 3.7044677734375, 3.965087890625, 4.2257080078125, 4.486328125, 4.7469482421875, 5.007568359375, 5.2681884765625, 5.52880859375, 5.7894287109375, 6.050048828125, 6.3106689453125, 6.5712890625, 6.8319091796875, 7.092529296875, 7.3531494140625, 7.61376953125, 7.8743896484375, 8.135009765625, 8.3956298828125, 8.65625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 30.0, 78.0, 227.0, 348.0, 200.0, 64.0, 25.0, 6.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.24658966064453, -60.713897705078125, -56.18120574951172, -51.64851379394531, -47.115821838378906, -42.5831298828125, -38.05044174194336, -33.51774978637695, -28.985057830810547, -24.45236587524414, -19.919673919677734, -15.386983871459961, -10.854291915893555, -6.321599960327148, -1.788909912109375, 2.7437820434570312, 7.2764739990234375, 11.809165954589844, 16.34185791015625, 20.874547958374023, 25.40723991394043, 29.939931869506836, 34.47262191772461, 39.005313873291016, 43.53800582885742, 48.07069778442383, 52.603389739990234, 57.136077880859375, 61.66876983642578, 66.20146179199219, 70.7341537475586, 75.266845703125, 79.79954528808594, 84.33223724365234, 88.86492919921875, 93.39762115478516, 97.93031311035156, 102.46300506591797, 106.99569702148438, 111.52838134765625, 116.06108093261719, 120.5937728881836, 125.12646484375, 129.65914916992188, 134.1918487548828, 138.7245330810547, 143.25723266601562, 147.7899169921875, 152.32260131835938, 156.85528564453125, 161.3879852294922, 165.92066955566406, 170.453369140625, 174.98605346679688, 179.5187530517578, 184.0514373779297, 188.58413696289062, 193.1168212890625, 197.64952087402344, 202.1822052001953, 206.71490478515625, 211.24758911132812, 215.78028869628906, 220.31297302246094, 224.84567260742188]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 3.0, 5.0, 8.0, 6.0, 14.0, 9.0, 19.0, 26.0, 21.0, 25.0, 30.0, 40.0, 46.0, 50.0, 56.0, 51.0, 57.0, 75.0, 54.0, 54.0, 49.0, 43.0, 48.0, 38.0, 38.0, 29.0, 26.0, 19.0, 12.0, 16.0, 11.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.97605514526367, -34.665931701660156, -33.355804443359375, -32.04568099975586, -30.735557556152344, -29.425434112548828, -28.11530876159668, -26.80518341064453, -25.495059967041016, -24.1849365234375, -22.87481117248535, -21.564685821533203, -20.254562377929688, -18.944438934326172, -17.634313583374023, -16.324188232421875, -15.01406478881836, -13.703940391540527, -12.393815994262695, -11.083691596984863, -9.773567199707031, -8.4634428024292, -7.153318405151367, -5.843194007873535, -4.533069610595703, -3.222945213317871, -1.912820816040039, -0.602696418762207, 0.707427978515625, 2.017552375793457, 3.327676773071289, 4.637801170349121, 5.947929382324219, 7.258053779602051, 8.568178176879883, 9.878302574157715, 11.188426971435547, 12.498551368713379, 13.808675765991211, 15.118800163269043, 16.428924560546875, 17.73904800415039, 19.04917335510254, 20.359298706054688, 21.669422149658203, 22.97954559326172, 24.289670944213867, 25.599796295166016, 26.90991973876953, 28.220043182373047, 29.530168533325195, 30.840293884277344, 32.15041732788086, 33.460540771484375, 34.770668029785156, 36.08079147338867, 37.39091491699219, 38.7010383605957, 40.01116180419922, 41.3212890625, 42.631412506103516, 43.94153594970703, 45.25166320800781, 46.56178665161133, 47.871910095214844]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 8.0, 11.0, 19.0, 17.0, 39.0, 51.0, 86.0, 122.0, 239.0, 412.0, 870.0, 1781.0, 3842.0, 9402.0, 25101.0, 79635.0, 303053.0, 435641.0, 127588.0, 37541.0, 13001.0, 5342.0, 2335.0, 1135.0, 569.0, 298.0, 163.0, 100.0, 67.0, 36.0, 28.0, 14.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.796875, -6.56396484375, -6.3310546875, -6.09814453125, -5.865234375, -5.63232421875, -5.3994140625, -5.16650390625, -4.93359375, -4.70068359375, -4.4677734375, -4.23486328125, -4.001953125, -3.76904296875, -3.5361328125, -3.30322265625, -3.0703125, -2.83740234375, -2.6044921875, -2.37158203125, -2.138671875, -1.90576171875, -1.6728515625, -1.43994140625, -1.20703125, -0.97412109375, -0.7412109375, -0.50830078125, -0.275390625, -0.04248046875, 0.1904296875, 0.42333984375, 0.65625, 0.88916015625, 1.1220703125, 1.35498046875, 1.587890625, 1.82080078125, 2.0537109375, 2.28662109375, 2.51953125, 2.75244140625, 2.9853515625, 3.21826171875, 3.451171875, 3.68408203125, 3.9169921875, 4.14990234375, 4.3828125, 4.61572265625, 4.8486328125, 5.08154296875, 5.314453125, 5.54736328125, 5.7802734375, 6.01318359375, 6.24609375, 6.47900390625, 6.7119140625, 6.94482421875, 7.177734375, 7.41064453125, 7.6435546875, 7.87646484375, 8.109375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 10.0, 7.0, 5.0, 8.0, 15.0, 15.0, 12.0, 18.0, 20.0, 18.0, 16.0, 23.0, 33.0, 29.0, 31.0, 35.0, 34.0, 50.0, 49.0, 35.0, 38.0, 45.0, 40.0, 54.0, 33.0, 30.0, 31.0, 28.0, 24.0, 31.0, 31.0, 26.0, 23.0, 17.0, 18.0, 8.0, 11.0, 11.0, 8.0, 6.0, 4.0, 7.0, 6.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0], "bins": [-2.36328125, -2.289337158203125, -2.21539306640625, -2.141448974609375, -2.0675048828125, -1.993560791015625, -1.91961669921875, -1.845672607421875, -1.771728515625, -1.697784423828125, -1.62384033203125, -1.549896240234375, -1.4759521484375, -1.402008056640625, -1.32806396484375, -1.254119873046875, -1.18017578125, -1.106231689453125, -1.03228759765625, -0.958343505859375, -0.8843994140625, -0.810455322265625, -0.73651123046875, -0.662567138671875, -0.588623046875, -0.514678955078125, -0.44073486328125, -0.366790771484375, -0.2928466796875, -0.218902587890625, -0.14495849609375, -0.071014404296875, 0.0029296875, 0.076873779296875, 0.15081787109375, 0.224761962890625, 0.2987060546875, 0.372650146484375, 0.44659423828125, 0.520538330078125, 0.594482421875, 0.668426513671875, 0.74237060546875, 0.816314697265625, 0.8902587890625, 0.964202880859375, 1.03814697265625, 1.112091064453125, 1.18603515625, 1.259979248046875, 1.33392333984375, 1.407867431640625, 1.4818115234375, 1.555755615234375, 1.62969970703125, 1.703643798828125, 1.777587890625, 1.851531982421875, 1.92547607421875, 1.999420166015625, 2.0733642578125, 2.147308349609375, 2.22125244140625, 2.295196533203125, 2.369140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 6.0, 3.0, 4.0, 8.0, 9.0, 16.0, 26.0, 33.0, 47.0, 91.0, 155.0, 250.0, 497.0, 1030.0, 2760.0, 11814.0, 167894.0, 819683.0, 35681.0, 5285.0, 1709.0, 699.0, 348.0, 198.0, 127.0, 63.0, 41.0, 21.0, 19.0, 11.0, 4.0, 7.0, 2.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.46875, -17.81494140625, -17.1611328125, -16.50732421875, -15.853515625, -15.19970703125, -14.5458984375, -13.89208984375, -13.23828125, -12.58447265625, -11.9306640625, -11.27685546875, -10.623046875, -9.96923828125, -9.3154296875, -8.66162109375, -8.0078125, -7.35400390625, -6.7001953125, -6.04638671875, -5.392578125, -4.73876953125, -4.0849609375, -3.43115234375, -2.77734375, -2.12353515625, -1.4697265625, -0.81591796875, -0.162109375, 0.49169921875, 1.1455078125, 1.79931640625, 2.453125, 3.10693359375, 3.7607421875, 4.41455078125, 5.068359375, 5.72216796875, 6.3759765625, 7.02978515625, 7.68359375, 8.33740234375, 8.9912109375, 9.64501953125, 10.298828125, 10.95263671875, 11.6064453125, 12.26025390625, 12.9140625, 13.56787109375, 14.2216796875, 14.87548828125, 15.529296875, 16.18310546875, 16.8369140625, 17.49072265625, 18.14453125, 18.79833984375, 19.4521484375, 20.10595703125, 20.759765625, 21.41357421875, 22.0673828125, 22.72119140625, 23.375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 7.0, 8.0, 6.0, 5.0, 14.0, 12.0, 17.0, 18.0, 16.0, 17.0, 25.0, 30.0, 37.0, 32.0, 41.0, 41.0, 35.0, 56.0, 48.0, 35.0, 43.0, 43.0, 40.0, 40.0, 40.0, 30.0, 45.0, 31.0, 28.0, 22.0, 15.0, 16.0, 15.0, 23.0, 10.0, 6.0, 8.0, 8.0, 8.0, 5.0, 7.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-10.421875, -10.111328125, -9.80078125, -9.490234375, -9.1796875, -8.869140625, -8.55859375, -8.248046875, -7.9375, -7.626953125, -7.31640625, -7.005859375, -6.6953125, -6.384765625, -6.07421875, -5.763671875, -5.453125, -5.142578125, -4.83203125, -4.521484375, -4.2109375, -3.900390625, -3.58984375, -3.279296875, -2.96875, -2.658203125, -2.34765625, -2.037109375, -1.7265625, -1.416015625, -1.10546875, -0.794921875, -0.484375, -0.173828125, 0.13671875, 0.447265625, 0.7578125, 1.068359375, 1.37890625, 1.689453125, 2.0, 2.310546875, 2.62109375, 2.931640625, 3.2421875, 3.552734375, 3.86328125, 4.173828125, 4.484375, 4.794921875, 5.10546875, 5.416015625, 5.7265625, 6.037109375, 6.34765625, 6.658203125, 6.96875, 7.279296875, 7.58984375, 7.900390625, 8.2109375, 8.521484375, 8.83203125, 9.142578125, 9.453125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 9.0, 2.0, 11.0, 1.0, 6.0, 11.0, 13.0, 20.0, 26.0, 41.0, 81.0, 87.0, 155.0, 257.0, 447.0, 745.0, 1336.0, 2671.0, 5524.0, 13145.0, 40006.0, 341814.0, 571211.0, 44849.0, 13865.0, 5837.0, 2884.0, 1500.0, 826.0, 409.0, 267.0, 170.0, 125.0, 70.0, 38.0, 30.0, 17.0, 15.0, 13.0, 5.0, 2.0, 4.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.10546875, -5.9022216796875, -5.698974609375, -5.4957275390625, -5.29248046875, -5.0892333984375, -4.885986328125, -4.6827392578125, -4.4794921875, -4.2762451171875, -4.072998046875, -3.8697509765625, -3.66650390625, -3.4632568359375, -3.260009765625, -3.0567626953125, -2.853515625, -2.6502685546875, -2.447021484375, -2.2437744140625, -2.04052734375, -1.8372802734375, -1.634033203125, -1.4307861328125, -1.2275390625, -1.0242919921875, -0.821044921875, -0.6177978515625, -0.41455078125, -0.2113037109375, -0.008056640625, 0.1951904296875, 0.3984375, 0.6016845703125, 0.804931640625, 1.0081787109375, 1.21142578125, 1.4146728515625, 1.617919921875, 1.8211669921875, 2.0244140625, 2.2276611328125, 2.430908203125, 2.6341552734375, 2.83740234375, 3.0406494140625, 3.243896484375, 3.4471435546875, 3.650390625, 3.8536376953125, 4.056884765625, 4.2601318359375, 4.46337890625, 4.6666259765625, 4.869873046875, 5.0731201171875, 5.2763671875, 5.4796142578125, 5.682861328125, 5.8861083984375, 6.08935546875, 6.2926025390625, 6.495849609375, 6.6990966796875, 6.90234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 8.0, 14.0, 21.0, 35.0, 35.0, 74.0, 157.0, 274.0, 134.0, 67.0, 42.0, 34.0, 22.0, 17.0, 11.0, 6.0, 7.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0027599334716796875, -0.002688109874725342, -0.002616286277770996, -0.0025444626808166504, -0.0024726390838623047, -0.002400815486907959, -0.0023289918899536133, -0.0022571682929992676, -0.002185344696044922, -0.002113521099090576, -0.0020416975021362305, -0.0019698739051818848, -0.001898050308227539, -0.0018262267112731934, -0.0017544031143188477, -0.001682579517364502, -0.0016107559204101562, -0.0015389323234558105, -0.0014671087265014648, -0.0013952851295471191, -0.0013234615325927734, -0.0012516379356384277, -0.001179814338684082, -0.0011079907417297363, -0.0010361671447753906, -0.0009643435478210449, -0.0008925199508666992, -0.0008206963539123535, -0.0007488727569580078, -0.0006770491600036621, -0.0006052255630493164, -0.0005334019660949707, -0.000461578369140625, -0.0003897547721862793, -0.0003179311752319336, -0.0002461075782775879, -0.0001742839813232422, -0.00010246038436889648, -3.063678741455078e-05, 4.118680953979492e-05, 0.00011301040649414062, 0.00018483400344848633, 0.00025665760040283203, 0.00032848119735717773, 0.00040030479431152344, 0.00047212839126586914, 0.0005439519882202148, 0.0006157755851745605, 0.0006875991821289062, 0.000759422779083252, 0.0008312463760375977, 0.0009030699729919434, 0.0009748935699462891, 0.0010467171669006348, 0.0011185407638549805, 0.0011903643608093262, 0.0012621879577636719, 0.0013340115547180176, 0.0014058351516723633, 0.001477658748626709, 0.0015494823455810547, 0.0016213059425354004, 0.001693129539489746, 0.0017649531364440918, 0.0018367767333984375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 6.0, 9.0, 3.0, 9.0, 12.0, 7.0, 27.0, 36.0, 49.0, 70.0, 95.0, 150.0, 203.0, 316.0, 529.0, 883.0, 1630.0, 3021.0, 6047.0, 13238.0, 37292.0, 240036.0, 649567.0, 60866.0, 18306.0, 7498.0, 3788.0, 1936.0, 1094.0, 636.0, 407.0, 269.0, 152.0, 106.0, 74.0, 45.0, 49.0, 21.0, 24.0, 12.0, 8.0, 12.0, 3.0, 2.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-5.7109375, -5.55303955078125, -5.3951416015625, -5.23724365234375, -5.079345703125, -4.92144775390625, -4.7635498046875, -4.60565185546875, -4.44775390625, -4.28985595703125, -4.1319580078125, -3.97406005859375, -3.816162109375, -3.65826416015625, -3.5003662109375, -3.34246826171875, -3.1845703125, -3.02667236328125, -2.8687744140625, -2.71087646484375, -2.552978515625, -2.39508056640625, -2.2371826171875, -2.07928466796875, -1.92138671875, -1.76348876953125, -1.6055908203125, -1.44769287109375, -1.289794921875, -1.13189697265625, -0.9739990234375, -0.81610107421875, -0.658203125, -0.50030517578125, -0.3424072265625, -0.18450927734375, -0.026611328125, 0.13128662109375, 0.2891845703125, 0.44708251953125, 0.60498046875, 0.76287841796875, 0.9207763671875, 1.07867431640625, 1.236572265625, 1.39447021484375, 1.5523681640625, 1.71026611328125, 1.8681640625, 2.02606201171875, 2.1839599609375, 2.34185791015625, 2.499755859375, 2.65765380859375, 2.8155517578125, 2.97344970703125, 3.13134765625, 3.28924560546875, 3.4471435546875, 3.60504150390625, 3.762939453125, 3.92083740234375, 4.0787353515625, 4.23663330078125, 4.39453125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 8.0, 5.0, 10.0, 18.0, 10.0, 18.0, 21.0, 23.0, 29.0, 38.0, 42.0, 59.0, 96.0, 92.0, 122.0, 89.0, 45.0, 51.0, 40.0, 33.0, 25.0, 17.0, 15.0, 19.0, 7.0, 10.0, 8.0, 6.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.8828125, -3.76202392578125, -3.6412353515625, -3.52044677734375, -3.399658203125, -3.27886962890625, -3.1580810546875, -3.03729248046875, -2.91650390625, -2.79571533203125, -2.6749267578125, -2.55413818359375, -2.433349609375, -2.31256103515625, -2.1917724609375, -2.07098388671875, -1.9501953125, -1.82940673828125, -1.7086181640625, -1.58782958984375, -1.467041015625, -1.34625244140625, -1.2254638671875, -1.10467529296875, -0.98388671875, -0.86309814453125, -0.7423095703125, -0.62152099609375, -0.500732421875, -0.37994384765625, -0.2591552734375, -0.13836669921875, -0.017578125, 0.10321044921875, 0.2239990234375, 0.34478759765625, 0.465576171875, 0.58636474609375, 0.7071533203125, 0.82794189453125, 0.94873046875, 1.06951904296875, 1.1903076171875, 1.31109619140625, 1.431884765625, 1.55267333984375, 1.6734619140625, 1.79425048828125, 1.9150390625, 2.03582763671875, 2.1566162109375, 2.27740478515625, 2.398193359375, 2.51898193359375, 2.6397705078125, 2.76055908203125, 2.88134765625, 3.00213623046875, 3.1229248046875, 3.24371337890625, 3.364501953125, 3.48529052734375, 3.6060791015625, 3.72686767578125, 3.84765625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 10.0, 11.0, 15.0, 24.0, 48.0, 61.0, 99.0, 176.0, 247.0, 134.0, 67.0, 37.0, 21.0, 15.0, 8.0, 5.0, 1.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-128.41885375976562, -124.98292541503906, -121.5469970703125, -118.11106872558594, -114.6751480102539, -111.23921966552734, -107.80329132080078, -104.36736297607422, -100.93144226074219, -97.49551391601562, -94.05958557128906, -90.6236572265625, -87.18773651123047, -83.7518081665039, -80.31587982177734, -76.87995147705078, -73.44402313232422, -70.00809478759766, -66.5721664428711, -63.1362419128418, -59.7003173828125, -56.26438903808594, -52.828460693359375, -49.39253234863281, -45.956607818603516, -42.52067947387695, -39.084754943847656, -35.648826599121094, -32.21289825439453, -28.776973724365234, -25.341045379638672, -21.905118942260742, -18.469192504882812, -15.033266067504883, -11.597338676452637, -8.16141128540039, -4.725484848022461, -1.2895584106445312, 2.1463699340820312, 5.582296371459961, 9.01822280883789, 12.45414924621582, 15.890076637268066, 19.326004028320312, 22.761930465698242, 26.197856903076172, 29.633785247802734, 33.06970977783203, 36.505638122558594, 39.941566467285156, 43.37749099731445, 46.813419342041016, 50.24934387207031, 53.685272216796875, 57.12120056152344, 60.55712890625, 63.9930534362793, 67.4289779663086, 70.86490631103516, 74.30083465576172, 77.73676300048828, 81.17268371582031, 84.60861206054688, 88.04454040527344, 91.48046875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 6.0, 5.0, 5.0, 4.0, 7.0, 14.0, 19.0, 15.0, 7.0, 14.0, 15.0, 21.0, 33.0, 26.0, 29.0, 26.0, 28.0, 45.0, 59.0, 68.0, 53.0, 69.0, 60.0, 49.0, 33.0, 35.0, 31.0, 35.0, 28.0, 24.0, 16.0, 16.0, 13.0, 15.0, 8.0, 12.0, 12.0, 10.0, 9.0, 8.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.85874557495117, -37.50409698486328, -36.149444580078125, -34.794795989990234, -33.44014358520508, -32.08549499511719, -30.730844497680664, -29.37619400024414, -28.021543502807617, -26.666893005371094, -25.31224250793457, -23.957592010498047, -22.602943420410156, -21.248291015625, -19.89364242553711, -18.538991928100586, -17.184341430664062, -15.829690933227539, -14.475040435791016, -13.120390892028809, -11.765740394592285, -10.411089897155762, -9.056440353393555, -7.701789855957031, -6.347139358520508, -4.992488861083984, -3.637838840484619, -2.283188819885254, -0.9285383224487305, 0.42611217498779297, 1.78076171875, 3.1354122161865234, 4.4900665283203125, 5.844717025756836, 7.199367046356201, 8.554017066955566, 9.90866756439209, 11.263318061828613, 12.61796760559082, 13.972618103027344, 15.327268600463867, 16.68191909790039, 18.036569595336914, 19.391220092773438, 20.745868682861328, 22.100521087646484, 23.455169677734375, 24.8098201751709, 26.164470672607422, 27.519121170043945, 28.87377166748047, 30.22842025756836, 31.583072662353516, 32.937721252441406, 34.29237365722656, 35.64702224731445, 37.001670837402344, 38.356319427490234, 39.71097183227539, 41.06562042236328, 42.42027282714844, 43.77492141723633, 45.12957000732422, 46.484222412109375, 47.83887481689453]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 6.0, 21.0, 15.0, 17.0, 33.0, 54.0, 87.0, 143.0, 324.0, 762.0, 2350.0, 10810.0, 156071.0, 3866026.0, 142854.0, 10752.0, 2361.0, 789.0, 364.0, 158.0, 95.0, 53.0, 37.0, 28.0, 15.0, 12.0, 10.0, 9.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1484375, -10.8052978515625, -10.462158203125, -10.1190185546875, -9.77587890625, -9.4327392578125, -9.089599609375, -8.7464599609375, -8.4033203125, -8.0601806640625, -7.717041015625, -7.3739013671875, -7.03076171875, -6.6876220703125, -6.344482421875, -6.0013427734375, -5.658203125, -5.3150634765625, -4.971923828125, -4.6287841796875, -4.28564453125, -3.9425048828125, -3.599365234375, -3.2562255859375, -2.9130859375, -2.5699462890625, -2.226806640625, -1.8836669921875, -1.54052734375, -1.1973876953125, -0.854248046875, -0.5111083984375, -0.16796875, 0.1751708984375, 0.518310546875, 0.8614501953125, 1.20458984375, 1.5477294921875, 1.890869140625, 2.2340087890625, 2.5771484375, 2.9202880859375, 3.263427734375, 3.6065673828125, 3.94970703125, 4.2928466796875, 4.635986328125, 4.9791259765625, 5.322265625, 5.6654052734375, 6.008544921875, 6.3516845703125, 6.69482421875, 7.0379638671875, 7.381103515625, 7.7242431640625, 8.0673828125, 8.4105224609375, 8.753662109375, 9.0968017578125, 9.43994140625, 9.7830810546875, 10.126220703125, 10.4693603515625, 10.8125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 10.0, 5.0, 17.0, 12.0, 25.0, 26.0, 30.0, 32.0, 35.0, 41.0, 49.0, 52.0, 62.0, 57.0, 57.0, 53.0, 49.0, 49.0, 51.0, 48.0, 48.0, 35.0, 40.0, 27.0, 21.0, 18.0, 3.0, 11.0, 10.0, 3.0, 5.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.736328125, -3.6343994140625, -3.532470703125, -3.4305419921875, -3.32861328125, -3.2266845703125, -3.124755859375, -3.0228271484375, -2.9208984375, -2.8189697265625, -2.717041015625, -2.6151123046875, -2.51318359375, -2.4112548828125, -2.309326171875, -2.2073974609375, -2.10546875, -2.0035400390625, -1.901611328125, -1.7996826171875, -1.69775390625, -1.5958251953125, -1.493896484375, -1.3919677734375, -1.2900390625, -1.1881103515625, -1.086181640625, -0.9842529296875, -0.88232421875, -0.7803955078125, -0.678466796875, -0.5765380859375, -0.474609375, -0.3726806640625, -0.270751953125, -0.1688232421875, -0.06689453125, 0.0350341796875, 0.136962890625, 0.2388916015625, 0.3408203125, 0.4427490234375, 0.544677734375, 0.6466064453125, 0.74853515625, 0.8504638671875, 0.952392578125, 1.0543212890625, 1.15625, 1.2581787109375, 1.360107421875, 1.4620361328125, 1.56396484375, 1.6658935546875, 1.767822265625, 1.8697509765625, 1.9716796875, 2.0736083984375, 2.175537109375, 2.2774658203125, 2.37939453125, 2.4813232421875, 2.583251953125, 2.6851806640625, 2.787109375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 24.0, 21.0, 42.0, 77.0, 124.0, 206.0, 393.0, 1052.0, 4769.0, 141823.0, 4024308.0, 18276.0, 2005.0, 590.0, 250.0, 149.0, 73.0, 42.0, 19.0, 11.0, 3.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.78125, -22.968505859375, -22.15576171875, -21.343017578125, -20.5302734375, -19.717529296875, -18.90478515625, -18.092041015625, -17.279296875, -16.466552734375, -15.65380859375, -14.841064453125, -14.0283203125, -13.215576171875, -12.40283203125, -11.590087890625, -10.77734375, -9.964599609375, -9.15185546875, -8.339111328125, -7.5263671875, -6.713623046875, -5.90087890625, -5.088134765625, -4.275390625, -3.462646484375, -2.64990234375, -1.837158203125, -1.0244140625, -0.211669921875, 0.60107421875, 1.413818359375, 2.2265625, 3.039306640625, 3.85205078125, 4.664794921875, 5.4775390625, 6.290283203125, 7.10302734375, 7.915771484375, 8.728515625, 9.541259765625, 10.35400390625, 11.166748046875, 11.9794921875, 12.792236328125, 13.60498046875, 14.417724609375, 15.23046875, 16.043212890625, 16.85595703125, 17.668701171875, 18.4814453125, 19.294189453125, 20.10693359375, 20.919677734375, 21.732421875, 22.545166015625, 23.35791015625, 24.170654296875, 24.9833984375, 25.796142578125, 26.60888671875, 27.421630859375, 28.234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 7.0, 7.0, 14.0, 39.0, 75.0, 257.0, 1119.0, 1802.0, 492.0, 133.0, 59.0, 29.0, 19.0, 9.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.734375, -24.1197509765625, -23.505126953125, -22.8905029296875, -22.27587890625, -21.6612548828125, -21.046630859375, -20.4320068359375, -19.8173828125, -19.2027587890625, -18.588134765625, -17.9735107421875, -17.35888671875, -16.7442626953125, -16.129638671875, -15.5150146484375, -14.900390625, -14.2857666015625, -13.671142578125, -13.0565185546875, -12.44189453125, -11.8272705078125, -11.212646484375, -10.5980224609375, -9.9833984375, -9.3687744140625, -8.754150390625, -8.1395263671875, -7.52490234375, -6.9102783203125, -6.295654296875, -5.6810302734375, -5.06640625, -4.4517822265625, -3.837158203125, -3.2225341796875, -2.60791015625, -1.9932861328125, -1.378662109375, -0.7640380859375, -0.1494140625, 0.4652099609375, 1.079833984375, 1.6944580078125, 2.30908203125, 2.9237060546875, 3.538330078125, 4.1529541015625, 4.767578125, 5.3822021484375, 5.996826171875, 6.6114501953125, 7.22607421875, 7.8406982421875, 8.455322265625, 9.0699462890625, 9.6845703125, 10.2991943359375, 10.913818359375, 11.5284423828125, 12.14306640625, 12.7576904296875, 13.372314453125, 13.9869384765625, 14.6015625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 12.0, 17.0, 40.0, 182.0, 428.0, 233.0, 56.0, 19.0, 6.0, 5.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-342.37353515625, -335.4742736816406, -328.5749816894531, -321.67572021484375, -314.7764587402344, -307.8771667480469, -300.9779052734375, -294.0786437988281, -287.1793518066406, -280.28009033203125, -273.38079833984375, -266.4815368652344, -259.582275390625, -252.68299865722656, -245.78372192382812, -238.88446044921875, -231.98519897460938, -225.08592224121094, -218.18666076660156, -211.28738403320312, -204.3881072998047, -197.4888458251953, -190.58956909179688, -183.6903076171875, -176.791015625, -169.89173889160156, -162.9924774169922, -156.09320068359375, -149.1939239501953, -142.29466247558594, -135.3953857421875, -128.49612426757812, -121.59684753417969, -114.69757843017578, -107.79830169677734, -100.89903259277344, -93.99976348876953, -87.10049438476562, -80.20121765136719, -73.30194854736328, -66.40267944335938, -59.5034065246582, -52.6041374206543, -45.704864501953125, -38.80559539794922, -31.906322479248047, -25.007049560546875, -18.10778045654297, -11.208503723144531, -4.309232234954834, 2.5900392532348633, 9.489311218261719, 16.388582229614258, 23.287853240966797, 30.18712615966797, 37.086395263671875, 43.98566818237305, 50.88494110107422, 57.784210205078125, 64.68348693847656, 71.58275604248047, 78.48202514648438, 85.38130187988281, 92.28056335449219, 99.17984008789062]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 9.0, 6.0, 12.0, 29.0, 25.0, 32.0, 50.0, 55.0, 91.0, 100.0, 81.0, 104.0, 79.0, 83.0, 63.0, 51.0, 34.0, 24.0, 19.0, 19.0, 12.0, 3.0, 7.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.29466247558594, -62.9083137512207, -60.52196502685547, -58.13561248779297, -55.749263763427734, -53.3629150390625, -50.976566314697266, -48.59021759033203, -46.20386505126953, -43.8175163269043, -41.43116760253906, -39.04481506347656, -36.65846633911133, -34.272117614746094, -31.88576889038086, -29.499418258666992, -27.11307144165039, -24.726722717285156, -22.34037208557129, -19.954023361206055, -17.567672729492188, -15.181324005126953, -12.794975280761719, -10.408624649047852, -8.022275924682617, -5.635926246643066, -3.249577045440674, -0.8632278442382812, 1.5231218338012695, 3.9094715118408203, 6.295820236206055, 8.682170867919922, 11.068519592285156, 13.454869270324707, 15.841218948364258, 18.227567672729492, 20.61391830444336, 23.000267028808594, 25.386615753173828, 27.772966384887695, 30.15931510925293, 32.5456657409668, 34.93201446533203, 37.318363189697266, 39.7047119140625, 42.091064453125, 44.47740936279297, 46.86376190185547, 49.2501106262207, 51.63645935058594, 54.02280807495117, 56.409156799316406, 58.795509338378906, 61.18185806274414, 63.568206787109375, 65.95455932617188, 68.34090423583984, 70.72725677490234, 73.11360168457031, 75.49995422363281, 77.88629913330078, 80.27265167236328, 82.65899658203125, 85.04534912109375, 87.43170166015625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 0.0, 6.0, 2.0, 9.0, 17.0, 27.0, 50.0, 65.0, 150.0, 252.0, 626.0, 1575.0, 4573.0, 15747.0, 73804.0, 361716.0, 453379.0, 105767.0, 21451.0, 5897.0, 1976.0, 819.0, 324.0, 150.0, 77.0, 33.0, 27.0, 15.0, 9.0, 8.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.265625, -6.025634765625, -5.78564453125, -5.545654296875, -5.3056640625, -5.065673828125, -4.82568359375, -4.585693359375, -4.345703125, -4.105712890625, -3.86572265625, -3.625732421875, -3.3857421875, -3.145751953125, -2.90576171875, -2.665771484375, -2.42578125, -2.185791015625, -1.94580078125, -1.705810546875, -1.4658203125, -1.225830078125, -0.98583984375, -0.745849609375, -0.505859375, -0.265869140625, -0.02587890625, 0.214111328125, 0.4541015625, 0.694091796875, 0.93408203125, 1.174072265625, 1.4140625, 1.654052734375, 1.89404296875, 2.134033203125, 2.3740234375, 2.614013671875, 2.85400390625, 3.093994140625, 3.333984375, 3.573974609375, 3.81396484375, 4.053955078125, 4.2939453125, 4.533935546875, 4.77392578125, 5.013916015625, 5.25390625, 5.493896484375, 5.73388671875, 5.973876953125, 6.2138671875, 6.453857421875, 6.69384765625, 6.933837890625, 7.173828125, 7.413818359375, 7.65380859375, 7.893798828125, 8.1337890625, 8.373779296875, 8.61376953125, 8.853759765625, 9.09375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 5.0, 10.0, 9.0, 15.0, 22.0, 23.0, 28.0, 30.0, 45.0, 54.0, 54.0, 76.0, 74.0, 68.0, 81.0, 61.0, 69.0, 56.0, 46.0, 48.0, 33.0, 25.0, 24.0, 16.0, 9.0, 9.0, 6.0, 2.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.48046875, -3.334716796875, -3.18896484375, -3.043212890625, -2.8974609375, -2.751708984375, -2.60595703125, -2.460205078125, -2.314453125, -2.168701171875, -2.02294921875, -1.877197265625, -1.7314453125, -1.585693359375, -1.43994140625, -1.294189453125, -1.1484375, -1.002685546875, -0.85693359375, -0.711181640625, -0.5654296875, -0.419677734375, -0.27392578125, -0.128173828125, 0.017578125, 0.163330078125, 0.30908203125, 0.454833984375, 0.6005859375, 0.746337890625, 0.89208984375, 1.037841796875, 1.18359375, 1.329345703125, 1.47509765625, 1.620849609375, 1.7666015625, 1.912353515625, 2.05810546875, 2.203857421875, 2.349609375, 2.495361328125, 2.64111328125, 2.786865234375, 2.9326171875, 3.078369140625, 3.22412109375, 3.369873046875, 3.515625, 3.661376953125, 3.80712890625, 3.952880859375, 4.0986328125, 4.244384765625, 4.39013671875, 4.535888671875, 4.681640625, 4.827392578125, 4.97314453125, 5.118896484375, 5.2646484375, 5.410400390625, 5.55615234375, 5.701904296875, 5.84765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 4.0, 6.0, 4.0, 6.0, 12.0, 9.0, 19.0, 33.0, 38.0, 52.0, 87.0, 153.0, 246.0, 521.0, 1001.0, 2619.0, 7526.0, 33484.0, 213308.0, 654861.0, 107166.0, 18867.0, 4987.0, 1812.0, 805.0, 370.0, 203.0, 118.0, 60.0, 63.0, 27.0, 22.0, 17.0, 16.0, 11.0, 4.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.8515625, -9.5467529296875, -9.241943359375, -8.9371337890625, -8.63232421875, -8.3275146484375, -8.022705078125, -7.7178955078125, -7.4130859375, -7.1082763671875, -6.803466796875, -6.4986572265625, -6.19384765625, -5.8890380859375, -5.584228515625, -5.2794189453125, -4.974609375, -4.6697998046875, -4.364990234375, -4.0601806640625, -3.75537109375, -3.4505615234375, -3.145751953125, -2.8409423828125, -2.5361328125, -2.2313232421875, -1.926513671875, -1.6217041015625, -1.31689453125, -1.0120849609375, -0.707275390625, -0.4024658203125, -0.09765625, 0.2071533203125, 0.511962890625, 0.8167724609375, 1.12158203125, 1.4263916015625, 1.731201171875, 2.0360107421875, 2.3408203125, 2.6456298828125, 2.950439453125, 3.2552490234375, 3.56005859375, 3.8648681640625, 4.169677734375, 4.4744873046875, 4.779296875, 5.0841064453125, 5.388916015625, 5.6937255859375, 5.99853515625, 6.3033447265625, 6.608154296875, 6.9129638671875, 7.2177734375, 7.5225830078125, 7.827392578125, 8.1322021484375, 8.43701171875, 8.7418212890625, 9.046630859375, 9.3514404296875, 9.65625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 4.0, 2.0, 8.0, 13.0, 7.0, 11.0, 21.0, 24.0, 23.0, 44.0, 23.0, 43.0, 44.0, 56.0, 57.0, 61.0, 49.0, 65.0, 57.0, 47.0, 46.0, 51.0, 33.0, 55.0, 32.0, 28.0, 21.0, 22.0, 11.0, 17.0, 7.0, 9.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.484375, -14.016357421875, -13.54833984375, -13.080322265625, -12.6123046875, -12.144287109375, -11.67626953125, -11.208251953125, -10.740234375, -10.272216796875, -9.80419921875, -9.336181640625, -8.8681640625, -8.400146484375, -7.93212890625, -7.464111328125, -6.99609375, -6.528076171875, -6.06005859375, -5.592041015625, -5.1240234375, -4.656005859375, -4.18798828125, -3.719970703125, -3.251953125, -2.783935546875, -2.31591796875, -1.847900390625, -1.3798828125, -0.911865234375, -0.44384765625, 0.024169921875, 0.4921875, 0.960205078125, 1.42822265625, 1.896240234375, 2.3642578125, 2.832275390625, 3.30029296875, 3.768310546875, 4.236328125, 4.704345703125, 5.17236328125, 5.640380859375, 6.1083984375, 6.576416015625, 7.04443359375, 7.512451171875, 7.98046875, 8.448486328125, 8.91650390625, 9.384521484375, 9.8525390625, 10.320556640625, 10.78857421875, 11.256591796875, 11.724609375, 12.192626953125, 12.66064453125, 13.128662109375, 13.5966796875, 14.064697265625, 14.53271484375, 15.000732421875, 15.46875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 3.0, 9.0, 5.0, 9.0, 12.0, 24.0, 24.0, 58.0, 68.0, 102.0, 139.0, 247.0, 361.0, 586.0, 1068.0, 1879.0, 3518.0, 7019.0, 16125.0, 47420.0, 232192.0, 610915.0, 82617.0, 24015.0, 9742.0, 4570.0, 2395.0, 1340.0, 788.0, 454.0, 322.0, 185.0, 118.0, 62.0, 51.0, 37.0, 33.0, 16.0, 10.0, 10.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.744140625, -3.64349365234375, -3.5428466796875, -3.44219970703125, -3.341552734375, -3.24090576171875, -3.1402587890625, -3.03961181640625, -2.93896484375, -2.83831787109375, -2.7376708984375, -2.63702392578125, -2.536376953125, -2.43572998046875, -2.3350830078125, -2.23443603515625, -2.1337890625, -2.03314208984375, -1.9324951171875, -1.83184814453125, -1.731201171875, -1.63055419921875, -1.5299072265625, -1.42926025390625, -1.32861328125, -1.22796630859375, -1.1273193359375, -1.02667236328125, -0.926025390625, -0.82537841796875, -0.7247314453125, -0.62408447265625, -0.5234375, -0.42279052734375, -0.3221435546875, -0.22149658203125, -0.120849609375, -0.02020263671875, 0.0804443359375, 0.18109130859375, 0.28173828125, 0.38238525390625, 0.4830322265625, 0.58367919921875, 0.684326171875, 0.78497314453125, 0.8856201171875, 0.98626708984375, 1.0869140625, 1.18756103515625, 1.2882080078125, 1.38885498046875, 1.489501953125, 1.59014892578125, 1.6907958984375, 1.79144287109375, 1.89208984375, 1.99273681640625, 2.0933837890625, 2.19403076171875, 2.294677734375, 2.39532470703125, 2.4959716796875, 2.59661865234375, 2.697265625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 5.0, 11.0, 37.0, 66.0, 206.0, 401.0, 148.0, 46.0, 20.0, 16.0, 8.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00295257568359375, -0.0028793662786483765, -0.002806156873703003, -0.0027329474687576294, -0.002659738063812256, -0.0025865286588668823, -0.002513319253921509, -0.0024401098489761353, -0.0023669004440307617, -0.002293691039085388, -0.0022204816341400146, -0.002147272229194641, -0.0020740628242492676, -0.002000853419303894, -0.0019276440143585205, -0.001854434609413147, -0.0017812252044677734, -0.0017080157995224, -0.0016348063945770264, -0.0015615969896316528, -0.0014883875846862793, -0.0014151781797409058, -0.0013419687747955322, -0.0012687593698501587, -0.0011955499649047852, -0.0011223405599594116, -0.001049131155014038, -0.0009759217500686646, -0.000902712345123291, -0.0008295029401779175, -0.0007562935352325439, -0.0006830841302871704, -0.0006098747253417969, -0.0005366653203964233, -0.0004634559154510498, -0.00039024651050567627, -0.00031703710556030273, -0.0002438277006149292, -0.00017061829566955566, -9.740889072418213e-05, -2.4199485778808594e-05, 4.900991916656494e-05, 0.00012221932411193848, 0.000195428729057312, 0.00026863813400268555, 0.0003418475389480591, 0.0004150569438934326, 0.00048826634883880615, 0.0005614757537841797, 0.0006346851587295532, 0.0007078945636749268, 0.0007811039686203003, 0.0008543133735656738, 0.0009275227785110474, 0.001000732183456421, 0.0010739415884017944, 0.001147150993347168, 0.0012203603982925415, 0.001293569803237915, 0.0013667792081832886, 0.0014399886131286621, 0.0015131980180740356, 0.0015864074230194092, 0.0016596168279647827, 0.0017328262329101562]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 9.0, 14.0, 12.0, 24.0, 26.0, 58.0, 66.0, 90.0, 164.0, 289.0, 526.0, 1105.0, 2181.0, 4938.0, 12212.0, 35859.0, 158578.0, 660466.0, 122740.0, 30300.0, 10507.0, 4245.0, 1960.0, 962.0, 483.0, 277.0, 154.0, 103.0, 60.0, 35.0, 25.0, 13.0, 8.0, 13.0, 8.0, 9.0, 5.0, 5.0, 2.0, 2.0, 0.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.13671875, -3.030120849609375, -2.92352294921875, -2.816925048828125, -2.7103271484375, -2.603729248046875, -2.49713134765625, -2.390533447265625, -2.283935546875, -2.177337646484375, -2.07073974609375, -1.964141845703125, -1.8575439453125, -1.750946044921875, -1.64434814453125, -1.537750244140625, -1.43115234375, -1.324554443359375, -1.21795654296875, -1.111358642578125, -1.0047607421875, -0.898162841796875, -0.79156494140625, -0.684967041015625, -0.578369140625, -0.471771240234375, -0.36517333984375, -0.258575439453125, -0.1519775390625, -0.045379638671875, 0.06121826171875, 0.167816162109375, 0.2744140625, 0.381011962890625, 0.48760986328125, 0.594207763671875, 0.7008056640625, 0.807403564453125, 0.91400146484375, 1.020599365234375, 1.127197265625, 1.233795166015625, 1.34039306640625, 1.446990966796875, 1.5535888671875, 1.660186767578125, 1.76678466796875, 1.873382568359375, 1.97998046875, 2.086578369140625, 2.19317626953125, 2.299774169921875, 2.4063720703125, 2.512969970703125, 2.61956787109375, 2.726165771484375, 2.832763671875, 2.939361572265625, 3.04595947265625, 3.152557373046875, 3.2591552734375, 3.365753173828125, 3.47235107421875, 3.578948974609375, 3.685546875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 7.0, 7.0, 18.0, 21.0, 19.0, 26.0, 37.0, 49.0, 60.0, 83.0, 98.0, 98.0, 103.0, 87.0, 67.0, 46.0, 46.0, 24.0, 18.0, 11.0, 14.0, 12.0, 6.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.109375, -3.993896484375, -3.87841796875, -3.762939453125, -3.6474609375, -3.531982421875, -3.41650390625, -3.301025390625, -3.185546875, -3.070068359375, -2.95458984375, -2.839111328125, -2.7236328125, -2.608154296875, -2.49267578125, -2.377197265625, -2.26171875, -2.146240234375, -2.03076171875, -1.915283203125, -1.7998046875, -1.684326171875, -1.56884765625, -1.453369140625, -1.337890625, -1.222412109375, -1.10693359375, -0.991455078125, -0.8759765625, -0.760498046875, -0.64501953125, -0.529541015625, -0.4140625, -0.298583984375, -0.18310546875, -0.067626953125, 0.0478515625, 0.163330078125, 0.27880859375, 0.394287109375, 0.509765625, 0.625244140625, 0.74072265625, 0.856201171875, 0.9716796875, 1.087158203125, 1.20263671875, 1.318115234375, 1.43359375, 1.549072265625, 1.66455078125, 1.780029296875, 1.8955078125, 2.010986328125, 2.12646484375, 2.241943359375, 2.357421875, 2.472900390625, 2.58837890625, 2.703857421875, 2.8193359375, 2.934814453125, 3.05029296875, 3.165771484375, 3.28125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 9.0, 24.0, 42.0, 85.0, 184.0, 277.0, 166.0, 85.0, 61.0, 25.0, 16.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.4755859375, -59.53202819824219, -56.588470458984375, -53.64491271972656, -50.70135498046875, -47.75779724121094, -44.81423568725586, -41.87067794799805, -38.927120208740234, -35.98356246948242, -33.04000473022461, -30.096445083618164, -27.15288734436035, -24.20932960510254, -21.265769958496094, -18.32221221923828, -15.378654479980469, -12.435096740722656, -9.491538047790527, -6.547979354858398, -3.604421615600586, -0.6608638763427734, 2.282695770263672, 5.226253509521484, 8.169811248779297, 11.11336898803711, 14.056927680969238, 17.000486373901367, 19.94404411315918, 22.887601852416992, 25.831161499023438, 28.77471923828125, 31.71826934814453, 34.661827087402344, 37.605384826660156, 40.54894256591797, 43.49250030517578, 46.436058044433594, 49.37961959838867, 52.323177337646484, 55.2667350769043, 58.21029281616211, 61.15385055541992, 64.097412109375, 67.04096984863281, 69.98452758789062, 72.92808532714844, 75.87164306640625, 78.81520080566406, 81.75875854492188, 84.70231628417969, 87.6458740234375, 90.58943176269531, 93.53298950195312, 96.47654724121094, 99.42010498046875, 102.36366271972656, 105.30722045898438, 108.25077819824219, 111.1943359375, 114.13789367675781, 117.08145141601562, 120.02500915527344, 122.96856689453125, 125.9121322631836]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 8.0, 5.0, 8.0, 7.0, 11.0, 14.0, 14.0, 11.0, 6.0, 25.0, 27.0, 35.0, 38.0, 38.0, 44.0, 65.0, 73.0, 95.0, 104.0, 50.0, 55.0, 29.0, 40.0, 35.0, 29.0, 22.0, 21.0, 11.0, 18.0, 11.0, 10.0, 9.0, 8.0, 5.0, 5.0, 4.0, 3.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-60.09502410888672, -58.31275939941406, -56.530494689941406, -54.74822998046875, -52.96596908569336, -51.1837043762207, -49.40143966674805, -47.61917495727539, -45.8369140625, -44.054649353027344, -42.27238464355469, -40.49011993408203, -38.70785903930664, -36.925594329833984, -35.14332962036133, -33.36106491088867, -31.578800201416016, -29.79653549194336, -28.014272689819336, -26.23200798034668, -24.449745178222656, -22.66748046875, -20.885215759277344, -19.102951049804688, -17.320688247680664, -15.538424491882324, -13.756160736083984, -11.973896026611328, -10.191632270812988, -8.409368515014648, -6.627103805541992, -4.844840049743652, -3.062572479248047, -1.280308485031128, 0.501955509185791, 2.284219741821289, 4.066483497619629, 5.848747253417969, 7.631011962890625, 9.413275718688965, 11.195539474487305, 12.977803230285645, 14.760066986083984, 16.54233169555664, 18.324596405029297, 20.10685920715332, 21.889123916625977, 23.67138671875, 25.453651428222656, 27.235916137695312, 29.018178939819336, 30.800443649291992, 32.582706451416016, 34.36497116088867, 36.14723587036133, 37.929500579833984, 39.711761474609375, 41.49402618408203, 43.27629089355469, 45.058555603027344, 46.840816497802734, 48.62308120727539, 50.40534591674805, 52.1876106262207, 53.96987533569336]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 11.0, 19.0, 17.0, 38.0, 50.0, 85.0, 138.0, 237.0, 469.0, 894.0, 1932.0, 5856.0, 25745.0, 301410.0, 3163251.0, 638962.0, 42279.0, 7871.0, 2579.0, 1157.0, 548.0, 302.0, 172.0, 95.0, 67.0, 38.0, 24.0, 17.0, 4.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.4146728515625, -4.227783203125, -4.0408935546875, -3.85400390625, -3.6671142578125, -3.480224609375, -3.2933349609375, -3.1064453125, -2.9195556640625, -2.732666015625, -2.5457763671875, -2.35888671875, -2.1719970703125, -1.985107421875, -1.7982177734375, -1.611328125, -1.4244384765625, -1.237548828125, -1.0506591796875, -0.86376953125, -0.6768798828125, -0.489990234375, -0.3031005859375, -0.1162109375, 0.0706787109375, 0.257568359375, 0.4444580078125, 0.63134765625, 0.8182373046875, 1.005126953125, 1.1920166015625, 1.37890625, 1.5657958984375, 1.752685546875, 1.9395751953125, 2.12646484375, 2.3133544921875, 2.500244140625, 2.6871337890625, 2.8740234375, 3.0609130859375, 3.247802734375, 3.4346923828125, 3.62158203125, 3.8084716796875, 3.995361328125, 4.1822509765625, 4.369140625, 4.5560302734375, 4.742919921875, 4.9298095703125, 5.11669921875, 5.3035888671875, 5.490478515625, 5.6773681640625, 5.8642578125, 6.0511474609375, 6.238037109375, 6.4249267578125, 6.61181640625, 6.7987060546875, 6.985595703125, 7.1724853515625, 7.359375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 0.0, 2.0, 6.0, 8.0, 8.0, 8.0, 6.0, 5.0, 17.0, 10.0, 21.0, 18.0, 27.0, 20.0, 40.0, 43.0, 36.0, 35.0, 56.0, 60.0, 52.0, 49.0, 59.0, 42.0, 41.0, 48.0, 31.0, 41.0, 24.0, 30.0, 24.0, 25.0, 16.0, 15.0, 18.0, 14.0, 8.0, 7.0, 10.0, 3.0, 8.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.427734375, -3.328765869140625, -3.22979736328125, -3.130828857421875, -3.0318603515625, -2.932891845703125, -2.83392333984375, -2.734954833984375, -2.635986328125, -2.537017822265625, -2.43804931640625, -2.339080810546875, -2.2401123046875, -2.141143798828125, -2.04217529296875, -1.943206787109375, -1.84423828125, -1.745269775390625, -1.64630126953125, -1.547332763671875, -1.4483642578125, -1.349395751953125, -1.25042724609375, -1.151458740234375, -1.052490234375, -0.953521728515625, -0.85455322265625, -0.755584716796875, -0.6566162109375, -0.557647705078125, -0.45867919921875, -0.359710693359375, -0.2607421875, -0.161773681640625, -0.06280517578125, 0.036163330078125, 0.1351318359375, 0.234100341796875, 0.33306884765625, 0.432037353515625, 0.531005859375, 0.629974365234375, 0.72894287109375, 0.827911376953125, 0.9268798828125, 1.025848388671875, 1.12481689453125, 1.223785400390625, 1.32275390625, 1.421722412109375, 1.52069091796875, 1.619659423828125, 1.7186279296875, 1.817596435546875, 1.91656494140625, 2.015533447265625, 2.114501953125, 2.213470458984375, 2.31243896484375, 2.411407470703125, 2.5103759765625, 2.609344482421875, 2.70831298828125, 2.807281494140625, 2.90625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 10.0, 11.0, 37.0, 37.0, 76.0, 104.0, 250.0, 517.0, 1535.0, 13374.0, 3686654.0, 483704.0, 6049.0, 1004.0, 446.0, 205.0, 97.0, 67.0, 41.0, 25.0, 16.0, 8.0, 5.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.625, -21.97607421875, -21.3271484375, -20.67822265625, -20.029296875, -19.38037109375, -18.7314453125, -18.08251953125, -17.43359375, -16.78466796875, -16.1357421875, -15.48681640625, -14.837890625, -14.18896484375, -13.5400390625, -12.89111328125, -12.2421875, -11.59326171875, -10.9443359375, -10.29541015625, -9.646484375, -8.99755859375, -8.3486328125, -7.69970703125, -7.05078125, -6.40185546875, -5.7529296875, -5.10400390625, -4.455078125, -3.80615234375, -3.1572265625, -2.50830078125, -1.859375, -1.21044921875, -0.5615234375, 0.08740234375, 0.736328125, 1.38525390625, 2.0341796875, 2.68310546875, 3.33203125, 3.98095703125, 4.6298828125, 5.27880859375, 5.927734375, 6.57666015625, 7.2255859375, 7.87451171875, 8.5234375, 9.17236328125, 9.8212890625, 10.47021484375, 11.119140625, 11.76806640625, 12.4169921875, 13.06591796875, 13.71484375, 14.36376953125, 15.0126953125, 15.66162109375, 16.310546875, 16.95947265625, 17.6083984375, 18.25732421875, 18.90625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 10.0, 15.0, 13.0, 26.0, 45.0, 78.0, 233.0, 620.0, 1390.0, 1001.0, 380.0, 132.0, 51.0, 37.0, 18.0, 8.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8125, -11.41552734375, -11.0185546875, -10.62158203125, -10.224609375, -9.82763671875, -9.4306640625, -9.03369140625, -8.63671875, -8.23974609375, -7.8427734375, -7.44580078125, -7.048828125, -6.65185546875, -6.2548828125, -5.85791015625, -5.4609375, -5.06396484375, -4.6669921875, -4.27001953125, -3.873046875, -3.47607421875, -3.0791015625, -2.68212890625, -2.28515625, -1.88818359375, -1.4912109375, -1.09423828125, -0.697265625, -0.30029296875, 0.0966796875, 0.49365234375, 0.890625, 1.28759765625, 1.6845703125, 2.08154296875, 2.478515625, 2.87548828125, 3.2724609375, 3.66943359375, 4.06640625, 4.46337890625, 4.8603515625, 5.25732421875, 5.654296875, 6.05126953125, 6.4482421875, 6.84521484375, 7.2421875, 7.63916015625, 8.0361328125, 8.43310546875, 8.830078125, 9.22705078125, 9.6240234375, 10.02099609375, 10.41796875, 10.81494140625, 11.2119140625, 11.60888671875, 12.005859375, 12.40283203125, 12.7998046875, 13.19677734375, 13.59375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 9.0, 29.0, 35.0, 55.0, 101.0, 148.0, 195.0, 146.0, 116.0, 62.0, 43.0, 20.0, 10.0, 9.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-93.1906509399414, -91.10945129394531, -89.02825927734375, -86.94705963134766, -84.86585998535156, -82.78466796875, -80.7034683227539, -78.62227630615234, -76.54107666015625, -74.45987701416016, -72.3786849975586, -70.2974853515625, -68.21629333496094, -66.13509368896484, -64.05389404296875, -61.97269821166992, -59.891502380371094, -57.810306549072266, -55.72911071777344, -53.647911071777344, -51.566715240478516, -49.48551940917969, -47.404319763183594, -45.323123931884766, -43.24192810058594, -41.16073226928711, -39.07953643798828, -36.99833679199219, -34.91714096069336, -32.83594512939453, -30.75474739074707, -28.67354965209961, -26.592361450195312, -24.511165618896484, -22.429967880249023, -20.348770141601562, -18.267574310302734, -16.186378479003906, -14.105180740356445, -12.0239839553833, -9.942787170410156, -7.861590385437012, -5.780393600463867, -3.6991968154907227, -1.6180000305175781, 0.4631967544555664, 2.544393539428711, 4.6255903244018555, 6.706787109375, 8.787983894348145, 10.869180679321289, 12.950377464294434, 15.031574249267578, 17.112770080566406, 19.193967819213867, 21.275165557861328, 23.356361389160156, 25.437557220458984, 27.518754959106445, 29.599952697753906, 31.681148529052734, 33.76234436035156, 35.843544006347656, 37.924739837646484, 40.00593566894531]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 5.0, 7.0, 8.0, 11.0, 9.0, 20.0, 19.0, 31.0, 20.0, 34.0, 40.0, 37.0, 39.0, 33.0, 39.0, 46.0, 59.0, 44.0, 47.0, 43.0, 52.0, 38.0, 41.0, 42.0, 40.0, 33.0, 31.0, 27.0, 22.0, 19.0, 7.0, 11.0, 7.0, 7.0, 7.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-34.533119201660156, -33.586387634277344, -32.6396598815918, -31.692928314208984, -30.746196746826172, -29.799467086791992, -28.852737426757812, -27.906005859375, -26.95927619934082, -26.01254653930664, -25.065814971923828, -24.11908531188965, -23.17235565185547, -22.225624084472656, -21.278894424438477, -20.332164764404297, -19.385433197021484, -18.438703536987305, -17.491971969604492, -16.545242309570312, -15.598511695861816, -14.65178108215332, -13.70505142211914, -12.758320808410645, -11.811590194702148, -10.864859580993652, -9.918128967285156, -8.971399307250977, -8.02466869354248, -7.077938079833984, -6.1312079429626465, -5.184477806091309, -4.2377471923828125, -3.2910168170928955, -2.3442864418029785, -1.3975560665130615, -0.45082569122314453, 0.49590492248535156, 1.4426350593566895, 2.3893651962280273, 3.3360958099365234, 4.2828264236450195, 5.229556560516357, 6.176286697387695, 7.123017311096191, 8.069747924804688, 9.016477584838867, 9.963208198547363, 10.90993881225586, 11.856669425964355, 12.803400039672852, 13.750129699707031, 14.696860313415527, 15.643590927124023, 16.590320587158203, 17.537052154541016, 18.483781814575195, 19.430511474609375, 20.377243041992188, 21.323972702026367, 22.270702362060547, 23.21743392944336, 24.16416358947754, 25.11089324951172, 26.05762481689453]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 5.0, 2.0, 17.0, 15.0, 48.0, 64.0, 97.0, 160.0, 278.0, 552.0, 1193.0, 2513.0, 5763.0, 14742.0, 42189.0, 135846.0, 377062.0, 313678.0, 101533.0, 32254.0, 11627.0, 4663.0, 2149.0, 970.0, 499.0, 279.0, 124.0, 80.0, 62.0, 35.0, 24.0, 12.0, 10.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.453125, -4.29339599609375, -4.1336669921875, -3.97393798828125, -3.814208984375, -3.65447998046875, -3.4947509765625, -3.33502197265625, -3.17529296875, -3.01556396484375, -2.8558349609375, -2.69610595703125, -2.536376953125, -2.37664794921875, -2.2169189453125, -2.05718994140625, -1.8974609375, -1.73773193359375, -1.5780029296875, -1.41827392578125, -1.258544921875, -1.09881591796875, -0.9390869140625, -0.77935791015625, -0.61962890625, -0.45989990234375, -0.3001708984375, -0.14044189453125, 0.019287109375, 0.17901611328125, 0.3387451171875, 0.49847412109375, 0.658203125, 0.81793212890625, 0.9776611328125, 1.13739013671875, 1.297119140625, 1.45684814453125, 1.6165771484375, 1.77630615234375, 1.93603515625, 2.09576416015625, 2.2554931640625, 2.41522216796875, 2.574951171875, 2.73468017578125, 2.8944091796875, 3.05413818359375, 3.2138671875, 3.37359619140625, 3.5333251953125, 3.69305419921875, 3.852783203125, 4.01251220703125, 4.1722412109375, 4.33197021484375, 4.49169921875, 4.65142822265625, 4.8111572265625, 4.97088623046875, 5.130615234375, 5.29034423828125, 5.4500732421875, 5.60980224609375, 5.76953125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 4.0, 7.0, 7.0, 4.0, 9.0, 14.0, 11.0, 13.0, 12.0, 20.0, 24.0, 23.0, 46.0, 35.0, 41.0, 46.0, 44.0, 54.0, 57.0, 61.0, 59.0, 41.0, 46.0, 45.0, 35.0, 36.0, 29.0, 22.0, 32.0, 29.0, 17.0, 19.0, 10.0, 7.0, 12.0, 7.0, 11.0, 3.0, 5.0, 0.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.494140625, -3.38336181640625, -3.2725830078125, -3.16180419921875, -3.051025390625, -2.94024658203125, -2.8294677734375, -2.71868896484375, -2.60791015625, -2.49713134765625, -2.3863525390625, -2.27557373046875, -2.164794921875, -2.05401611328125, -1.9432373046875, -1.83245849609375, -1.7216796875, -1.61090087890625, -1.5001220703125, -1.38934326171875, -1.278564453125, -1.16778564453125, -1.0570068359375, -0.94622802734375, -0.83544921875, -0.72467041015625, -0.6138916015625, -0.50311279296875, -0.392333984375, -0.28155517578125, -0.1707763671875, -0.05999755859375, 0.05078125, 0.16156005859375, 0.2723388671875, 0.38311767578125, 0.493896484375, 0.60467529296875, 0.7154541015625, 0.82623291015625, 0.93701171875, 1.04779052734375, 1.1585693359375, 1.26934814453125, 1.380126953125, 1.49090576171875, 1.6016845703125, 1.71246337890625, 1.8232421875, 1.93402099609375, 2.0447998046875, 2.15557861328125, 2.266357421875, 2.37713623046875, 2.4879150390625, 2.59869384765625, 2.70947265625, 2.82025146484375, 2.9310302734375, 3.04180908203125, 3.152587890625, 3.26336669921875, 3.3741455078125, 3.48492431640625, 3.595703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 5.0, 18.0, 18.0, 21.0, 24.0, 36.0, 50.0, 82.0, 91.0, 153.0, 234.0, 372.0, 717.0, 1457.0, 3888.0, 15240.0, 91688.0, 728362.0, 171968.0, 24266.0, 5625.0, 1956.0, 923.0, 481.0, 279.0, 177.0, 133.0, 68.0, 61.0, 44.0, 33.0, 23.0, 10.0, 17.0, 10.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.25, -9.93603515625, -9.6220703125, -9.30810546875, -8.994140625, -8.68017578125, -8.3662109375, -8.05224609375, -7.73828125, -7.42431640625, -7.1103515625, -6.79638671875, -6.482421875, -6.16845703125, -5.8544921875, -5.54052734375, -5.2265625, -4.91259765625, -4.5986328125, -4.28466796875, -3.970703125, -3.65673828125, -3.3427734375, -3.02880859375, -2.71484375, -2.40087890625, -2.0869140625, -1.77294921875, -1.458984375, -1.14501953125, -0.8310546875, -0.51708984375, -0.203125, 0.11083984375, 0.4248046875, 0.73876953125, 1.052734375, 1.36669921875, 1.6806640625, 1.99462890625, 2.30859375, 2.62255859375, 2.9365234375, 3.25048828125, 3.564453125, 3.87841796875, 4.1923828125, 4.50634765625, 4.8203125, 5.13427734375, 5.4482421875, 5.76220703125, 6.076171875, 6.39013671875, 6.7041015625, 7.01806640625, 7.33203125, 7.64599609375, 7.9599609375, 8.27392578125, 8.587890625, 8.90185546875, 9.2158203125, 9.52978515625, 9.84375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 6.0, 7.0, 13.0, 12.0, 18.0, 28.0, 25.0, 39.0, 26.0, 39.0, 64.0, 58.0, 59.0, 50.0, 53.0, 80.0, 50.0, 55.0, 46.0, 43.0, 42.0, 22.0, 37.0, 21.0, 27.0, 12.0, 12.0, 13.0, 8.0, 8.0, 6.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.734375, -15.27783203125, -14.8212890625, -14.36474609375, -13.908203125, -13.45166015625, -12.9951171875, -12.53857421875, -12.08203125, -11.62548828125, -11.1689453125, -10.71240234375, -10.255859375, -9.79931640625, -9.3427734375, -8.88623046875, -8.4296875, -7.97314453125, -7.5166015625, -7.06005859375, -6.603515625, -6.14697265625, -5.6904296875, -5.23388671875, -4.77734375, -4.32080078125, -3.8642578125, -3.40771484375, -2.951171875, -2.49462890625, -2.0380859375, -1.58154296875, -1.125, -0.66845703125, -0.2119140625, 0.24462890625, 0.701171875, 1.15771484375, 1.6142578125, 2.07080078125, 2.52734375, 2.98388671875, 3.4404296875, 3.89697265625, 4.353515625, 4.81005859375, 5.2666015625, 5.72314453125, 6.1796875, 6.63623046875, 7.0927734375, 7.54931640625, 8.005859375, 8.46240234375, 8.9189453125, 9.37548828125, 9.83203125, 10.28857421875, 10.7451171875, 11.20166015625, 11.658203125, 12.11474609375, 12.5712890625, 13.02783203125, 13.484375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 10.0, 21.0, 22.0, 43.0, 56.0, 108.0, 186.0, 322.0, 608.0, 1217.0, 2637.0, 6521.0, 18532.0, 74848.0, 759821.0, 140047.0, 27937.0, 8861.0, 3453.0, 1580.0, 759.0, 408.0, 208.0, 131.0, 73.0, 44.0, 36.0, 16.0, 12.0, 9.0, 4.0, 8.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.505859375, -3.398529052734375, -3.29119873046875, -3.183868408203125, -3.0765380859375, -2.969207763671875, -2.86187744140625, -2.754547119140625, -2.647216796875, -2.539886474609375, -2.43255615234375, -2.325225830078125, -2.2178955078125, -2.110565185546875, -2.00323486328125, -1.895904541015625, -1.78857421875, -1.681243896484375, -1.57391357421875, -1.466583251953125, -1.3592529296875, -1.251922607421875, -1.14459228515625, -1.037261962890625, -0.929931640625, -0.822601318359375, -0.71527099609375, -0.607940673828125, -0.5006103515625, -0.393280029296875, -0.28594970703125, -0.178619384765625, -0.0712890625, 0.036041259765625, 0.14337158203125, 0.250701904296875, 0.3580322265625, 0.465362548828125, 0.57269287109375, 0.680023193359375, 0.787353515625, 0.894683837890625, 1.00201416015625, 1.109344482421875, 1.2166748046875, 1.324005126953125, 1.43133544921875, 1.538665771484375, 1.64599609375, 1.753326416015625, 1.86065673828125, 1.967987060546875, 2.0753173828125, 2.182647705078125, 2.28997802734375, 2.397308349609375, 2.504638671875, 2.611968994140625, 2.71929931640625, 2.826629638671875, 2.9339599609375, 3.041290283203125, 3.14862060546875, 3.255950927734375, 3.36328125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 0.0, 6.0, 13.0, 17.0, 16.0, 36.0, 54.0, 95.0, 179.0, 285.0, 120.0, 50.0, 36.0, 32.0, 18.0, 6.0, 8.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010776519775390625, -0.0010408610105514526, -0.0010040700435638428, -0.0009672790765762329, -0.000930488109588623, -0.0008936971426010132, -0.0008569061756134033, -0.0008201152086257935, -0.0007833242416381836, -0.0007465332746505737, -0.0007097423076629639, -0.000672951340675354, -0.0006361603736877441, -0.0005993694067001343, -0.0005625784397125244, -0.0005257874727249146, -0.0004889965057373047, -0.0004522055387496948, -0.00041541457176208496, -0.0003786236047744751, -0.00034183263778686523, -0.00030504167079925537, -0.0002682507038116455, -0.00023145973682403564, -0.00019466876983642578, -0.00015787780284881592, -0.00012108683586120605, -8.429586887359619e-05, -4.750490188598633e-05, -1.0713934898376465e-05, 2.60770320892334e-05, 6.286799907684326e-05, 9.965896606445312e-05, 0.000136449933052063, 0.00017324090003967285, 0.00021003186702728271, 0.0002468228340148926, 0.00028361380100250244, 0.0003204047679901123, 0.00035719573497772217, 0.00039398670196533203, 0.0004307776689529419, 0.00046756863594055176, 0.0005043596029281616, 0.0005411505699157715, 0.0005779415369033813, 0.0006147325038909912, 0.0006515234708786011, 0.0006883144378662109, 0.0007251054048538208, 0.0007618963718414307, 0.0007986873388290405, 0.0008354783058166504, 0.0008722692728042603, 0.0009090602397918701, 0.00094585120677948, 0.0009826421737670898, 0.0010194331407546997, 0.0010562241077423096, 0.0010930150747299194, 0.0011298060417175293, 0.0011665970087051392, 0.001203387975692749, 0.0012401789426803589, 0.0012769699096679688]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 8.0, 20.0, 27.0, 34.0, 65.0, 124.0, 279.0, 684.0, 1735.0, 5351.0, 24953.0, 316848.0, 659040.0, 29851.0, 6120.0, 1953.0, 720.0, 346.0, 172.0, 96.0, 45.0, 24.0, 16.0, 14.0, 6.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2421875, -5.0733642578125, -4.904541015625, -4.7357177734375, -4.56689453125, -4.3980712890625, -4.229248046875, -4.0604248046875, -3.8916015625, -3.7227783203125, -3.553955078125, -3.3851318359375, -3.21630859375, -3.0474853515625, -2.878662109375, -2.7098388671875, -2.541015625, -2.3721923828125, -2.203369140625, -2.0345458984375, -1.86572265625, -1.6968994140625, -1.528076171875, -1.3592529296875, -1.1904296875, -1.0216064453125, -0.852783203125, -0.6839599609375, -0.51513671875, -0.3463134765625, -0.177490234375, -0.0086669921875, 0.16015625, 0.3289794921875, 0.497802734375, 0.6666259765625, 0.83544921875, 1.0042724609375, 1.173095703125, 1.3419189453125, 1.5107421875, 1.6795654296875, 1.848388671875, 2.0172119140625, 2.18603515625, 2.3548583984375, 2.523681640625, 2.6925048828125, 2.861328125, 3.0301513671875, 3.198974609375, 3.3677978515625, 3.53662109375, 3.7054443359375, 3.874267578125, 4.0430908203125, 4.2119140625, 4.3807373046875, 4.549560546875, 4.7183837890625, 4.88720703125, 5.0560302734375, 5.224853515625, 5.3936767578125, 5.5625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 6.0, 18.0, 13.0, 22.0, 37.0, 63.0, 89.0, 163.0, 176.0, 138.0, 85.0, 64.0, 31.0, 31.0, 17.0, 15.0, 9.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.60546875, -4.4544677734375, -4.303466796875, -4.1524658203125, -4.00146484375, -3.8504638671875, -3.699462890625, -3.5484619140625, -3.3974609375, -3.2464599609375, -3.095458984375, -2.9444580078125, -2.79345703125, -2.6424560546875, -2.491455078125, -2.3404541015625, -2.189453125, -2.0384521484375, -1.887451171875, -1.7364501953125, -1.58544921875, -1.4344482421875, -1.283447265625, -1.1324462890625, -0.9814453125, -0.8304443359375, -0.679443359375, -0.5284423828125, -0.37744140625, -0.2264404296875, -0.075439453125, 0.0755615234375, 0.2265625, 0.3775634765625, 0.528564453125, 0.6795654296875, 0.83056640625, 0.9815673828125, 1.132568359375, 1.2835693359375, 1.4345703125, 1.5855712890625, 1.736572265625, 1.8875732421875, 2.03857421875, 2.1895751953125, 2.340576171875, 2.4915771484375, 2.642578125, 2.7935791015625, 2.944580078125, 3.0955810546875, 3.24658203125, 3.3975830078125, 3.548583984375, 3.6995849609375, 3.8505859375, 4.0015869140625, 4.152587890625, 4.3035888671875, 4.45458984375, 4.6055908203125, 4.756591796875, 4.9075927734375, 5.05859375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 9.0, 23.0, 44.0, 125.0, 367.0, 250.0, 112.0, 37.0, 17.0, 10.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-140.16384887695312, -136.2601318359375, -132.3563995361328, -128.4526824951172, -124.54895782470703, -120.64523315429688, -116.74151611328125, -112.8377914428711, -108.93406677246094, -105.03034210205078, -101.12662506103516, -97.222900390625, -93.31917572021484, -89.41545104980469, -85.51173400878906, -81.6080093383789, -77.70428466796875, -73.8005599975586, -69.89684295654297, -65.99311828613281, -62.089393615722656, -58.185672760009766, -54.281951904296875, -50.37822723388672, -46.474510192871094, -42.5707893371582, -38.66706466674805, -34.763343811035156, -30.859619140625, -26.95589828491211, -23.052175521850586, -19.148452758789062, -15.244728088378906, -11.341005325317383, -7.437283039093018, -3.5335607528686523, 0.3701620101928711, 4.273883819580078, 8.177606582641602, 12.081329345703125, 15.985052108764648, 19.888774871826172, 23.792497634887695, 27.69622039794922, 31.59994125366211, 35.503662109375, 39.407386779785156, 43.31111145019531, 47.2148323059082, 51.118553161621094, 55.02227783203125, 58.92599868774414, 62.8297233581543, 66.73344421386719, 70.63716888427734, 74.5408935546875, 78.44461059570312, 82.34833526611328, 86.2520523071289, 90.15577697753906, 94.05950164794922, 97.96322631835938, 101.866943359375, 105.77066802978516, 109.67439270019531]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 8.0, 3.0, 9.0, 6.0, 6.0, 11.0, 5.0, 10.0, 8.0, 13.0, 24.0, 20.0, 17.0, 24.0, 26.0, 39.0, 35.0, 31.0, 36.0, 53.0, 77.0, 104.0, 84.0, 37.0, 46.0, 29.0, 19.0, 24.0, 23.0, 17.0, 27.0, 21.0, 20.0, 9.0, 15.0, 9.0, 5.0, 11.0, 6.0, 8.0, 5.0, 9.0, 3.0, 3.0, 3.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.3431396484375, -37.967628479003906, -36.59211730957031, -35.21660232543945, -33.84109115600586, -32.465579986572266, -31.090068817138672, -29.714555740356445, -28.33904266357422, -26.963531494140625, -25.5880184173584, -24.212507247924805, -22.836994171142578, -21.461483001708984, -20.08597183227539, -18.710458755493164, -17.33494758605957, -15.95943546295166, -14.58392333984375, -13.208412170410156, -11.83289909362793, -10.457387924194336, -9.081875801086426, -7.706363677978516, -6.3308515548706055, -4.955339431762695, -3.5798275470733643, -2.204315662384033, -0.828803539276123, 0.5467085838317871, 1.922220230102539, 3.297732353210449, 4.673244476318359, 6.0487565994262695, 7.42426872253418, 8.799779891967773, 10.17529296875, 11.550804138183594, 12.926316261291504, 14.301828384399414, 15.677340507507324, 17.052852630615234, 18.428363800048828, 19.803876876831055, 21.17938804626465, 22.554901123046875, 23.93041229248047, 25.305923461914062, 26.68143653869629, 28.056947708129883, 29.43246078491211, 30.807971954345703, 32.1834831237793, 33.558998107910156, 34.93450927734375, 36.310020446777344, 37.68553161621094, 39.06104278564453, 40.436553955078125, 41.812068939208984, 43.18758010864258, 44.56309127807617, 45.938602447509766, 47.314117431640625, 48.68962860107422]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 14.0, 10.0, 15.0, 22.0, 23.0, 50.0, 57.0, 80.0, 144.0, 206.0, 318.0, 608.0, 1130.0, 2336.0, 5147.0, 14899.0, 65149.0, 508961.0, 2612558.0, 850565.0, 99557.0, 20184.0, 6456.0, 2672.0, 1268.0, 692.0, 407.0, 257.0, 159.0, 97.0, 62.0, 44.0, 28.0, 35.0, 20.0, 16.0, 8.0, 10.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.97265625, -4.81536865234375, -4.6580810546875, -4.50079345703125, -4.343505859375, -4.18621826171875, -4.0289306640625, -3.87164306640625, -3.71435546875, -3.55706787109375, -3.3997802734375, -3.24249267578125, -3.085205078125, -2.92791748046875, -2.7706298828125, -2.61334228515625, -2.4560546875, -2.29876708984375, -2.1414794921875, -1.98419189453125, -1.826904296875, -1.66961669921875, -1.5123291015625, -1.35504150390625, -1.19775390625, -1.04046630859375, -0.8831787109375, -0.72589111328125, -0.568603515625, -0.41131591796875, -0.2540283203125, -0.09674072265625, 0.060546875, 0.21783447265625, 0.3751220703125, 0.53240966796875, 0.689697265625, 0.84698486328125, 1.0042724609375, 1.16156005859375, 1.31884765625, 1.47613525390625, 1.6334228515625, 1.79071044921875, 1.947998046875, 2.10528564453125, 2.2625732421875, 2.41986083984375, 2.5771484375, 2.73443603515625, 2.8917236328125, 3.04901123046875, 3.206298828125, 3.36358642578125, 3.5208740234375, 3.67816162109375, 3.83544921875, 3.99273681640625, 4.1500244140625, 4.30731201171875, 4.464599609375, 4.62188720703125, 4.7791748046875, 4.93646240234375, 5.09375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 1.0, 2.0, 6.0, 6.0, 7.0, 6.0, 14.0, 12.0, 15.0, 17.0, 18.0, 17.0, 21.0, 21.0, 37.0, 38.0, 39.0, 35.0, 34.0, 46.0, 54.0, 37.0, 44.0, 46.0, 42.0, 47.0, 39.0, 33.0, 32.0, 35.0, 27.0, 24.0, 20.0, 22.0, 19.0, 15.0, 13.0, 10.0, 7.0, 11.0, 7.0, 12.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.775909423828125, -2.68463134765625, -2.593353271484375, -2.5020751953125, -2.410797119140625, -2.31951904296875, -2.228240966796875, -2.136962890625, -2.045684814453125, -1.95440673828125, -1.863128662109375, -1.7718505859375, -1.680572509765625, -1.58929443359375, -1.498016357421875, -1.40673828125, -1.315460205078125, -1.22418212890625, -1.132904052734375, -1.0416259765625, -0.950347900390625, -0.85906982421875, -0.767791748046875, -0.676513671875, -0.585235595703125, -0.49395751953125, -0.402679443359375, -0.3114013671875, -0.220123291015625, -0.12884521484375, -0.037567138671875, 0.0537109375, 0.144989013671875, 0.23626708984375, 0.327545166015625, 0.4188232421875, 0.510101318359375, 0.60137939453125, 0.692657470703125, 0.783935546875, 0.875213623046875, 0.96649169921875, 1.057769775390625, 1.1490478515625, 1.240325927734375, 1.33160400390625, 1.422882080078125, 1.51416015625, 1.605438232421875, 1.69671630859375, 1.787994384765625, 1.8792724609375, 1.970550537109375, 2.06182861328125, 2.153106689453125, 2.244384765625, 2.335662841796875, 2.42694091796875, 2.518218994140625, 2.6094970703125, 2.700775146484375, 2.79205322265625, 2.883331298828125, 2.974609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 14.0, 19.0, 22.0, 36.0, 59.0, 93.0, 149.0, 295.0, 1210.0, 11293.0, 3010223.0, 1160799.0, 8378.0, 1018.0, 330.0, 142.0, 74.0, 41.0, 32.0, 19.0, 10.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.171875, -20.4404296875, -19.708984375, -18.9775390625, -18.24609375, -17.5146484375, -16.783203125, -16.0517578125, -15.3203125, -14.5888671875, -13.857421875, -13.1259765625, -12.39453125, -11.6630859375, -10.931640625, -10.2001953125, -9.46875, -8.7373046875, -8.005859375, -7.2744140625, -6.54296875, -5.8115234375, -5.080078125, -4.3486328125, -3.6171875, -2.8857421875, -2.154296875, -1.4228515625, -0.69140625, 0.0400390625, 0.771484375, 1.5029296875, 2.234375, 2.9658203125, 3.697265625, 4.4287109375, 5.16015625, 5.8916015625, 6.623046875, 7.3544921875, 8.0859375, 8.8173828125, 9.548828125, 10.2802734375, 11.01171875, 11.7431640625, 12.474609375, 13.2060546875, 13.9375, 14.6689453125, 15.400390625, 16.1318359375, 16.86328125, 17.5947265625, 18.326171875, 19.0576171875, 19.7890625, 20.5205078125, 21.251953125, 21.9833984375, 22.71484375, 23.4462890625, 24.177734375, 24.9091796875, 25.640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 8.0, 9.0, 35.0, 38.0, 57.0, 118.0, 213.0, 419.0, 854.0, 1059.0, 633.0, 288.0, 140.0, 69.0, 45.0, 29.0, 21.0, 12.0, 10.0, 5.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-17.390625, -17.006591796875, -16.62255859375, -16.238525390625, -15.8544921875, -15.470458984375, -15.08642578125, -14.702392578125, -14.318359375, -13.934326171875, -13.55029296875, -13.166259765625, -12.7822265625, -12.398193359375, -12.01416015625, -11.630126953125, -11.24609375, -10.862060546875, -10.47802734375, -10.093994140625, -9.7099609375, -9.325927734375, -8.94189453125, -8.557861328125, -8.173828125, -7.789794921875, -7.40576171875, -7.021728515625, -6.6376953125, -6.253662109375, -5.86962890625, -5.485595703125, -5.1015625, -4.717529296875, -4.33349609375, -3.949462890625, -3.5654296875, -3.181396484375, -2.79736328125, -2.413330078125, -2.029296875, -1.645263671875, -1.26123046875, -0.877197265625, -0.4931640625, -0.109130859375, 0.27490234375, 0.658935546875, 1.04296875, 1.427001953125, 1.81103515625, 2.195068359375, 2.5791015625, 2.963134765625, 3.34716796875, 3.731201171875, 4.115234375, 4.499267578125, 4.88330078125, 5.267333984375, 5.6513671875, 6.035400390625, 6.41943359375, 6.803466796875, 7.1875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 0.0, 3.0, 4.0, 10.0, 24.0, 33.0, 56.0, 63.0, 97.0, 121.0, 137.0, 161.0, 91.0, 66.0, 28.0, 38.0, 19.0, 9.0, 7.0, 5.0, 7.0, 7.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.34293746948242, -47.481319427490234, -45.61970520019531, -43.758087158203125, -41.89646911621094, -40.03485107421875, -38.17323684692383, -36.31161880493164, -34.45000457763672, -32.58838653564453, -30.726770401000977, -28.865154266357422, -27.003536224365234, -25.14192008972168, -23.280303955078125, -21.418685913085938, -19.55706787109375, -17.695451736450195, -15.833833694458008, -13.972217559814453, -12.110600471496582, -10.248983383178711, -8.387367248535156, -6.525750160217285, -4.664133071899414, -2.802516222000122, -0.9408993721008301, 0.9207172393798828, 2.782334327697754, 4.643951416015625, 6.50556755065918, 8.36718463897705, 10.228797912597656, 12.090415000915527, 13.952032089233398, 15.813648223876953, 17.67526626586914, 19.536882400512695, 21.39849853515625, 23.260116577148438, 25.121732711791992, 26.983348846435547, 28.844966888427734, 30.70658302307129, 32.568199157714844, 34.42981719970703, 36.29143524169922, 38.15304946899414, 40.01466751098633, 41.876285552978516, 43.73789978027344, 45.599517822265625, 47.46113586425781, 49.32275390625, 51.18436813354492, 53.04598617553711, 54.90760040283203, 56.76921844482422, 58.63083267211914, 60.49245071411133, 62.354068756103516, 64.21568298339844, 66.07730102539062, 67.93891906738281, 69.800537109375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 6.0, 6.0, 8.0, 7.0, 11.0, 13.0, 20.0, 20.0, 23.0, 35.0, 40.0, 48.0, 47.0, 48.0, 51.0, 60.0, 62.0, 56.0, 69.0, 59.0, 41.0, 44.0, 36.0, 39.0, 39.0, 23.0, 12.0, 19.0, 15.0, 10.0, 13.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.907562255859375, -37.520904541015625, -36.13424301147461, -34.74758529663086, -33.360923767089844, -31.974266052246094, -30.58760643005371, -29.200946807861328, -27.814289093017578, -26.427629470825195, -25.040969848632812, -23.654312133789062, -22.26765251159668, -20.880992889404297, -19.494333267211914, -18.10767364501953, -16.72101402282715, -15.334354400634766, -13.9476957321167, -12.561036109924316, -11.17437744140625, -9.787717819213867, -8.401058197021484, -7.014399528503418, -5.627739906311035, -4.2410807609558105, -2.854421377182007, -1.4677619934082031, -0.08110284805297852, 1.305556297302246, 2.692215919494629, 4.078874588012695, 5.465534210205078, 6.852193355560303, 8.238852500915527, 9.62551212310791, 11.012170791625977, 12.39883041381836, 13.785490036010742, 15.172148704528809, 16.558807373046875, 17.945466995239258, 19.33212661743164, 20.71878433227539, 22.105443954467773, 23.492103576660156, 24.87876319885254, 26.265422821044922, 27.652082443237305, 29.038742065429688, 30.42540168762207, 31.812061309814453, 33.1987190246582, 34.58538055419922, 35.97203826904297, 37.35869598388672, 38.745357513427734, 40.132015228271484, 41.5186767578125, 42.90533447265625, 44.291996002197266, 45.678653717041016, 47.06531524658203, 48.45197296142578, 49.83863067626953]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 5.0, 7.0, 10.0, 11.0, 29.0, 54.0, 96.0, 162.0, 322.0, 577.0, 1142.0, 2283.0, 4807.0, 10552.0, 25984.0, 68747.0, 192895.0, 394685.0, 218155.0, 76849.0, 29092.0, 11852.0, 5241.0, 2474.0, 1195.0, 570.0, 330.0, 175.0, 99.0, 61.0, 34.0, 34.0, 11.0, 8.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.59375, -5.431884765625, -5.27001953125, -5.108154296875, -4.9462890625, -4.784423828125, -4.62255859375, -4.460693359375, -4.298828125, -4.136962890625, -3.97509765625, -3.813232421875, -3.6513671875, -3.489501953125, -3.32763671875, -3.165771484375, -3.00390625, -2.842041015625, -2.68017578125, -2.518310546875, -2.3564453125, -2.194580078125, -2.03271484375, -1.870849609375, -1.708984375, -1.547119140625, -1.38525390625, -1.223388671875, -1.0615234375, -0.899658203125, -0.73779296875, -0.575927734375, -0.4140625, -0.252197265625, -0.09033203125, 0.071533203125, 0.2333984375, 0.395263671875, 0.55712890625, 0.718994140625, 0.880859375, 1.042724609375, 1.20458984375, 1.366455078125, 1.5283203125, 1.690185546875, 1.85205078125, 2.013916015625, 2.17578125, 2.337646484375, 2.49951171875, 2.661376953125, 2.8232421875, 2.985107421875, 3.14697265625, 3.308837890625, 3.470703125, 3.632568359375, 3.79443359375, 3.956298828125, 4.1181640625, 4.280029296875, 4.44189453125, 4.603759765625, 4.765625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 0.0, 0.0, 3.0, 9.0, 5.0, 15.0, 10.0, 11.0, 14.0, 12.0, 21.0, 28.0, 26.0, 31.0, 25.0, 40.0, 37.0, 31.0, 33.0, 37.0, 42.0, 46.0, 42.0, 27.0, 40.0, 36.0, 40.0, 38.0, 39.0, 32.0, 29.0, 32.0, 26.0, 26.0, 19.0, 15.0, 11.0, 8.0, 14.0, 8.0, 11.0, 7.0, 11.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.951171875, -2.858123779296875, -2.76507568359375, -2.672027587890625, -2.5789794921875, -2.485931396484375, -2.39288330078125, -2.299835205078125, -2.206787109375, -2.113739013671875, -2.02069091796875, -1.927642822265625, -1.8345947265625, -1.741546630859375, -1.64849853515625, -1.555450439453125, -1.46240234375, -1.369354248046875, -1.27630615234375, -1.183258056640625, -1.0902099609375, -0.997161865234375, -0.90411376953125, -0.811065673828125, -0.718017578125, -0.624969482421875, -0.53192138671875, -0.438873291015625, -0.3458251953125, -0.252777099609375, -0.15972900390625, -0.066680908203125, 0.0263671875, 0.119415283203125, 0.21246337890625, 0.305511474609375, 0.3985595703125, 0.491607666015625, 0.58465576171875, 0.677703857421875, 0.770751953125, 0.863800048828125, 0.95684814453125, 1.049896240234375, 1.1429443359375, 1.235992431640625, 1.32904052734375, 1.422088623046875, 1.51513671875, 1.608184814453125, 1.70123291015625, 1.794281005859375, 1.8873291015625, 1.980377197265625, 2.07342529296875, 2.166473388671875, 2.259521484375, 2.352569580078125, 2.44561767578125, 2.538665771484375, 2.6317138671875, 2.724761962890625, 2.81781005859375, 2.910858154296875, 3.00390625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 11.0, 7.0, 18.0, 14.0, 24.0, 24.0, 40.0, 69.0, 89.0, 110.0, 194.0, 272.0, 381.0, 625.0, 1024.0, 1899.0, 5051.0, 20485.0, 156625.0, 767096.0, 74843.0, 12098.0, 3524.0, 1549.0, 888.0, 534.0, 311.0, 207.0, 154.0, 110.0, 78.0, 42.0, 50.0, 26.0, 18.0, 20.0, 11.0, 10.0, 10.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.875, -11.5389404296875, -11.202880859375, -10.8668212890625, -10.53076171875, -10.1947021484375, -9.858642578125, -9.5225830078125, -9.1865234375, -8.8504638671875, -8.514404296875, -8.1783447265625, -7.84228515625, -7.5062255859375, -7.170166015625, -6.8341064453125, -6.498046875, -6.1619873046875, -5.825927734375, -5.4898681640625, -5.15380859375, -4.8177490234375, -4.481689453125, -4.1456298828125, -3.8095703125, -3.4735107421875, -3.137451171875, -2.8013916015625, -2.46533203125, -2.1292724609375, -1.793212890625, -1.4571533203125, -1.12109375, -0.7850341796875, -0.448974609375, -0.1129150390625, 0.22314453125, 0.5592041015625, 0.895263671875, 1.2313232421875, 1.5673828125, 1.9034423828125, 2.239501953125, 2.5755615234375, 2.91162109375, 3.2476806640625, 3.583740234375, 3.9197998046875, 4.255859375, 4.5919189453125, 4.927978515625, 5.2640380859375, 5.60009765625, 5.9361572265625, 6.272216796875, 6.6082763671875, 6.9443359375, 7.2803955078125, 7.616455078125, 7.9525146484375, 8.28857421875, 8.6246337890625, 8.960693359375, 9.2967529296875, 9.6328125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 8.0, 10.0, 11.0, 9.0, 18.0, 19.0, 23.0, 31.0, 53.0, 48.0, 50.0, 82.0, 64.0, 58.0, 67.0, 78.0, 70.0, 52.0, 43.0, 44.0, 39.0, 34.0, 26.0, 15.0, 12.0, 14.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.515625, -20.9686279296875, -20.421630859375, -19.8746337890625, -19.32763671875, -18.7806396484375, -18.233642578125, -17.6866455078125, -17.1396484375, -16.5926513671875, -16.045654296875, -15.4986572265625, -14.95166015625, -14.4046630859375, -13.857666015625, -13.3106689453125, -12.763671875, -12.2166748046875, -11.669677734375, -11.1226806640625, -10.57568359375, -10.0286865234375, -9.481689453125, -8.9346923828125, -8.3876953125, -7.8406982421875, -7.293701171875, -6.7467041015625, -6.19970703125, -5.6527099609375, -5.105712890625, -4.5587158203125, -4.01171875, -3.4647216796875, -2.917724609375, -2.3707275390625, -1.82373046875, -1.2767333984375, -0.729736328125, -0.1827392578125, 0.3642578125, 0.9112548828125, 1.458251953125, 2.0052490234375, 2.55224609375, 3.0992431640625, 3.646240234375, 4.1932373046875, 4.740234375, 5.2872314453125, 5.834228515625, 6.3812255859375, 6.92822265625, 7.4752197265625, 8.022216796875, 8.5692138671875, 9.1162109375, 9.6632080078125, 10.210205078125, 10.7572021484375, 11.30419921875, 11.8511962890625, 12.398193359375, 12.9451904296875, 13.4921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 11.0, 7.0, 9.0, 10.0, 16.0, 26.0, 55.0, 67.0, 102.0, 239.0, 555.0, 1593.0, 6985.0, 66482.0, 924843.0, 40169.0, 5130.0, 1273.0, 408.0, 218.0, 113.0, 58.0, 48.0, 31.0, 24.0, 20.0, 5.0, 12.0, 5.0, 4.0, 6.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.4609375, -5.30224609375, -5.1435546875, -4.98486328125, -4.826171875, -4.66748046875, -4.5087890625, -4.35009765625, -4.19140625, -4.03271484375, -3.8740234375, -3.71533203125, -3.556640625, -3.39794921875, -3.2392578125, -3.08056640625, -2.921875, -2.76318359375, -2.6044921875, -2.44580078125, -2.287109375, -2.12841796875, -1.9697265625, -1.81103515625, -1.65234375, -1.49365234375, -1.3349609375, -1.17626953125, -1.017578125, -0.85888671875, -0.7001953125, -0.54150390625, -0.3828125, -0.22412109375, -0.0654296875, 0.09326171875, 0.251953125, 0.41064453125, 0.5693359375, 0.72802734375, 0.88671875, 1.04541015625, 1.2041015625, 1.36279296875, 1.521484375, 1.68017578125, 1.8388671875, 1.99755859375, 2.15625, 2.31494140625, 2.4736328125, 2.63232421875, 2.791015625, 2.94970703125, 3.1083984375, 3.26708984375, 3.42578125, 3.58447265625, 3.7431640625, 3.90185546875, 4.060546875, 4.21923828125, 4.3779296875, 4.53662109375, 4.6953125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 10.0, 8.0, 16.0, 13.0, 17.0, 14.0, 30.0, 30.0, 37.0, 90.0, 155.0, 213.0, 109.0, 59.0, 50.0, 25.0, 15.0, 22.0, 22.0, 7.0, 9.0, 2.0, 8.0, 7.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0007781982421875, -0.0007507205009460449, -0.0007232427597045898, -0.0006957650184631348, -0.0006682872772216797, -0.0006408095359802246, -0.0006133317947387695, -0.0005858540534973145, -0.0005583763122558594, -0.0005308985710144043, -0.0005034208297729492, -0.00047594308853149414, -0.00044846534729003906, -0.000420987606048584, -0.0003935098648071289, -0.00036603212356567383, -0.00033855438232421875, -0.00031107664108276367, -0.0002835988998413086, -0.0002561211585998535, -0.00022864341735839844, -0.00020116567611694336, -0.00017368793487548828, -0.0001462101936340332, -0.00011873245239257812, -9.125471115112305e-05, -6.377696990966797e-05, -3.629922866821289e-05, -8.821487426757812e-06, 1.8656253814697266e-05, 4.6133995056152344e-05, 7.361173629760742e-05, 0.0001010894775390625, 0.00012856721878051758, 0.00015604496002197266, 0.00018352270126342773, 0.0002110004425048828, 0.0002384781837463379, 0.00026595592498779297, 0.00029343366622924805, 0.0003209114074707031, 0.0003483891487121582, 0.0003758668899536133, 0.00040334463119506836, 0.00043082237243652344, 0.0004583001136779785, 0.0004857778549194336, 0.0005132555961608887, 0.0005407333374023438, 0.0005682110786437988, 0.0005956888198852539, 0.000623166561126709, 0.0006506443023681641, 0.0006781220436096191, 0.0007055997848510742, 0.0007330775260925293, 0.0007605552673339844, 0.0007880330085754395, 0.0008155107498168945, 0.0008429884910583496, 0.0008704662322998047, 0.0008979439735412598, 0.0009254217147827148, 0.0009528994560241699, 0.000980377197265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 9.0, 6.0, 9.0, 20.0, 37.0, 36.0, 57.0, 92.0, 117.0, 198.0, 334.0, 567.0, 1194.0, 2630.0, 6710.0, 22599.0, 116138.0, 765448.0, 100745.0, 20355.0, 6145.0, 2428.0, 1154.0, 591.0, 299.0, 201.0, 134.0, 76.0, 61.0, 38.0, 42.0, 13.0, 14.0, 7.0, 10.0, 13.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.85546875, -2.772613525390625, -2.68975830078125, -2.606903076171875, -2.5240478515625, -2.441192626953125, -2.35833740234375, -2.275482177734375, -2.192626953125, -2.109771728515625, -2.02691650390625, -1.944061279296875, -1.8612060546875, -1.778350830078125, -1.69549560546875, -1.612640380859375, -1.52978515625, -1.446929931640625, -1.36407470703125, -1.281219482421875, -1.1983642578125, -1.115509033203125, -1.03265380859375, -0.949798583984375, -0.866943359375, -0.784088134765625, -0.70123291015625, -0.618377685546875, -0.5355224609375, -0.452667236328125, -0.36981201171875, -0.286956787109375, -0.2041015625, -0.121246337890625, -0.03839111328125, 0.044464111328125, 0.1273193359375, 0.210174560546875, 0.29302978515625, 0.375885009765625, 0.458740234375, 0.541595458984375, 0.62445068359375, 0.707305908203125, 0.7901611328125, 0.873016357421875, 0.95587158203125, 1.038726806640625, 1.12158203125, 1.204437255859375, 1.28729248046875, 1.370147705078125, 1.4530029296875, 1.535858154296875, 1.61871337890625, 1.701568603515625, 1.784423828125, 1.867279052734375, 1.95013427734375, 2.032989501953125, 2.1158447265625, 2.198699951171875, 2.28155517578125, 2.364410400390625, 2.447265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 13.0, 11.0, 15.0, 21.0, 35.0, 47.0, 76.0, 108.0, 126.0, 151.0, 105.0, 71.0, 60.0, 38.0, 23.0, 22.0, 19.0, 15.0, 10.0, 6.0, 6.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.953125, -2.8582763671875, -2.763427734375, -2.6685791015625, -2.57373046875, -2.4788818359375, -2.384033203125, -2.2891845703125, -2.1943359375, -2.0994873046875, -2.004638671875, -1.9097900390625, -1.81494140625, -1.7200927734375, -1.625244140625, -1.5303955078125, -1.435546875, -1.3406982421875, -1.245849609375, -1.1510009765625, -1.05615234375, -0.9613037109375, -0.866455078125, -0.7716064453125, -0.6767578125, -0.5819091796875, -0.487060546875, -0.3922119140625, -0.29736328125, -0.2025146484375, -0.107666015625, -0.0128173828125, 0.08203125, 0.1768798828125, 0.271728515625, 0.3665771484375, 0.46142578125, 0.5562744140625, 0.651123046875, 0.7459716796875, 0.8408203125, 0.9356689453125, 1.030517578125, 1.1253662109375, 1.22021484375, 1.3150634765625, 1.409912109375, 1.5047607421875, 1.599609375, 1.6944580078125, 1.789306640625, 1.8841552734375, 1.97900390625, 2.0738525390625, 2.168701171875, 2.2635498046875, 2.3583984375, 2.4532470703125, 2.548095703125, 2.6429443359375, 2.73779296875, 2.8326416015625, 2.927490234375, 3.0223388671875, 3.1171875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 7.0, 13.0, 33.0, 116.0, 491.0, 236.0, 70.0, 18.0, 7.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.6720962524414, -114.6357650756836, -109.59943389892578, -104.56310272216797, -99.52677154541016, -94.49044036865234, -89.45410919189453, -84.41777801513672, -79.3814468383789, -74.3451156616211, -69.30878448486328, -64.27245330810547, -59.236122131347656, -54.199790954589844, -49.16345977783203, -44.12712860107422, -39.090797424316406, -34.054466247558594, -29.01813507080078, -23.98180389404297, -18.945472717285156, -13.909141540527344, -8.872810363769531, -3.8364791870117188, 1.1998519897460938, 6.236183166503906, 11.272514343261719, 16.30884552001953, 21.345176696777344, 26.381507873535156, 31.41783905029297, 36.45417022705078, 41.490509033203125, 46.52684020996094, 51.56317138671875, 56.59950256347656, 61.635833740234375, 66.67216491699219, 71.70849609375, 76.74482727050781, 81.78115844726562, 86.81748962402344, 91.85382080078125, 96.89015197753906, 101.92648315429688, 106.96281433105469, 111.9991455078125, 117.03547668457031, 122.07180786132812, 127.10813903808594, 132.14447021484375, 137.18080139160156, 142.21713256835938, 147.2534637451172, 152.289794921875, 157.3261260986328, 162.36245727539062, 167.39878845214844, 172.43511962890625, 177.47145080566406, 182.50778198242188, 187.5441131591797, 192.5804443359375, 197.6167755126953, 202.65310668945312]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 2.0, 7.0, 7.0, 4.0, 9.0, 10.0, 14.0, 13.0, 11.0, 16.0, 19.0, 21.0, 27.0, 37.0, 30.0, 24.0, 36.0, 52.0, 128.0, 154.0, 70.0, 40.0, 35.0, 23.0, 28.0, 23.0, 24.0, 27.0, 18.0, 14.0, 12.0, 12.0, 9.0, 8.0, 5.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-56.93780517578125, -55.3607177734375, -53.783626556396484, -52.206539154052734, -50.62944793701172, -49.05236053466797, -47.47527313232422, -45.89818572998047, -44.32109451293945, -42.7440071105957, -41.16691589355469, -39.58982849121094, -38.01274108886719, -36.43564987182617, -34.85856246948242, -33.281471252441406, -31.704383850097656, -30.127294540405273, -28.55020523071289, -26.97311782836914, -25.396028518676758, -23.818939208984375, -22.241851806640625, -20.664762496948242, -19.08767318725586, -17.510583877563477, -15.93349552154541, -14.356407165527344, -12.779317855834961, -11.202228546142578, -9.625140190124512, -8.048051834106445, -6.4709625244140625, -4.893873691558838, -3.3167848587036133, -1.7396960258483887, -0.16260719299316406, 1.4144816398620605, 2.991570472717285, 4.568658828735352, 6.145748138427734, 7.722836971282959, 9.299925804138184, 10.87701416015625, 12.454103469848633, 14.031192779541016, 15.608281135559082, 17.18536949157715, 18.76245880126953, 20.339548110961914, 21.916637420654297, 23.493724822998047, 25.07081413269043, 26.647903442382812, 28.224990844726562, 29.802080154418945, 31.379169464111328, 32.95625686645508, 34.533348083496094, 36.110435485839844, 37.687522888183594, 39.26461410522461, 40.84170150756836, 42.418792724609375, 43.995880126953125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 5.0, 12.0, 7.0, 7.0, 19.0, 20.0, 28.0, 44.0, 70.0, 97.0, 142.0, 245.0, 368.0, 607.0, 1024.0, 1928.0, 3849.0, 8776.0, 24282.0, 99219.0, 646034.0, 2308881.0, 912529.0, 136179.0, 29837.0, 10402.0, 4372.0, 2192.0, 1254.0, 673.0, 399.0, 269.0, 172.0, 98.0, 73.0, 52.0, 33.0, 32.0, 17.0, 13.0, 12.0, 4.0, 2.0, 4.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.5234375, -5.3428955078125, -5.162353515625, -4.9818115234375, -4.80126953125, -4.6207275390625, -4.440185546875, -4.2596435546875, -4.0791015625, -3.8985595703125, -3.718017578125, -3.5374755859375, -3.35693359375, -3.1763916015625, -2.995849609375, -2.8153076171875, -2.634765625, -2.4542236328125, -2.273681640625, -2.0931396484375, -1.91259765625, -1.7320556640625, -1.551513671875, -1.3709716796875, -1.1904296875, -1.0098876953125, -0.829345703125, -0.6488037109375, -0.46826171875, -0.2877197265625, -0.107177734375, 0.0733642578125, 0.25390625, 0.4344482421875, 0.614990234375, 0.7955322265625, 0.97607421875, 1.1566162109375, 1.337158203125, 1.5177001953125, 1.6982421875, 1.8787841796875, 2.059326171875, 2.2398681640625, 2.42041015625, 2.6009521484375, 2.781494140625, 2.9620361328125, 3.142578125, 3.3231201171875, 3.503662109375, 3.6842041015625, 3.86474609375, 4.0452880859375, 4.225830078125, 4.4063720703125, 4.5869140625, 4.7674560546875, 4.947998046875, 5.1285400390625, 5.30908203125, 5.4896240234375, 5.670166015625, 5.8507080078125, 6.03125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 8.0, 13.0, 5.0, 13.0, 14.0, 16.0, 16.0, 35.0, 21.0, 24.0, 36.0, 38.0, 25.0, 33.0, 41.0, 45.0, 46.0, 40.0, 39.0, 42.0, 53.0, 33.0, 41.0, 36.0, 35.0, 28.0, 37.0, 25.0, 22.0, 28.0, 11.0, 16.0, 9.0, 4.0, 7.0, 7.0, 5.0, 10.0, 7.0, 5.0, 5.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.65234375, -2.567138671875, -2.48193359375, -2.396728515625, -2.3115234375, -2.226318359375, -2.14111328125, -2.055908203125, -1.970703125, -1.885498046875, -1.80029296875, -1.715087890625, -1.6298828125, -1.544677734375, -1.45947265625, -1.374267578125, -1.2890625, -1.203857421875, -1.11865234375, -1.033447265625, -0.9482421875, -0.863037109375, -0.77783203125, -0.692626953125, -0.607421875, -0.522216796875, -0.43701171875, -0.351806640625, -0.2666015625, -0.181396484375, -0.09619140625, -0.010986328125, 0.07421875, 0.159423828125, 0.24462890625, 0.329833984375, 0.4150390625, 0.500244140625, 0.58544921875, 0.670654296875, 0.755859375, 0.841064453125, 0.92626953125, 1.011474609375, 1.0966796875, 1.181884765625, 1.26708984375, 1.352294921875, 1.4375, 1.522705078125, 1.60791015625, 1.693115234375, 1.7783203125, 1.863525390625, 1.94873046875, 2.033935546875, 2.119140625, 2.204345703125, 2.28955078125, 2.374755859375, 2.4599609375, 2.545166015625, 2.63037109375, 2.715576171875, 2.80078125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 8.0, 9.0, 10.0, 31.0, 26.0, 48.0, 70.0, 131.0, 216.0, 372.0, 826.0, 2411.0, 20429.0, 4044546.0, 117929.0, 4775.0, 1250.0, 509.0, 264.0, 150.0, 91.0, 56.0, 33.0, 23.0, 15.0, 10.0, 7.0, 9.0, 1.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.9375, -28.89453125, -27.8515625, -26.80859375, -25.765625, -24.72265625, -23.6796875, -22.63671875, -21.59375, -20.55078125, -19.5078125, -18.46484375, -17.421875, -16.37890625, -15.3359375, -14.29296875, -13.25, -12.20703125, -11.1640625, -10.12109375, -9.078125, -8.03515625, -6.9921875, -5.94921875, -4.90625, -3.86328125, -2.8203125, -1.77734375, -0.734375, 0.30859375, 1.3515625, 2.39453125, 3.4375, 4.48046875, 5.5234375, 6.56640625, 7.609375, 8.65234375, 9.6953125, 10.73828125, 11.78125, 12.82421875, 13.8671875, 14.91015625, 15.953125, 16.99609375, 18.0390625, 19.08203125, 20.125, 21.16796875, 22.2109375, 23.25390625, 24.296875, 25.33984375, 26.3828125, 27.42578125, 28.46875, 29.51171875, 30.5546875, 31.59765625, 32.640625, 33.68359375, 34.7265625, 35.76953125, 36.8125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 20.0, 22.0, 21.0, 53.0, 88.0, 177.0, 368.0, 1002.0, 1276.0, 582.0, 230.0, 107.0, 60.0, 31.0, 9.0, 13.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.515625, -19.812744140625, -19.10986328125, -18.406982421875, -17.7041015625, -17.001220703125, -16.29833984375, -15.595458984375, -14.892578125, -14.189697265625, -13.48681640625, -12.783935546875, -12.0810546875, -11.378173828125, -10.67529296875, -9.972412109375, -9.26953125, -8.566650390625, -7.86376953125, -7.160888671875, -6.4580078125, -5.755126953125, -5.05224609375, -4.349365234375, -3.646484375, -2.943603515625, -2.24072265625, -1.537841796875, -0.8349609375, -0.132080078125, 0.57080078125, 1.273681640625, 1.9765625, 2.679443359375, 3.38232421875, 4.085205078125, 4.7880859375, 5.490966796875, 6.19384765625, 6.896728515625, 7.599609375, 8.302490234375, 9.00537109375, 9.708251953125, 10.4111328125, 11.114013671875, 11.81689453125, 12.519775390625, 13.22265625, 13.925537109375, 14.62841796875, 15.331298828125, 16.0341796875, 16.737060546875, 17.43994140625, 18.142822265625, 18.845703125, 19.548583984375, 20.25146484375, 20.954345703125, 21.6572265625, 22.360107421875, 23.06298828125, 23.765869140625, 24.46875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 7.0, 4.0, 7.0, 12.0, 25.0, 34.0, 45.0, 117.0, 226.0, 241.0, 144.0, 73.0, 28.0, 10.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.3430938720703, -158.51947021484375, -152.6958465576172, -146.87222290039062, -141.04859924316406, -135.2249755859375, -129.4013671875, -123.5777359008789, -117.75411224365234, -111.93048858642578, -106.10686492919922, -100.28324890136719, -94.45962524414062, -88.63600158691406, -82.8123779296875, -76.98875427246094, -71.16513061523438, -65.34150695800781, -59.51788330078125, -53.69426345825195, -47.87063980102539, -42.04701614379883, -36.22339630126953, -30.39977264404297, -24.576148986816406, -18.752525329589844, -12.928903579711914, -7.105281829833984, -1.2816581726074219, 4.541965484619141, 10.365585327148438, 16.189208984375, 22.012847900390625, 27.836471557617188, 33.66009521484375, 39.48371505737305, 45.30733871459961, 51.13096237182617, 56.95458221435547, 62.77820587158203, 68.6018295288086, 74.42545318603516, 80.24907684326172, 86.07269287109375, 91.89631652832031, 97.71994018554688, 103.54356384277344, 109.3671875, 115.19081115722656, 121.01443481445312, 126.83805847167969, 132.66168212890625, 138.4853057861328, 144.30892944335938, 150.13253784179688, 155.9561767578125, 161.77978515625, 167.60340881347656, 173.42703247070312, 179.2506561279297, 185.07427978515625, 190.8979034423828, 196.72152709960938, 202.54513549804688, 208.3687744140625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 10.0, 9.0, 5.0, 11.0, 20.0, 34.0, 38.0, 58.0, 61.0, 73.0, 71.0, 85.0, 83.0, 91.0, 61.0, 58.0, 51.0, 36.0, 29.0, 29.0, 25.0, 16.0, 13.0, 7.0, 5.0, 6.0, 2.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.46734619140625, -96.44294738769531, -93.41854858398438, -90.39414978027344, -87.3697509765625, -84.34534454345703, -81.3209457397461, -78.29654693603516, -75.27214813232422, -72.24774932861328, -69.22335052490234, -66.1989517211914, -63.1745491027832, -60.150150299072266, -57.12574768066406, -54.101348876953125, -51.07695007324219, -48.05255126953125, -45.02815246582031, -42.00374984741211, -38.97935104370117, -35.954952239990234, -32.93054962158203, -29.906150817871094, -26.881752014160156, -23.85735321044922, -20.83295249938965, -17.808551788330078, -14.78415298461914, -11.759753227233887, -8.735353469848633, -5.7109527587890625, -2.6865615844726562, 0.33783817291259766, 3.3622379302978516, 6.3866376876831055, 9.41103744506836, 12.435437202453613, 15.459836959838867, 18.484237670898438, 21.508636474609375, 24.533035278320312, 27.557435989379883, 30.581836700439453, 33.60623550415039, 36.63063430786133, 39.65503692626953, 42.67943572998047, 45.703834533691406, 48.728233337402344, 51.75263214111328, 54.777034759521484, 57.80143356323242, 60.82583236694336, 63.85023498535156, 66.8746337890625, 69.89903259277344, 72.92343139648438, 75.94783020019531, 78.97222900390625, 81.99662780761719, 85.02103424072266, 88.0454330444336, 91.06983184814453, 94.09423065185547]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 7.0, 10.0, 25.0, 23.0, 37.0, 45.0, 57.0, 66.0, 114.0, 182.0, 234.0, 372.0, 580.0, 842.0, 1289.0, 2007.0, 3529.0, 5958.0, 10996.0, 21867.0, 48110.0, 120887.0, 354096.0, 291513.0, 101111.0, 41497.0, 19227.0, 9805.0, 5401.0, 3125.0, 1924.0, 1234.0, 767.0, 493.0, 349.0, 237.0, 146.0, 120.0, 86.0, 57.0, 42.0, 23.0, 14.0, 11.0, 10.0, 6.0, 3.0, 5.0, 6.0, 3.0, 3.0, 2.0], "bins": [-4.51171875, -4.382476806640625, -4.25323486328125, -4.123992919921875, -3.9947509765625, -3.865509033203125, -3.73626708984375, -3.607025146484375, -3.477783203125, -3.348541259765625, -3.21929931640625, -3.090057373046875, -2.9608154296875, -2.831573486328125, -2.70233154296875, -2.573089599609375, -2.44384765625, -2.314605712890625, -2.18536376953125, -2.056121826171875, -1.9268798828125, -1.797637939453125, -1.66839599609375, -1.539154052734375, -1.409912109375, -1.280670166015625, -1.15142822265625, -1.022186279296875, -0.8929443359375, -0.763702392578125, -0.63446044921875, -0.505218505859375, -0.3759765625, -0.246734619140625, -0.11749267578125, 0.011749267578125, 0.1409912109375, 0.270233154296875, 0.39947509765625, 0.528717041015625, 0.657958984375, 0.787200927734375, 0.91644287109375, 1.045684814453125, 1.1749267578125, 1.304168701171875, 1.43341064453125, 1.562652587890625, 1.69189453125, 1.821136474609375, 1.95037841796875, 2.079620361328125, 2.2088623046875, 2.338104248046875, 2.46734619140625, 2.596588134765625, 2.725830078125, 2.855072021484375, 2.98431396484375, 3.113555908203125, 3.2427978515625, 3.372039794921875, 3.50128173828125, 3.630523681640625, 3.759765625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 11.0, 19.0, 18.0, 13.0, 27.0, 39.0, 37.0, 32.0, 51.0, 52.0, 43.0, 45.0, 51.0, 60.0, 48.0, 55.0, 46.0, 61.0, 41.0, 42.0, 38.0, 34.0, 27.0, 22.0, 17.0, 14.0, 12.0, 5.0, 5.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.27734375, -4.1414794921875, -4.005615234375, -3.8697509765625, -3.73388671875, -3.5980224609375, -3.462158203125, -3.3262939453125, -3.1904296875, -3.0545654296875, -2.918701171875, -2.7828369140625, -2.64697265625, -2.5111083984375, -2.375244140625, -2.2393798828125, -2.103515625, -1.9676513671875, -1.831787109375, -1.6959228515625, -1.56005859375, -1.4241943359375, -1.288330078125, -1.1524658203125, -1.0166015625, -0.8807373046875, -0.744873046875, -0.6090087890625, -0.47314453125, -0.3372802734375, -0.201416015625, -0.0655517578125, 0.0703125, 0.2061767578125, 0.342041015625, 0.4779052734375, 0.61376953125, 0.7496337890625, 0.885498046875, 1.0213623046875, 1.1572265625, 1.2930908203125, 1.428955078125, 1.5648193359375, 1.70068359375, 1.8365478515625, 1.972412109375, 2.1082763671875, 2.244140625, 2.3800048828125, 2.515869140625, 2.6517333984375, 2.78759765625, 2.9234619140625, 3.059326171875, 3.1951904296875, 3.3310546875, 3.4669189453125, 3.602783203125, 3.7386474609375, 3.87451171875, 4.0103759765625, 4.146240234375, 4.2821044921875, 4.41796875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 4.0, 5.0, 8.0, 8.0, 9.0, 6.0, 16.0, 22.0, 22.0, 41.0, 54.0, 56.0, 73.0, 97.0, 168.0, 269.0, 383.0, 810.0, 1812.0, 5321.0, 23781.0, 234301.0, 721511.0, 46078.0, 8614.0, 2480.0, 1050.0, 502.0, 315.0, 217.0, 125.0, 95.0, 64.0, 50.0, 41.0, 28.0, 23.0, 20.0, 16.0, 15.0, 11.0, 12.0, 7.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.38671875, -7.15716552734375, -6.9276123046875, -6.69805908203125, -6.468505859375, -6.23895263671875, -6.0093994140625, -5.77984619140625, -5.55029296875, -5.32073974609375, -5.0911865234375, -4.86163330078125, -4.632080078125, -4.40252685546875, -4.1729736328125, -3.94342041015625, -3.7138671875, -3.48431396484375, -3.2547607421875, -3.02520751953125, -2.795654296875, -2.56610107421875, -2.3365478515625, -2.10699462890625, -1.87744140625, -1.64788818359375, -1.4183349609375, -1.18878173828125, -0.959228515625, -0.72967529296875, -0.5001220703125, -0.27056884765625, -0.041015625, 0.18853759765625, 0.4180908203125, 0.64764404296875, 0.877197265625, 1.10675048828125, 1.3363037109375, 1.56585693359375, 1.79541015625, 2.02496337890625, 2.2545166015625, 2.48406982421875, 2.713623046875, 2.94317626953125, 3.1727294921875, 3.40228271484375, 3.6318359375, 3.86138916015625, 4.0909423828125, 4.32049560546875, 4.550048828125, 4.77960205078125, 5.0091552734375, 5.23870849609375, 5.46826171875, 5.69781494140625, 5.9273681640625, 6.15692138671875, 6.386474609375, 6.61602783203125, 6.8455810546875, 7.07513427734375, 7.3046875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 6.0, 12.0, 8.0, 8.0, 9.0, 13.0, 17.0, 25.0, 14.0, 29.0, 26.0, 26.0, 41.0, 52.0, 64.0, 69.0, 81.0, 74.0, 76.0, 52.0, 51.0, 39.0, 33.0, 16.0, 24.0, 22.0, 13.0, 15.0, 13.0, 11.0, 15.0, 8.0, 8.0, 4.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7578125, -15.2735595703125, -14.789306640625, -14.3050537109375, -13.82080078125, -13.3365478515625, -12.852294921875, -12.3680419921875, -11.8837890625, -11.3995361328125, -10.915283203125, -10.4310302734375, -9.94677734375, -9.4625244140625, -8.978271484375, -8.4940185546875, -8.009765625, -7.5255126953125, -7.041259765625, -6.5570068359375, -6.07275390625, -5.5885009765625, -5.104248046875, -4.6199951171875, -4.1357421875, -3.6514892578125, -3.167236328125, -2.6829833984375, -2.19873046875, -1.7144775390625, -1.230224609375, -0.7459716796875, -0.26171875, 0.2225341796875, 0.706787109375, 1.1910400390625, 1.67529296875, 2.1595458984375, 2.643798828125, 3.1280517578125, 3.6123046875, 4.0965576171875, 4.580810546875, 5.0650634765625, 5.54931640625, 6.0335693359375, 6.517822265625, 7.0020751953125, 7.486328125, 7.9705810546875, 8.454833984375, 8.9390869140625, 9.42333984375, 9.9075927734375, 10.391845703125, 10.8760986328125, 11.3603515625, 11.8446044921875, 12.328857421875, 12.8131103515625, 13.29736328125, 13.7816162109375, 14.265869140625, 14.7501220703125, 15.234375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 7.0, 6.0, 12.0, 18.0, 27.0, 30.0, 65.0, 102.0, 135.0, 273.0, 520.0, 1041.0, 2476.0, 7462.0, 32240.0, 800992.0, 173478.0, 20453.0, 5510.0, 1919.0, 773.0, 417.0, 208.0, 122.0, 82.0, 52.0, 39.0, 28.0, 16.0, 9.0, 13.0, 7.0, 7.0, 2.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2294921875, -1.1896514892578125, -1.149810791015625, -1.1099700927734375, -1.07012939453125, -1.0302886962890625, -0.990447998046875, -0.9506072998046875, -0.9107666015625, -0.8709259033203125, -0.831085205078125, -0.7912445068359375, -0.75140380859375, -0.7115631103515625, -0.671722412109375, -0.6318817138671875, -0.592041015625, -0.5522003173828125, -0.512359619140625, -0.4725189208984375, -0.43267822265625, -0.3928375244140625, -0.352996826171875, -0.3131561279296875, -0.2733154296875, -0.2334747314453125, -0.193634033203125, -0.1537933349609375, -0.11395263671875, -0.0741119384765625, -0.034271240234375, 0.0055694580078125, 0.04541015625, 0.0852508544921875, 0.125091552734375, 0.1649322509765625, 0.20477294921875, 0.2446136474609375, 0.284454345703125, 0.3242950439453125, 0.3641357421875, 0.4039764404296875, 0.443817138671875, 0.4836578369140625, 0.52349853515625, 0.5633392333984375, 0.603179931640625, 0.6430206298828125, 0.682861328125, 0.7227020263671875, 0.762542724609375, 0.8023834228515625, 0.84222412109375, 0.8820648193359375, 0.921905517578125, 0.9617462158203125, 1.0015869140625, 1.0414276123046875, 1.081268310546875, 1.1211090087890625, 1.16094970703125, 1.2007904052734375, 1.240631103515625, 1.2804718017578125, 1.3203125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 7.0, 5.0, 15.0, 12.0, 9.0, 24.0, 28.0, 30.0, 42.0, 81.0, 91.0, 126.0, 165.0, 111.0, 68.0, 45.0, 29.0, 24.0, 14.0, 14.0, 12.0, 8.0, 7.0, 4.0, 9.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003459453582763672, -0.0003336705267429352, -0.0003213956952095032, -0.00030912086367607117, -0.00029684603214263916, -0.00028457120060920715, -0.00027229636907577515, -0.00026002153754234314, -0.00024774670600891113, -0.00023547187447547913, -0.00022319704294204712, -0.0002109222114086151, -0.0001986473798751831, -0.0001863725483417511, -0.0001740977168083191, -0.00016182288527488708, -0.00014954805374145508, -0.00013727322220802307, -0.00012499839067459106, -0.00011272355914115906, -0.00010044872760772705, -8.817389607429504e-05, -7.589906454086304e-05, -6.362423300743103e-05, -5.1349401473999023e-05, -3.9074569940567017e-05, -2.679973840713501e-05, -1.4524906873703003e-05, -2.250075340270996e-06, 1.002475619316101e-05, 2.2299587726593018e-05, 3.4574419260025024e-05, 4.684925079345703e-05, 5.912408232688904e-05, 7.139891386032104e-05, 8.367374539375305e-05, 9.594857692718506e-05, 0.00010822340846061707, 0.00012049823999404907, 0.00013277307152748108, 0.00014504790306091309, 0.0001573227345943451, 0.0001695975661277771, 0.0001818723976612091, 0.0001941472291946411, 0.00020642206072807312, 0.00021869689226150513, 0.00023097172379493713, 0.00024324655532836914, 0.00025552138686180115, 0.00026779621839523315, 0.00028007104992866516, 0.00029234588146209717, 0.0003046207129955292, 0.0003168955445289612, 0.0003291703760623932, 0.0003414452075958252, 0.0003537200391292572, 0.0003659948706626892, 0.0003782697021961212, 0.0003905445337295532, 0.00040281936526298523, 0.00041509419679641724, 0.00042736902832984924, 0.00043964385986328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 1.0, 6.0, 11.0, 13.0, 11.0, 28.0, 23.0, 39.0, 49.0, 76.0, 136.0, 232.0, 387.0, 698.0, 1355.0, 2651.0, 5584.0, 13678.0, 39809.0, 268637.0, 637377.0, 48883.0, 16115.0, 6568.0, 2900.0, 1445.0, 773.0, 399.0, 271.0, 136.0, 95.0, 50.0, 43.0, 26.0, 9.0, 14.0, 9.0, 3.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96728515625, -0.9351272583007812, -0.9029693603515625, -0.8708114624023438, -0.838653564453125, -0.8064956665039062, -0.7743377685546875, -0.7421798706054688, -0.71002197265625, -0.6778640747070312, -0.6457061767578125, -0.6135482788085938, -0.581390380859375, -0.5492324829101562, -0.5170745849609375, -0.48491668701171875, -0.4527587890625, -0.42060089111328125, -0.3884429931640625, -0.35628509521484375, -0.324127197265625, -0.29196929931640625, -0.2598114013671875, -0.22765350341796875, -0.19549560546875, -0.16333770751953125, -0.1311798095703125, -0.09902191162109375, -0.066864013671875, -0.03470611572265625, -0.0025482177734375, 0.02960968017578125, 0.061767578125, 0.09392547607421875, 0.1260833740234375, 0.15824127197265625, 0.190399169921875, 0.22255706787109375, 0.2547149658203125, 0.28687286376953125, 0.31903076171875, 0.35118865966796875, 0.3833465576171875, 0.41550445556640625, 0.447662353515625, 0.47982025146484375, 0.5119781494140625, 0.5441360473632812, 0.5762939453125, 0.6084518432617188, 0.6406097412109375, 0.6727676391601562, 0.704925537109375, 0.7370834350585938, 0.7692413330078125, 0.8013992309570312, 0.83355712890625, 0.8657150268554688, 0.8978729248046875, 0.9300308227539062, 0.962188720703125, 0.9943466186523438, 1.0265045166015625, 1.0586624145507812, 1.0908203125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 5.0, 9.0, 5.0, 10.0, 6.0, 13.0, 17.0, 17.0, 25.0, 69.0, 82.0, 110.0, 144.0, 141.0, 107.0, 77.0, 37.0, 33.0, 16.0, 10.0, 16.0, 11.0, 5.0, 4.0, 4.0, 5.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.7490234375, -1.702728271484375, -1.65643310546875, -1.610137939453125, -1.5638427734375, -1.517547607421875, -1.47125244140625, -1.424957275390625, -1.378662109375, -1.332366943359375, -1.28607177734375, -1.239776611328125, -1.1934814453125, -1.147186279296875, -1.10089111328125, -1.054595947265625, -1.00830078125, -0.962005615234375, -0.91571044921875, -0.869415283203125, -0.8231201171875, -0.776824951171875, -0.73052978515625, -0.684234619140625, -0.637939453125, -0.591644287109375, -0.54534912109375, -0.499053955078125, -0.4527587890625, -0.406463623046875, -0.36016845703125, -0.313873291015625, -0.267578125, -0.221282958984375, -0.17498779296875, -0.128692626953125, -0.0823974609375, -0.036102294921875, 0.01019287109375, 0.056488037109375, 0.102783203125, 0.149078369140625, 0.19537353515625, 0.241668701171875, 0.2879638671875, 0.334259033203125, 0.38055419921875, 0.426849365234375, 0.47314453125, 0.519439697265625, 0.56573486328125, 0.612030029296875, 0.6583251953125, 0.704620361328125, 0.75091552734375, 0.797210693359375, 0.843505859375, 0.889801025390625, 0.93609619140625, 0.982391357421875, 1.0286865234375, 1.074981689453125, 1.12127685546875, 1.167572021484375, 1.2138671875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 12.0, 52.0, 96.0, 531.0, 192.0, 80.0, 23.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.45187377929688, -104.05889129638672, -100.66590881347656, -97.2729263305664, -93.87994384765625, -90.48696899414062, -87.09397888183594, -83.70100402832031, -80.30802154541016, -76.9150390625, -73.52205657958984, -70.12907409667969, -66.73609161376953, -63.34311294555664, -59.950130462646484, -56.557151794433594, -53.16416549682617, -49.771183013916016, -46.37820053100586, -42.98522186279297, -39.59223937988281, -36.199256896972656, -32.8062744140625, -29.413293838500977, -26.02031135559082, -22.627328872680664, -19.23434829711914, -15.841365814208984, -12.448384284973145, -9.055402755737305, -5.662420272827148, -2.269439697265625, 1.1235427856445312, 4.516524314880371, 7.909506320953369, 11.302488327026367, 14.695469856262207, 18.088451385498047, 21.481433868408203, 24.874414443969727, 28.267396926879883, 31.66037940979004, 35.05335998535156, 38.44634246826172, 41.839324951171875, 45.23230743408203, 48.62528991699219, 52.01826858520508, 55.411251068115234, 58.80423355102539, 62.19721603393555, 65.59019470214844, 68.9831771850586, 72.37615966796875, 75.7691421508789, 79.16212463378906, 82.55510711669922, 85.94808959960938, 89.34107208251953, 92.73405456542969, 96.12703704833984, 99.52001953125, 102.91299438476562, 106.30597686767578, 109.69895935058594]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 9.0, 7.0, 11.0, 11.0, 13.0, 11.0, 14.0, 25.0, 22.0, 21.0, 17.0, 34.0, 22.0, 129.0, 134.0, 48.0, 68.0, 139.0, 48.0, 35.0, 20.0, 16.0, 18.0, 15.0, 17.0, 13.0, 10.0, 12.0, 7.0, 6.0, 8.0, 4.0, 7.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-50.79786682128906, -49.41446304321289, -48.031063079833984, -46.64765930175781, -45.264259338378906, -43.880855560302734, -42.49745178222656, -41.114051818847656, -39.730648040771484, -38.34724426269531, -36.963844299316406, -35.580440521240234, -34.19704055786133, -32.813636779785156, -31.430234909057617, -30.046833038330078, -28.66343116760254, -27.280029296875, -25.89662742614746, -24.513225555419922, -23.12982177734375, -21.74641990661621, -20.363018035888672, -18.9796142578125, -17.596214294433594, -16.212812423706055, -14.8294095993042, -13.44600772857666, -12.062604904174805, -10.679203033447266, -9.295801162719727, -7.912398338317871, -6.528995513916016, -5.145593166351318, -3.7621910572052, -2.378788948059082, -0.9953866004943848, 0.3880157470703125, 1.7714176177978516, 3.154820442199707, 4.538222312927246, 5.921624660491943, 7.305027008056641, 8.68842887878418, 10.071830749511719, 11.455233573913574, 12.838635444641113, 14.222038269042969, 15.605440139770508, 16.988842010498047, 18.372243881225586, 19.755645751953125, 21.139049530029297, 22.522451400756836, 23.905853271484375, 25.289257049560547, 26.672657012939453, 28.056058883666992, 29.43946075439453, 30.822864532470703, 32.20626449584961, 33.58966827392578, 34.97306823730469, 36.35647201538086, 37.73987579345703]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 17.0, 9.0, 15.0, 20.0, 34.0, 52.0, 37.0, 54.0, 111.0, 344.0, 79.0, 62.0, 40.0, 34.0, 34.0, 19.0, 16.0, 2.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.3515625, -9.1136474609375, -8.875732421875, -8.6378173828125, -8.39990234375, -8.1619873046875, -7.924072265625, -7.6861572265625, -7.4482421875, -7.2103271484375, -6.972412109375, -6.7344970703125, -6.49658203125, -6.2586669921875, -6.020751953125, -5.7828369140625, -5.544921875, -5.3070068359375, -5.069091796875, -4.8311767578125, -4.59326171875, -4.3553466796875, -4.117431640625, -3.8795166015625, -3.6416015625, -3.4036865234375, -3.165771484375, -2.9278564453125, -2.68994140625, -2.4520263671875, -2.214111328125, -1.9761962890625, -1.73828125, -1.5003662109375, -1.262451171875, -1.0245361328125, -0.78662109375, -0.5487060546875, -0.310791015625, -0.0728759765625, 0.1650390625, 0.4029541015625, 0.640869140625, 0.8787841796875, 1.11669921875, 1.3546142578125, 1.592529296875, 1.8304443359375, 2.068359375, 2.3062744140625, 2.544189453125, 2.7821044921875, 3.02001953125, 3.2579345703125, 3.495849609375, 3.7337646484375, 3.9716796875, 4.2095947265625, 4.447509765625, 4.6854248046875, 4.92333984375, 5.1612548828125, 5.399169921875, 5.6370849609375, 5.875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 9.0, 11.0, 19.0, 16.0, 8.0, 13.0, 23.0, 32.0, 75.0, 84.0, 129.0, 243.0, 410.0, 868.0, 2506.0, 10594.0, 8305511.0, 59722.0, 5268.0, 1558.0, 626.0, 271.0, 208.0, 120.0, 81.0, 45.0, 35.0, 23.0, 19.0, 17.0, 7.0, 7.0, 7.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-54.406837463378906, -52.967220306396484, -51.52760696411133, -50.087989807128906, -48.64837646484375, -47.20875930786133, -45.769142150878906, -44.32952880859375, -42.88991165161133, -41.450294494628906, -40.01068115234375, -38.57106399536133, -37.131446838378906, -35.69183349609375, -34.25221633911133, -32.812599182128906, -31.37298583984375, -29.93337059020996, -28.493755340576172, -27.05413818359375, -25.61452293395996, -24.174907684326172, -22.73529052734375, -21.29567527770996, -19.856060028076172, -18.416444778442383, -16.976829528808594, -15.537212371826172, -14.097597122192383, -12.657981872558594, -11.218365669250488, -9.778749465942383, -8.339130401611328, -6.899514675140381, -5.459898948669434, -4.020283222198486, -2.580667495727539, -1.1410517692565918, 0.29856395721435547, 1.738180160522461, 3.17779541015625, 4.617411136627197, 6.0570268630981445, 7.496642589569092, 8.936258316040039, 10.375873565673828, 11.815489768981934, 13.255105972290039, 14.694721221923828, 16.134336471557617, 17.573951721191406, 19.013568878173828, 20.453184127807617, 21.892799377441406, 23.332416534423828, 24.772031784057617, 26.211647033691406, 27.651262283325195, 29.090877532958984, 30.530494689941406, 31.970109939575195, 33.409725189208984, 34.849342346191406, 36.28895568847656, 37.728572845458984]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 0.0, 1.0, 5.0, 4.0, 4.0, 5.0, 1.0, 6.0, 4.0, 4.0, 1.0, 10.0, 4.0, 5.0, 5.0, 4.0, 5.0, 5.0, 6.0, 4.0, 3.0, 4.0, 0.0, 5.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.792640686035156, -45.144046783447266, -42.495452880859375, -39.84686279296875, -37.19826889038086, -34.54967498779297, -31.90108299255371, -29.252490997314453, -26.603897094726562, -23.955303192138672, -21.306711196899414, -18.658119201660156, -16.009525299072266, -13.360932350158691, -10.712339401245117, -8.06374740600586, -5.415153503417969, -2.7665605545043945, -0.11796760559082031, 2.530625343322754, 5.179218292236328, 7.827811241149902, 10.476404190063477, 13.124996185302734, 15.773590087890625, 18.422183990478516, 21.070775985717773, 23.71936798095703, 26.367961883544922, 29.016555786132812, 31.66514778137207, 34.31373977661133, 36.96234130859375, 39.61093521118164, 42.25952911376953, 44.908119201660156, 47.55671310424805, 50.20530700683594, 52.85389709472656, 55.50249099731445, 58.151084899902344, 60.799678802490234, 63.448272705078125, 66.09686279296875, 68.74545288085938, 71.39405059814453, 74.04264068603516, 76.69123840332031, 79.33982849121094, 81.98841857910156, 84.63701629638672, 87.28560638427734, 89.9342041015625, 92.58279418945312, 95.23138427734375, 97.87997436523438, 100.52857208251953, 103.17716217041016, 105.82575988769531, 108.47434997558594, 111.12294006347656, 113.77153778076172, 116.42012786865234, 119.0687255859375, 121.71731567382812]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 6.0, 1.0, 4.0, 4.0, 4.0, 4.0, 8.0, 10.0, 13.0, 9.0, 17.0, 23.0, 26.0, 35.0, 36.0, 52.0, 71.0, 109.0, 147.0, 202.0, 280.0, 464.0, 703.0, 1184.0, 1978.0, 3248.0, 5947.0, 11949.0, 24309.0, 51950.0, 108293.0, 144897.0, 86700.0, 39839.0, 19073.0, 9605.0, 5069.0, 2924.0, 1693.0, 1109.0, 649.0, 517.0, 320.0, 207.0, 158.0, 125.0, 78.0, 60.0, 41.0, 39.0, 31.0, 21.0, 8.0, 5.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0], "bins": [-28.15625, -27.359375, -26.5625, -25.765625, -24.96875, -24.171875, -23.375, -22.578125, -21.78125, -20.984375, -20.1875, -19.390625, -18.59375, -17.796875, -17.0, -16.203125, -15.40625, -14.609375, -13.8125, -13.015625, -12.21875, -11.421875, -10.625, -9.828125, -9.03125, -8.234375, -7.4375, -6.640625, -5.84375, -5.046875, -4.25, -3.453125, -2.65625, -1.859375, -1.0625, -0.265625, 0.53125, 1.328125, 2.125, 2.921875, 3.71875, 4.515625, 5.3125, 6.109375, 6.90625, 7.703125, 8.5, 9.296875, 10.09375, 10.890625, 11.6875, 12.484375, 13.28125, 14.078125, 14.875, 15.671875, 16.46875, 17.265625, 18.0625, 18.859375, 19.65625, 20.453125, 21.25, 22.046875, 22.84375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 1.0, 6.0, 8.0, 10.0, 16.0, 16.0, 17.0, 21.0, 28.0, 54.0, 51.0, 71.0, 90.0, 71.0, 73.0, 80.0, 62.0, 59.0, 62.0, 49.0, 30.0, 35.0, 19.0, 20.0, 12.0, 8.0, 13.0, 5.0, 6.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.667236328125, -4.48291015625, -4.298583984375, -4.1142578125, -3.929931640625, -3.74560546875, -3.561279296875, -3.376953125, -3.192626953125, -3.00830078125, -2.823974609375, -2.6396484375, -2.455322265625, -2.27099609375, -2.086669921875, -1.90234375, -1.718017578125, -1.53369140625, -1.349365234375, -1.1650390625, -0.980712890625, -0.79638671875, -0.612060546875, -0.427734375, -0.243408203125, -0.05908203125, 0.125244140625, 0.3095703125, 0.493896484375, 0.67822265625, 0.862548828125, 1.046875, 1.231201171875, 1.41552734375, 1.599853515625, 1.7841796875, 1.968505859375, 2.15283203125, 2.337158203125, 2.521484375, 2.705810546875, 2.89013671875, 3.074462890625, 3.2587890625, 3.443115234375, 3.62744140625, 3.811767578125, 3.99609375, 4.180419921875, 4.36474609375, 4.549072265625, 4.7333984375, 4.917724609375, 5.10205078125, 5.286376953125, 5.470703125, 5.655029296875, 5.83935546875, 6.023681640625, 6.2080078125, 6.392333984375, 6.57666015625, 6.760986328125, 6.9453125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 3.0, 10.0, 19.0, 24.0, 65.0, 97.0, 116.0, 65.0, 32.0, 20.0, 9.0, 7.0, 8.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-73.39955139160156, -71.52816772460938, -69.65678405761719, -67.78539276123047, -65.91400909423828, -64.0426254272461, -62.171241760253906, -60.29985427856445, -58.428466796875, -56.55708312988281, -54.68569564819336, -52.81431198120117, -50.94292449951172, -49.07154083251953, -47.200157165527344, -45.32876968383789, -43.4573860168457, -41.586002349853516, -39.71461486816406, -37.843231201171875, -35.97184371948242, -34.100460052490234, -32.22907257080078, -30.357688903808594, -28.486303329467773, -26.614917755126953, -24.743532180786133, -22.872146606445312, -21.000762939453125, -19.129375457763672, -17.257991790771484, -15.386606216430664, -13.515220642089844, -11.643835067749023, -9.772449493408203, -7.901064872741699, -6.029679298400879, -4.158293724060059, -2.2869091033935547, -0.4155235290527344, 1.455862045288086, 3.327247381210327, 5.198632717132568, 7.0700178146362305, 8.94140338897705, 10.812788963317871, 12.684173583984375, 14.555559158325195, 16.426944732666016, 18.298330307006836, 20.169715881347656, 22.041099548339844, 23.912487030029297, 25.783870697021484, 27.655256271362305, 29.526641845703125, 31.398027420043945, 33.269412994384766, 35.14079666137695, 37.012184143066406, 38.883567810058594, 40.75495529174805, 42.626338958740234, 44.49772644042969, 46.369110107421875]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 3.0, 12.0, 7.0, 4.0, 14.0, 21.0, 15.0, 30.0, 42.0, 47.0, 51.0, 48.0, 32.0, 28.0, 20.0, 31.0, 19.0, 8.0, 6.0, 5.0, 5.0, 3.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.70725440979004, -21.948942184448242, -21.190629959106445, -20.43231773376465, -19.67400550842285, -18.915693283081055, -18.157379150390625, -17.399066925048828, -16.64075469970703, -15.882442474365234, -15.124130249023438, -14.36581802368164, -13.607505798339844, -12.849193572998047, -12.090880393981934, -11.332568168640137, -10.574256896972656, -9.81594467163086, -9.057632446289062, -8.299320220947266, -7.5410075187683105, -6.782695293426514, -6.024382591247559, -5.266070365905762, -4.507758140563965, -3.749445915222168, -2.991133451461792, -2.232820987701416, -1.4745087623596191, -0.7161965370178223, 0.04211616516113281, 0.8004283905029297, 1.5587406158447266, 2.3170528411865234, 3.0753653049468994, 3.8336777687072754, 4.591989994049072, 5.350302219390869, 6.108614921569824, 6.866927146911621, 7.625239372253418, 8.383551597595215, 9.141863822937012, 9.900177001953125, 10.658489227294922, 11.416801452636719, 12.175113677978516, 12.933425903320312, 13.69173812866211, 14.450050354003906, 15.208362579345703, 15.9666748046875, 16.724987030029297, 17.483299255371094, 18.24161148071289, 18.999923706054688, 19.758235931396484, 20.51654815673828, 21.274860382080078, 22.033172607421875, 22.791484832763672, 23.54979705810547, 24.308109283447266, 25.066421508789062, 25.824735641479492]}, "eval/loss": 1.837830901145935, "eval/wer": 0.2812177707259024, "eval/runtime": 833.3263, "eval/samples_per_second": 3.17, "eval/steps_per_second": 0.397} \ No newline at end of file